{"current_steps": 1, "total_steps": 10853, "loss": 0.3834, "learning_rate": 9.208103130755065e-09, "epoch": 9.213617727000507e-05, "percentage": 0.01, "elapsed_time": "0:00:14", "remaining_time": "1 day, 19:29:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2, "total_steps": 10853, "loss": 0.3996, "learning_rate": 1.841620626151013e-08, "epoch": 0.00018427235454001014, "percentage": 0.02, "elapsed_time": "0:00:25", "remaining_time": "1 day, 14:34:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3, "total_steps": 10853, "loss": 0.4053, "learning_rate": 2.7624309392265195e-08, "epoch": 0.0002764085318100152, "percentage": 0.03, "elapsed_time": "0:00:36", "remaining_time": "1 day, 12:37:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4, "total_steps": 10853, "loss": 0.3794, "learning_rate": 3.683241252302026e-08, "epoch": 0.0003685447090800203, "percentage": 0.04, "elapsed_time": "0:00:47", "remaining_time": "1 day, 11:42:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5, "total_steps": 10853, "loss": 0.3735, "learning_rate": 4.604051565377533e-08, "epoch": 0.0004606808863500253, "percentage": 0.05, "elapsed_time": "0:00:57", "remaining_time": "1 day, 10:55:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6, "total_steps": 10853, "loss": 0.3882, "learning_rate": 5.524861878453039e-08, "epoch": 0.0005528170636200304, "percentage": 0.06, "elapsed_time": "0:01:08", "remaining_time": "1 day, 10:21:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7, "total_steps": 10853, "loss": 0.3758, "learning_rate": 6.445672191528546e-08, "epoch": 0.0006449532408900354, "percentage": 0.06, "elapsed_time": "0:01:19", "remaining_time": "1 day, 10:13:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8, "total_steps": 10853, "loss": 0.3758, "learning_rate": 7.366482504604052e-08, "epoch": 0.0007370894181600406, "percentage": 0.07, "elapsed_time": "0:01:30", "remaining_time": "1 day, 10:03:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9, "total_steps": 10853, "loss": 0.4019, "learning_rate": 8.287292817679558e-08, "epoch": 0.0008292255954300456, "percentage": 0.08, "elapsed_time": "0:01:40", "remaining_time": "1 day, 9:30:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10, "total_steps": 10853, "loss": 0.3827, "learning_rate": 9.208103130755066e-08, "epoch": 0.0009213617727000506, "percentage": 0.09, "elapsed_time": "0:01:49", "remaining_time": "1 day, 9:03:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11, "total_steps": 10853, "loss": 0.3846, "learning_rate": 1.0128913443830572e-07, "epoch": 0.0010134979499700557, "percentage": 0.1, "elapsed_time": "0:01:59", "remaining_time": "1 day, 8:42:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12, "total_steps": 10853, "loss": 0.3843, "learning_rate": 1.1049723756906078e-07, "epoch": 0.0011056341272400608, "percentage": 0.11, "elapsed_time": "0:02:08", "remaining_time": "1 day, 8:16:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13, "total_steps": 10853, "loss": 0.3511, "learning_rate": 1.1970534069981586e-07, "epoch": 0.001197770304510066, "percentage": 0.12, "elapsed_time": "0:02:18", "remaining_time": "1 day, 8:05:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14, "total_steps": 10853, "loss": 0.3672, "learning_rate": 1.2891344383057092e-07, "epoch": 0.0012899064817800709, "percentage": 0.13, "elapsed_time": "0:02:30", "remaining_time": "1 day, 8:22:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15, "total_steps": 10853, "loss": 0.3796, "learning_rate": 1.3812154696132598e-07, "epoch": 0.001382042659050076, "percentage": 0.14, "elapsed_time": "0:02:41", "remaining_time": "1 day, 8:23:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16, "total_steps": 10853, "loss": 0.3803, "learning_rate": 1.4732965009208104e-07, "epoch": 0.0014741788363200811, "percentage": 0.15, "elapsed_time": "0:02:53", "remaining_time": "1 day, 8:37:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17, "total_steps": 10853, "loss": 0.3716, "learning_rate": 1.5653775322283613e-07, "epoch": 0.001566315013590086, "percentage": 0.16, "elapsed_time": "0:03:03", "remaining_time": "1 day, 8:33:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18, "total_steps": 10853, "loss": 0.3838, "learning_rate": 1.6574585635359117e-07, "epoch": 0.0016584511908600912, "percentage": 0.17, "elapsed_time": "0:03:14", "remaining_time": "1 day, 8:30:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19, "total_steps": 10853, "loss": 0.3516, "learning_rate": 1.7495395948434625e-07, "epoch": 0.0017505873681300963, "percentage": 0.18, "elapsed_time": "0:03:24", "remaining_time": "1 day, 8:19:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20, "total_steps": 10853, "loss": 0.3971, "learning_rate": 1.8416206261510132e-07, "epoch": 0.0018427235454001013, "percentage": 0.18, "elapsed_time": "0:03:34", "remaining_time": "1 day, 8:20:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21, "total_steps": 10853, "loss": 0.3621, "learning_rate": 1.9337016574585635e-07, "epoch": 0.0019348597226701064, "percentage": 0.19, "elapsed_time": "0:03:47", "remaining_time": "1 day, 8:31:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22, "total_steps": 10853, "loss": 0.3671, "learning_rate": 2.0257826887661144e-07, "epoch": 0.0020269958999401113, "percentage": 0.2, "elapsed_time": "0:03:57", "remaining_time": "1 day, 8:25:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23, "total_steps": 10853, "loss": 0.3586, "learning_rate": 2.1178637200736653e-07, "epoch": 0.0021191320772101165, "percentage": 0.21, "elapsed_time": "0:04:06", "remaining_time": "1 day, 8:18:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24, "total_steps": 10853, "loss": 0.3351, "learning_rate": 2.2099447513812156e-07, "epoch": 0.0022112682544801216, "percentage": 0.22, "elapsed_time": "0:04:16", "remaining_time": "1 day, 8:09:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25, "total_steps": 10853, "loss": 0.3547, "learning_rate": 2.3020257826887662e-07, "epoch": 0.0023034044317501268, "percentage": 0.23, "elapsed_time": "0:04:27", "remaining_time": "1 day, 8:10:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 26, "total_steps": 10853, "loss": 0.3643, "learning_rate": 2.394106813996317e-07, "epoch": 0.002395540609020132, "percentage": 0.24, "elapsed_time": "0:04:38", "remaining_time": "1 day, 8:12:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 27, "total_steps": 10853, "loss": 0.3735, "learning_rate": 2.486187845303868e-07, "epoch": 0.002487676786290137, "percentage": 0.25, "elapsed_time": "0:04:49", "remaining_time": "1 day, 8:13:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 28, "total_steps": 10853, "loss": 0.3538, "learning_rate": 2.5782688766114184e-07, "epoch": 0.0025798129635601417, "percentage": 0.26, "elapsed_time": "0:05:00", "remaining_time": "1 day, 8:14:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 29, "total_steps": 10853, "loss": 0.3466, "learning_rate": 2.670349907918969e-07, "epoch": 0.002671949140830147, "percentage": 0.27, "elapsed_time": "0:05:10", "remaining_time": "1 day, 8:14:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 30, "total_steps": 10853, "loss": 0.3678, "learning_rate": 2.7624309392265196e-07, "epoch": 0.002764085318100152, "percentage": 0.28, "elapsed_time": "0:05:21", "remaining_time": "1 day, 8:14:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 31, "total_steps": 10853, "loss": 0.3472, "learning_rate": 2.85451197053407e-07, "epoch": 0.002856221495370157, "percentage": 0.29, "elapsed_time": "0:05:32", "remaining_time": "1 day, 8:17:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 32, "total_steps": 10853, "loss": 0.3326, "learning_rate": 2.946593001841621e-07, "epoch": 0.0029483576726401623, "percentage": 0.29, "elapsed_time": "0:05:43", "remaining_time": "1 day, 8:17:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 33, "total_steps": 10853, "loss": 0.3714, "learning_rate": 3.0386740331491715e-07, "epoch": 0.0030404938499101674, "percentage": 0.3, "elapsed_time": "0:05:56", "remaining_time": "1 day, 8:29:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 34, "total_steps": 10853, "loss": 0.3392, "learning_rate": 3.1307550644567226e-07, "epoch": 0.003132630027180172, "percentage": 0.31, "elapsed_time": "0:06:06", "remaining_time": "1 day, 8:22:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 35, "total_steps": 10853, "loss": 0.3501, "learning_rate": 3.2228360957642727e-07, "epoch": 0.0032247662044501773, "percentage": 0.32, "elapsed_time": "0:06:17", "remaining_time": "1 day, 8:24:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 36, "total_steps": 10853, "loss": 0.3466, "learning_rate": 3.3149171270718233e-07, "epoch": 0.0033169023817201824, "percentage": 0.33, "elapsed_time": "0:06:27", "remaining_time": "1 day, 8:21:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 37, "total_steps": 10853, "loss": 0.3354, "learning_rate": 3.4069981583793745e-07, "epoch": 0.0034090385589901876, "percentage": 0.34, "elapsed_time": "0:06:39", "remaining_time": "1 day, 8:27:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 38, "total_steps": 10853, "loss": 0.3341, "learning_rate": 3.499079189686925e-07, "epoch": 0.0035011747362601927, "percentage": 0.35, "elapsed_time": "0:06:51", "remaining_time": "1 day, 8:31:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 39, "total_steps": 10853, "loss": 0.3518, "learning_rate": 3.591160220994475e-07, "epoch": 0.003593310913530198, "percentage": 0.36, "elapsed_time": "0:07:02", "remaining_time": "1 day, 8:30:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 40, "total_steps": 10853, "loss": 0.2944, "learning_rate": 3.6832412523020263e-07, "epoch": 0.0036854470908002025, "percentage": 0.37, "elapsed_time": "0:07:12", "remaining_time": "1 day, 8:28:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 41, "total_steps": 10853, "loss": 0.3516, "learning_rate": 3.775322283609577e-07, "epoch": 0.0037775832680702077, "percentage": 0.38, "elapsed_time": "0:07:23", "remaining_time": "1 day, 8:30:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 42, "total_steps": 10853, "loss": 0.2974, "learning_rate": 3.867403314917127e-07, "epoch": 0.003869719445340213, "percentage": 0.39, "elapsed_time": "0:07:36", "remaining_time": "1 day, 8:36:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 43, "total_steps": 10853, "loss": 0.3482, "learning_rate": 3.959484346224678e-07, "epoch": 0.003961855622610218, "percentage": 0.4, "elapsed_time": "0:07:47", "remaining_time": "1 day, 8:38:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 44, "total_steps": 10853, "loss": 0.2894, "learning_rate": 4.051565377532229e-07, "epoch": 0.004053991799880223, "percentage": 0.41, "elapsed_time": "0:07:58", "remaining_time": "1 day, 8:37:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 45, "total_steps": 10853, "loss": 0.3062, "learning_rate": 4.1436464088397794e-07, "epoch": 0.004146127977150228, "percentage": 0.41, "elapsed_time": "0:08:07", "remaining_time": "1 day, 8:32:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 46, "total_steps": 10853, "loss": 0.318, "learning_rate": 4.2357274401473305e-07, "epoch": 0.004238264154420233, "percentage": 0.42, "elapsed_time": "0:08:18", "remaining_time": "1 day, 8:30:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 47, "total_steps": 10853, "loss": 0.3012, "learning_rate": 4.3278084714548806e-07, "epoch": 0.0043304003316902385, "percentage": 0.43, "elapsed_time": "0:08:27", "remaining_time": "1 day, 8:24:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 48, "total_steps": 10853, "loss": 0.3069, "learning_rate": 4.419889502762431e-07, "epoch": 0.004422536508960243, "percentage": 0.44, "elapsed_time": "0:08:38", "remaining_time": "1 day, 8:25:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 49, "total_steps": 10853, "loss": 0.3099, "learning_rate": 4.5119705340699824e-07, "epoch": 0.004514672686230248, "percentage": 0.45, "elapsed_time": "0:08:50", "remaining_time": "1 day, 8:30:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 50, "total_steps": 10853, "loss": 0.3363, "learning_rate": 4.6040515653775325e-07, "epoch": 0.0046068088635002535, "percentage": 0.46, "elapsed_time": "0:09:02", "remaining_time": "1 day, 8:33:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 51, "total_steps": 10853, "loss": 0.2906, "learning_rate": 4.696132596685083e-07, "epoch": 0.004698945040770258, "percentage": 0.47, "elapsed_time": "0:09:14", "remaining_time": "1 day, 8:37:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 52, "total_steps": 10853, "loss": 0.3293, "learning_rate": 4.788213627992634e-07, "epoch": 0.004791081218040264, "percentage": 0.48, "elapsed_time": "0:09:25", "remaining_time": "1 day, 8:36:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 53, "total_steps": 10853, "loss": 0.2983, "learning_rate": 4.880294659300184e-07, "epoch": 0.0048832173953102685, "percentage": 0.49, "elapsed_time": "0:09:37", "remaining_time": "1 day, 8:42:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 54, "total_steps": 10853, "loss": 0.3062, "learning_rate": 4.972375690607735e-07, "epoch": 0.004975353572580274, "percentage": 0.5, "elapsed_time": "0:09:48", "remaining_time": "1 day, 8:43:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 55, "total_steps": 10853, "loss": 0.2957, "learning_rate": 5.064456721915287e-07, "epoch": 0.005067489749850279, "percentage": 0.51, "elapsed_time": "0:09:59", "remaining_time": "1 day, 8:41:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 56, "total_steps": 10853, "loss": 0.3123, "learning_rate": 5.156537753222837e-07, "epoch": 0.0051596259271202835, "percentage": 0.52, "elapsed_time": "0:10:09", "remaining_time": "1 day, 8:39:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 57, "total_steps": 10853, "loss": 0.3136, "learning_rate": 5.248618784530387e-07, "epoch": 0.005251762104390289, "percentage": 0.53, "elapsed_time": "0:10:21", "remaining_time": "1 day, 8:41:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 58, "total_steps": 10853, "loss": 0.2735, "learning_rate": 5.340699815837938e-07, "epoch": 0.005343898281660294, "percentage": 0.53, "elapsed_time": "0:10:32", "remaining_time": "1 day, 8:42:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 59, "total_steps": 10853, "loss": 0.2884, "learning_rate": 5.432780847145488e-07, "epoch": 0.005436034458930299, "percentage": 0.54, "elapsed_time": "0:10:42", "remaining_time": "1 day, 8:39:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 60, "total_steps": 10853, "loss": 0.2867, "learning_rate": 5.524861878453039e-07, "epoch": 0.005528170636200304, "percentage": 0.55, "elapsed_time": "0:10:53", "remaining_time": "1 day, 8:38:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 61, "total_steps": 10853, "loss": 0.298, "learning_rate": 5.61694290976059e-07, "epoch": 0.005620306813470309, "percentage": 0.56, "elapsed_time": "0:11:04", "remaining_time": "1 day, 8:40:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 62, "total_steps": 10853, "loss": 0.3088, "learning_rate": 5.70902394106814e-07, "epoch": 0.005712442990740314, "percentage": 0.57, "elapsed_time": "0:11:15", "remaining_time": "1 day, 8:40:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 63, "total_steps": 10853, "loss": 0.2788, "learning_rate": 5.80110497237569e-07, "epoch": 0.005804579168010319, "percentage": 0.58, "elapsed_time": "0:11:27", "remaining_time": "1 day, 8:41:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 64, "total_steps": 10853, "loss": 0.3007, "learning_rate": 5.893186003683242e-07, "epoch": 0.005896715345280325, "percentage": 0.59, "elapsed_time": "0:11:37", "remaining_time": "1 day, 8:38:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 65, "total_steps": 10853, "loss": 0.2784, "learning_rate": 5.985267034990793e-07, "epoch": 0.005988851522550329, "percentage": 0.6, "elapsed_time": "0:11:48", "remaining_time": "1 day, 8:39:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 66, "total_steps": 10853, "loss": 0.2824, "learning_rate": 6.077348066298343e-07, "epoch": 0.006080987699820335, "percentage": 0.61, "elapsed_time": "0:11:58", "remaining_time": "1 day, 8:37:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 67, "total_steps": 10853, "loss": 0.2809, "learning_rate": 6.169429097605894e-07, "epoch": 0.00617312387709034, "percentage": 0.62, "elapsed_time": "0:12:10", "remaining_time": "1 day, 8:40:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 68, "total_steps": 10853, "loss": 0.2803, "learning_rate": 6.261510128913445e-07, "epoch": 0.006265260054360344, "percentage": 0.63, "elapsed_time": "0:12:23", "remaining_time": "1 day, 8:44:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 69, "total_steps": 10853, "loss": 0.2722, "learning_rate": 6.353591160220995e-07, "epoch": 0.00635739623163035, "percentage": 0.64, "elapsed_time": "0:12:33", "remaining_time": "1 day, 8:42:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 70, "total_steps": 10853, "loss": 0.2856, "learning_rate": 6.445672191528545e-07, "epoch": 0.0064495324089003546, "percentage": 0.64, "elapsed_time": "0:12:42", "remaining_time": "1 day, 8:38:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 71, "total_steps": 10853, "loss": 0.2821, "learning_rate": 6.537753222836097e-07, "epoch": 0.00654166858617036, "percentage": 0.65, "elapsed_time": "0:12:54", "remaining_time": "1 day, 8:40:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 72, "total_steps": 10853, "loss": 0.2859, "learning_rate": 6.629834254143647e-07, "epoch": 0.006633804763440365, "percentage": 0.66, "elapsed_time": "0:13:04", "remaining_time": "1 day, 8:38:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 73, "total_steps": 10853, "loss": 0.2693, "learning_rate": 6.721915285451197e-07, "epoch": 0.0067259409407103695, "percentage": 0.67, "elapsed_time": "0:13:15", "remaining_time": "1 day, 8:36:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 74, "total_steps": 10853, "loss": 0.2678, "learning_rate": 6.813996316758749e-07, "epoch": 0.006818077117980375, "percentage": 0.68, "elapsed_time": "0:13:26", "remaining_time": "1 day, 8:36:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 75, "total_steps": 10853, "loss": 0.2752, "learning_rate": 6.906077348066299e-07, "epoch": 0.00691021329525038, "percentage": 0.69, "elapsed_time": "0:13:36", "remaining_time": "1 day, 8:35:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 76, "total_steps": 10853, "loss": 0.2893, "learning_rate": 6.99815837937385e-07, "epoch": 0.007002349472520385, "percentage": 0.7, "elapsed_time": "0:13:47", "remaining_time": "1 day, 8:35:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 77, "total_steps": 10853, "loss": 0.26, "learning_rate": 7.0902394106814e-07, "epoch": 0.00709448564979039, "percentage": 0.71, "elapsed_time": "0:13:57", "remaining_time": "1 day, 8:33:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 78, "total_steps": 10853, "loss": 0.2838, "learning_rate": 7.18232044198895e-07, "epoch": 0.007186621827060396, "percentage": 0.72, "elapsed_time": "0:14:08", "remaining_time": "1 day, 8:34:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 79, "total_steps": 10853, "loss": 0.2673, "learning_rate": 7.274401473296501e-07, "epoch": 0.0072787580043304, "percentage": 0.73, "elapsed_time": "0:14:20", "remaining_time": "1 day, 8:35:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 80, "total_steps": 10853, "loss": 0.2795, "learning_rate": 7.366482504604053e-07, "epoch": 0.007370894181600405, "percentage": 0.74, "elapsed_time": "0:14:31", "remaining_time": "1 day, 8:36:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 81, "total_steps": 10853, "loss": 0.274, "learning_rate": 7.458563535911603e-07, "epoch": 0.007463030358870411, "percentage": 0.75, "elapsed_time": "0:14:43", "remaining_time": "1 day, 8:38:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 82, "total_steps": 10853, "loss": 0.237, "learning_rate": 7.550644567219154e-07, "epoch": 0.007555166536140415, "percentage": 0.76, "elapsed_time": "0:14:54", "remaining_time": "1 day, 8:37:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 83, "total_steps": 10853, "loss": 0.2535, "learning_rate": 7.642725598526704e-07, "epoch": 0.007647302713410421, "percentage": 0.76, "elapsed_time": "0:15:06", "remaining_time": "1 day, 8:39:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 84, "total_steps": 10853, "loss": 0.2579, "learning_rate": 7.734806629834254e-07, "epoch": 0.007739438890680426, "percentage": 0.77, "elapsed_time": "0:15:16", "remaining_time": "1 day, 8:38:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 85, "total_steps": 10853, "loss": 0.2553, "learning_rate": 7.826887661141805e-07, "epoch": 0.00783157506795043, "percentage": 0.78, "elapsed_time": "0:15:27", "remaining_time": "1 day, 8:38:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 86, "total_steps": 10853, "loss": 0.2552, "learning_rate": 7.918968692449356e-07, "epoch": 0.007923711245220436, "percentage": 0.79, "elapsed_time": "0:15:36", "remaining_time": "1 day, 8:35:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 87, "total_steps": 10853, "loss": 0.2544, "learning_rate": 8.011049723756907e-07, "epoch": 0.008015847422490441, "percentage": 0.8, "elapsed_time": "0:15:47", "remaining_time": "1 day, 8:33:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 88, "total_steps": 10853, "loss": 0.2697, "learning_rate": 8.103130755064458e-07, "epoch": 0.008107983599760445, "percentage": 0.81, "elapsed_time": "0:15:56", "remaining_time": "1 day, 8:30:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 89, "total_steps": 10853, "loss": 0.2477, "learning_rate": 8.195211786372008e-07, "epoch": 0.008200119777030451, "percentage": 0.82, "elapsed_time": "0:16:05", "remaining_time": "1 day, 8:26:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 90, "total_steps": 10853, "loss": 0.2627, "learning_rate": 8.287292817679559e-07, "epoch": 0.008292255954300456, "percentage": 0.83, "elapsed_time": "0:16:16", "remaining_time": "1 day, 8:26:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 91, "total_steps": 10853, "loss": 0.2851, "learning_rate": 8.379373848987109e-07, "epoch": 0.00838439213157046, "percentage": 0.84, "elapsed_time": "0:16:26", "remaining_time": "1 day, 8:24:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 92, "total_steps": 10853, "loss": 0.2619, "learning_rate": 8.471454880294661e-07, "epoch": 0.008476528308840466, "percentage": 0.85, "elapsed_time": "0:16:37", "remaining_time": "1 day, 8:25:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 93, "total_steps": 10853, "loss": 0.2579, "learning_rate": 8.563535911602211e-07, "epoch": 0.008568664486110471, "percentage": 0.86, "elapsed_time": "0:16:48", "remaining_time": "1 day, 8:24:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 94, "total_steps": 10853, "loss": 0.2461, "learning_rate": 8.655616942909761e-07, "epoch": 0.008660800663380477, "percentage": 0.87, "elapsed_time": "0:16:59", "remaining_time": "1 day, 8:24:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 95, "total_steps": 10853, "loss": 0.2838, "learning_rate": 8.747697974217311e-07, "epoch": 0.008752936840650481, "percentage": 0.88, "elapsed_time": "0:17:11", "remaining_time": "1 day, 8:26:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 96, "total_steps": 10853, "loss": 0.255, "learning_rate": 8.839779005524863e-07, "epoch": 0.008845073017920486, "percentage": 0.88, "elapsed_time": "0:17:22", "remaining_time": "1 day, 8:27:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 97, "total_steps": 10853, "loss": 0.2563, "learning_rate": 8.931860036832413e-07, "epoch": 0.008937209195190492, "percentage": 0.89, "elapsed_time": "0:17:33", "remaining_time": "1 day, 8:27:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 98, "total_steps": 10853, "loss": 0.2482, "learning_rate": 9.023941068139965e-07, "epoch": 0.009029345372460496, "percentage": 0.9, "elapsed_time": "0:17:44", "remaining_time": "1 day, 8:27:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 99, "total_steps": 10853, "loss": 0.2524, "learning_rate": 9.116022099447515e-07, "epoch": 0.009121481549730501, "percentage": 0.91, "elapsed_time": "0:17:55", "remaining_time": "1 day, 8:26:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 100, "total_steps": 10853, "loss": 0.2371, "learning_rate": 9.208103130755065e-07, "epoch": 0.009213617727000507, "percentage": 0.92, "elapsed_time": "0:18:07", "remaining_time": "1 day, 8:28:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 101, "total_steps": 10853, "loss": 0.2508, "learning_rate": 9.300184162062616e-07, "epoch": 0.009305753904270513, "percentage": 0.93, "elapsed_time": "0:18:18", "remaining_time": "1 day, 8:28:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 102, "total_steps": 10853, "loss": 0.2719, "learning_rate": 9.392265193370166e-07, "epoch": 0.009397890081540516, "percentage": 0.94, "elapsed_time": "0:18:28", "remaining_time": "1 day, 8:27:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 103, "total_steps": 10853, "loss": 0.2406, "learning_rate": 9.484346224677716e-07, "epoch": 0.009490026258810522, "percentage": 0.95, "elapsed_time": "0:18:40", "remaining_time": "1 day, 8:29:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 104, "total_steps": 10853, "loss": 0.2594, "learning_rate": 9.576427255985269e-07, "epoch": 0.009582162436080528, "percentage": 0.96, "elapsed_time": "0:18:52", "remaining_time": "1 day, 8:30:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 105, "total_steps": 10853, "loss": 0.2578, "learning_rate": 9.66850828729282e-07, "epoch": 0.009674298613350531, "percentage": 0.97, "elapsed_time": "0:19:03", "remaining_time": "1 day, 8:30:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 106, "total_steps": 10853, "loss": 0.2449, "learning_rate": 9.760589318600369e-07, "epoch": 0.009766434790620537, "percentage": 0.98, "elapsed_time": "0:19:13", "remaining_time": "1 day, 8:29:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 107, "total_steps": 10853, "loss": 0.23, "learning_rate": 9.85267034990792e-07, "epoch": 0.009858570967890543, "percentage": 0.99, "elapsed_time": "0:19:23", "remaining_time": "1 day, 8:28:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 108, "total_steps": 10853, "loss": 0.2575, "learning_rate": 9.94475138121547e-07, "epoch": 0.009950707145160548, "percentage": 1.0, "elapsed_time": "0:19:33", "remaining_time": "1 day, 8:25:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 109, "total_steps": 10853, "loss": 0.2414, "learning_rate": 1.003683241252302e-06, "epoch": 0.010042843322430552, "percentage": 1.0, "elapsed_time": "0:19:43", "remaining_time": "1 day, 8:25:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 110, "total_steps": 10853, "loss": 0.2422, "learning_rate": 1.0128913443830573e-06, "epoch": 0.010134979499700558, "percentage": 1.01, "elapsed_time": "0:19:55", "remaining_time": "1 day, 8:25:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 111, "total_steps": 10853, "loss": 0.2504, "learning_rate": 1.0220994475138122e-06, "epoch": 0.010227115676970563, "percentage": 1.02, "elapsed_time": "0:20:05", "remaining_time": "1 day, 8:24:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 112, "total_steps": 10853, "loss": 0.2625, "learning_rate": 1.0313075506445673e-06, "epoch": 0.010319251854240567, "percentage": 1.03, "elapsed_time": "0:20:17", "remaining_time": "1 day, 8:26:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 113, "total_steps": 10853, "loss": 0.2717, "learning_rate": 1.0405156537753222e-06, "epoch": 0.010411388031510573, "percentage": 1.04, "elapsed_time": "0:20:29", "remaining_time": "1 day, 8:27:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 114, "total_steps": 10853, "loss": 0.2338, "learning_rate": 1.0497237569060774e-06, "epoch": 0.010503524208780578, "percentage": 1.05, "elapsed_time": "0:20:41", "remaining_time": "1 day, 8:28:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 115, "total_steps": 10853, "loss": 0.2571, "learning_rate": 1.0589318600368325e-06, "epoch": 0.010595660386050582, "percentage": 1.06, "elapsed_time": "0:20:52", "remaining_time": "1 day, 8:29:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 116, "total_steps": 10853, "loss": 0.2181, "learning_rate": 1.0681399631675876e-06, "epoch": 0.010687796563320588, "percentage": 1.07, "elapsed_time": "0:21:02", "remaining_time": "1 day, 8:27:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 117, "total_steps": 10853, "loss": 0.2413, "learning_rate": 1.0773480662983427e-06, "epoch": 0.010779932740590593, "percentage": 1.08, "elapsed_time": "0:21:13", "remaining_time": "1 day, 8:28:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 118, "total_steps": 10853, "loss": 0.2561, "learning_rate": 1.0865561694290976e-06, "epoch": 0.010872068917860599, "percentage": 1.09, "elapsed_time": "0:21:24", "remaining_time": "1 day, 8:27:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 119, "total_steps": 10853, "loss": 0.2393, "learning_rate": 1.0957642725598527e-06, "epoch": 0.010964205095130602, "percentage": 1.1, "elapsed_time": "0:21:35", "remaining_time": "1 day, 8:27:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 120, "total_steps": 10853, "loss": 0.2349, "learning_rate": 1.1049723756906078e-06, "epoch": 0.011056341272400608, "percentage": 1.11, "elapsed_time": "0:21:45", "remaining_time": "1 day, 8:26:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 121, "total_steps": 10853, "loss": 0.2315, "learning_rate": 1.114180478821363e-06, "epoch": 0.011148477449670614, "percentage": 1.11, "elapsed_time": "0:21:56", "remaining_time": "1 day, 8:26:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 122, "total_steps": 10853, "loss": 0.2442, "learning_rate": 1.123388581952118e-06, "epoch": 0.011240613626940617, "percentage": 1.12, "elapsed_time": "0:22:07", "remaining_time": "1 day, 8:25:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 123, "total_steps": 10853, "loss": 0.2427, "learning_rate": 1.132596685082873e-06, "epoch": 0.011332749804210623, "percentage": 1.13, "elapsed_time": "0:22:18", "remaining_time": "1 day, 8:25:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 124, "total_steps": 10853, "loss": 0.2507, "learning_rate": 1.141804788213628e-06, "epoch": 0.011424885981480629, "percentage": 1.14, "elapsed_time": "0:22:29", "remaining_time": "1 day, 8:25:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 125, "total_steps": 10853, "loss": 0.2491, "learning_rate": 1.1510128913443832e-06, "epoch": 0.011517022158750634, "percentage": 1.15, "elapsed_time": "0:22:40", "remaining_time": "1 day, 8:25:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 126, "total_steps": 10853, "loss": 0.2238, "learning_rate": 1.160220994475138e-06, "epoch": 0.011609158336020638, "percentage": 1.16, "elapsed_time": "0:22:50", "remaining_time": "1 day, 8:24:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 127, "total_steps": 10853, "loss": 0.2306, "learning_rate": 1.1694290976058934e-06, "epoch": 0.011701294513290644, "percentage": 1.17, "elapsed_time": "0:23:01", "remaining_time": "1 day, 8:24:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 128, "total_steps": 10853, "loss": 0.2529, "learning_rate": 1.1786372007366483e-06, "epoch": 0.01179343069056065, "percentage": 1.18, "elapsed_time": "0:23:12", "remaining_time": "1 day, 8:24:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 129, "total_steps": 10853, "loss": 0.2297, "learning_rate": 1.1878453038674034e-06, "epoch": 0.011885566867830653, "percentage": 1.19, "elapsed_time": "0:23:24", "remaining_time": "1 day, 8:25:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 130, "total_steps": 10853, "loss": 0.2428, "learning_rate": 1.1970534069981586e-06, "epoch": 0.011977703045100659, "percentage": 1.2, "elapsed_time": "0:23:35", "remaining_time": "1 day, 8:26:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 131, "total_steps": 10853, "loss": 0.2387, "learning_rate": 1.2062615101289135e-06, "epoch": 0.012069839222370664, "percentage": 1.21, "elapsed_time": "0:23:47", "remaining_time": "1 day, 8:27:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 132, "total_steps": 10853, "loss": 0.2606, "learning_rate": 1.2154696132596686e-06, "epoch": 0.01216197539964067, "percentage": 1.22, "elapsed_time": "0:23:58", "remaining_time": "1 day, 8:27:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 133, "total_steps": 10853, "loss": 0.2558, "learning_rate": 1.2246777163904237e-06, "epoch": 0.012254111576910674, "percentage": 1.23, "elapsed_time": "0:24:10", "remaining_time": "1 day, 8:27:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 134, "total_steps": 10853, "loss": 0.2131, "learning_rate": 1.2338858195211788e-06, "epoch": 0.01234624775418068, "percentage": 1.23, "elapsed_time": "0:24:20", "remaining_time": "1 day, 8:27:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 135, "total_steps": 10853, "loss": 0.2607, "learning_rate": 1.243093922651934e-06, "epoch": 0.012438383931450685, "percentage": 1.24, "elapsed_time": "0:24:31", "remaining_time": "1 day, 8:26:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 136, "total_steps": 10853, "loss": 0.2543, "learning_rate": 1.252302025782689e-06, "epoch": 0.012530520108720689, "percentage": 1.25, "elapsed_time": "0:24:43", "remaining_time": "1 day, 8:27:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 137, "total_steps": 10853, "loss": 0.2066, "learning_rate": 1.261510128913444e-06, "epoch": 0.012622656285990694, "percentage": 1.26, "elapsed_time": "0:24:55", "remaining_time": "1 day, 8:29:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 138, "total_steps": 10853, "loss": 0.2428, "learning_rate": 1.270718232044199e-06, "epoch": 0.0127147924632607, "percentage": 1.27, "elapsed_time": "0:25:05", "remaining_time": "1 day, 8:28:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 139, "total_steps": 10853, "loss": 0.2452, "learning_rate": 1.2799263351749542e-06, "epoch": 0.012806928640530704, "percentage": 1.28, "elapsed_time": "0:25:15", "remaining_time": "1 day, 8:27:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 140, "total_steps": 10853, "loss": 0.2375, "learning_rate": 1.289134438305709e-06, "epoch": 0.012899064817800709, "percentage": 1.29, "elapsed_time": "0:25:26", "remaining_time": "1 day, 8:27:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 141, "total_steps": 10853, "loss": 0.2296, "learning_rate": 1.2983425414364642e-06, "epoch": 0.012991200995070715, "percentage": 1.3, "elapsed_time": "0:25:38", "remaining_time": "1 day, 8:27:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 142, "total_steps": 10853, "loss": 0.2249, "learning_rate": 1.3075506445672193e-06, "epoch": 0.01308333717234072, "percentage": 1.31, "elapsed_time": "0:25:49", "remaining_time": "1 day, 8:27:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 143, "total_steps": 10853, "loss": 0.2336, "learning_rate": 1.3167587476979742e-06, "epoch": 0.013175473349610724, "percentage": 1.32, "elapsed_time": "0:25:58", "remaining_time": "1 day, 8:25:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 144, "total_steps": 10853, "loss": 0.2305, "learning_rate": 1.3259668508287293e-06, "epoch": 0.01326760952688073, "percentage": 1.33, "elapsed_time": "0:26:10", "remaining_time": "1 day, 8:26:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 145, "total_steps": 10853, "loss": 0.2524, "learning_rate": 1.3351749539594844e-06, "epoch": 0.013359745704150735, "percentage": 1.34, "elapsed_time": "0:26:21", "remaining_time": "1 day, 8:26:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 146, "total_steps": 10853, "loss": 0.2421, "learning_rate": 1.3443830570902393e-06, "epoch": 0.013451881881420739, "percentage": 1.35, "elapsed_time": "0:26:33", "remaining_time": "1 day, 8:27:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 147, "total_steps": 10853, "loss": 0.256, "learning_rate": 1.3535911602209945e-06, "epoch": 0.013544018058690745, "percentage": 1.35, "elapsed_time": "0:26:46", "remaining_time": "1 day, 8:29:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 148, "total_steps": 10853, "loss": 0.2283, "learning_rate": 1.3627992633517498e-06, "epoch": 0.01363615423596075, "percentage": 1.36, "elapsed_time": "0:26:56", "remaining_time": "1 day, 8:28:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 149, "total_steps": 10853, "loss": 0.231, "learning_rate": 1.372007366482505e-06, "epoch": 0.013728290413230756, "percentage": 1.37, "elapsed_time": "0:27:06", "remaining_time": "1 day, 8:27:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 150, "total_steps": 10853, "loss": 0.2265, "learning_rate": 1.3812154696132598e-06, "epoch": 0.01382042659050076, "percentage": 1.38, "elapsed_time": "0:27:17", "remaining_time": "1 day, 8:26:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 151, "total_steps": 10853, "loss": 0.2347, "learning_rate": 1.390423572744015e-06, "epoch": 0.013912562767770765, "percentage": 1.39, "elapsed_time": "0:27:27", "remaining_time": "1 day, 8:25:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 152, "total_steps": 10853, "loss": 0.2265, "learning_rate": 1.39963167587477e-06, "epoch": 0.01400469894504077, "percentage": 1.4, "elapsed_time": "0:27:37", "remaining_time": "1 day, 8:24:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 153, "total_steps": 10853, "loss": 0.2361, "learning_rate": 1.408839779005525e-06, "epoch": 0.014096835122310775, "percentage": 1.41, "elapsed_time": "0:27:46", "remaining_time": "1 day, 8:22:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 154, "total_steps": 10853, "loss": 0.2538, "learning_rate": 1.41804788213628e-06, "epoch": 0.01418897129958078, "percentage": 1.42, "elapsed_time": "0:27:57", "remaining_time": "1 day, 8:21:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 155, "total_steps": 10853, "loss": 0.2386, "learning_rate": 1.4272559852670352e-06, "epoch": 0.014281107476850786, "percentage": 1.43, "elapsed_time": "0:28:07", "remaining_time": "1 day, 8:20:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 156, "total_steps": 10853, "loss": 0.2503, "learning_rate": 1.43646408839779e-06, "epoch": 0.014373243654120791, "percentage": 1.44, "elapsed_time": "0:28:17", "remaining_time": "1 day, 8:19:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 157, "total_steps": 10853, "loss": 0.2439, "learning_rate": 1.4456721915285452e-06, "epoch": 0.014465379831390795, "percentage": 1.45, "elapsed_time": "0:28:28", "remaining_time": "1 day, 8:19:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 158, "total_steps": 10853, "loss": 0.2325, "learning_rate": 1.4548802946593003e-06, "epoch": 0.0145575160086608, "percentage": 1.46, "elapsed_time": "0:28:38", "remaining_time": "1 day, 8:18:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 159, "total_steps": 10853, "loss": 0.2056, "learning_rate": 1.4640883977900552e-06, "epoch": 0.014649652185930806, "percentage": 1.47, "elapsed_time": "0:28:48", "remaining_time": "1 day, 8:17:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 160, "total_steps": 10853, "loss": 0.2571, "learning_rate": 1.4732965009208105e-06, "epoch": 0.01474178836320081, "percentage": 1.47, "elapsed_time": "0:29:00", "remaining_time": "1 day, 8:18:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 161, "total_steps": 10853, "loss": 0.2195, "learning_rate": 1.4825046040515656e-06, "epoch": 0.014833924540470816, "percentage": 1.48, "elapsed_time": "0:29:10", "remaining_time": "1 day, 8:17:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 162, "total_steps": 10853, "loss": 0.2245, "learning_rate": 1.4917127071823205e-06, "epoch": 0.014926060717740821, "percentage": 1.49, "elapsed_time": "0:29:21", "remaining_time": "1 day, 8:17:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 163, "total_steps": 10853, "loss": 0.2298, "learning_rate": 1.5009208103130757e-06, "epoch": 0.015018196895010825, "percentage": 1.5, "elapsed_time": "0:29:32", "remaining_time": "1 day, 8:16:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 164, "total_steps": 10853, "loss": 0.2343, "learning_rate": 1.5101289134438308e-06, "epoch": 0.01511033307228083, "percentage": 1.51, "elapsed_time": "0:29:42", "remaining_time": "1 day, 8:16:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 165, "total_steps": 10853, "loss": 0.2271, "learning_rate": 1.5193370165745857e-06, "epoch": 0.015202469249550836, "percentage": 1.52, "elapsed_time": "0:29:54", "remaining_time": "1 day, 8:17:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 166, "total_steps": 10853, "loss": 0.221, "learning_rate": 1.5285451197053408e-06, "epoch": 0.015294605426820842, "percentage": 1.53, "elapsed_time": "0:30:05", "remaining_time": "1 day, 8:17:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 167, "total_steps": 10853, "loss": 0.2053, "learning_rate": 1.537753222836096e-06, "epoch": 0.015386741604090846, "percentage": 1.54, "elapsed_time": "0:30:15", "remaining_time": "1 day, 8:15:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 168, "total_steps": 10853, "loss": 0.2051, "learning_rate": 1.5469613259668508e-06, "epoch": 0.015478877781360851, "percentage": 1.55, "elapsed_time": "0:30:24", "remaining_time": "1 day, 8:14:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 169, "total_steps": 10853, "loss": 0.2238, "learning_rate": 1.556169429097606e-06, "epoch": 0.015571013958630857, "percentage": 1.56, "elapsed_time": "0:30:36", "remaining_time": "1 day, 8:14:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 170, "total_steps": 10853, "loss": 0.2422, "learning_rate": 1.565377532228361e-06, "epoch": 0.01566315013590086, "percentage": 1.57, "elapsed_time": "0:30:46", "remaining_time": "1 day, 8:13:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 171, "total_steps": 10853, "loss": 0.211, "learning_rate": 1.574585635359116e-06, "epoch": 0.015755286313170868, "percentage": 1.58, "elapsed_time": "0:30:56", "remaining_time": "1 day, 8:12:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 172, "total_steps": 10853, "loss": 0.2124, "learning_rate": 1.5837937384898713e-06, "epoch": 0.015847422490440872, "percentage": 1.58, "elapsed_time": "0:31:07", "remaining_time": "1 day, 8:12:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 173, "total_steps": 10853, "loss": 0.2183, "learning_rate": 1.5930018416206264e-06, "epoch": 0.015939558667710876, "percentage": 1.59, "elapsed_time": "0:31:17", "remaining_time": "1 day, 8:11:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 174, "total_steps": 10853, "loss": 0.2236, "learning_rate": 1.6022099447513815e-06, "epoch": 0.016031694844980883, "percentage": 1.6, "elapsed_time": "0:31:28", "remaining_time": "1 day, 8:12:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 175, "total_steps": 10853, "loss": 0.2141, "learning_rate": 1.6114180478821364e-06, "epoch": 0.016123831022250887, "percentage": 1.61, "elapsed_time": "0:31:39", "remaining_time": "1 day, 8:11:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 176, "total_steps": 10853, "loss": 0.2423, "learning_rate": 1.6206261510128915e-06, "epoch": 0.01621596719952089, "percentage": 1.62, "elapsed_time": "0:31:50", "remaining_time": "1 day, 8:11:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 177, "total_steps": 10853, "loss": 0.2346, "learning_rate": 1.6298342541436466e-06, "epoch": 0.016308103376790898, "percentage": 1.63, "elapsed_time": "0:32:00", "remaining_time": "1 day, 8:10:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 178, "total_steps": 10853, "loss": 0.2506, "learning_rate": 1.6390423572744015e-06, "epoch": 0.016400239554060902, "percentage": 1.64, "elapsed_time": "0:32:11", "remaining_time": "1 day, 8:10:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 179, "total_steps": 10853, "loss": 0.2216, "learning_rate": 1.6482504604051566e-06, "epoch": 0.016492375731330906, "percentage": 1.65, "elapsed_time": "0:32:22", "remaining_time": "1 day, 8:10:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 180, "total_steps": 10853, "loss": 0.2348, "learning_rate": 1.6574585635359118e-06, "epoch": 0.016584511908600913, "percentage": 1.66, "elapsed_time": "0:32:33", "remaining_time": "1 day, 8:10:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 181, "total_steps": 10853, "loss": 0.2321, "learning_rate": 1.6666666666666667e-06, "epoch": 0.016676648085870917, "percentage": 1.67, "elapsed_time": "0:32:44", "remaining_time": "1 day, 8:10:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 182, "total_steps": 10853, "loss": 0.2443, "learning_rate": 1.6758747697974218e-06, "epoch": 0.01676878426314092, "percentage": 1.68, "elapsed_time": "0:32:55", "remaining_time": "1 day, 8:10:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 183, "total_steps": 10853, "loss": 0.2121, "learning_rate": 1.685082872928177e-06, "epoch": 0.016860920440410928, "percentage": 1.69, "elapsed_time": "0:33:06", "remaining_time": "1 day, 8:10:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 184, "total_steps": 10853, "loss": 0.2287, "learning_rate": 1.6942909760589322e-06, "epoch": 0.016953056617680932, "percentage": 1.7, "elapsed_time": "0:33:16", "remaining_time": "1 day, 8:09:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 185, "total_steps": 10853, "loss": 0.2049, "learning_rate": 1.7034990791896871e-06, "epoch": 0.01704519279495094, "percentage": 1.7, "elapsed_time": "0:33:27", "remaining_time": "1 day, 8:09:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 186, "total_steps": 10853, "loss": 0.2424, "learning_rate": 1.7127071823204422e-06, "epoch": 0.017137328972220943, "percentage": 1.71, "elapsed_time": "0:33:37", "remaining_time": "1 day, 8:08:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 187, "total_steps": 10853, "loss": 0.2227, "learning_rate": 1.7219152854511971e-06, "epoch": 0.017229465149490947, "percentage": 1.72, "elapsed_time": "0:33:49", "remaining_time": "1 day, 8:08:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 188, "total_steps": 10853, "loss": 0.2431, "learning_rate": 1.7311233885819523e-06, "epoch": 0.017321601326760954, "percentage": 1.73, "elapsed_time": "0:34:00", "remaining_time": "1 day, 8:09:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 189, "total_steps": 10853, "loss": 0.2179, "learning_rate": 1.7403314917127074e-06, "epoch": 0.017413737504030958, "percentage": 1.74, "elapsed_time": "0:34:10", "remaining_time": "1 day, 8:08:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 190, "total_steps": 10853, "loss": 0.2518, "learning_rate": 1.7495395948434623e-06, "epoch": 0.017505873681300962, "percentage": 1.75, "elapsed_time": "0:34:22", "remaining_time": "1 day, 8:09:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 191, "total_steps": 10853, "loss": 0.2519, "learning_rate": 1.7587476979742174e-06, "epoch": 0.01759800985857097, "percentage": 1.76, "elapsed_time": "0:34:32", "remaining_time": "1 day, 8:08:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 192, "total_steps": 10853, "loss": 0.2122, "learning_rate": 1.7679558011049725e-06, "epoch": 0.017690146035840973, "percentage": 1.77, "elapsed_time": "0:34:44", "remaining_time": "1 day, 8:08:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 193, "total_steps": 10853, "loss": 0.218, "learning_rate": 1.7771639042357274e-06, "epoch": 0.017782282213110977, "percentage": 1.78, "elapsed_time": "0:34:56", "remaining_time": "1 day, 8:09:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 194, "total_steps": 10853, "loss": 0.2275, "learning_rate": 1.7863720073664825e-06, "epoch": 0.017874418390380984, "percentage": 1.79, "elapsed_time": "0:35:07", "remaining_time": "1 day, 8:09:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 195, "total_steps": 10853, "loss": 0.2265, "learning_rate": 1.7955801104972378e-06, "epoch": 0.017966554567650988, "percentage": 1.8, "elapsed_time": "0:35:19", "remaining_time": "1 day, 8:10:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 196, "total_steps": 10853, "loss": 0.2106, "learning_rate": 1.804788213627993e-06, "epoch": 0.01805869074492099, "percentage": 1.81, "elapsed_time": "0:35:29", "remaining_time": "1 day, 8:10:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 197, "total_steps": 10853, "loss": 0.2421, "learning_rate": 1.8139963167587479e-06, "epoch": 0.018150826922191, "percentage": 1.82, "elapsed_time": "0:35:40", "remaining_time": "1 day, 8:09:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 198, "total_steps": 10853, "loss": 0.2258, "learning_rate": 1.823204419889503e-06, "epoch": 0.018242963099461003, "percentage": 1.82, "elapsed_time": "0:35:50", "remaining_time": "1 day, 8:09:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 199, "total_steps": 10853, "loss": 0.2086, "learning_rate": 1.832412523020258e-06, "epoch": 0.018335099276731007, "percentage": 1.83, "elapsed_time": "0:36:00", "remaining_time": "1 day, 8:08:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 200, "total_steps": 10853, "loss": 0.2129, "learning_rate": 1.841620626151013e-06, "epoch": 0.018427235454001014, "percentage": 1.84, "elapsed_time": "0:36:12", "remaining_time": "1 day, 8:08:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 201, "total_steps": 10853, "loss": 0.2191, "learning_rate": 1.8508287292817681e-06, "epoch": 0.018519371631271018, "percentage": 1.85, "elapsed_time": "0:36:23", "remaining_time": "1 day, 8:08:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 202, "total_steps": 10853, "loss": 0.2061, "learning_rate": 1.8600368324125232e-06, "epoch": 0.018611507808541025, "percentage": 1.86, "elapsed_time": "0:36:33", "remaining_time": "1 day, 8:07:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 203, "total_steps": 10853, "loss": 0.2277, "learning_rate": 1.8692449355432781e-06, "epoch": 0.01870364398581103, "percentage": 1.87, "elapsed_time": "0:36:44", "remaining_time": "1 day, 8:07:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 204, "total_steps": 10853, "loss": 0.2065, "learning_rate": 1.8784530386740332e-06, "epoch": 0.018795780163081033, "percentage": 1.88, "elapsed_time": "0:36:54", "remaining_time": "1 day, 8:06:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 205, "total_steps": 10853, "loss": 0.2117, "learning_rate": 1.8876611418047884e-06, "epoch": 0.01888791634035104, "percentage": 1.89, "elapsed_time": "0:37:04", "remaining_time": "1 day, 8:06:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 206, "total_steps": 10853, "loss": 0.2241, "learning_rate": 1.8968692449355433e-06, "epoch": 0.018980052517621044, "percentage": 1.9, "elapsed_time": "0:37:15", "remaining_time": "1 day, 8:05:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 207, "total_steps": 10853, "loss": 0.2394, "learning_rate": 1.9060773480662986e-06, "epoch": 0.019072188694891048, "percentage": 1.91, "elapsed_time": "0:37:26", "remaining_time": "1 day, 8:05:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 208, "total_steps": 10853, "loss": 0.2147, "learning_rate": 1.9152854511970537e-06, "epoch": 0.019164324872161055, "percentage": 1.92, "elapsed_time": "0:37:36", "remaining_time": "1 day, 8:04:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 209, "total_steps": 10853, "loss": 0.2454, "learning_rate": 1.9244935543278086e-06, "epoch": 0.01925646104943106, "percentage": 1.93, "elapsed_time": "0:37:48", "remaining_time": "1 day, 8:05:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 210, "total_steps": 10853, "loss": 0.2281, "learning_rate": 1.933701657458564e-06, "epoch": 0.019348597226701063, "percentage": 1.93, "elapsed_time": "0:38:00", "remaining_time": "1 day, 8:06:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 211, "total_steps": 10853, "loss": 0.2011, "learning_rate": 1.942909760589319e-06, "epoch": 0.01944073340397107, "percentage": 1.94, "elapsed_time": "0:38:10", "remaining_time": "1 day, 8:05:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 212, "total_steps": 10853, "loss": 0.2198, "learning_rate": 1.9521178637200737e-06, "epoch": 0.019532869581241074, "percentage": 1.95, "elapsed_time": "0:38:21", "remaining_time": "1 day, 8:04:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 213, "total_steps": 10853, "loss": 0.2174, "learning_rate": 1.961325966850829e-06, "epoch": 0.019625005758511078, "percentage": 1.96, "elapsed_time": "0:38:32", "remaining_time": "1 day, 8:05:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 214, "total_steps": 10853, "loss": 0.2225, "learning_rate": 1.970534069981584e-06, "epoch": 0.019717141935781085, "percentage": 1.97, "elapsed_time": "0:38:42", "remaining_time": "1 day, 8:04:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 215, "total_steps": 10853, "loss": 0.2267, "learning_rate": 1.979742173112339e-06, "epoch": 0.01980927811305109, "percentage": 1.98, "elapsed_time": "0:38:52", "remaining_time": "1 day, 8:03:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 216, "total_steps": 10853, "loss": 0.2297, "learning_rate": 1.988950276243094e-06, "epoch": 0.019901414290321096, "percentage": 1.99, "elapsed_time": "0:39:04", "remaining_time": "1 day, 8:04:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 217, "total_steps": 10853, "loss": 0.2181, "learning_rate": 1.998158379373849e-06, "epoch": 0.0199935504675911, "percentage": 2.0, "elapsed_time": "0:39:15", "remaining_time": "1 day, 8:04:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 218, "total_steps": 10853, "loss": 0.2397, "learning_rate": 2.007366482504604e-06, "epoch": 0.020085686644861104, "percentage": 2.01, "elapsed_time": "0:39:27", "remaining_time": "1 day, 8:04:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 219, "total_steps": 10853, "loss": 0.2253, "learning_rate": 2.0165745856353593e-06, "epoch": 0.02017782282213111, "percentage": 2.02, "elapsed_time": "0:39:37", "remaining_time": "1 day, 8:03:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 220, "total_steps": 10853, "loss": 0.2252, "learning_rate": 2.0257826887661147e-06, "epoch": 0.020269958999401115, "percentage": 2.03, "elapsed_time": "0:39:47", "remaining_time": "1 day, 8:02:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 221, "total_steps": 10853, "loss": 0.2278, "learning_rate": 2.0349907918968696e-06, "epoch": 0.02036209517667112, "percentage": 2.04, "elapsed_time": "0:39:57", "remaining_time": "1 day, 8:02:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 222, "total_steps": 10853, "loss": 0.2124, "learning_rate": 2.0441988950276245e-06, "epoch": 0.020454231353941126, "percentage": 2.05, "elapsed_time": "0:40:09", "remaining_time": "1 day, 8:02:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 223, "total_steps": 10853, "loss": 0.2216, "learning_rate": 2.0534069981583794e-06, "epoch": 0.02054636753121113, "percentage": 2.05, "elapsed_time": "0:40:20", "remaining_time": "1 day, 8:03:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 224, "total_steps": 10853, "loss": 0.222, "learning_rate": 2.0626151012891347e-06, "epoch": 0.020638503708481134, "percentage": 2.06, "elapsed_time": "0:40:30", "remaining_time": "1 day, 8:02:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 225, "total_steps": 10853, "loss": 0.2043, "learning_rate": 2.0718232044198896e-06, "epoch": 0.02073063988575114, "percentage": 2.07, "elapsed_time": "0:40:41", "remaining_time": "1 day, 8:02:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 226, "total_steps": 10853, "loss": 0.222, "learning_rate": 2.0810313075506445e-06, "epoch": 0.020822776063021145, "percentage": 2.08, "elapsed_time": "0:40:53", "remaining_time": "1 day, 8:02:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 227, "total_steps": 10853, "loss": 0.2425, "learning_rate": 2.0902394106814e-06, "epoch": 0.02091491224029115, "percentage": 2.09, "elapsed_time": "0:41:04", "remaining_time": "1 day, 8:02:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 228, "total_steps": 10853, "loss": 0.223, "learning_rate": 2.0994475138121547e-06, "epoch": 0.021007048417561156, "percentage": 2.1, "elapsed_time": "0:41:15", "remaining_time": "1 day, 8:02:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 229, "total_steps": 10853, "loss": 0.2223, "learning_rate": 2.1086556169429096e-06, "epoch": 0.02109918459483116, "percentage": 2.11, "elapsed_time": "0:41:25", "remaining_time": "1 day, 8:01:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 230, "total_steps": 10853, "loss": 0.223, "learning_rate": 2.117863720073665e-06, "epoch": 0.021191320772101164, "percentage": 2.12, "elapsed_time": "0:41:34", "remaining_time": "1 day, 8:00:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 231, "total_steps": 10853, "loss": 0.2088, "learning_rate": 2.1270718232044203e-06, "epoch": 0.02128345694937117, "percentage": 2.13, "elapsed_time": "0:41:45", "remaining_time": "1 day, 7:59:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 232, "total_steps": 10853, "loss": 0.2183, "learning_rate": 2.136279926335175e-06, "epoch": 0.021375593126641175, "percentage": 2.14, "elapsed_time": "0:41:56", "remaining_time": "1 day, 8:00:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 233, "total_steps": 10853, "loss": 0.2218, "learning_rate": 2.14548802946593e-06, "epoch": 0.021467729303911182, "percentage": 2.15, "elapsed_time": "0:42:07", "remaining_time": "1 day, 7:59:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 234, "total_steps": 10853, "loss": 0.2167, "learning_rate": 2.1546961325966854e-06, "epoch": 0.021559865481181186, "percentage": 2.16, "elapsed_time": "0:42:18", "remaining_time": "1 day, 7:59:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 235, "total_steps": 10853, "loss": 0.2378, "learning_rate": 2.1639042357274403e-06, "epoch": 0.02165200165845119, "percentage": 2.17, "elapsed_time": "0:42:29", "remaining_time": "1 day, 8:00:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 236, "total_steps": 10853, "loss": 0.2294, "learning_rate": 2.1731123388581952e-06, "epoch": 0.021744137835721197, "percentage": 2.17, "elapsed_time": "0:42:40", "remaining_time": "1 day, 7:59:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 237, "total_steps": 10853, "loss": 0.1968, "learning_rate": 2.1823204419889505e-06, "epoch": 0.0218362740129912, "percentage": 2.18, "elapsed_time": "0:42:50", "remaining_time": "1 day, 7:59:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 238, "total_steps": 10853, "loss": 0.2228, "learning_rate": 2.1915285451197054e-06, "epoch": 0.021928410190261205, "percentage": 2.19, "elapsed_time": "0:43:02", "remaining_time": "1 day, 7:59:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 239, "total_steps": 10853, "loss": 0.224, "learning_rate": 2.2007366482504604e-06, "epoch": 0.022020546367531212, "percentage": 2.2, "elapsed_time": "0:43:12", "remaining_time": "1 day, 7:59:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 240, "total_steps": 10853, "loss": 0.2334, "learning_rate": 2.2099447513812157e-06, "epoch": 0.022112682544801216, "percentage": 2.21, "elapsed_time": "0:43:23", "remaining_time": "1 day, 7:58:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 241, "total_steps": 10853, "loss": 0.207, "learning_rate": 2.2191528545119706e-06, "epoch": 0.02220481872207122, "percentage": 2.22, "elapsed_time": "0:43:34", "remaining_time": "1 day, 7:58:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 242, "total_steps": 10853, "loss": 0.2236, "learning_rate": 2.228360957642726e-06, "epoch": 0.022296954899341227, "percentage": 2.23, "elapsed_time": "0:43:44", "remaining_time": "1 day, 7:57:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 243, "total_steps": 10853, "loss": 0.2244, "learning_rate": 2.237569060773481e-06, "epoch": 0.02238909107661123, "percentage": 2.24, "elapsed_time": "0:43:55", "remaining_time": "1 day, 7:57:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 244, "total_steps": 10853, "loss": 0.2098, "learning_rate": 2.246777163904236e-06, "epoch": 0.022481227253881235, "percentage": 2.25, "elapsed_time": "0:44:05", "remaining_time": "1 day, 7:57:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 245, "total_steps": 10853, "loss": 0.2038, "learning_rate": 2.255985267034991e-06, "epoch": 0.022573363431151242, "percentage": 2.26, "elapsed_time": "0:44:16", "remaining_time": "1 day, 7:57:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 246, "total_steps": 10853, "loss": 0.221, "learning_rate": 2.265193370165746e-06, "epoch": 0.022665499608421246, "percentage": 2.27, "elapsed_time": "0:44:27", "remaining_time": "1 day, 7:56:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 247, "total_steps": 10853, "loss": 0.2059, "learning_rate": 2.2744014732965013e-06, "epoch": 0.022757635785691253, "percentage": 2.28, "elapsed_time": "0:44:36", "remaining_time": "1 day, 7:55:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 248, "total_steps": 10853, "loss": 0.2116, "learning_rate": 2.283609576427256e-06, "epoch": 0.022849771962961257, "percentage": 2.29, "elapsed_time": "0:44:46", "remaining_time": "1 day, 7:54:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 249, "total_steps": 10853, "loss": 0.2044, "learning_rate": 2.292817679558011e-06, "epoch": 0.02294190814023126, "percentage": 2.29, "elapsed_time": "0:44:58", "remaining_time": "1 day, 7:55:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 250, "total_steps": 10853, "loss": 0.2265, "learning_rate": 2.3020257826887664e-06, "epoch": 0.02303404431750127, "percentage": 2.3, "elapsed_time": "0:45:09", "remaining_time": "1 day, 7:55:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 251, "total_steps": 10853, "loss": 0.2098, "learning_rate": 2.3112338858195213e-06, "epoch": 0.023126180494771272, "percentage": 2.31, "elapsed_time": "0:45:20", "remaining_time": "1 day, 7:55:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 252, "total_steps": 10853, "loss": 0.2274, "learning_rate": 2.320441988950276e-06, "epoch": 0.023218316672041276, "percentage": 2.32, "elapsed_time": "0:45:32", "remaining_time": "1 day, 7:55:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 253, "total_steps": 10853, "loss": 0.203, "learning_rate": 2.3296500920810315e-06, "epoch": 0.023310452849311283, "percentage": 2.33, "elapsed_time": "0:45:41", "remaining_time": "1 day, 7:54:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 254, "total_steps": 10853, "loss": 0.2124, "learning_rate": 2.338858195211787e-06, "epoch": 0.023402589026581287, "percentage": 2.34, "elapsed_time": "0:45:52", "remaining_time": "1 day, 7:53:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 255, "total_steps": 10853, "loss": 0.2284, "learning_rate": 2.3480662983425418e-06, "epoch": 0.02349472520385129, "percentage": 2.35, "elapsed_time": "0:46:01", "remaining_time": "1 day, 7:52:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 256, "total_steps": 10853, "loss": 0.2212, "learning_rate": 2.3572744014732967e-06, "epoch": 0.0235868613811213, "percentage": 2.36, "elapsed_time": "0:46:12", "remaining_time": "1 day, 7:52:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 257, "total_steps": 10853, "loss": 0.2158, "learning_rate": 2.366482504604052e-06, "epoch": 0.023678997558391302, "percentage": 2.37, "elapsed_time": "0:46:23", "remaining_time": "1 day, 7:52:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 258, "total_steps": 10853, "loss": 0.2223, "learning_rate": 2.375690607734807e-06, "epoch": 0.023771133735661306, "percentage": 2.38, "elapsed_time": "0:46:33", "remaining_time": "1 day, 7:52:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 259, "total_steps": 10853, "loss": 0.2355, "learning_rate": 2.384898710865562e-06, "epoch": 0.023863269912931313, "percentage": 2.39, "elapsed_time": "0:46:45", "remaining_time": "1 day, 7:52:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 260, "total_steps": 10853, "loss": 0.2093, "learning_rate": 2.394106813996317e-06, "epoch": 0.023955406090201317, "percentage": 2.4, "elapsed_time": "0:46:56", "remaining_time": "1 day, 7:52:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 261, "total_steps": 10853, "loss": 0.2299, "learning_rate": 2.403314917127072e-06, "epoch": 0.02404754226747132, "percentage": 2.4, "elapsed_time": "0:47:07", "remaining_time": "1 day, 7:52:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 262, "total_steps": 10853, "loss": 0.2235, "learning_rate": 2.412523020257827e-06, "epoch": 0.02413967844474133, "percentage": 2.41, "elapsed_time": "0:47:18", "remaining_time": "1 day, 7:52:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 263, "total_steps": 10853, "loss": 0.2314, "learning_rate": 2.4217311233885823e-06, "epoch": 0.024231814622011332, "percentage": 2.42, "elapsed_time": "0:47:31", "remaining_time": "1 day, 7:53:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 264, "total_steps": 10853, "loss": 0.192, "learning_rate": 2.430939226519337e-06, "epoch": 0.02432395079928134, "percentage": 2.43, "elapsed_time": "0:47:40", "remaining_time": "1 day, 7:52:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 265, "total_steps": 10853, "loss": 0.2218, "learning_rate": 2.440147329650092e-06, "epoch": 0.024416086976551343, "percentage": 2.44, "elapsed_time": "0:47:51", "remaining_time": "1 day, 7:52:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 266, "total_steps": 10853, "loss": 0.2003, "learning_rate": 2.4493554327808474e-06, "epoch": 0.024508223153821347, "percentage": 2.45, "elapsed_time": "0:48:01", "remaining_time": "1 day, 7:51:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 267, "total_steps": 10853, "loss": 0.2036, "learning_rate": 2.4585635359116027e-06, "epoch": 0.024600359331091354, "percentage": 2.46, "elapsed_time": "0:48:11", "remaining_time": "1 day, 7:50:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 268, "total_steps": 10853, "loss": 0.2168, "learning_rate": 2.4677716390423576e-06, "epoch": 0.02469249550836136, "percentage": 2.47, "elapsed_time": "0:48:22", "remaining_time": "1 day, 7:50:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 269, "total_steps": 10853, "loss": 0.2164, "learning_rate": 2.4769797421731125e-06, "epoch": 0.024784631685631362, "percentage": 2.48, "elapsed_time": "0:48:33", "remaining_time": "1 day, 7:50:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 270, "total_steps": 10853, "loss": 0.2136, "learning_rate": 2.486187845303868e-06, "epoch": 0.02487676786290137, "percentage": 2.49, "elapsed_time": "0:48:43", "remaining_time": "1 day, 7:49:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 271, "total_steps": 10853, "loss": 0.2217, "learning_rate": 2.4953959484346228e-06, "epoch": 0.024968904040171373, "percentage": 2.5, "elapsed_time": "0:48:54", "remaining_time": "1 day, 7:49:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 272, "total_steps": 10853, "loss": 0.2018, "learning_rate": 2.504604051565378e-06, "epoch": 0.025061040217441377, "percentage": 2.51, "elapsed_time": "0:49:05", "remaining_time": "1 day, 7:49:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 273, "total_steps": 10853, "loss": 0.2315, "learning_rate": 2.513812154696133e-06, "epoch": 0.025153176394711384, "percentage": 2.52, "elapsed_time": "0:49:15", "remaining_time": "1 day, 7:49:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 274, "total_steps": 10853, "loss": 0.2087, "learning_rate": 2.523020257826888e-06, "epoch": 0.025245312571981388, "percentage": 2.52, "elapsed_time": "0:49:27", "remaining_time": "1 day, 7:49:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 275, "total_steps": 10853, "loss": 0.2127, "learning_rate": 2.5322283609576432e-06, "epoch": 0.025337448749251392, "percentage": 2.53, "elapsed_time": "0:49:37", "remaining_time": "1 day, 7:48:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 276, "total_steps": 10853, "loss": 0.1973, "learning_rate": 2.541436464088398e-06, "epoch": 0.0254295849265214, "percentage": 2.54, "elapsed_time": "0:49:48", "remaining_time": "1 day, 7:48:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 277, "total_steps": 10853, "loss": 0.2099, "learning_rate": 2.550644567219153e-06, "epoch": 0.025521721103791403, "percentage": 2.55, "elapsed_time": "0:49:58", "remaining_time": "1 day, 7:47:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 278, "total_steps": 10853, "loss": 0.2243, "learning_rate": 2.5598526703499083e-06, "epoch": 0.025613857281061407, "percentage": 2.56, "elapsed_time": "0:50:08", "remaining_time": "1 day, 7:47:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 279, "total_steps": 10853, "loss": 0.2204, "learning_rate": 2.5690607734806632e-06, "epoch": 0.025705993458331414, "percentage": 2.57, "elapsed_time": "0:50:19", "remaining_time": "1 day, 7:47:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 280, "total_steps": 10853, "loss": 0.2211, "learning_rate": 2.578268876611418e-06, "epoch": 0.025798129635601418, "percentage": 2.58, "elapsed_time": "0:50:30", "remaining_time": "1 day, 7:47:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 281, "total_steps": 10853, "loss": 0.1965, "learning_rate": 2.5874769797421735e-06, "epoch": 0.025890265812871426, "percentage": 2.59, "elapsed_time": "0:50:42", "remaining_time": "1 day, 7:47:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 282, "total_steps": 10853, "loss": 0.2134, "learning_rate": 2.5966850828729284e-06, "epoch": 0.02598240199014143, "percentage": 2.6, "elapsed_time": "0:50:51", "remaining_time": "1 day, 7:46:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 283, "total_steps": 10853, "loss": 0.2039, "learning_rate": 2.6058931860036833e-06, "epoch": 0.026074538167411433, "percentage": 2.61, "elapsed_time": "0:51:01", "remaining_time": "1 day, 7:45:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 284, "total_steps": 10853, "loss": 0.2091, "learning_rate": 2.6151012891344386e-06, "epoch": 0.02616667434468144, "percentage": 2.62, "elapsed_time": "0:51:12", "remaining_time": "1 day, 7:45:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 285, "total_steps": 10853, "loss": 0.2127, "learning_rate": 2.6243093922651935e-06, "epoch": 0.026258810521951444, "percentage": 2.63, "elapsed_time": "0:51:22", "remaining_time": "1 day, 7:45:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 286, "total_steps": 10853, "loss": 0.2134, "learning_rate": 2.6335174953959484e-06, "epoch": 0.026350946699221448, "percentage": 2.64, "elapsed_time": "0:51:34", "remaining_time": "1 day, 7:45:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 287, "total_steps": 10853, "loss": 0.2229, "learning_rate": 2.6427255985267037e-06, "epoch": 0.026443082876491456, "percentage": 2.64, "elapsed_time": "0:51:45", "remaining_time": "1 day, 7:45:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 288, "total_steps": 10853, "loss": 0.2292, "learning_rate": 2.6519337016574586e-06, "epoch": 0.02653521905376146, "percentage": 2.65, "elapsed_time": "0:51:55", "remaining_time": "1 day, 7:44:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 289, "total_steps": 10853, "loss": 0.22, "learning_rate": 2.6611418047882135e-06, "epoch": 0.026627355231031463, "percentage": 2.66, "elapsed_time": "0:52:07", "remaining_time": "1 day, 7:45:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 290, "total_steps": 10853, "loss": 0.2194, "learning_rate": 2.670349907918969e-06, "epoch": 0.02671949140830147, "percentage": 2.67, "elapsed_time": "0:52:17", "remaining_time": "1 day, 7:44:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 291, "total_steps": 10853, "loss": 0.2239, "learning_rate": 2.6795580110497238e-06, "epoch": 0.026811627585571474, "percentage": 2.68, "elapsed_time": "0:52:28", "remaining_time": "1 day, 7:44:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 292, "total_steps": 10853, "loss": 0.2141, "learning_rate": 2.6887661141804787e-06, "epoch": 0.026903763762841478, "percentage": 2.69, "elapsed_time": "0:52:39", "remaining_time": "1 day, 7:44:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 293, "total_steps": 10853, "loss": 0.2224, "learning_rate": 2.697974217311234e-06, "epoch": 0.026995899940111485, "percentage": 2.7, "elapsed_time": "0:52:50", "remaining_time": "1 day, 7:44:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 294, "total_steps": 10853, "loss": 0.2214, "learning_rate": 2.707182320441989e-06, "epoch": 0.02708803611738149, "percentage": 2.71, "elapsed_time": "0:53:01", "remaining_time": "1 day, 7:44:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 295, "total_steps": 10853, "loss": 0.2179, "learning_rate": 2.716390423572744e-06, "epoch": 0.027180172294651497, "percentage": 2.72, "elapsed_time": "0:53:12", "remaining_time": "1 day, 7:44:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 296, "total_steps": 10853, "loss": 0.2196, "learning_rate": 2.7255985267034996e-06, "epoch": 0.0272723084719215, "percentage": 2.73, "elapsed_time": "0:53:24", "remaining_time": "1 day, 7:44:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 297, "total_steps": 10853, "loss": 0.2201, "learning_rate": 2.7348066298342545e-06, "epoch": 0.027364444649191504, "percentage": 2.74, "elapsed_time": "0:53:34", "remaining_time": "1 day, 7:44:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 298, "total_steps": 10853, "loss": 0.2109, "learning_rate": 2.74401473296501e-06, "epoch": 0.02745658082646151, "percentage": 2.75, "elapsed_time": "0:53:44", "remaining_time": "1 day, 7:43:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 299, "total_steps": 10853, "loss": 0.22, "learning_rate": 2.7532228360957647e-06, "epoch": 0.027548717003731515, "percentage": 2.75, "elapsed_time": "0:53:55", "remaining_time": "1 day, 7:43:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 300, "total_steps": 10853, "loss": 0.2002, "learning_rate": 2.7624309392265196e-06, "epoch": 0.02764085318100152, "percentage": 2.76, "elapsed_time": "0:54:06", "remaining_time": "1 day, 7:43:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 301, "total_steps": 10853, "loss": 0.2016, "learning_rate": 2.771639042357275e-06, "epoch": 0.027732989358271527, "percentage": 2.77, "elapsed_time": "0:54:17", "remaining_time": "1 day, 7:43:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 302, "total_steps": 10853, "loss": 0.2001, "learning_rate": 2.78084714548803e-06, "epoch": 0.02782512553554153, "percentage": 2.78, "elapsed_time": "0:54:27", "remaining_time": "1 day, 7:42:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 303, "total_steps": 10853, "loss": 0.2034, "learning_rate": 2.7900552486187847e-06, "epoch": 0.027917261712811534, "percentage": 2.79, "elapsed_time": "0:54:38", "remaining_time": "1 day, 7:42:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 304, "total_steps": 10853, "loss": 0.2161, "learning_rate": 2.79926335174954e-06, "epoch": 0.02800939789008154, "percentage": 2.8, "elapsed_time": "0:54:48", "remaining_time": "1 day, 7:42:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 305, "total_steps": 10853, "loss": 0.1892, "learning_rate": 2.808471454880295e-06, "epoch": 0.028101534067351545, "percentage": 2.81, "elapsed_time": "0:54:59", "remaining_time": "1 day, 7:41:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 306, "total_steps": 10853, "loss": 0.2128, "learning_rate": 2.81767955801105e-06, "epoch": 0.02819367024462155, "percentage": 2.82, "elapsed_time": "0:55:09", "remaining_time": "1 day, 7:41:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 307, "total_steps": 10853, "loss": 0.22, "learning_rate": 2.826887661141805e-06, "epoch": 0.028285806421891557, "percentage": 2.83, "elapsed_time": "0:55:19", "remaining_time": "1 day, 7:40:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 308, "total_steps": 10853, "loss": 0.1904, "learning_rate": 2.83609576427256e-06, "epoch": 0.02837794259916156, "percentage": 2.84, "elapsed_time": "0:55:30", "remaining_time": "1 day, 7:40:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 309, "total_steps": 10853, "loss": 0.2057, "learning_rate": 2.845303867403315e-06, "epoch": 0.028470078776431564, "percentage": 2.85, "elapsed_time": "0:55:41", "remaining_time": "1 day, 7:40:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 310, "total_steps": 10853, "loss": 0.2165, "learning_rate": 2.8545119705340703e-06, "epoch": 0.02856221495370157, "percentage": 2.86, "elapsed_time": "0:55:51", "remaining_time": "1 day, 7:39:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 311, "total_steps": 10853, "loss": 0.2277, "learning_rate": 2.8637200736648252e-06, "epoch": 0.028654351130971575, "percentage": 2.87, "elapsed_time": "0:56:03", "remaining_time": "1 day, 7:40:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 312, "total_steps": 10853, "loss": 0.2047, "learning_rate": 2.87292817679558e-06, "epoch": 0.028746487308241583, "percentage": 2.87, "elapsed_time": "0:56:14", "remaining_time": "1 day, 7:39:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 313, "total_steps": 10853, "loss": 0.2256, "learning_rate": 2.8821362799263355e-06, "epoch": 0.028838623485511587, "percentage": 2.88, "elapsed_time": "0:56:24", "remaining_time": "1 day, 7:39:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 314, "total_steps": 10853, "loss": 0.2202, "learning_rate": 2.8913443830570904e-06, "epoch": 0.02893075966278159, "percentage": 2.89, "elapsed_time": "0:56:34", "remaining_time": "1 day, 7:38:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 315, "total_steps": 10853, "loss": 0.2197, "learning_rate": 2.9005524861878453e-06, "epoch": 0.029022895840051598, "percentage": 2.9, "elapsed_time": "0:56:44", "remaining_time": "1 day, 7:38:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 316, "total_steps": 10853, "loss": 0.2082, "learning_rate": 2.9097605893186006e-06, "epoch": 0.0291150320173216, "percentage": 2.91, "elapsed_time": "0:56:55", "remaining_time": "1 day, 7:38:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 317, "total_steps": 10853, "loss": 0.2061, "learning_rate": 2.9189686924493555e-06, "epoch": 0.029207168194591605, "percentage": 2.92, "elapsed_time": "0:57:05", "remaining_time": "1 day, 7:37:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 318, "total_steps": 10853, "loss": 0.1971, "learning_rate": 2.9281767955801104e-06, "epoch": 0.029299304371861613, "percentage": 2.93, "elapsed_time": "0:57:17", "remaining_time": "1 day, 7:37:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 319, "total_steps": 10853, "loss": 0.2427, "learning_rate": 2.937384898710866e-06, "epoch": 0.029391440549131616, "percentage": 2.94, "elapsed_time": "0:57:27", "remaining_time": "1 day, 7:37:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 320, "total_steps": 10853, "loss": 0.2244, "learning_rate": 2.946593001841621e-06, "epoch": 0.02948357672640162, "percentage": 2.95, "elapsed_time": "0:57:39", "remaining_time": "1 day, 7:37:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 321, "total_steps": 10853, "loss": 0.2265, "learning_rate": 2.955801104972376e-06, "epoch": 0.029575712903671628, "percentage": 2.96, "elapsed_time": "0:57:50", "remaining_time": "1 day, 7:37:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 322, "total_steps": 10853, "loss": 0.2238, "learning_rate": 2.9650092081031313e-06, "epoch": 0.02966784908094163, "percentage": 2.97, "elapsed_time": "0:58:00", "remaining_time": "1 day, 7:37:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 323, "total_steps": 10853, "loss": 0.1929, "learning_rate": 2.974217311233886e-06, "epoch": 0.029759985258211635, "percentage": 2.98, "elapsed_time": "0:58:11", "remaining_time": "1 day, 7:37:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 324, "total_steps": 10853, "loss": 0.2134, "learning_rate": 2.983425414364641e-06, "epoch": 0.029852121435481643, "percentage": 2.99, "elapsed_time": "0:58:23", "remaining_time": "1 day, 7:37:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 325, "total_steps": 10853, "loss": 0.2066, "learning_rate": 2.9926335174953964e-06, "epoch": 0.029944257612751646, "percentage": 2.99, "elapsed_time": "0:58:33", "remaining_time": "1 day, 7:36:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 326, "total_steps": 10853, "loss": 0.1822, "learning_rate": 3.0018416206261513e-06, "epoch": 0.03003639379002165, "percentage": 3.0, "elapsed_time": "0:58:43", "remaining_time": "1 day, 7:36:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 327, "total_steps": 10853, "loss": 0.2225, "learning_rate": 3.0110497237569062e-06, "epoch": 0.030128529967291658, "percentage": 3.01, "elapsed_time": "0:58:55", "remaining_time": "1 day, 7:36:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 328, "total_steps": 10853, "loss": 0.2303, "learning_rate": 3.0202578268876615e-06, "epoch": 0.03022066614456166, "percentage": 3.02, "elapsed_time": "0:59:06", "remaining_time": "1 day, 7:36:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 329, "total_steps": 10853, "loss": 0.2327, "learning_rate": 3.0294659300184164e-06, "epoch": 0.03031280232183167, "percentage": 3.03, "elapsed_time": "0:59:17", "remaining_time": "1 day, 7:36:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 330, "total_steps": 10853, "loss": 0.2113, "learning_rate": 3.0386740331491713e-06, "epoch": 0.030404938499101673, "percentage": 3.04, "elapsed_time": "0:59:26", "remaining_time": "1 day, 7:35:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 331, "total_steps": 10853, "loss": 0.2292, "learning_rate": 3.0478821362799267e-06, "epoch": 0.030497074676371676, "percentage": 3.05, "elapsed_time": "0:59:37", "remaining_time": "1 day, 7:35:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 332, "total_steps": 10853, "loss": 0.2158, "learning_rate": 3.0570902394106816e-06, "epoch": 0.030589210853641684, "percentage": 3.06, "elapsed_time": "0:59:48", "remaining_time": "1 day, 7:35:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 333, "total_steps": 10853, "loss": 0.2161, "learning_rate": 3.0662983425414365e-06, "epoch": 0.030681347030911688, "percentage": 3.07, "elapsed_time": "0:59:59", "remaining_time": "1 day, 7:35:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 334, "total_steps": 10853, "loss": 0.2042, "learning_rate": 3.075506445672192e-06, "epoch": 0.03077348320818169, "percentage": 3.08, "elapsed_time": "1:00:10", "remaining_time": "1 day, 7:35:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 335, "total_steps": 10853, "loss": 0.2221, "learning_rate": 3.0847145488029467e-06, "epoch": 0.0308656193854517, "percentage": 3.09, "elapsed_time": "1:00:22", "remaining_time": "1 day, 7:35:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 336, "total_steps": 10853, "loss": 0.2091, "learning_rate": 3.0939226519337016e-06, "epoch": 0.030957755562721703, "percentage": 3.1, "elapsed_time": "1:00:34", "remaining_time": "1 day, 7:35:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 337, "total_steps": 10853, "loss": 0.22, "learning_rate": 3.103130755064457e-06, "epoch": 0.031049891739991706, "percentage": 3.11, "elapsed_time": "1:00:45", "remaining_time": "1 day, 7:35:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 338, "total_steps": 10853, "loss": 0.2012, "learning_rate": 3.112338858195212e-06, "epoch": 0.031142027917261714, "percentage": 3.11, "elapsed_time": "1:00:56", "remaining_time": "1 day, 7:35:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 339, "total_steps": 10853, "loss": 0.2362, "learning_rate": 3.1215469613259667e-06, "epoch": 0.031234164094531718, "percentage": 3.12, "elapsed_time": "1:01:07", "remaining_time": "1 day, 7:35:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 340, "total_steps": 10853, "loss": 0.2006, "learning_rate": 3.130755064456722e-06, "epoch": 0.03132630027180172, "percentage": 3.13, "elapsed_time": "1:01:17", "remaining_time": "1 day, 7:35:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 341, "total_steps": 10853, "loss": 0.217, "learning_rate": 3.139963167587477e-06, "epoch": 0.031418436449071725, "percentage": 3.14, "elapsed_time": "1:01:27", "remaining_time": "1 day, 7:34:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 342, "total_steps": 10853, "loss": 0.2124, "learning_rate": 3.149171270718232e-06, "epoch": 0.031510572626341736, "percentage": 3.15, "elapsed_time": "1:01:39", "remaining_time": "1 day, 7:34:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 343, "total_steps": 10853, "loss": 0.2098, "learning_rate": 3.1583793738489876e-06, "epoch": 0.03160270880361174, "percentage": 3.16, "elapsed_time": "1:01:49", "remaining_time": "1 day, 7:34:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 344, "total_steps": 10853, "loss": 0.2314, "learning_rate": 3.1675874769797425e-06, "epoch": 0.031694844980881744, "percentage": 3.17, "elapsed_time": "1:02:00", "remaining_time": "1 day, 7:34:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 345, "total_steps": 10853, "loss": 0.1965, "learning_rate": 3.176795580110498e-06, "epoch": 0.03178698115815175, "percentage": 3.18, "elapsed_time": "1:02:11", "remaining_time": "1 day, 7:34:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 346, "total_steps": 10853, "loss": 0.2225, "learning_rate": 3.1860036832412528e-06, "epoch": 0.03187911733542175, "percentage": 3.19, "elapsed_time": "1:02:22", "remaining_time": "1 day, 7:34:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 347, "total_steps": 10853, "loss": 0.2206, "learning_rate": 3.1952117863720077e-06, "epoch": 0.031971253512691755, "percentage": 3.2, "elapsed_time": "1:02:33", "remaining_time": "1 day, 7:33:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 348, "total_steps": 10853, "loss": 0.2035, "learning_rate": 3.204419889502763e-06, "epoch": 0.032063389689961766, "percentage": 3.21, "elapsed_time": "1:02:42", "remaining_time": "1 day, 7:33:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 349, "total_steps": 10853, "loss": 0.2145, "learning_rate": 3.213627992633518e-06, "epoch": 0.03215552586723177, "percentage": 3.22, "elapsed_time": "1:02:53", "remaining_time": "1 day, 7:32:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 350, "total_steps": 10853, "loss": 0.2112, "learning_rate": 3.222836095764273e-06, "epoch": 0.032247662044501774, "percentage": 3.22, "elapsed_time": "1:03:02", "remaining_time": "1 day, 7:31:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 351, "total_steps": 10853, "loss": 0.2056, "learning_rate": 3.232044198895028e-06, "epoch": 0.03233979822177178, "percentage": 3.23, "elapsed_time": "1:03:14", "remaining_time": "1 day, 7:32:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 352, "total_steps": 10853, "loss": 0.1955, "learning_rate": 3.241252302025783e-06, "epoch": 0.03243193439904178, "percentage": 3.24, "elapsed_time": "1:03:25", "remaining_time": "1 day, 7:31:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 353, "total_steps": 10853, "loss": 0.2054, "learning_rate": 3.250460405156538e-06, "epoch": 0.03252407057631179, "percentage": 3.25, "elapsed_time": "1:03:35", "remaining_time": "1 day, 7:31:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 354, "total_steps": 10853, "loss": 0.1981, "learning_rate": 3.2596685082872933e-06, "epoch": 0.032616206753581796, "percentage": 3.26, "elapsed_time": "1:03:46", "remaining_time": "1 day, 7:31:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 355, "total_steps": 10853, "loss": 0.2342, "learning_rate": 3.268876611418048e-06, "epoch": 0.0327083429308518, "percentage": 3.27, "elapsed_time": "1:03:56", "remaining_time": "1 day, 7:30:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 356, "total_steps": 10853, "loss": 0.2183, "learning_rate": 3.278084714548803e-06, "epoch": 0.032800479108121804, "percentage": 3.28, "elapsed_time": "1:04:07", "remaining_time": "1 day, 7:30:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 357, "total_steps": 10853, "loss": 0.2029, "learning_rate": 3.2872928176795584e-06, "epoch": 0.03289261528539181, "percentage": 3.29, "elapsed_time": "1:04:18", "remaining_time": "1 day, 7:30:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 358, "total_steps": 10853, "loss": 0.2214, "learning_rate": 3.2965009208103133e-06, "epoch": 0.03298475146266181, "percentage": 3.3, "elapsed_time": "1:04:30", "remaining_time": "1 day, 7:31:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 359, "total_steps": 10853, "loss": 0.2026, "learning_rate": 3.305709023941068e-06, "epoch": 0.03307688763993182, "percentage": 3.31, "elapsed_time": "1:04:40", "remaining_time": "1 day, 7:30:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 360, "total_steps": 10853, "loss": 0.2209, "learning_rate": 3.3149171270718235e-06, "epoch": 0.033169023817201826, "percentage": 3.32, "elapsed_time": "1:04:51", "remaining_time": "1 day, 7:30:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 361, "total_steps": 10853, "loss": 0.2119, "learning_rate": 3.3241252302025784e-06, "epoch": 0.03326115999447183, "percentage": 3.33, "elapsed_time": "1:05:02", "remaining_time": "1 day, 7:30:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 362, "total_steps": 10853, "loss": 0.2142, "learning_rate": 3.3333333333333333e-06, "epoch": 0.033353296171741834, "percentage": 3.34, "elapsed_time": "1:05:12", "remaining_time": "1 day, 7:29:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 363, "total_steps": 10853, "loss": 0.21, "learning_rate": 3.3425414364640887e-06, "epoch": 0.03344543234901184, "percentage": 3.34, "elapsed_time": "1:05:23", "remaining_time": "1 day, 7:29:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 364, "total_steps": 10853, "loss": 0.2179, "learning_rate": 3.3517495395948436e-06, "epoch": 0.03353756852628184, "percentage": 3.35, "elapsed_time": "1:05:35", "remaining_time": "1 day, 7:29:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 365, "total_steps": 10853, "loss": 0.2066, "learning_rate": 3.3609576427255985e-06, "epoch": 0.03362970470355185, "percentage": 3.36, "elapsed_time": "1:05:46", "remaining_time": "1 day, 7:29:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 366, "total_steps": 10853, "loss": 0.2008, "learning_rate": 3.370165745856354e-06, "epoch": 0.033721840880821856, "percentage": 3.37, "elapsed_time": "1:05:56", "remaining_time": "1 day, 7:29:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 367, "total_steps": 10853, "loss": 0.193, "learning_rate": 3.379373848987109e-06, "epoch": 0.03381397705809186, "percentage": 3.38, "elapsed_time": "1:06:08", "remaining_time": "1 day, 7:29:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 368, "total_steps": 10853, "loss": 0.1982, "learning_rate": 3.3885819521178644e-06, "epoch": 0.033906113235361864, "percentage": 3.39, "elapsed_time": "1:06:19", "remaining_time": "1 day, 7:29:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 369, "total_steps": 10853, "loss": 0.1977, "learning_rate": 3.3977900552486193e-06, "epoch": 0.03399824941263187, "percentage": 3.4, "elapsed_time": "1:06:30", "remaining_time": "1 day, 7:29:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 370, "total_steps": 10853, "loss": 0.2018, "learning_rate": 3.4069981583793742e-06, "epoch": 0.03409038558990188, "percentage": 3.41, "elapsed_time": "1:06:41", "remaining_time": "1 day, 7:29:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 371, "total_steps": 10853, "loss": 0.2088, "learning_rate": 3.416206261510129e-06, "epoch": 0.03418252176717188, "percentage": 3.42, "elapsed_time": "1:06:52", "remaining_time": "1 day, 7:29:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 372, "total_steps": 10853, "loss": 0.2105, "learning_rate": 3.4254143646408845e-06, "epoch": 0.034274657944441886, "percentage": 3.43, "elapsed_time": "1:07:03", "remaining_time": "1 day, 7:29:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 373, "total_steps": 10853, "loss": 0.2063, "learning_rate": 3.4346224677716394e-06, "epoch": 0.03436679412171189, "percentage": 3.44, "elapsed_time": "1:07:14", "remaining_time": "1 day, 7:29:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 374, "total_steps": 10853, "loss": 0.2128, "learning_rate": 3.4438305709023943e-06, "epoch": 0.034458930298981894, "percentage": 3.45, "elapsed_time": "1:07:25", "remaining_time": "1 day, 7:29:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 375, "total_steps": 10853, "loss": 0.2021, "learning_rate": 3.4530386740331496e-06, "epoch": 0.0345510664762519, "percentage": 3.46, "elapsed_time": "1:07:36", "remaining_time": "1 day, 7:28:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 376, "total_steps": 10853, "loss": 0.2257, "learning_rate": 3.4622467771639045e-06, "epoch": 0.03464320265352191, "percentage": 3.46, "elapsed_time": "1:07:47", "remaining_time": "1 day, 7:29:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 377, "total_steps": 10853, "loss": 0.2145, "learning_rate": 3.4714548802946594e-06, "epoch": 0.03473533883079191, "percentage": 3.47, "elapsed_time": "1:07:58", "remaining_time": "1 day, 7:28:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 378, "total_steps": 10853, "loss": 0.2079, "learning_rate": 3.4806629834254147e-06, "epoch": 0.034827475008061916, "percentage": 3.48, "elapsed_time": "1:08:07", "remaining_time": "1 day, 7:28:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 379, "total_steps": 10853, "loss": 0.1901, "learning_rate": 3.4898710865561696e-06, "epoch": 0.03491961118533192, "percentage": 3.49, "elapsed_time": "1:08:18", "remaining_time": "1 day, 7:27:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 380, "total_steps": 10853, "loss": 0.2007, "learning_rate": 3.4990791896869245e-06, "epoch": 0.035011747362601923, "percentage": 3.5, "elapsed_time": "1:08:29", "remaining_time": "1 day, 7:27:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 381, "total_steps": 10853, "loss": 0.2195, "learning_rate": 3.50828729281768e-06, "epoch": 0.03510388353987193, "percentage": 3.51, "elapsed_time": "1:08:41", "remaining_time": "1 day, 7:28:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 382, "total_steps": 10853, "loss": 0.2066, "learning_rate": 3.5174953959484348e-06, "epoch": 0.03519601971714194, "percentage": 3.52, "elapsed_time": "1:08:51", "remaining_time": "1 day, 7:27:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 383, "total_steps": 10853, "loss": 0.2093, "learning_rate": 3.5267034990791897e-06, "epoch": 0.03528815589441194, "percentage": 3.53, "elapsed_time": "1:09:01", "remaining_time": "1 day, 7:27:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 384, "total_steps": 10853, "loss": 0.2202, "learning_rate": 3.535911602209945e-06, "epoch": 0.035380292071681946, "percentage": 3.54, "elapsed_time": "1:09:12", "remaining_time": "1 day, 7:26:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 385, "total_steps": 10853, "loss": 0.2001, "learning_rate": 3.5451197053407e-06, "epoch": 0.03547242824895195, "percentage": 3.55, "elapsed_time": "1:09:22", "remaining_time": "1 day, 7:26:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 386, "total_steps": 10853, "loss": 0.2256, "learning_rate": 3.554327808471455e-06, "epoch": 0.03556456442622195, "percentage": 3.56, "elapsed_time": "1:09:34", "remaining_time": "1 day, 7:26:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 387, "total_steps": 10853, "loss": 0.199, "learning_rate": 3.56353591160221e-06, "epoch": 0.035656700603491964, "percentage": 3.57, "elapsed_time": "1:09:44", "remaining_time": "1 day, 7:25:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 388, "total_steps": 10853, "loss": 0.2078, "learning_rate": 3.572744014732965e-06, "epoch": 0.03574883678076197, "percentage": 3.58, "elapsed_time": "1:09:56", "remaining_time": "1 day, 7:26:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 389, "total_steps": 10853, "loss": 0.2103, "learning_rate": 3.58195211786372e-06, "epoch": 0.03584097295803197, "percentage": 3.58, "elapsed_time": "1:10:06", "remaining_time": "1 day, 7:25:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 390, "total_steps": 10853, "loss": 0.2152, "learning_rate": 3.5911602209944757e-06, "epoch": 0.035933109135301976, "percentage": 3.59, "elapsed_time": "1:10:16", "remaining_time": "1 day, 7:25:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 391, "total_steps": 10853, "loss": 0.1992, "learning_rate": 3.6003683241252306e-06, "epoch": 0.03602524531257198, "percentage": 3.6, "elapsed_time": "1:10:27", "remaining_time": "1 day, 7:25:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 392, "total_steps": 10853, "loss": 0.2187, "learning_rate": 3.609576427255986e-06, "epoch": 0.03611738148984198, "percentage": 3.61, "elapsed_time": "1:10:37", "remaining_time": "1 day, 7:24:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 393, "total_steps": 10853, "loss": 0.1978, "learning_rate": 3.618784530386741e-06, "epoch": 0.036209517667111994, "percentage": 3.62, "elapsed_time": "1:10:47", "remaining_time": "1 day, 7:24:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 394, "total_steps": 10853, "loss": 0.207, "learning_rate": 3.6279926335174957e-06, "epoch": 0.036301653844382, "percentage": 3.63, "elapsed_time": "1:10:57", "remaining_time": "1 day, 7:23:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 395, "total_steps": 10853, "loss": 0.2155, "learning_rate": 3.637200736648251e-06, "epoch": 0.036393790021652, "percentage": 3.64, "elapsed_time": "1:11:07", "remaining_time": "1 day, 7:22:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 396, "total_steps": 10853, "loss": 0.2142, "learning_rate": 3.646408839779006e-06, "epoch": 0.036485926198922006, "percentage": 3.65, "elapsed_time": "1:11:17", "remaining_time": "1 day, 7:22:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 397, "total_steps": 10853, "loss": 0.2167, "learning_rate": 3.655616942909761e-06, "epoch": 0.03657806237619201, "percentage": 3.66, "elapsed_time": "1:11:28", "remaining_time": "1 day, 7:22:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 398, "total_steps": 10853, "loss": 0.2194, "learning_rate": 3.664825046040516e-06, "epoch": 0.03667019855346201, "percentage": 3.67, "elapsed_time": "1:11:40", "remaining_time": "1 day, 7:22:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 399, "total_steps": 10853, "loss": 0.2089, "learning_rate": 3.674033149171271e-06, "epoch": 0.036762334730732024, "percentage": 3.68, "elapsed_time": "1:11:50", "remaining_time": "1 day, 7:22:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 400, "total_steps": 10853, "loss": 0.2106, "learning_rate": 3.683241252302026e-06, "epoch": 0.03685447090800203, "percentage": 3.69, "elapsed_time": "1:12:01", "remaining_time": "1 day, 7:22:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 401, "total_steps": 10853, "loss": 0.2099, "learning_rate": 3.6924493554327813e-06, "epoch": 0.03694660708527203, "percentage": 3.69, "elapsed_time": "1:12:13", "remaining_time": "1 day, 7:22:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 402, "total_steps": 10853, "loss": 0.2095, "learning_rate": 3.7016574585635362e-06, "epoch": 0.037038743262542036, "percentage": 3.7, "elapsed_time": "1:12:23", "remaining_time": "1 day, 7:22:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 403, "total_steps": 10853, "loss": 0.201, "learning_rate": 3.710865561694291e-06, "epoch": 0.03713087943981204, "percentage": 3.71, "elapsed_time": "1:12:35", "remaining_time": "1 day, 7:22:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 404, "total_steps": 10853, "loss": 0.2073, "learning_rate": 3.7200736648250464e-06, "epoch": 0.03722301561708205, "percentage": 3.72, "elapsed_time": "1:12:46", "remaining_time": "1 day, 7:22:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 405, "total_steps": 10853, "loss": 0.2214, "learning_rate": 3.7292817679558014e-06, "epoch": 0.037315151794352054, "percentage": 3.73, "elapsed_time": "1:12:56", "remaining_time": "1 day, 7:21:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 406, "total_steps": 10853, "loss": 0.2202, "learning_rate": 3.7384898710865563e-06, "epoch": 0.03740728797162206, "percentage": 3.74, "elapsed_time": "1:13:05", "remaining_time": "1 day, 7:20:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 407, "total_steps": 10853, "loss": 0.1994, "learning_rate": 3.7476979742173116e-06, "epoch": 0.03749942414889206, "percentage": 3.75, "elapsed_time": "1:13:17", "remaining_time": "1 day, 7:20:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 408, "total_steps": 10853, "loss": 0.1877, "learning_rate": 3.7569060773480665e-06, "epoch": 0.037591560326162066, "percentage": 3.76, "elapsed_time": "1:13:29", "remaining_time": "1 day, 7:21:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 409, "total_steps": 10853, "loss": 0.2068, "learning_rate": 3.7661141804788214e-06, "epoch": 0.03768369650343207, "percentage": 3.77, "elapsed_time": "1:13:39", "remaining_time": "1 day, 7:20:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 410, "total_steps": 10853, "loss": 0.2184, "learning_rate": 3.7753222836095767e-06, "epoch": 0.03777583268070208, "percentage": 3.78, "elapsed_time": "1:13:50", "remaining_time": "1 day, 7:20:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 411, "total_steps": 10853, "loss": 0.1949, "learning_rate": 3.7845303867403316e-06, "epoch": 0.037867968857972084, "percentage": 3.79, "elapsed_time": "1:14:01", "remaining_time": "1 day, 7:20:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 412, "total_steps": 10853, "loss": 0.1906, "learning_rate": 3.7937384898710865e-06, "epoch": 0.03796010503524209, "percentage": 3.8, "elapsed_time": "1:14:10", "remaining_time": "1 day, 7:19:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 413, "total_steps": 10853, "loss": 0.1814, "learning_rate": 3.802946593001842e-06, "epoch": 0.03805224121251209, "percentage": 3.81, "elapsed_time": "1:14:20", "remaining_time": "1 day, 7:19:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 414, "total_steps": 10853, "loss": 0.2248, "learning_rate": 3.812154696132597e-06, "epoch": 0.038144377389782096, "percentage": 3.81, "elapsed_time": "1:14:31", "remaining_time": "1 day, 7:19:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 415, "total_steps": 10853, "loss": 0.2128, "learning_rate": 3.8213627992633525e-06, "epoch": 0.038236513567052106, "percentage": 3.82, "elapsed_time": "1:14:40", "remaining_time": "1 day, 7:18:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 416, "total_steps": 10853, "loss": 0.1874, "learning_rate": 3.830570902394107e-06, "epoch": 0.03832864974432211, "percentage": 3.83, "elapsed_time": "1:14:50", "remaining_time": "1 day, 7:17:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 417, "total_steps": 10853, "loss": 0.2141, "learning_rate": 3.839779005524862e-06, "epoch": 0.038420785921592114, "percentage": 3.84, "elapsed_time": "1:15:02", "remaining_time": "1 day, 7:17:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 418, "total_steps": 10853, "loss": 0.2094, "learning_rate": 3.848987108655617e-06, "epoch": 0.03851292209886212, "percentage": 3.85, "elapsed_time": "1:15:12", "remaining_time": "1 day, 7:17:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 419, "total_steps": 10853, "loss": 0.1954, "learning_rate": 3.858195211786372e-06, "epoch": 0.03860505827613212, "percentage": 3.86, "elapsed_time": "1:15:21", "remaining_time": "1 day, 7:16:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 420, "total_steps": 10853, "loss": 0.2275, "learning_rate": 3.867403314917128e-06, "epoch": 0.038697194453402126, "percentage": 3.87, "elapsed_time": "1:15:33", "remaining_time": "1 day, 7:16:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 421, "total_steps": 10853, "loss": 0.2126, "learning_rate": 3.876611418047883e-06, "epoch": 0.038789330630672136, "percentage": 3.88, "elapsed_time": "1:15:46", "remaining_time": "1 day, 7:17:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 422, "total_steps": 10853, "loss": 0.2024, "learning_rate": 3.885819521178638e-06, "epoch": 0.03888146680794214, "percentage": 3.89, "elapsed_time": "1:15:55", "remaining_time": "1 day, 7:16:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 423, "total_steps": 10853, "loss": 0.2131, "learning_rate": 3.8950276243093926e-06, "epoch": 0.038973602985212144, "percentage": 3.9, "elapsed_time": "1:16:06", "remaining_time": "1 day, 7:16:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 424, "total_steps": 10853, "loss": 0.2113, "learning_rate": 3.9042357274401475e-06, "epoch": 0.03906573916248215, "percentage": 3.91, "elapsed_time": "1:16:18", "remaining_time": "1 day, 7:16:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 425, "total_steps": 10853, "loss": 0.2132, "learning_rate": 3.913443830570902e-06, "epoch": 0.03915787533975215, "percentage": 3.92, "elapsed_time": "1:16:29", "remaining_time": "1 day, 7:16:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 426, "total_steps": 10853, "loss": 0.2099, "learning_rate": 3.922651933701658e-06, "epoch": 0.039250011517022156, "percentage": 3.93, "elapsed_time": "1:16:40", "remaining_time": "1 day, 7:16:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 427, "total_steps": 10853, "loss": 0.2125, "learning_rate": 3.931860036832413e-06, "epoch": 0.039342147694292166, "percentage": 3.93, "elapsed_time": "1:16:51", "remaining_time": "1 day, 7:16:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 428, "total_steps": 10853, "loss": 0.2057, "learning_rate": 3.941068139963168e-06, "epoch": 0.03943428387156217, "percentage": 3.94, "elapsed_time": "1:17:02", "remaining_time": "1 day, 7:16:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 429, "total_steps": 10853, "loss": 0.1912, "learning_rate": 3.950276243093923e-06, "epoch": 0.039526420048832174, "percentage": 3.95, "elapsed_time": "1:17:14", "remaining_time": "1 day, 7:16:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 430, "total_steps": 10853, "loss": 0.2224, "learning_rate": 3.959484346224678e-06, "epoch": 0.03961855622610218, "percentage": 3.96, "elapsed_time": "1:17:25", "remaining_time": "1 day, 7:16:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 431, "total_steps": 10853, "loss": 0.2296, "learning_rate": 3.968692449355433e-06, "epoch": 0.03971069240337218, "percentage": 3.97, "elapsed_time": "1:17:35", "remaining_time": "1 day, 7:16:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 432, "total_steps": 10853, "loss": 0.2062, "learning_rate": 3.977900552486188e-06, "epoch": 0.03980282858064219, "percentage": 3.98, "elapsed_time": "1:17:46", "remaining_time": "1 day, 7:16:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 433, "total_steps": 10853, "loss": 0.2085, "learning_rate": 3.987108655616943e-06, "epoch": 0.039894964757912196, "percentage": 3.99, "elapsed_time": "1:17:56", "remaining_time": "1 day, 7:15:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 434, "total_steps": 10853, "loss": 0.1929, "learning_rate": 3.996316758747698e-06, "epoch": 0.0399871009351822, "percentage": 4.0, "elapsed_time": "1:18:07", "remaining_time": "1 day, 7:15:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 435, "total_steps": 10853, "loss": 0.2097, "learning_rate": 4.005524861878453e-06, "epoch": 0.040079237112452204, "percentage": 4.01, "elapsed_time": "1:18:18", "remaining_time": "1 day, 7:15:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 436, "total_steps": 10853, "loss": 0.2118, "learning_rate": 4.014732965009208e-06, "epoch": 0.04017137328972221, "percentage": 4.02, "elapsed_time": "1:18:29", "remaining_time": "1 day, 7:15:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 437, "total_steps": 10853, "loss": 0.2149, "learning_rate": 4.023941068139964e-06, "epoch": 0.04026350946699221, "percentage": 4.03, "elapsed_time": "1:18:40", "remaining_time": "1 day, 7:15:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 438, "total_steps": 10853, "loss": 0.2219, "learning_rate": 4.033149171270719e-06, "epoch": 0.04035564564426222, "percentage": 4.04, "elapsed_time": "1:18:51", "remaining_time": "1 day, 7:14:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 439, "total_steps": 10853, "loss": 0.1945, "learning_rate": 4.0423572744014736e-06, "epoch": 0.040447781821532226, "percentage": 4.04, "elapsed_time": "1:19:01", "remaining_time": "1 day, 7:14:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 440, "total_steps": 10853, "loss": 0.1891, "learning_rate": 4.051565377532229e-06, "epoch": 0.04053991799880223, "percentage": 4.05, "elapsed_time": "1:19:12", "remaining_time": "1 day, 7:14:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 441, "total_steps": 10853, "loss": 0.2175, "learning_rate": 4.060773480662984e-06, "epoch": 0.040632054176072234, "percentage": 4.06, "elapsed_time": "1:19:24", "remaining_time": "1 day, 7:14:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 442, "total_steps": 10853, "loss": 0.2064, "learning_rate": 4.069981583793739e-06, "epoch": 0.04072419035334224, "percentage": 4.07, "elapsed_time": "1:19:35", "remaining_time": "1 day, 7:14:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 443, "total_steps": 10853, "loss": 0.219, "learning_rate": 4.079189686924494e-06, "epoch": 0.04081632653061224, "percentage": 4.08, "elapsed_time": "1:19:46", "remaining_time": "1 day, 7:14:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 444, "total_steps": 10853, "loss": 0.203, "learning_rate": 4.088397790055249e-06, "epoch": 0.04090846270788225, "percentage": 4.09, "elapsed_time": "1:19:56", "remaining_time": "1 day, 7:14:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 445, "total_steps": 10853, "loss": 0.2131, "learning_rate": 4.097605893186004e-06, "epoch": 0.041000598885152256, "percentage": 4.1, "elapsed_time": "1:20:08", "remaining_time": "1 day, 7:14:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 446, "total_steps": 10853, "loss": 0.2029, "learning_rate": 4.106813996316759e-06, "epoch": 0.04109273506242226, "percentage": 4.11, "elapsed_time": "1:20:19", "remaining_time": "1 day, 7:14:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 447, "total_steps": 10853, "loss": 0.2069, "learning_rate": 4.1160220994475145e-06, "epoch": 0.041184871239692264, "percentage": 4.12, "elapsed_time": "1:20:32", "remaining_time": "1 day, 7:14:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 448, "total_steps": 10853, "loss": 0.2179, "learning_rate": 4.125230202578269e-06, "epoch": 0.04127700741696227, "percentage": 4.13, "elapsed_time": "1:20:43", "remaining_time": "1 day, 7:14:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 449, "total_steps": 10853, "loss": 0.2043, "learning_rate": 4.134438305709024e-06, "epoch": 0.04136914359423228, "percentage": 4.14, "elapsed_time": "1:20:54", "remaining_time": "1 day, 7:14:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 450, "total_steps": 10853, "loss": 0.2162, "learning_rate": 4.143646408839779e-06, "epoch": 0.04146127977150228, "percentage": 4.15, "elapsed_time": "1:21:05", "remaining_time": "1 day, 7:14:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 451, "total_steps": 10853, "loss": 0.2197, "learning_rate": 4.152854511970534e-06, "epoch": 0.041553415948772286, "percentage": 4.16, "elapsed_time": "1:21:16", "remaining_time": "1 day, 7:14:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 452, "total_steps": 10853, "loss": 0.24, "learning_rate": 4.162062615101289e-06, "epoch": 0.04164555212604229, "percentage": 4.16, "elapsed_time": "1:21:25", "remaining_time": "1 day, 7:13:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 453, "total_steps": 10853, "loss": 0.209, "learning_rate": 4.171270718232045e-06, "epoch": 0.041737688303312294, "percentage": 4.17, "elapsed_time": "1:21:36", "remaining_time": "1 day, 7:13:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 454, "total_steps": 10853, "loss": 0.1983, "learning_rate": 4.1804788213628e-06, "epoch": 0.0418298244805823, "percentage": 4.18, "elapsed_time": "1:21:47", "remaining_time": "1 day, 7:13:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 455, "total_steps": 10853, "loss": 0.2191, "learning_rate": 4.1896869244935545e-06, "epoch": 0.04192196065785231, "percentage": 4.19, "elapsed_time": "1:21:58", "remaining_time": "1 day, 7:13:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 456, "total_steps": 10853, "loss": 0.2023, "learning_rate": 4.1988950276243095e-06, "epoch": 0.04201409683512231, "percentage": 4.2, "elapsed_time": "1:22:08", "remaining_time": "1 day, 7:12:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 457, "total_steps": 10853, "loss": 0.2032, "learning_rate": 4.208103130755064e-06, "epoch": 0.042106233012392316, "percentage": 4.21, "elapsed_time": "1:22:19", "remaining_time": "1 day, 7:12:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 458, "total_steps": 10853, "loss": 0.2193, "learning_rate": 4.217311233885819e-06, "epoch": 0.04219836918966232, "percentage": 4.22, "elapsed_time": "1:22:30", "remaining_time": "1 day, 7:12:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 459, "total_steps": 10853, "loss": 0.221, "learning_rate": 4.226519337016575e-06, "epoch": 0.042290505366932324, "percentage": 4.23, "elapsed_time": "1:22:42", "remaining_time": "1 day, 7:12:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 460, "total_steps": 10853, "loss": 0.2258, "learning_rate": 4.23572744014733e-06, "epoch": 0.04238264154420233, "percentage": 4.24, "elapsed_time": "1:22:54", "remaining_time": "1 day, 7:13:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 461, "total_steps": 10853, "loss": 0.2027, "learning_rate": 4.244935543278086e-06, "epoch": 0.04247477772147234, "percentage": 4.25, "elapsed_time": "1:23:03", "remaining_time": "1 day, 7:12:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 462, "total_steps": 10853, "loss": 0.2351, "learning_rate": 4.2541436464088406e-06, "epoch": 0.04256691389874234, "percentage": 4.26, "elapsed_time": "1:23:13", "remaining_time": "1 day, 7:12:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 463, "total_steps": 10853, "loss": 0.2035, "learning_rate": 4.2633517495395955e-06, "epoch": 0.042659050076012346, "percentage": 4.27, "elapsed_time": "1:23:24", "remaining_time": "1 day, 7:11:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 464, "total_steps": 10853, "loss": 0.2234, "learning_rate": 4.27255985267035e-06, "epoch": 0.04275118625328235, "percentage": 4.28, "elapsed_time": "1:23:36", "remaining_time": "1 day, 7:12:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 465, "total_steps": 10853, "loss": 0.1724, "learning_rate": 4.281767955801105e-06, "epoch": 0.042843322430552354, "percentage": 4.28, "elapsed_time": "1:23:49", "remaining_time": "1 day, 7:12:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 466, "total_steps": 10853, "loss": 0.2288, "learning_rate": 4.29097605893186e-06, "epoch": 0.042935458607822365, "percentage": 4.29, "elapsed_time": "1:24:00", "remaining_time": "1 day, 7:12:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 467, "total_steps": 10853, "loss": 0.2017, "learning_rate": 4.300184162062616e-06, "epoch": 0.04302759478509237, "percentage": 4.3, "elapsed_time": "1:24:10", "remaining_time": "1 day, 7:12:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 468, "total_steps": 10853, "loss": 0.2096, "learning_rate": 4.309392265193371e-06, "epoch": 0.04311973096236237, "percentage": 4.31, "elapsed_time": "1:24:22", "remaining_time": "1 day, 7:12:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 469, "total_steps": 10853, "loss": 0.2148, "learning_rate": 4.318600368324126e-06, "epoch": 0.043211867139632376, "percentage": 4.32, "elapsed_time": "1:24:32", "remaining_time": "1 day, 7:11:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 470, "total_steps": 10853, "loss": 0.2164, "learning_rate": 4.327808471454881e-06, "epoch": 0.04330400331690238, "percentage": 4.33, "elapsed_time": "1:24:43", "remaining_time": "1 day, 7:11:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 471, "total_steps": 10853, "loss": 0.2054, "learning_rate": 4.3370165745856355e-06, "epoch": 0.043396139494172384, "percentage": 4.34, "elapsed_time": "1:24:55", "remaining_time": "1 day, 7:11:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 472, "total_steps": 10853, "loss": 0.2119, "learning_rate": 4.3462246777163904e-06, "epoch": 0.043488275671442395, "percentage": 4.35, "elapsed_time": "1:25:07", "remaining_time": "1 day, 7:12:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 473, "total_steps": 10853, "loss": 0.2158, "learning_rate": 4.355432780847146e-06, "epoch": 0.0435804118487124, "percentage": 4.36, "elapsed_time": "1:25:17", "remaining_time": "1 day, 7:11:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 474, "total_steps": 10853, "loss": 0.2089, "learning_rate": 4.364640883977901e-06, "epoch": 0.0436725480259824, "percentage": 4.37, "elapsed_time": "1:25:28", "remaining_time": "1 day, 7:11:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 475, "total_steps": 10853, "loss": 0.2184, "learning_rate": 4.373848987108656e-06, "epoch": 0.043764684203252406, "percentage": 4.38, "elapsed_time": "1:25:39", "remaining_time": "1 day, 7:11:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 476, "total_steps": 10853, "loss": 0.2198, "learning_rate": 4.383057090239411e-06, "epoch": 0.04385682038052241, "percentage": 4.39, "elapsed_time": "1:25:50", "remaining_time": "1 day, 7:11:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 477, "total_steps": 10853, "loss": 0.2047, "learning_rate": 4.392265193370166e-06, "epoch": 0.043948956557792414, "percentage": 4.4, "elapsed_time": "1:26:00", "remaining_time": "1 day, 7:10:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 478, "total_steps": 10853, "loss": 0.2104, "learning_rate": 4.401473296500921e-06, "epoch": 0.044041092735062425, "percentage": 4.4, "elapsed_time": "1:26:11", "remaining_time": "1 day, 7:10:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 479, "total_steps": 10853, "loss": 0.2169, "learning_rate": 4.4106813996316765e-06, "epoch": 0.04413322891233243, "percentage": 4.41, "elapsed_time": "1:26:22", "remaining_time": "1 day, 7:10:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 480, "total_steps": 10853, "loss": 0.2173, "learning_rate": 4.419889502762431e-06, "epoch": 0.04422536508960243, "percentage": 4.42, "elapsed_time": "1:26:33", "remaining_time": "1 day, 7:10:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 481, "total_steps": 10853, "loss": 0.1962, "learning_rate": 4.429097605893186e-06, "epoch": 0.044317501266872436, "percentage": 4.43, "elapsed_time": "1:26:44", "remaining_time": "1 day, 7:10:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 482, "total_steps": 10853, "loss": 0.218, "learning_rate": 4.438305709023941e-06, "epoch": 0.04440963744414244, "percentage": 4.44, "elapsed_time": "1:26:56", "remaining_time": "1 day, 7:10:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 483, "total_steps": 10853, "loss": 0.2183, "learning_rate": 4.447513812154696e-06, "epoch": 0.04450177362141245, "percentage": 4.45, "elapsed_time": "1:27:08", "remaining_time": "1 day, 7:10:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 484, "total_steps": 10853, "loss": 0.2013, "learning_rate": 4.456721915285452e-06, "epoch": 0.044593909798682455, "percentage": 4.46, "elapsed_time": "1:27:17", "remaining_time": "1 day, 7:10:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 485, "total_steps": 10853, "loss": 0.2002, "learning_rate": 4.465930018416207e-06, "epoch": 0.04468604597595246, "percentage": 4.47, "elapsed_time": "1:27:28", "remaining_time": "1 day, 7:09:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 486, "total_steps": 10853, "loss": 0.2209, "learning_rate": 4.475138121546962e-06, "epoch": 0.04477818215322246, "percentage": 4.48, "elapsed_time": "1:27:38", "remaining_time": "1 day, 7:09:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 487, "total_steps": 10853, "loss": 0.2046, "learning_rate": 4.484346224677717e-06, "epoch": 0.044870318330492466, "percentage": 4.49, "elapsed_time": "1:27:49", "remaining_time": "1 day, 7:09:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 488, "total_steps": 10853, "loss": 0.2199, "learning_rate": 4.493554327808472e-06, "epoch": 0.04496245450776247, "percentage": 4.5, "elapsed_time": "1:28:01", "remaining_time": "1 day, 7:09:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 489, "total_steps": 10853, "loss": 0.2117, "learning_rate": 4.502762430939227e-06, "epoch": 0.04505459068503248, "percentage": 4.51, "elapsed_time": "1:28:12", "remaining_time": "1 day, 7:09:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 490, "total_steps": 10853, "loss": 0.2126, "learning_rate": 4.511970534069982e-06, "epoch": 0.045146726862302484, "percentage": 4.51, "elapsed_time": "1:28:22", "remaining_time": "1 day, 7:09:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 491, "total_steps": 10853, "loss": 0.2079, "learning_rate": 4.521178637200737e-06, "epoch": 0.04523886303957249, "percentage": 4.52, "elapsed_time": "1:28:34", "remaining_time": "1 day, 7:09:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 492, "total_steps": 10853, "loss": 0.2047, "learning_rate": 4.530386740331492e-06, "epoch": 0.04533099921684249, "percentage": 4.53, "elapsed_time": "1:28:43", "remaining_time": "1 day, 7:08:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 493, "total_steps": 10853, "loss": 0.1852, "learning_rate": 4.539594843462248e-06, "epoch": 0.045423135394112496, "percentage": 4.54, "elapsed_time": "1:28:53", "remaining_time": "1 day, 7:07:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 494, "total_steps": 10853, "loss": 0.2038, "learning_rate": 4.5488029465930025e-06, "epoch": 0.04551527157138251, "percentage": 4.55, "elapsed_time": "1:29:03", "remaining_time": "1 day, 7:07:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 495, "total_steps": 10853, "loss": 0.196, "learning_rate": 4.5580110497237574e-06, "epoch": 0.04560740774865251, "percentage": 4.56, "elapsed_time": "1:29:13", "remaining_time": "1 day, 7:07:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 496, "total_steps": 10853, "loss": 0.1995, "learning_rate": 4.567219152854512e-06, "epoch": 0.045699543925922514, "percentage": 4.57, "elapsed_time": "1:29:24", "remaining_time": "1 day, 7:06:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 497, "total_steps": 10853, "loss": 0.2143, "learning_rate": 4.576427255985267e-06, "epoch": 0.04579168010319252, "percentage": 4.58, "elapsed_time": "1:29:34", "remaining_time": "1 day, 7:06:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 498, "total_steps": 10853, "loss": 0.1979, "learning_rate": 4.585635359116022e-06, "epoch": 0.04588381628046252, "percentage": 4.59, "elapsed_time": "1:29:45", "remaining_time": "1 day, 7:06:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 499, "total_steps": 10853, "loss": 0.2078, "learning_rate": 4.594843462246777e-06, "epoch": 0.045975952457732526, "percentage": 4.6, "elapsed_time": "1:29:56", "remaining_time": "1 day, 7:06:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 500, "total_steps": 10853, "loss": 0.1961, "learning_rate": 4.604051565377533e-06, "epoch": 0.04606808863500254, "percentage": 4.61, "elapsed_time": "1:30:06", "remaining_time": "1 day, 7:05:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 500, "total_steps": 10853, "eval_loss": 0.20690900087356567, "epoch": 0.04606808863500254, "percentage": 4.61, "elapsed_time": "1:35:06", "remaining_time": "1 day, 8:49:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 501, "total_steps": 10853, "loss": 0.2047, "learning_rate": 4.613259668508288e-06, "epoch": 0.04616022481227254, "percentage": 4.62, "elapsed_time": "1:35:16", "remaining_time": "1 day, 8:48:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 502, "total_steps": 10853, "loss": 0.2019, "learning_rate": 4.622467771639043e-06, "epoch": 0.046252360989542544, "percentage": 4.63, "elapsed_time": "1:35:28", "remaining_time": "1 day, 8:48:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 503, "total_steps": 10853, "loss": 0.1987, "learning_rate": 4.6316758747697975e-06, "epoch": 0.04634449716681255, "percentage": 4.63, "elapsed_time": "1:35:39", "remaining_time": "1 day, 8:48:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 504, "total_steps": 10853, "loss": 0.2127, "learning_rate": 4.640883977900552e-06, "epoch": 0.04643663334408255, "percentage": 4.64, "elapsed_time": "1:35:50", "remaining_time": "1 day, 8:48:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 505, "total_steps": 10853, "loss": 0.197, "learning_rate": 4.650092081031307e-06, "epoch": 0.046528769521352556, "percentage": 4.65, "elapsed_time": "1:36:01", "remaining_time": "1 day, 8:47:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 506, "total_steps": 10853, "loss": 0.1919, "learning_rate": 4.659300184162063e-06, "epoch": 0.04662090569862257, "percentage": 4.66, "elapsed_time": "1:36:11", "remaining_time": "1 day, 8:46:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 507, "total_steps": 10853, "loss": 0.1938, "learning_rate": 4.668508287292818e-06, "epoch": 0.04671304187589257, "percentage": 4.67, "elapsed_time": "1:36:23", "remaining_time": "1 day, 8:46:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 508, "total_steps": 10853, "loss": 0.2025, "learning_rate": 4.677716390423574e-06, "epoch": 0.046805178053162574, "percentage": 4.68, "elapsed_time": "1:36:33", "remaining_time": "1 day, 8:46:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 509, "total_steps": 10853, "loss": 0.2144, "learning_rate": 4.686924493554329e-06, "epoch": 0.04689731423043258, "percentage": 4.69, "elapsed_time": "1:36:44", "remaining_time": "1 day, 8:46:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 510, "total_steps": 10853, "loss": 0.2194, "learning_rate": 4.6961325966850835e-06, "epoch": 0.04698945040770258, "percentage": 4.7, "elapsed_time": "1:36:54", "remaining_time": "1 day, 8:45:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 511, "total_steps": 10853, "loss": 0.2092, "learning_rate": 4.7053406998158384e-06, "epoch": 0.04708158658497259, "percentage": 4.71, "elapsed_time": "1:37:06", "remaining_time": "1 day, 8:45:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 512, "total_steps": 10853, "loss": 0.2052, "learning_rate": 4.714548802946593e-06, "epoch": 0.0471737227622426, "percentage": 4.72, "elapsed_time": "1:37:17", "remaining_time": "1 day, 8:45:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 513, "total_steps": 10853, "loss": 0.207, "learning_rate": 4.723756906077348e-06, "epoch": 0.0472658589395126, "percentage": 4.73, "elapsed_time": "1:37:28", "remaining_time": "1 day, 8:44:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 514, "total_steps": 10853, "loss": 0.2169, "learning_rate": 4.732965009208104e-06, "epoch": 0.047357995116782604, "percentage": 4.74, "elapsed_time": "1:37:37", "remaining_time": "1 day, 8:43:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 515, "total_steps": 10853, "loss": 0.2123, "learning_rate": 4.742173112338859e-06, "epoch": 0.04745013129405261, "percentage": 4.75, "elapsed_time": "1:37:47", "remaining_time": "1 day, 8:43:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 516, "total_steps": 10853, "loss": 0.2213, "learning_rate": 4.751381215469614e-06, "epoch": 0.04754226747132261, "percentage": 4.75, "elapsed_time": "1:37:58", "remaining_time": "1 day, 8:42:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 517, "total_steps": 10853, "loss": 0.2248, "learning_rate": 4.760589318600369e-06, "epoch": 0.04763440364859262, "percentage": 4.76, "elapsed_time": "1:38:07", "remaining_time": "1 day, 8:41:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 518, "total_steps": 10853, "loss": 0.2067, "learning_rate": 4.769797421731124e-06, "epoch": 0.04772653982586263, "percentage": 4.77, "elapsed_time": "1:38:18", "remaining_time": "1 day, 8:41:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 519, "total_steps": 10853, "loss": 0.2121, "learning_rate": 4.7790055248618785e-06, "epoch": 0.04781867600313263, "percentage": 4.78, "elapsed_time": "1:38:28", "remaining_time": "1 day, 8:40:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 520, "total_steps": 10853, "loss": 0.2048, "learning_rate": 4.788213627992634e-06, "epoch": 0.047910812180402634, "percentage": 4.79, "elapsed_time": "1:38:39", "remaining_time": "1 day, 8:40:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 521, "total_steps": 10853, "loss": 0.2052, "learning_rate": 4.797421731123389e-06, "epoch": 0.04800294835767264, "percentage": 4.8, "elapsed_time": "1:38:49", "remaining_time": "1 day, 8:39:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 522, "total_steps": 10853, "loss": 0.2037, "learning_rate": 4.806629834254144e-06, "epoch": 0.04809508453494264, "percentage": 4.81, "elapsed_time": "1:39:00", "remaining_time": "1 day, 8:39:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 523, "total_steps": 10853, "loss": 0.2162, "learning_rate": 4.815837937384899e-06, "epoch": 0.04818722071221265, "percentage": 4.82, "elapsed_time": "1:39:13", "remaining_time": "1 day, 8:39:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 524, "total_steps": 10853, "loss": 0.1947, "learning_rate": 4.825046040515654e-06, "epoch": 0.04827935688948266, "percentage": 4.83, "elapsed_time": "1:39:23", "remaining_time": "1 day, 8:39:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 525, "total_steps": 10853, "loss": 0.2224, "learning_rate": 4.834254143646409e-06, "epoch": 0.04837149306675266, "percentage": 4.84, "elapsed_time": "1:39:35", "remaining_time": "1 day, 8:39:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 526, "total_steps": 10853, "loss": 0.2104, "learning_rate": 4.8434622467771645e-06, "epoch": 0.048463629244022664, "percentage": 4.85, "elapsed_time": "1:39:45", "remaining_time": "1 day, 8:38:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 527, "total_steps": 10853, "loss": 0.2112, "learning_rate": 4.852670349907919e-06, "epoch": 0.04855576542129267, "percentage": 4.86, "elapsed_time": "1:39:56", "remaining_time": "1 day, 8:38:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 528, "total_steps": 10853, "loss": 0.2075, "learning_rate": 4.861878453038674e-06, "epoch": 0.04864790159856268, "percentage": 4.87, "elapsed_time": "1:40:08", "remaining_time": "1 day, 8:38:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 529, "total_steps": 10853, "loss": 0.2143, "learning_rate": 4.871086556169429e-06, "epoch": 0.04874003777583268, "percentage": 4.87, "elapsed_time": "1:40:18", "remaining_time": "1 day, 8:37:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 530, "total_steps": 10853, "loss": 0.2131, "learning_rate": 4.880294659300184e-06, "epoch": 0.04883217395310269, "percentage": 4.88, "elapsed_time": "1:40:29", "remaining_time": "1 day, 8:37:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 531, "total_steps": 10853, "loss": 0.2198, "learning_rate": 4.889502762430939e-06, "epoch": 0.04892431013037269, "percentage": 4.89, "elapsed_time": "1:40:39", "remaining_time": "1 day, 8:36:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 532, "total_steps": 10853, "loss": 0.1981, "learning_rate": 4.898710865561695e-06, "epoch": 0.049016446307642694, "percentage": 4.9, "elapsed_time": "1:40:50", "remaining_time": "1 day, 8:36:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 533, "total_steps": 10853, "loss": 0.2105, "learning_rate": 4.90791896869245e-06, "epoch": 0.0491085824849127, "percentage": 4.91, "elapsed_time": "1:41:01", "remaining_time": "1 day, 8:36:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 534, "total_steps": 10853, "loss": 0.2274, "learning_rate": 4.9171270718232054e-06, "epoch": 0.04920071866218271, "percentage": 4.92, "elapsed_time": "1:41:12", "remaining_time": "1 day, 8:35:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 535, "total_steps": 10853, "loss": 0.2047, "learning_rate": 4.92633517495396e-06, "epoch": 0.04929285483945271, "percentage": 4.93, "elapsed_time": "1:41:23", "remaining_time": "1 day, 8:35:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 536, "total_steps": 10853, "loss": 0.1734, "learning_rate": 4.935543278084715e-06, "epoch": 0.04938499101672272, "percentage": 4.94, "elapsed_time": "1:41:33", "remaining_time": "1 day, 8:34:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 537, "total_steps": 10853, "loss": 0.2168, "learning_rate": 4.94475138121547e-06, "epoch": 0.04947712719399272, "percentage": 4.95, "elapsed_time": "1:41:43", "remaining_time": "1 day, 8:34:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 538, "total_steps": 10853, "loss": 0.2109, "learning_rate": 4.953959484346225e-06, "epoch": 0.049569263371262724, "percentage": 4.96, "elapsed_time": "1:41:54", "remaining_time": "1 day, 8:33:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 539, "total_steps": 10853, "loss": 0.2091, "learning_rate": 4.96316758747698e-06, "epoch": 0.04966139954853273, "percentage": 4.97, "elapsed_time": "1:42:06", "remaining_time": "1 day, 8:33:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 540, "total_steps": 10853, "loss": 0.2072, "learning_rate": 4.972375690607736e-06, "epoch": 0.04975353572580274, "percentage": 4.98, "elapsed_time": "1:42:17", "remaining_time": "1 day, 8:33:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 541, "total_steps": 10853, "loss": 0.2066, "learning_rate": 4.981583793738491e-06, "epoch": 0.04984567190307274, "percentage": 4.98, "elapsed_time": "1:42:28", "remaining_time": "1 day, 8:33:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 542, "total_steps": 10853, "loss": 0.2128, "learning_rate": 4.9907918968692455e-06, "epoch": 0.04993780808034275, "percentage": 4.99, "elapsed_time": "1:42:38", "remaining_time": "1 day, 8:32:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 543, "total_steps": 10853, "loss": 0.2015, "learning_rate": 5e-06, "epoch": 0.05002994425761275, "percentage": 5.0, "elapsed_time": "1:42:51", "remaining_time": "1 day, 8:32:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 544, "total_steps": 10853, "loss": 0.213, "learning_rate": 4.999999883937366e-06, "epoch": 0.050122080434882754, "percentage": 5.01, "elapsed_time": "1:43:02", "remaining_time": "1 day, 8:32:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 545, "total_steps": 10853, "loss": 0.2064, "learning_rate": 4.999999535749473e-06, "epoch": 0.050214216612152765, "percentage": 5.02, "elapsed_time": "1:43:11", "remaining_time": "1 day, 8:31:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 546, "total_steps": 10853, "loss": 0.2024, "learning_rate": 4.999998955436354e-06, "epoch": 0.05030635278942277, "percentage": 5.03, "elapsed_time": "1:43:21", "remaining_time": "1 day, 8:31:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 547, "total_steps": 10853, "loss": 0.2001, "learning_rate": 4.999998142998064e-06, "epoch": 0.05039848896669277, "percentage": 5.04, "elapsed_time": "1:43:33", "remaining_time": "1 day, 8:31:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 548, "total_steps": 10853, "loss": 0.2089, "learning_rate": 4.999997098434676e-06, "epoch": 0.050490625143962777, "percentage": 5.05, "elapsed_time": "1:43:45", "remaining_time": "1 day, 8:31:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 549, "total_steps": 10853, "loss": 0.2084, "learning_rate": 4.999995821746289e-06, "epoch": 0.05058276132123278, "percentage": 5.06, "elapsed_time": "1:43:56", "remaining_time": "1 day, 8:30:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 550, "total_steps": 10853, "loss": 0.2187, "learning_rate": 4.9999943129330204e-06, "epoch": 0.050674897498502784, "percentage": 5.07, "elapsed_time": "1:44:07", "remaining_time": "1 day, 8:30:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 551, "total_steps": 10853, "loss": 0.1944, "learning_rate": 4.999992571995011e-06, "epoch": 0.050767033675772795, "percentage": 5.08, "elapsed_time": "1:44:17", "remaining_time": "1 day, 8:29:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 552, "total_steps": 10853, "loss": 0.2001, "learning_rate": 4.999990598932423e-06, "epoch": 0.0508591698530428, "percentage": 5.09, "elapsed_time": "1:44:29", "remaining_time": "1 day, 8:29:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 553, "total_steps": 10853, "loss": 0.2018, "learning_rate": 4.999988393745438e-06, "epoch": 0.0509513060303128, "percentage": 5.1, "elapsed_time": "1:44:39", "remaining_time": "1 day, 8:29:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 554, "total_steps": 10853, "loss": 0.2369, "learning_rate": 4.999985956434263e-06, "epoch": 0.051043442207582806, "percentage": 5.1, "elapsed_time": "1:44:49", "remaining_time": "1 day, 8:28:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 555, "total_steps": 10853, "loss": 0.1985, "learning_rate": 4.999983286999121e-06, "epoch": 0.05113557838485281, "percentage": 5.11, "elapsed_time": "1:44:59", "remaining_time": "1 day, 8:28:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 556, "total_steps": 10853, "loss": 0.2056, "learning_rate": 4.999980385440262e-06, "epoch": 0.051227714562122814, "percentage": 5.12, "elapsed_time": "1:45:11", "remaining_time": "1 day, 8:28:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 557, "total_steps": 10853, "loss": 0.2036, "learning_rate": 4.999977251757956e-06, "epoch": 0.051319850739392825, "percentage": 5.13, "elapsed_time": "1:45:23", "remaining_time": "1 day, 8:28:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 558, "total_steps": 10853, "loss": 0.2105, "learning_rate": 4.999973885952492e-06, "epoch": 0.05141198691666283, "percentage": 5.14, "elapsed_time": "1:45:33", "remaining_time": "1 day, 8:27:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 559, "total_steps": 10853, "loss": 0.2136, "learning_rate": 4.9999702880241855e-06, "epoch": 0.05150412309393283, "percentage": 5.15, "elapsed_time": "1:45:44", "remaining_time": "1 day, 8:27:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 560, "total_steps": 10853, "loss": 0.2173, "learning_rate": 4.999966457973367e-06, "epoch": 0.051596259271202836, "percentage": 5.16, "elapsed_time": "1:45:54", "remaining_time": "1 day, 8:26:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 561, "total_steps": 10853, "loss": 0.2334, "learning_rate": 4.999962395800395e-06, "epoch": 0.05168839544847284, "percentage": 5.17, "elapsed_time": "1:46:04", "remaining_time": "1 day, 8:25:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 562, "total_steps": 10853, "loss": 0.2071, "learning_rate": 4.999958101505645e-06, "epoch": 0.05178053162574285, "percentage": 5.18, "elapsed_time": "1:46:16", "remaining_time": "1 day, 8:25:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 563, "total_steps": 10853, "loss": 0.2165, "learning_rate": 4.999953575089516e-06, "epoch": 0.051872667803012855, "percentage": 5.19, "elapsed_time": "1:46:27", "remaining_time": "1 day, 8:25:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 564, "total_steps": 10853, "loss": 0.2057, "learning_rate": 4.999948816552429e-06, "epoch": 0.05196480398028286, "percentage": 5.2, "elapsed_time": "1:46:38", "remaining_time": "1 day, 8:25:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 565, "total_steps": 10853, "loss": 0.2254, "learning_rate": 4.999943825894825e-06, "epoch": 0.05205694015755286, "percentage": 5.21, "elapsed_time": "1:46:49", "remaining_time": "1 day, 8:25:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 566, "total_steps": 10853, "loss": 0.2032, "learning_rate": 4.999938603117167e-06, "epoch": 0.052149076334822866, "percentage": 5.22, "elapsed_time": "1:46:59", "remaining_time": "1 day, 8:24:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 567, "total_steps": 10853, "loss": 0.2353, "learning_rate": 4.999933148219942e-06, "epoch": 0.05224121251209287, "percentage": 5.22, "elapsed_time": "1:47:11", "remaining_time": "1 day, 8:24:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 568, "total_steps": 10853, "loss": 0.2122, "learning_rate": 4.999927461203654e-06, "epoch": 0.05233334868936288, "percentage": 5.23, "elapsed_time": "1:47:22", "remaining_time": "1 day, 8:24:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 569, "total_steps": 10853, "loss": 0.2023, "learning_rate": 4.999921542068833e-06, "epoch": 0.052425484866632885, "percentage": 5.24, "elapsed_time": "1:47:34", "remaining_time": "1 day, 8:24:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 570, "total_steps": 10853, "loss": 0.1914, "learning_rate": 4.9999153908160285e-06, "epoch": 0.05251762104390289, "percentage": 5.25, "elapsed_time": "1:47:45", "remaining_time": "1 day, 8:23:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 571, "total_steps": 10853, "loss": 0.2155, "learning_rate": 4.999909007445809e-06, "epoch": 0.05260975722117289, "percentage": 5.26, "elapsed_time": "1:47:55", "remaining_time": "1 day, 8:23:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 572, "total_steps": 10853, "loss": 0.2156, "learning_rate": 4.99990239195877e-06, "epoch": 0.052701893398442896, "percentage": 5.27, "elapsed_time": "1:48:06", "remaining_time": "1 day, 8:23:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 573, "total_steps": 10853, "loss": 0.2128, "learning_rate": 4.999895544355525e-06, "epoch": 0.0527940295757129, "percentage": 5.28, "elapsed_time": "1:48:18", "remaining_time": "1 day, 8:23:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 574, "total_steps": 10853, "loss": 0.1973, "learning_rate": 4.9998884646367094e-06, "epoch": 0.05288616575298291, "percentage": 5.29, "elapsed_time": "1:48:29", "remaining_time": "1 day, 8:22:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 575, "total_steps": 10853, "loss": 0.2063, "learning_rate": 4.999881152802981e-06, "epoch": 0.052978301930252915, "percentage": 5.3, "elapsed_time": "1:48:41", "remaining_time": "1 day, 8:22:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 576, "total_steps": 10853, "loss": 0.2013, "learning_rate": 4.999873608855019e-06, "epoch": 0.05307043810752292, "percentage": 5.31, "elapsed_time": "1:48:51", "remaining_time": "1 day, 8:22:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 577, "total_steps": 10853, "loss": 0.2111, "learning_rate": 4.999865832793522e-06, "epoch": 0.05316257428479292, "percentage": 5.32, "elapsed_time": "1:49:02", "remaining_time": "1 day, 8:21:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 578, "total_steps": 10853, "loss": 0.2059, "learning_rate": 4.9998578246192155e-06, "epoch": 0.053254710462062926, "percentage": 5.33, "elapsed_time": "1:49:11", "remaining_time": "1 day, 8:21:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 579, "total_steps": 10853, "loss": 0.2221, "learning_rate": 4.9998495843328385e-06, "epoch": 0.05334684663933294, "percentage": 5.33, "elapsed_time": "1:49:22", "remaining_time": "1 day, 8:20:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 580, "total_steps": 10853, "loss": 0.2102, "learning_rate": 4.9998411119351605e-06, "epoch": 0.05343898281660294, "percentage": 5.34, "elapsed_time": "1:49:33", "remaining_time": "1 day, 8:20:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 581, "total_steps": 10853, "loss": 0.215, "learning_rate": 4.999832407426966e-06, "epoch": 0.053531118993872945, "percentage": 5.35, "elapsed_time": "1:49:44", "remaining_time": "1 day, 8:20:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 582, "total_steps": 10853, "loss": 0.2148, "learning_rate": 4.999823470809062e-06, "epoch": 0.05362325517114295, "percentage": 5.36, "elapsed_time": "1:49:55", "remaining_time": "1 day, 8:19:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 583, "total_steps": 10853, "loss": 0.1878, "learning_rate": 4.999814302082281e-06, "epoch": 0.05371539134841295, "percentage": 5.37, "elapsed_time": "1:50:06", "remaining_time": "1 day, 8:19:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 584, "total_steps": 10853, "loss": 0.2021, "learning_rate": 4.999804901247472e-06, "epoch": 0.053807527525682956, "percentage": 5.38, "elapsed_time": "1:50:18", "remaining_time": "1 day, 8:19:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 585, "total_steps": 10853, "loss": 0.2083, "learning_rate": 4.99979526830551e-06, "epoch": 0.05389966370295297, "percentage": 5.39, "elapsed_time": "1:50:29", "remaining_time": "1 day, 8:19:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 586, "total_steps": 10853, "loss": 0.1993, "learning_rate": 4.999785403257288e-06, "epoch": 0.05399179988022297, "percentage": 5.4, "elapsed_time": "1:50:39", "remaining_time": "1 day, 8:18:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 587, "total_steps": 10853, "loss": 0.1965, "learning_rate": 4.9997753061037225e-06, "epoch": 0.054083936057492975, "percentage": 5.41, "elapsed_time": "1:50:51", "remaining_time": "1 day, 8:18:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 588, "total_steps": 10853, "loss": 0.2219, "learning_rate": 4.9997649768457505e-06, "epoch": 0.05417607223476298, "percentage": 5.42, "elapsed_time": "1:51:02", "remaining_time": "1 day, 8:18:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 589, "total_steps": 10853, "loss": 0.2147, "learning_rate": 4.999754415484331e-06, "epoch": 0.05426820841203298, "percentage": 5.43, "elapsed_time": "1:51:12", "remaining_time": "1 day, 8:17:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 590, "total_steps": 10853, "loss": 0.2046, "learning_rate": 4.9997436220204455e-06, "epoch": 0.05436034458930299, "percentage": 5.44, "elapsed_time": "1:51:23", "remaining_time": "1 day, 8:17:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 591, "total_steps": 10853, "loss": 0.2243, "learning_rate": 4.9997325964550945e-06, "epoch": 0.054452480766573, "percentage": 5.45, "elapsed_time": "1:51:35", "remaining_time": "1 day, 8:17:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 592, "total_steps": 10853, "loss": 0.2069, "learning_rate": 4.999721338789304e-06, "epoch": 0.054544616943843, "percentage": 5.45, "elapsed_time": "1:51:45", "remaining_time": "1 day, 8:17:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 593, "total_steps": 10853, "loss": 0.2018, "learning_rate": 4.999709849024118e-06, "epoch": 0.054636753121113005, "percentage": 5.46, "elapsed_time": "1:51:56", "remaining_time": "1 day, 8:16:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 594, "total_steps": 10853, "loss": 0.1898, "learning_rate": 4.999698127160604e-06, "epoch": 0.05472888929838301, "percentage": 5.47, "elapsed_time": "1:52:07", "remaining_time": "1 day, 8:16:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 595, "total_steps": 10853, "loss": 0.2035, "learning_rate": 4.999686173199849e-06, "epoch": 0.05482102547565301, "percentage": 5.48, "elapsed_time": "1:52:18", "remaining_time": "1 day, 8:16:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 596, "total_steps": 10853, "loss": 0.2044, "learning_rate": 4.999673987142964e-06, "epoch": 0.05491316165292302, "percentage": 5.49, "elapsed_time": "1:52:28", "remaining_time": "1 day, 8:15:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 597, "total_steps": 10853, "loss": 0.2042, "learning_rate": 4.999661568991081e-06, "epoch": 0.05500529783019303, "percentage": 5.5, "elapsed_time": "1:52:38", "remaining_time": "1 day, 8:15:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 598, "total_steps": 10853, "loss": 0.2115, "learning_rate": 4.999648918745352e-06, "epoch": 0.05509743400746303, "percentage": 5.51, "elapsed_time": "1:52:48", "remaining_time": "1 day, 8:14:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 599, "total_steps": 10853, "loss": 0.2169, "learning_rate": 4.999636036406951e-06, "epoch": 0.055189570184733035, "percentage": 5.52, "elapsed_time": "1:52:58", "remaining_time": "1 day, 8:13:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 600, "total_steps": 10853, "loss": 0.2131, "learning_rate": 4.999622921977076e-06, "epoch": 0.05528170636200304, "percentage": 5.53, "elapsed_time": "1:53:10", "remaining_time": "1 day, 8:13:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 601, "total_steps": 10853, "loss": 0.1844, "learning_rate": 4.999609575456944e-06, "epoch": 0.05537384253927304, "percentage": 5.54, "elapsed_time": "1:53:20", "remaining_time": "1 day, 8:13:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 602, "total_steps": 10853, "loss": 0.2256, "learning_rate": 4.9995959968477926e-06, "epoch": 0.05546597871654305, "percentage": 5.55, "elapsed_time": "1:53:30", "remaining_time": "1 day, 8:12:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 603, "total_steps": 10853, "loss": 0.1867, "learning_rate": 4.9995821861508844e-06, "epoch": 0.05555811489381306, "percentage": 5.56, "elapsed_time": "1:53:41", "remaining_time": "1 day, 8:12:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 604, "total_steps": 10853, "loss": 0.1964, "learning_rate": 4.999568143367501e-06, "epoch": 0.05565025107108306, "percentage": 5.57, "elapsed_time": "1:53:51", "remaining_time": "1 day, 8:11:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 605, "total_steps": 10853, "loss": 0.2115, "learning_rate": 4.999553868498948e-06, "epoch": 0.055742387248353065, "percentage": 5.57, "elapsed_time": "1:54:01", "remaining_time": "1 day, 8:11:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 606, "total_steps": 10853, "loss": 0.1758, "learning_rate": 4.999539361546547e-06, "epoch": 0.05583452342562307, "percentage": 5.58, "elapsed_time": "1:54:11", "remaining_time": "1 day, 8:10:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 607, "total_steps": 10853, "loss": 0.2164, "learning_rate": 4.999524622511649e-06, "epoch": 0.05592665960289308, "percentage": 5.59, "elapsed_time": "1:54:22", "remaining_time": "1 day, 8:10:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 608, "total_steps": 10853, "loss": 0.2008, "learning_rate": 4.99950965139562e-06, "epoch": 0.05601879578016308, "percentage": 5.6, "elapsed_time": "1:54:32", "remaining_time": "1 day, 8:10:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 609, "total_steps": 10853, "loss": 0.2092, "learning_rate": 4.999494448199851e-06, "epoch": 0.05611093195743309, "percentage": 5.61, "elapsed_time": "1:54:42", "remaining_time": "1 day, 8:09:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 610, "total_steps": 10853, "loss": 0.1984, "learning_rate": 4.9994790129257535e-06, "epoch": 0.05620306813470309, "percentage": 5.62, "elapsed_time": "1:54:54", "remaining_time": "1 day, 8:09:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 611, "total_steps": 10853, "loss": 0.2162, "learning_rate": 4.999463345574761e-06, "epoch": 0.056295204311973095, "percentage": 5.63, "elapsed_time": "1:55:05", "remaining_time": "1 day, 8:09:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 612, "total_steps": 10853, "loss": 0.2137, "learning_rate": 4.999447446148328e-06, "epoch": 0.0563873404892431, "percentage": 5.64, "elapsed_time": "1:55:16", "remaining_time": "1 day, 8:09:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 613, "total_steps": 10853, "loss": 0.2129, "learning_rate": 4.999431314647929e-06, "epoch": 0.05647947666651311, "percentage": 5.65, "elapsed_time": "1:55:27", "remaining_time": "1 day, 8:08:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 614, "total_steps": 10853, "loss": 0.2007, "learning_rate": 4.999414951075065e-06, "epoch": 0.05657161284378311, "percentage": 5.66, "elapsed_time": "1:55:37", "remaining_time": "1 day, 8:08:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 615, "total_steps": 10853, "loss": 0.2108, "learning_rate": 4.999398355431253e-06, "epoch": 0.05666374902105312, "percentage": 5.67, "elapsed_time": "1:55:47", "remaining_time": "1 day, 8:07:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 616, "total_steps": 10853, "loss": 0.2098, "learning_rate": 4.999381527718036e-06, "epoch": 0.05675588519832312, "percentage": 5.68, "elapsed_time": "1:55:58", "remaining_time": "1 day, 8:07:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 617, "total_steps": 10853, "loss": 0.2076, "learning_rate": 4.999364467936974e-06, "epoch": 0.056848021375593125, "percentage": 5.69, "elapsed_time": "1:56:09", "remaining_time": "1 day, 8:07:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 618, "total_steps": 10853, "loss": 0.1909, "learning_rate": 4.999347176089653e-06, "epoch": 0.05694015755286313, "percentage": 5.69, "elapsed_time": "1:56:21", "remaining_time": "1 day, 8:07:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 619, "total_steps": 10853, "loss": 0.2081, "learning_rate": 4.999329652177677e-06, "epoch": 0.05703229373013314, "percentage": 5.7, "elapsed_time": "1:56:32", "remaining_time": "1 day, 8:06:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 620, "total_steps": 10853, "loss": 0.2152, "learning_rate": 4.9993118962026735e-06, "epoch": 0.05712442990740314, "percentage": 5.71, "elapsed_time": "1:56:42", "remaining_time": "1 day, 8:06:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 621, "total_steps": 10853, "loss": 0.1946, "learning_rate": 4.999293908166292e-06, "epoch": 0.05721656608467315, "percentage": 5.72, "elapsed_time": "1:56:54", "remaining_time": "1 day, 8:06:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 622, "total_steps": 10853, "loss": 0.1944, "learning_rate": 4.999275688070202e-06, "epoch": 0.05730870226194315, "percentage": 5.73, "elapsed_time": "1:57:04", "remaining_time": "1 day, 8:05:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 623, "total_steps": 10853, "loss": 0.2065, "learning_rate": 4.999257235916096e-06, "epoch": 0.057400838439213155, "percentage": 5.74, "elapsed_time": "1:57:16", "remaining_time": "1 day, 8:05:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 624, "total_steps": 10853, "loss": 0.1944, "learning_rate": 4.999238551705686e-06, "epoch": 0.057492974616483165, "percentage": 5.75, "elapsed_time": "1:57:26", "remaining_time": "1 day, 8:05:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 625, "total_steps": 10853, "loss": 0.2122, "learning_rate": 4.9992196354407075e-06, "epoch": 0.05758511079375317, "percentage": 5.76, "elapsed_time": "1:57:37", "remaining_time": "1 day, 8:04:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 626, "total_steps": 10853, "loss": 0.2187, "learning_rate": 4.999200487122917e-06, "epoch": 0.05767724697102317, "percentage": 5.77, "elapsed_time": "1:57:47", "remaining_time": "1 day, 8:04:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 627, "total_steps": 10853, "loss": 0.1956, "learning_rate": 4.999181106754093e-06, "epoch": 0.05776938314829318, "percentage": 5.78, "elapsed_time": "1:57:57", "remaining_time": "1 day, 8:03:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 628, "total_steps": 10853, "loss": 0.1927, "learning_rate": 4.999161494336033e-06, "epoch": 0.05786151932556318, "percentage": 5.79, "elapsed_time": "1:58:09", "remaining_time": "1 day, 8:03:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 629, "total_steps": 10853, "loss": 0.1986, "learning_rate": 4.99914164987056e-06, "epoch": 0.057953655502833185, "percentage": 5.8, "elapsed_time": "1:58:20", "remaining_time": "1 day, 8:03:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 630, "total_steps": 10853, "loss": 0.2119, "learning_rate": 4.999121573359516e-06, "epoch": 0.058045791680103195, "percentage": 5.8, "elapsed_time": "1:58:32", "remaining_time": "1 day, 8:03:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 631, "total_steps": 10853, "loss": 0.1911, "learning_rate": 4.999101264804765e-06, "epoch": 0.0581379278573732, "percentage": 5.81, "elapsed_time": "1:58:43", "remaining_time": "1 day, 8:03:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 632, "total_steps": 10853, "loss": 0.2053, "learning_rate": 4.9990807242081915e-06, "epoch": 0.0582300640346432, "percentage": 5.82, "elapsed_time": "1:58:54", "remaining_time": "1 day, 8:03:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 633, "total_steps": 10853, "loss": 0.2119, "learning_rate": 4.999059951571705e-06, "epoch": 0.05832220021191321, "percentage": 5.83, "elapsed_time": "1:59:04", "remaining_time": "1 day, 8:02:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 634, "total_steps": 10853, "loss": 0.2239, "learning_rate": 4.9990389468972336e-06, "epoch": 0.05841433638918321, "percentage": 5.84, "elapsed_time": "1:59:15", "remaining_time": "1 day, 8:02:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 635, "total_steps": 10853, "loss": 0.2233, "learning_rate": 4.999017710186725e-06, "epoch": 0.058506472566453215, "percentage": 5.85, "elapsed_time": "1:59:27", "remaining_time": "1 day, 8:02:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 636, "total_steps": 10853, "loss": 0.2056, "learning_rate": 4.998996241442155e-06, "epoch": 0.058598608743723225, "percentage": 5.86, "elapsed_time": "1:59:38", "remaining_time": "1 day, 8:02:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 637, "total_steps": 10853, "loss": 0.2078, "learning_rate": 4.998974540665514e-06, "epoch": 0.05869074492099323, "percentage": 5.87, "elapsed_time": "1:59:51", "remaining_time": "1 day, 8:02:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 638, "total_steps": 10853, "loss": 0.1947, "learning_rate": 4.998952607858818e-06, "epoch": 0.05878288109826323, "percentage": 5.88, "elapsed_time": "2:00:01", "remaining_time": "1 day, 8:01:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 639, "total_steps": 10853, "loss": 0.1999, "learning_rate": 4.998930443024103e-06, "epoch": 0.05887501727553324, "percentage": 5.89, "elapsed_time": "2:00:13", "remaining_time": "1 day, 8:01:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 640, "total_steps": 10853, "loss": 0.2139, "learning_rate": 4.9989080461634285e-06, "epoch": 0.05896715345280324, "percentage": 5.9, "elapsed_time": "2:00:25", "remaining_time": "1 day, 8:01:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 641, "total_steps": 10853, "loss": 0.1945, "learning_rate": 4.9988854172788725e-06, "epoch": 0.05905928963007325, "percentage": 5.91, "elapsed_time": "2:00:36", "remaining_time": "1 day, 8:01:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 642, "total_steps": 10853, "loss": 0.2146, "learning_rate": 4.998862556372537e-06, "epoch": 0.059151425807343255, "percentage": 5.92, "elapsed_time": "2:00:47", "remaining_time": "1 day, 8:01:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 643, "total_steps": 10853, "loss": 0.1872, "learning_rate": 4.998839463446543e-06, "epoch": 0.05924356198461326, "percentage": 5.92, "elapsed_time": "2:00:58", "remaining_time": "1 day, 8:00:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 644, "total_steps": 10853, "loss": 0.2128, "learning_rate": 4.998816138503038e-06, "epoch": 0.05933569816188326, "percentage": 5.93, "elapsed_time": "2:01:08", "remaining_time": "1 day, 8:00:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 645, "total_steps": 10853, "loss": 0.186, "learning_rate": 4.9987925815441835e-06, "epoch": 0.05942783433915327, "percentage": 5.94, "elapsed_time": "2:01:18", "remaining_time": "1 day, 7:59:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 646, "total_steps": 10853, "loss": 0.1814, "learning_rate": 4.99876879257217e-06, "epoch": 0.05951997051642327, "percentage": 5.95, "elapsed_time": "2:01:28", "remaining_time": "1 day, 7:59:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 647, "total_steps": 10853, "loss": 0.2033, "learning_rate": 4.9987447715892046e-06, "epoch": 0.05961210669369328, "percentage": 5.96, "elapsed_time": "2:01:38", "remaining_time": "1 day, 7:58:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 648, "total_steps": 10853, "loss": 0.1976, "learning_rate": 4.998720518597518e-06, "epoch": 0.059704242870963285, "percentage": 5.97, "elapsed_time": "2:01:49", "remaining_time": "1 day, 7:58:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 649, "total_steps": 10853, "loss": 0.2214, "learning_rate": 4.998696033599363e-06, "epoch": 0.05979637904823329, "percentage": 5.98, "elapsed_time": "2:02:01", "remaining_time": "1 day, 7:58:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 650, "total_steps": 10853, "loss": 0.1957, "learning_rate": 4.998671316597012e-06, "epoch": 0.05988851522550329, "percentage": 5.99, "elapsed_time": "2:02:11", "remaining_time": "1 day, 7:58:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 651, "total_steps": 10853, "loss": 0.1977, "learning_rate": 4.998646367592761e-06, "epoch": 0.0599806514027733, "percentage": 6.0, "elapsed_time": "2:02:22", "remaining_time": "1 day, 7:57:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 652, "total_steps": 10853, "loss": 0.2137, "learning_rate": 4.998621186588925e-06, "epoch": 0.0600727875800433, "percentage": 6.01, "elapsed_time": "2:02:32", "remaining_time": "1 day, 7:57:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 653, "total_steps": 10853, "loss": 0.198, "learning_rate": 4.998595773587844e-06, "epoch": 0.06016492375731331, "percentage": 6.02, "elapsed_time": "2:02:43", "remaining_time": "1 day, 7:57:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 654, "total_steps": 10853, "loss": 0.1983, "learning_rate": 4.998570128591875e-06, "epoch": 0.060257059934583315, "percentage": 6.03, "elapsed_time": "2:02:54", "remaining_time": "1 day, 7:56:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 655, "total_steps": 10853, "loss": 0.197, "learning_rate": 4.998544251603402e-06, "epoch": 0.06034919611185332, "percentage": 6.04, "elapsed_time": "2:03:05", "remaining_time": "1 day, 7:56:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 656, "total_steps": 10853, "loss": 0.2165, "learning_rate": 4.998518142624826e-06, "epoch": 0.06044133228912332, "percentage": 6.04, "elapsed_time": "2:03:16", "remaining_time": "1 day, 7:56:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 657, "total_steps": 10853, "loss": 0.1782, "learning_rate": 4.998491801658571e-06, "epoch": 0.06053346846639333, "percentage": 6.05, "elapsed_time": "2:03:25", "remaining_time": "1 day, 7:55:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 658, "total_steps": 10853, "loss": 0.1976, "learning_rate": 4.998465228707084e-06, "epoch": 0.06062560464366334, "percentage": 6.06, "elapsed_time": "2:03:37", "remaining_time": "1 day, 7:55:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 659, "total_steps": 10853, "loss": 0.2195, "learning_rate": 4.998438423772831e-06, "epoch": 0.06071774082093334, "percentage": 6.07, "elapsed_time": "2:03:47", "remaining_time": "1 day, 7:54:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 660, "total_steps": 10853, "loss": 0.2114, "learning_rate": 4.998411386858303e-06, "epoch": 0.060809876998203345, "percentage": 6.08, "elapsed_time": "2:03:57", "remaining_time": "1 day, 7:54:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 661, "total_steps": 10853, "loss": 0.1967, "learning_rate": 4.998384117966007e-06, "epoch": 0.06090201317547335, "percentage": 6.09, "elapsed_time": "2:04:09", "remaining_time": "1 day, 7:54:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 662, "total_steps": 10853, "loss": 0.2076, "learning_rate": 4.998356617098478e-06, "epoch": 0.06099414935274335, "percentage": 6.1, "elapsed_time": "2:04:20", "remaining_time": "1 day, 7:54:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 663, "total_steps": 10853, "loss": 0.2047, "learning_rate": 4.9983288842582665e-06, "epoch": 0.06108628553001336, "percentage": 6.11, "elapsed_time": "2:04:32", "remaining_time": "1 day, 7:54:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 664, "total_steps": 10853, "loss": 0.2026, "learning_rate": 4.9983009194479505e-06, "epoch": 0.06117842170728337, "percentage": 6.12, "elapsed_time": "2:04:42", "remaining_time": "1 day, 7:53:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 665, "total_steps": 10853, "loss": 0.2008, "learning_rate": 4.998272722670126e-06, "epoch": 0.06127055788455337, "percentage": 6.13, "elapsed_time": "2:04:53", "remaining_time": "1 day, 7:53:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 666, "total_steps": 10853, "loss": 0.1813, "learning_rate": 4.998244293927409e-06, "epoch": 0.061362694061823375, "percentage": 6.14, "elapsed_time": "2:05:01", "remaining_time": "1 day, 7:52:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 667, "total_steps": 10853, "loss": 0.219, "learning_rate": 4.998215633222441e-06, "epoch": 0.06145483023909338, "percentage": 6.15, "elapsed_time": "2:05:11", "remaining_time": "1 day, 7:51:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 668, "total_steps": 10853, "loss": 0.1977, "learning_rate": 4.998186740557882e-06, "epoch": 0.06154696641636338, "percentage": 6.15, "elapsed_time": "2:05:22", "remaining_time": "1 day, 7:51:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 669, "total_steps": 10853, "loss": 0.1914, "learning_rate": 4.998157615936416e-06, "epoch": 0.061639102593633394, "percentage": 6.16, "elapsed_time": "2:05:33", "remaining_time": "1 day, 7:51:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 670, "total_steps": 10853, "loss": 0.2087, "learning_rate": 4.998128259360747e-06, "epoch": 0.0617312387709034, "percentage": 6.17, "elapsed_time": "2:05:44", "remaining_time": "1 day, 7:51:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 671, "total_steps": 10853, "loss": 0.211, "learning_rate": 4.998098670833599e-06, "epoch": 0.0618233749481734, "percentage": 6.18, "elapsed_time": "2:05:54", "remaining_time": "1 day, 7:50:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 672, "total_steps": 10853, "loss": 0.1912, "learning_rate": 4.998068850357721e-06, "epoch": 0.061915511125443405, "percentage": 6.19, "elapsed_time": "2:06:05", "remaining_time": "1 day, 7:50:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 673, "total_steps": 10853, "loss": 0.1952, "learning_rate": 4.998038797935882e-06, "epoch": 0.06200764730271341, "percentage": 6.2, "elapsed_time": "2:06:15", "remaining_time": "1 day, 7:49:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 674, "total_steps": 10853, "loss": 0.2017, "learning_rate": 4.9980085135708715e-06, "epoch": 0.06209978347998341, "percentage": 6.21, "elapsed_time": "2:06:25", "remaining_time": "1 day, 7:49:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 675, "total_steps": 10853, "loss": 0.2049, "learning_rate": 4.997977997265501e-06, "epoch": 0.062191919657253424, "percentage": 6.22, "elapsed_time": "2:06:37", "remaining_time": "1 day, 7:49:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 676, "total_steps": 10853, "loss": 0.1861, "learning_rate": 4.997947249022605e-06, "epoch": 0.06228405583452343, "percentage": 6.23, "elapsed_time": "2:06:47", "remaining_time": "1 day, 7:48:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 677, "total_steps": 10853, "loss": 0.1935, "learning_rate": 4.997916268845038e-06, "epoch": 0.06237619201179343, "percentage": 6.24, "elapsed_time": "2:06:57", "remaining_time": "1 day, 7:48:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 678, "total_steps": 10853, "loss": 0.1959, "learning_rate": 4.997885056735677e-06, "epoch": 0.062468328189063435, "percentage": 6.25, "elapsed_time": "2:07:08", "remaining_time": "1 day, 7:47:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 679, "total_steps": 10853, "loss": 0.1987, "learning_rate": 4.99785361269742e-06, "epoch": 0.06256046436633345, "percentage": 6.26, "elapsed_time": "2:07:17", "remaining_time": "1 day, 7:47:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 680, "total_steps": 10853, "loss": 0.2098, "learning_rate": 4.9978219367331856e-06, "epoch": 0.06265260054360344, "percentage": 6.27, "elapsed_time": "2:07:30", "remaining_time": "1 day, 7:47:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 681, "total_steps": 10853, "loss": 0.2078, "learning_rate": 4.997790028845916e-06, "epoch": 0.06274473672087345, "percentage": 6.27, "elapsed_time": "2:07:40", "remaining_time": "1 day, 7:47:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 682, "total_steps": 10853, "loss": 0.2082, "learning_rate": 4.997757889038573e-06, "epoch": 0.06283687289814345, "percentage": 6.28, "elapsed_time": "2:07:50", "remaining_time": "1 day, 7:46:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 683, "total_steps": 10853, "loss": 0.1917, "learning_rate": 4.9977255173141405e-06, "epoch": 0.06292900907541346, "percentage": 6.29, "elapsed_time": "2:08:02", "remaining_time": "1 day, 7:46:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 684, "total_steps": 10853, "loss": 0.2071, "learning_rate": 4.997692913675626e-06, "epoch": 0.06302114525268347, "percentage": 6.3, "elapsed_time": "2:08:13", "remaining_time": "1 day, 7:46:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 685, "total_steps": 10853, "loss": 0.2097, "learning_rate": 4.997660078126055e-06, "epoch": 0.06311328142995347, "percentage": 6.31, "elapsed_time": "2:08:24", "remaining_time": "1 day, 7:46:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 686, "total_steps": 10853, "loss": 0.2119, "learning_rate": 4.997627010668477e-06, "epoch": 0.06320541760722348, "percentage": 6.32, "elapsed_time": "2:08:35", "remaining_time": "1 day, 7:45:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 687, "total_steps": 10853, "loss": 0.1931, "learning_rate": 4.997593711305963e-06, "epoch": 0.06329755378449348, "percentage": 6.33, "elapsed_time": "2:08:47", "remaining_time": "1 day, 7:45:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 688, "total_steps": 10853, "loss": 0.2016, "learning_rate": 4.997560180041604e-06, "epoch": 0.06338968996176349, "percentage": 6.34, "elapsed_time": "2:08:58", "remaining_time": "1 day, 7:45:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 689, "total_steps": 10853, "loss": 0.1991, "learning_rate": 4.997526416878513e-06, "epoch": 0.0634818261390335, "percentage": 6.35, "elapsed_time": "2:09:07", "remaining_time": "1 day, 7:44:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 690, "total_steps": 10853, "loss": 0.1901, "learning_rate": 4.997492421819825e-06, "epoch": 0.0635739623163035, "percentage": 6.36, "elapsed_time": "2:09:18", "remaining_time": "1 day, 7:44:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 691, "total_steps": 10853, "loss": 0.1964, "learning_rate": 4.997458194868697e-06, "epoch": 0.0636660984935735, "percentage": 6.37, "elapsed_time": "2:09:29", "remaining_time": "1 day, 7:44:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 692, "total_steps": 10853, "loss": 0.1942, "learning_rate": 4.997423736028308e-06, "epoch": 0.0637582346708435, "percentage": 6.38, "elapsed_time": "2:09:40", "remaining_time": "1 day, 7:43:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 693, "total_steps": 10853, "loss": 0.1803, "learning_rate": 4.997389045301856e-06, "epoch": 0.06385037084811351, "percentage": 6.39, "elapsed_time": "2:09:52", "remaining_time": "1 day, 7:44:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 694, "total_steps": 10853, "loss": 0.2028, "learning_rate": 4.997354122692561e-06, "epoch": 0.06394250702538351, "percentage": 6.39, "elapsed_time": "2:10:03", "remaining_time": "1 day, 7:43:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 695, "total_steps": 10853, "loss": 0.1639, "learning_rate": 4.997318968203668e-06, "epoch": 0.06403464320265352, "percentage": 6.4, "elapsed_time": "2:10:14", "remaining_time": "1 day, 7:43:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 696, "total_steps": 10853, "loss": 0.1952, "learning_rate": 4.99728358183844e-06, "epoch": 0.06412677937992353, "percentage": 6.41, "elapsed_time": "2:10:24", "remaining_time": "1 day, 7:43:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 697, "total_steps": 10853, "loss": 0.1902, "learning_rate": 4.9972479636001625e-06, "epoch": 0.06421891555719353, "percentage": 6.42, "elapsed_time": "2:10:35", "remaining_time": "1 day, 7:42:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 698, "total_steps": 10853, "loss": 0.1993, "learning_rate": 4.9972121134921435e-06, "epoch": 0.06431105173446354, "percentage": 6.43, "elapsed_time": "2:10:45", "remaining_time": "1 day, 7:42:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 699, "total_steps": 10853, "loss": 0.1968, "learning_rate": 4.99717603151771e-06, "epoch": 0.06440318791173354, "percentage": 6.44, "elapsed_time": "2:10:56", "remaining_time": "1 day, 7:42:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 700, "total_steps": 10853, "loss": 0.1962, "learning_rate": 4.997139717680214e-06, "epoch": 0.06449532408900355, "percentage": 6.45, "elapsed_time": "2:11:07", "remaining_time": "1 day, 7:41:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 701, "total_steps": 10853, "loss": 0.2103, "learning_rate": 4.9971031719830255e-06, "epoch": 0.06458746026627356, "percentage": 6.46, "elapsed_time": "2:11:17", "remaining_time": "1 day, 7:41:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 702, "total_steps": 10853, "loss": 0.1929, "learning_rate": 4.9970663944295396e-06, "epoch": 0.06467959644354355, "percentage": 6.47, "elapsed_time": "2:11:29", "remaining_time": "1 day, 7:41:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 703, "total_steps": 10853, "loss": 0.2004, "learning_rate": 4.99702938502317e-06, "epoch": 0.06477173262081357, "percentage": 6.48, "elapsed_time": "2:11:40", "remaining_time": "1 day, 7:41:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 704, "total_steps": 10853, "loss": 0.1955, "learning_rate": 4.996992143767353e-06, "epoch": 0.06486386879808356, "percentage": 6.49, "elapsed_time": "2:11:52", "remaining_time": "1 day, 7:41:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 705, "total_steps": 10853, "loss": 0.1971, "learning_rate": 4.996954670665547e-06, "epoch": 0.06495600497535357, "percentage": 6.5, "elapsed_time": "2:12:02", "remaining_time": "1 day, 7:40:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 706, "total_steps": 10853, "loss": 0.2186, "learning_rate": 4.996916965721232e-06, "epoch": 0.06504814115262358, "percentage": 6.51, "elapsed_time": "2:12:14", "remaining_time": "1 day, 7:40:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 707, "total_steps": 10853, "loss": 0.2043, "learning_rate": 4.996879028937906e-06, "epoch": 0.06514027732989358, "percentage": 6.51, "elapsed_time": "2:12:26", "remaining_time": "1 day, 7:40:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 708, "total_steps": 10853, "loss": 0.2042, "learning_rate": 4.996840860319094e-06, "epoch": 0.06523241350716359, "percentage": 6.52, "elapsed_time": "2:12:36", "remaining_time": "1 day, 7:40:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 709, "total_steps": 10853, "loss": 0.1927, "learning_rate": 4.996802459868341e-06, "epoch": 0.06532454968443359, "percentage": 6.53, "elapsed_time": "2:12:46", "remaining_time": "1 day, 7:39:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 710, "total_steps": 10853, "loss": 0.2088, "learning_rate": 4.996763827589209e-06, "epoch": 0.0654166858617036, "percentage": 6.54, "elapsed_time": "2:12:57", "remaining_time": "1 day, 7:39:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 711, "total_steps": 10853, "loss": 0.2067, "learning_rate": 4.996724963485288e-06, "epoch": 0.0655088220389736, "percentage": 6.55, "elapsed_time": "2:13:05", "remaining_time": "1 day, 7:38:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 712, "total_steps": 10853, "loss": 0.2011, "learning_rate": 4.996685867560186e-06, "epoch": 0.06560095821624361, "percentage": 6.56, "elapsed_time": "2:13:15", "remaining_time": "1 day, 7:38:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 713, "total_steps": 10853, "loss": 0.2104, "learning_rate": 4.996646539817531e-06, "epoch": 0.06569309439351362, "percentage": 6.57, "elapsed_time": "2:13:27", "remaining_time": "1 day, 7:37:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 714, "total_steps": 10853, "loss": 0.2188, "learning_rate": 4.996606980260977e-06, "epoch": 0.06578523057078361, "percentage": 6.58, "elapsed_time": "2:13:38", "remaining_time": "1 day, 7:37:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 715, "total_steps": 10853, "loss": 0.1866, "learning_rate": 4.9965671888941955e-06, "epoch": 0.06587736674805363, "percentage": 6.59, "elapsed_time": "2:13:49", "remaining_time": "1 day, 7:37:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 716, "total_steps": 10853, "loss": 0.2027, "learning_rate": 4.996527165720882e-06, "epoch": 0.06596950292532362, "percentage": 6.6, "elapsed_time": "2:14:01", "remaining_time": "1 day, 7:37:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 717, "total_steps": 10853, "loss": 0.184, "learning_rate": 4.996486910744753e-06, "epoch": 0.06606163910259363, "percentage": 6.61, "elapsed_time": "2:14:11", "remaining_time": "1 day, 7:37:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 718, "total_steps": 10853, "loss": 0.1791, "learning_rate": 4.996446423969546e-06, "epoch": 0.06615377527986364, "percentage": 6.62, "elapsed_time": "2:14:22", "remaining_time": "1 day, 7:36:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 719, "total_steps": 10853, "loss": 0.2073, "learning_rate": 4.9964057053990186e-06, "epoch": 0.06624591145713364, "percentage": 6.62, "elapsed_time": "2:14:34", "remaining_time": "1 day, 7:36:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 720, "total_steps": 10853, "loss": 0.201, "learning_rate": 4.996364755036954e-06, "epoch": 0.06633804763440365, "percentage": 6.63, "elapsed_time": "2:14:46", "remaining_time": "1 day, 7:36:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 721, "total_steps": 10853, "loss": 0.1882, "learning_rate": 4.996323572887153e-06, "epoch": 0.06643018381167365, "percentage": 6.64, "elapsed_time": "2:14:58", "remaining_time": "1 day, 7:36:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 722, "total_steps": 10853, "loss": 0.1845, "learning_rate": 4.996282158953439e-06, "epoch": 0.06652231998894366, "percentage": 6.65, "elapsed_time": "2:15:09", "remaining_time": "1 day, 7:36:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 723, "total_steps": 10853, "loss": 0.2094, "learning_rate": 4.996240513239658e-06, "epoch": 0.06661445616621367, "percentage": 6.66, "elapsed_time": "2:15:19", "remaining_time": "1 day, 7:36:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 724, "total_steps": 10853, "loss": 0.2001, "learning_rate": 4.9961986357496775e-06, "epoch": 0.06670659234348367, "percentage": 6.67, "elapsed_time": "2:15:29", "remaining_time": "1 day, 7:35:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 725, "total_steps": 10853, "loss": 0.1898, "learning_rate": 4.996156526487383e-06, "epoch": 0.06679872852075368, "percentage": 6.68, "elapsed_time": "2:15:40", "remaining_time": "1 day, 7:35:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 726, "total_steps": 10853, "loss": 0.1877, "learning_rate": 4.996114185456688e-06, "epoch": 0.06689086469802367, "percentage": 6.69, "elapsed_time": "2:15:50", "remaining_time": "1 day, 7:34:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 727, "total_steps": 10853, "loss": 0.1953, "learning_rate": 4.996071612661523e-06, "epoch": 0.06698300087529369, "percentage": 6.7, "elapsed_time": "2:16:00", "remaining_time": "1 day, 7:34:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 728, "total_steps": 10853, "loss": 0.2108, "learning_rate": 4.996028808105838e-06, "epoch": 0.06707513705256368, "percentage": 6.71, "elapsed_time": "2:16:10", "remaining_time": "1 day, 7:33:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 729, "total_steps": 10853, "loss": 0.1885, "learning_rate": 4.995985771793611e-06, "epoch": 0.0671672732298337, "percentage": 6.72, "elapsed_time": "2:16:21", "remaining_time": "1 day, 7:33:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 730, "total_steps": 10853, "loss": 0.1945, "learning_rate": 4.995942503728837e-06, "epoch": 0.0672594094071037, "percentage": 6.73, "elapsed_time": "2:16:32", "remaining_time": "1 day, 7:33:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 731, "total_steps": 10853, "loss": 0.2073, "learning_rate": 4.995899003915532e-06, "epoch": 0.0673515455843737, "percentage": 6.74, "elapsed_time": "2:16:44", "remaining_time": "1 day, 7:33:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 732, "total_steps": 10853, "loss": 0.2024, "learning_rate": 4.995855272357736e-06, "epoch": 0.06744368176164371, "percentage": 6.74, "elapsed_time": "2:16:54", "remaining_time": "1 day, 7:32:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 733, "total_steps": 10853, "loss": 0.2027, "learning_rate": 4.995811309059509e-06, "epoch": 0.06753581793891371, "percentage": 6.75, "elapsed_time": "2:17:06", "remaining_time": "1 day, 7:32:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 734, "total_steps": 10853, "loss": 0.1931, "learning_rate": 4.995767114024934e-06, "epoch": 0.06762795411618372, "percentage": 6.76, "elapsed_time": "2:17:17", "remaining_time": "1 day, 7:32:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 735, "total_steps": 10853, "loss": 0.2125, "learning_rate": 4.995722687258113e-06, "epoch": 0.06772009029345373, "percentage": 6.77, "elapsed_time": "2:17:28", "remaining_time": "1 day, 7:32:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 736, "total_steps": 10853, "loss": 0.1767, "learning_rate": 4.995678028763172e-06, "epoch": 0.06781222647072373, "percentage": 6.78, "elapsed_time": "2:17:38", "remaining_time": "1 day, 7:32:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 737, "total_steps": 10853, "loss": 0.1896, "learning_rate": 4.995633138544258e-06, "epoch": 0.06790436264799374, "percentage": 6.79, "elapsed_time": "2:17:49", "remaining_time": "1 day, 7:31:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 738, "total_steps": 10853, "loss": 0.1975, "learning_rate": 4.995588016605539e-06, "epoch": 0.06799649882526373, "percentage": 6.8, "elapsed_time": "2:18:01", "remaining_time": "1 day, 7:31:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 739, "total_steps": 10853, "loss": 0.2018, "learning_rate": 4.995542662951203e-06, "epoch": 0.06808863500253375, "percentage": 6.81, "elapsed_time": "2:18:12", "remaining_time": "1 day, 7:31:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 740, "total_steps": 10853, "loss": 0.2105, "learning_rate": 4.9954970775854626e-06, "epoch": 0.06818077117980376, "percentage": 6.82, "elapsed_time": "2:18:23", "remaining_time": "1 day, 7:31:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 741, "total_steps": 10853, "loss": 0.1922, "learning_rate": 4.99545126051255e-06, "epoch": 0.06827290735707375, "percentage": 6.83, "elapsed_time": "2:18:33", "remaining_time": "1 day, 7:30:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 742, "total_steps": 10853, "loss": 0.2023, "learning_rate": 4.99540521173672e-06, "epoch": 0.06836504353434376, "percentage": 6.84, "elapsed_time": "2:18:44", "remaining_time": "1 day, 7:30:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 743, "total_steps": 10853, "loss": 0.1969, "learning_rate": 4.995358931262246e-06, "epoch": 0.06845717971161376, "percentage": 6.85, "elapsed_time": "2:18:55", "remaining_time": "1 day, 7:30:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 744, "total_steps": 10853, "loss": 0.2191, "learning_rate": 4.995312419093427e-06, "epoch": 0.06854931588888377, "percentage": 6.86, "elapsed_time": "2:19:05", "remaining_time": "1 day, 7:29:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 745, "total_steps": 10853, "loss": 0.1987, "learning_rate": 4.995265675234583e-06, "epoch": 0.06864145206615377, "percentage": 6.86, "elapsed_time": "2:19:16", "remaining_time": "1 day, 7:29:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 746, "total_steps": 10853, "loss": 0.209, "learning_rate": 4.995218699690051e-06, "epoch": 0.06873358824342378, "percentage": 6.87, "elapsed_time": "2:19:26", "remaining_time": "1 day, 7:29:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 747, "total_steps": 10853, "loss": 0.1994, "learning_rate": 4.995171492464195e-06, "epoch": 0.06882572442069379, "percentage": 6.88, "elapsed_time": "2:19:37", "remaining_time": "1 day, 7:28:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 748, "total_steps": 10853, "loss": 0.2027, "learning_rate": 4.995124053561396e-06, "epoch": 0.06891786059796379, "percentage": 6.89, "elapsed_time": "2:19:47", "remaining_time": "1 day, 7:28:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 749, "total_steps": 10853, "loss": 0.1868, "learning_rate": 4.9950763829860615e-06, "epoch": 0.0690099967752338, "percentage": 6.9, "elapsed_time": "2:19:59", "remaining_time": "1 day, 7:28:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 750, "total_steps": 10853, "loss": 0.1966, "learning_rate": 4.995028480742616e-06, "epoch": 0.0691021329525038, "percentage": 6.91, "elapsed_time": "2:20:09", "remaining_time": "1 day, 7:28:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 751, "total_steps": 10853, "loss": 0.1893, "learning_rate": 4.9949803468355075e-06, "epoch": 0.0691942691297738, "percentage": 6.92, "elapsed_time": "2:20:19", "remaining_time": "1 day, 7:27:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 752, "total_steps": 10853, "loss": 0.2112, "learning_rate": 4.994931981269206e-06, "epoch": 0.06928640530704382, "percentage": 6.93, "elapsed_time": "2:20:30", "remaining_time": "1 day, 7:27:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 753, "total_steps": 10853, "loss": 0.1965, "learning_rate": 4.9948833840482e-06, "epoch": 0.06937854148431381, "percentage": 6.94, "elapsed_time": "2:20:41", "remaining_time": "1 day, 7:27:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 754, "total_steps": 10853, "loss": 0.2011, "learning_rate": 4.994834555177004e-06, "epoch": 0.06947067766158382, "percentage": 6.95, "elapsed_time": "2:20:52", "remaining_time": "1 day, 7:26:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 755, "total_steps": 10853, "loss": 0.2018, "learning_rate": 4.994785494660151e-06, "epoch": 0.06956281383885382, "percentage": 6.96, "elapsed_time": "2:21:02", "remaining_time": "1 day, 7:26:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 756, "total_steps": 10853, "loss": 0.2266, "learning_rate": 4.994736202502196e-06, "epoch": 0.06965495001612383, "percentage": 6.97, "elapsed_time": "2:21:13", "remaining_time": "1 day, 7:26:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 757, "total_steps": 10853, "loss": 0.2197, "learning_rate": 4.994686678707716e-06, "epoch": 0.06974708619339384, "percentage": 6.98, "elapsed_time": "2:21:22", "remaining_time": "1 day, 7:25:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 758, "total_steps": 10853, "loss": 0.1926, "learning_rate": 4.9946369232813104e-06, "epoch": 0.06983922237066384, "percentage": 6.98, "elapsed_time": "2:21:33", "remaining_time": "1 day, 7:25:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 759, "total_steps": 10853, "loss": 0.1856, "learning_rate": 4.994586936227598e-06, "epoch": 0.06993135854793385, "percentage": 6.99, "elapsed_time": "2:21:43", "remaining_time": "1 day, 7:24:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 760, "total_steps": 10853, "loss": 0.1985, "learning_rate": 4.99453671755122e-06, "epoch": 0.07002349472520385, "percentage": 7.0, "elapsed_time": "2:21:55", "remaining_time": "1 day, 7:24:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 761, "total_steps": 10853, "loss": 0.2043, "learning_rate": 4.994486267256839e-06, "epoch": 0.07011563090247386, "percentage": 7.01, "elapsed_time": "2:22:06", "remaining_time": "1 day, 7:24:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 762, "total_steps": 10853, "loss": 0.1854, "learning_rate": 4.994435585349139e-06, "epoch": 0.07020776707974385, "percentage": 7.02, "elapsed_time": "2:22:17", "remaining_time": "1 day, 7:24:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 763, "total_steps": 10853, "loss": 0.194, "learning_rate": 4.994384671832827e-06, "epoch": 0.07029990325701387, "percentage": 7.03, "elapsed_time": "2:22:27", "remaining_time": "1 day, 7:23:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 764, "total_steps": 10853, "loss": 0.2038, "learning_rate": 4.994333526712629e-06, "epoch": 0.07039203943428388, "percentage": 7.04, "elapsed_time": "2:22:38", "remaining_time": "1 day, 7:23:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 765, "total_steps": 10853, "loss": 0.1941, "learning_rate": 4.994282149993296e-06, "epoch": 0.07048417561155387, "percentage": 7.05, "elapsed_time": "2:22:50", "remaining_time": "1 day, 7:23:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 766, "total_steps": 10853, "loss": 0.1952, "learning_rate": 4.994230541679596e-06, "epoch": 0.07057631178882388, "percentage": 7.06, "elapsed_time": "2:23:00", "remaining_time": "1 day, 7:23:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 767, "total_steps": 10853, "loss": 0.1973, "learning_rate": 4.994178701776322e-06, "epoch": 0.07066844796609388, "percentage": 7.07, "elapsed_time": "2:23:11", "remaining_time": "1 day, 7:22:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 768, "total_steps": 10853, "loss": 0.1998, "learning_rate": 4.994126630288287e-06, "epoch": 0.07076058414336389, "percentage": 7.08, "elapsed_time": "2:23:21", "remaining_time": "1 day, 7:22:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 769, "total_steps": 10853, "loss": 0.1912, "learning_rate": 4.994074327220326e-06, "epoch": 0.0708527203206339, "percentage": 7.09, "elapsed_time": "2:23:31", "remaining_time": "1 day, 7:22:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 770, "total_steps": 10853, "loss": 0.1996, "learning_rate": 4.994021792577296e-06, "epoch": 0.0709448564979039, "percentage": 7.09, "elapsed_time": "2:23:42", "remaining_time": "1 day, 7:21:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 771, "total_steps": 10853, "loss": 0.2068, "learning_rate": 4.993969026364074e-06, "epoch": 0.07103699267517391, "percentage": 7.1, "elapsed_time": "2:23:53", "remaining_time": "1 day, 7:21:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 772, "total_steps": 10853, "loss": 0.198, "learning_rate": 4.993916028585559e-06, "epoch": 0.0711291288524439, "percentage": 7.11, "elapsed_time": "2:24:03", "remaining_time": "1 day, 7:21:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 773, "total_steps": 10853, "loss": 0.1984, "learning_rate": 4.993862799246672e-06, "epoch": 0.07122126502971392, "percentage": 7.12, "elapsed_time": "2:24:13", "remaining_time": "1 day, 7:20:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 774, "total_steps": 10853, "loss": 0.2117, "learning_rate": 4.9938093383523565e-06, "epoch": 0.07131340120698393, "percentage": 7.13, "elapsed_time": "2:24:24", "remaining_time": "1 day, 7:20:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 775, "total_steps": 10853, "loss": 0.2116, "learning_rate": 4.993755645907575e-06, "epoch": 0.07140553738425393, "percentage": 7.14, "elapsed_time": "2:24:36", "remaining_time": "1 day, 7:20:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 776, "total_steps": 10853, "loss": 0.2012, "learning_rate": 4.993701721917314e-06, "epoch": 0.07149767356152394, "percentage": 7.15, "elapsed_time": "2:24:46", "remaining_time": "1 day, 7:20:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 777, "total_steps": 10853, "loss": 0.2059, "learning_rate": 4.993647566386579e-06, "epoch": 0.07158980973879393, "percentage": 7.16, "elapsed_time": "2:24:57", "remaining_time": "1 day, 7:19:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 778, "total_steps": 10853, "loss": 0.1983, "learning_rate": 4.993593179320399e-06, "epoch": 0.07168194591606394, "percentage": 7.17, "elapsed_time": "2:25:07", "remaining_time": "1 day, 7:19:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 779, "total_steps": 10853, "loss": 0.2079, "learning_rate": 4.993538560723824e-06, "epoch": 0.07177408209333394, "percentage": 7.18, "elapsed_time": "2:25:20", "remaining_time": "1 day, 7:19:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 780, "total_steps": 10853, "loss": 0.2136, "learning_rate": 4.993483710601926e-06, "epoch": 0.07186621827060395, "percentage": 7.19, "elapsed_time": "2:25:31", "remaining_time": "1 day, 7:19:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 781, "total_steps": 10853, "loss": 0.1913, "learning_rate": 4.993428628959796e-06, "epoch": 0.07195835444787396, "percentage": 7.2, "elapsed_time": "2:25:40", "remaining_time": "1 day, 7:18:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 782, "total_steps": 10853, "loss": 0.201, "learning_rate": 4.993373315802551e-06, "epoch": 0.07205049062514396, "percentage": 7.21, "elapsed_time": "2:25:50", "remaining_time": "1 day, 7:18:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 783, "total_steps": 10853, "loss": 0.1903, "learning_rate": 4.993317771135324e-06, "epoch": 0.07214262680241397, "percentage": 7.21, "elapsed_time": "2:26:02", "remaining_time": "1 day, 7:18:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 784, "total_steps": 10853, "loss": 0.2212, "learning_rate": 4.993261994963275e-06, "epoch": 0.07223476297968397, "percentage": 7.22, "elapsed_time": "2:26:12", "remaining_time": "1 day, 7:17:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 785, "total_steps": 10853, "loss": 0.1948, "learning_rate": 4.99320598729158e-06, "epoch": 0.07232689915695398, "percentage": 7.23, "elapsed_time": "2:26:23", "remaining_time": "1 day, 7:17:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 786, "total_steps": 10853, "loss": 0.1928, "learning_rate": 4.993149748125441e-06, "epoch": 0.07241903533422399, "percentage": 7.24, "elapsed_time": "2:26:33", "remaining_time": "1 day, 7:17:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 787, "total_steps": 10853, "loss": 0.1938, "learning_rate": 4.99309327747008e-06, "epoch": 0.07251117151149399, "percentage": 7.25, "elapsed_time": "2:26:44", "remaining_time": "1 day, 7:16:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 788, "total_steps": 10853, "loss": 0.2087, "learning_rate": 4.99303657533074e-06, "epoch": 0.072603307688764, "percentage": 7.26, "elapsed_time": "2:26:55", "remaining_time": "1 day, 7:16:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 789, "total_steps": 10853, "loss": 0.2004, "learning_rate": 4.9929796417126855e-06, "epoch": 0.07269544386603399, "percentage": 7.27, "elapsed_time": "2:27:05", "remaining_time": "1 day, 7:16:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 790, "total_steps": 10853, "loss": 0.1968, "learning_rate": 4.992922476621203e-06, "epoch": 0.072787580043304, "percentage": 7.28, "elapsed_time": "2:27:16", "remaining_time": "1 day, 7:16:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 791, "total_steps": 10853, "loss": 0.2078, "learning_rate": 4.992865080061599e-06, "epoch": 0.07287971622057401, "percentage": 7.29, "elapsed_time": "2:27:27", "remaining_time": "1 day, 7:15:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 792, "total_steps": 10853, "loss": 0.2075, "learning_rate": 4.992807452039206e-06, "epoch": 0.07297185239784401, "percentage": 7.3, "elapsed_time": "2:27:39", "remaining_time": "1 day, 7:15:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 793, "total_steps": 10853, "loss": 0.2064, "learning_rate": 4.992749592559372e-06, "epoch": 0.07306398857511402, "percentage": 7.31, "elapsed_time": "2:27:51", "remaining_time": "1 day, 7:15:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 794, "total_steps": 10853, "loss": 0.2035, "learning_rate": 4.99269150162747e-06, "epoch": 0.07315612475238402, "percentage": 7.32, "elapsed_time": "2:28:02", "remaining_time": "1 day, 7:15:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 795, "total_steps": 10853, "loss": 0.2013, "learning_rate": 4.9926331792488935e-06, "epoch": 0.07324826092965403, "percentage": 7.33, "elapsed_time": "2:28:13", "remaining_time": "1 day, 7:15:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 796, "total_steps": 10853, "loss": 0.1991, "learning_rate": 4.992574625429059e-06, "epoch": 0.07334039710692403, "percentage": 7.33, "elapsed_time": "2:28:23", "remaining_time": "1 day, 7:14:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 797, "total_steps": 10853, "loss": 0.205, "learning_rate": 4.992515840173401e-06, "epoch": 0.07343253328419404, "percentage": 7.34, "elapsed_time": "2:28:34", "remaining_time": "1 day, 7:14:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 798, "total_steps": 10853, "loss": 0.2123, "learning_rate": 4.992456823487381e-06, "epoch": 0.07352466946146405, "percentage": 7.35, "elapsed_time": "2:28:45", "remaining_time": "1 day, 7:14:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 799, "total_steps": 10853, "loss": 0.206, "learning_rate": 4.992397575376474e-06, "epoch": 0.07361680563873405, "percentage": 7.36, "elapsed_time": "2:28:57", "remaining_time": "1 day, 7:14:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 800, "total_steps": 10853, "loss": 0.1954, "learning_rate": 4.992338095846185e-06, "epoch": 0.07370894181600406, "percentage": 7.37, "elapsed_time": "2:29:08", "remaining_time": "1 day, 7:14:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 801, "total_steps": 10853, "loss": 0.1823, "learning_rate": 4.992278384902036e-06, "epoch": 0.07380107799327405, "percentage": 7.38, "elapsed_time": "2:29:18", "remaining_time": "1 day, 7:13:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 802, "total_steps": 10853, "loss": 0.1972, "learning_rate": 4.992218442549571e-06, "epoch": 0.07389321417054406, "percentage": 7.39, "elapsed_time": "2:29:29", "remaining_time": "1 day, 7:13:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 803, "total_steps": 10853, "loss": 0.174, "learning_rate": 4.992158268794355e-06, "epoch": 0.07398535034781407, "percentage": 7.4, "elapsed_time": "2:29:39", "remaining_time": "1 day, 7:13:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 804, "total_steps": 10853, "loss": 0.1921, "learning_rate": 4.992097863641975e-06, "epoch": 0.07407748652508407, "percentage": 7.41, "elapsed_time": "2:29:50", "remaining_time": "1 day, 7:12:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 805, "total_steps": 10853, "loss": 0.2003, "learning_rate": 4.992037227098041e-06, "epoch": 0.07416962270235408, "percentage": 7.42, "elapsed_time": "2:30:01", "remaining_time": "1 day, 7:12:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 806, "total_steps": 10853, "loss": 0.2154, "learning_rate": 4.991976359168182e-06, "epoch": 0.07426175887962408, "percentage": 7.43, "elapsed_time": "2:30:11", "remaining_time": "1 day, 7:12:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 807, "total_steps": 10853, "loss": 0.2022, "learning_rate": 4.99191525985805e-06, "epoch": 0.07435389505689409, "percentage": 7.44, "elapsed_time": "2:30:23", "remaining_time": "1 day, 7:12:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 808, "total_steps": 10853, "loss": 0.1988, "learning_rate": 4.991853929173318e-06, "epoch": 0.0744460312341641, "percentage": 7.44, "elapsed_time": "2:30:36", "remaining_time": "1 day, 7:12:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 809, "total_steps": 10853, "loss": 0.1876, "learning_rate": 4.99179236711968e-06, "epoch": 0.0745381674114341, "percentage": 7.45, "elapsed_time": "2:30:45", "remaining_time": "1 day, 7:11:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 810, "total_steps": 10853, "loss": 0.1909, "learning_rate": 4.991730573702852e-06, "epoch": 0.07463030358870411, "percentage": 7.46, "elapsed_time": "2:30:57", "remaining_time": "1 day, 7:11:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 811, "total_steps": 10853, "loss": 0.2195, "learning_rate": 4.991668548928573e-06, "epoch": 0.0747224397659741, "percentage": 7.47, "elapsed_time": "2:31:09", "remaining_time": "1 day, 7:11:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 812, "total_steps": 10853, "loss": 0.2199, "learning_rate": 4.991606292802601e-06, "epoch": 0.07481457594324412, "percentage": 7.48, "elapsed_time": "2:31:20", "remaining_time": "1 day, 7:11:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 813, "total_steps": 10853, "loss": 0.2144, "learning_rate": 4.991543805330716e-06, "epoch": 0.07490671212051413, "percentage": 7.49, "elapsed_time": "2:31:32", "remaining_time": "1 day, 7:11:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 814, "total_steps": 10853, "loss": 0.1924, "learning_rate": 4.991481086518721e-06, "epoch": 0.07499884829778412, "percentage": 7.5, "elapsed_time": "2:31:43", "remaining_time": "1 day, 7:11:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 815, "total_steps": 10853, "loss": 0.1979, "learning_rate": 4.9914181363724394e-06, "epoch": 0.07509098447505413, "percentage": 7.51, "elapsed_time": "2:31:53", "remaining_time": "1 day, 7:10:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 816, "total_steps": 10853, "loss": 0.2131, "learning_rate": 4.991354954897715e-06, "epoch": 0.07518312065232413, "percentage": 7.52, "elapsed_time": "2:32:04", "remaining_time": "1 day, 7:10:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 817, "total_steps": 10853, "loss": 0.207, "learning_rate": 4.991291542100416e-06, "epoch": 0.07527525682959414, "percentage": 7.53, "elapsed_time": "2:32:15", "remaining_time": "1 day, 7:10:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 818, "total_steps": 10853, "loss": 0.1917, "learning_rate": 4.991227897986428e-06, "epoch": 0.07536739300686414, "percentage": 7.54, "elapsed_time": "2:32:25", "remaining_time": "1 day, 7:09:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 819, "total_steps": 10853, "loss": 0.2016, "learning_rate": 4.991164022561662e-06, "epoch": 0.07545952918413415, "percentage": 7.55, "elapsed_time": "2:32:35", "remaining_time": "1 day, 7:09:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 820, "total_steps": 10853, "loss": 0.1846, "learning_rate": 4.991099915832048e-06, "epoch": 0.07555166536140416, "percentage": 7.56, "elapsed_time": "2:32:45", "remaining_time": "1 day, 7:09:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 821, "total_steps": 10853, "loss": 0.2127, "learning_rate": 4.9910355778035394e-06, "epoch": 0.07564380153867416, "percentage": 7.56, "elapsed_time": "2:32:56", "remaining_time": "1 day, 7:08:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 822, "total_steps": 10853, "loss": 0.1968, "learning_rate": 4.990971008482109e-06, "epoch": 0.07573593771594417, "percentage": 7.57, "elapsed_time": "2:33:05", "remaining_time": "1 day, 7:08:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 823, "total_steps": 10853, "loss": 0.1904, "learning_rate": 4.990906207873753e-06, "epoch": 0.07582807389321417, "percentage": 7.58, "elapsed_time": "2:33:15", "remaining_time": "1 day, 7:07:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 824, "total_steps": 10853, "loss": 0.2, "learning_rate": 4.990841175984486e-06, "epoch": 0.07592021007048418, "percentage": 7.59, "elapsed_time": "2:33:27", "remaining_time": "1 day, 7:07:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 825, "total_steps": 10853, "loss": 0.1958, "learning_rate": 4.9907759128203485e-06, "epoch": 0.07601234624775419, "percentage": 7.6, "elapsed_time": "2:33:38", "remaining_time": "1 day, 7:07:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 826, "total_steps": 10853, "loss": 0.1939, "learning_rate": 4.9907104183874e-06, "epoch": 0.07610448242502418, "percentage": 7.61, "elapsed_time": "2:33:49", "remaining_time": "1 day, 7:07:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 827, "total_steps": 10853, "loss": 0.1983, "learning_rate": 4.990644692691721e-06, "epoch": 0.0761966186022942, "percentage": 7.62, "elapsed_time": "2:33:59", "remaining_time": "1 day, 7:06:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 828, "total_steps": 10853, "loss": 0.1936, "learning_rate": 4.990578735739413e-06, "epoch": 0.07628875477956419, "percentage": 7.63, "elapsed_time": "2:34:09", "remaining_time": "1 day, 7:06:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 829, "total_steps": 10853, "loss": 0.196, "learning_rate": 4.990512547536602e-06, "epoch": 0.0763808909568342, "percentage": 7.64, "elapsed_time": "2:34:20", "remaining_time": "1 day, 7:06:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 830, "total_steps": 10853, "loss": 0.1939, "learning_rate": 4.990446128089434e-06, "epoch": 0.07647302713410421, "percentage": 7.65, "elapsed_time": "2:34:31", "remaining_time": "1 day, 7:05:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 831, "total_steps": 10853, "loss": 0.1973, "learning_rate": 4.990379477404073e-06, "epoch": 0.07656516331137421, "percentage": 7.66, "elapsed_time": "2:34:42", "remaining_time": "1 day, 7:05:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 832, "total_steps": 10853, "loss": 0.2066, "learning_rate": 4.9903125954867114e-06, "epoch": 0.07665729948864422, "percentage": 7.67, "elapsed_time": "2:34:54", "remaining_time": "1 day, 7:05:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 833, "total_steps": 10853, "loss": 0.1749, "learning_rate": 4.990245482343556e-06, "epoch": 0.07674943566591422, "percentage": 7.68, "elapsed_time": "2:35:03", "remaining_time": "1 day, 7:05:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 834, "total_steps": 10853, "loss": 0.2042, "learning_rate": 4.990178137980841e-06, "epoch": 0.07684157184318423, "percentage": 7.68, "elapsed_time": "2:35:15", "remaining_time": "1 day, 7:05:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 835, "total_steps": 10853, "loss": 0.1887, "learning_rate": 4.990110562404817e-06, "epoch": 0.07693370802045423, "percentage": 7.69, "elapsed_time": "2:35:26", "remaining_time": "1 day, 7:04:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 836, "total_steps": 10853, "loss": 0.1925, "learning_rate": 4.990042755621759e-06, "epoch": 0.07702584419772424, "percentage": 7.7, "elapsed_time": "2:35:36", "remaining_time": "1 day, 7:04:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 837, "total_steps": 10853, "loss": 0.1917, "learning_rate": 4.989974717637963e-06, "epoch": 0.07711798037499425, "percentage": 7.71, "elapsed_time": "2:35:46", "remaining_time": "1 day, 7:04:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 838, "total_steps": 10853, "loss": 0.2083, "learning_rate": 4.989906448459748e-06, "epoch": 0.07721011655226424, "percentage": 7.72, "elapsed_time": "2:35:57", "remaining_time": "1 day, 7:03:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 839, "total_steps": 10853, "loss": 0.1941, "learning_rate": 4.98983794809345e-06, "epoch": 0.07730225272953425, "percentage": 7.73, "elapsed_time": "2:36:08", "remaining_time": "1 day, 7:03:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 840, "total_steps": 10853, "loss": 0.1952, "learning_rate": 4.989769216545431e-06, "epoch": 0.07739438890680425, "percentage": 7.74, "elapsed_time": "2:36:18", "remaining_time": "1 day, 7:03:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 841, "total_steps": 10853, "loss": 0.1889, "learning_rate": 4.9897002538220715e-06, "epoch": 0.07748652508407426, "percentage": 7.75, "elapsed_time": "2:36:29", "remaining_time": "1 day, 7:03:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 842, "total_steps": 10853, "loss": 0.2183, "learning_rate": 4.989631059929777e-06, "epoch": 0.07757866126134427, "percentage": 7.76, "elapsed_time": "2:36:42", "remaining_time": "1 day, 7:03:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 843, "total_steps": 10853, "loss": 0.1995, "learning_rate": 4.989561634874969e-06, "epoch": 0.07767079743861427, "percentage": 7.77, "elapsed_time": "2:36:52", "remaining_time": "1 day, 7:02:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 844, "total_steps": 10853, "loss": 0.2053, "learning_rate": 4.9894919786640964e-06, "epoch": 0.07776293361588428, "percentage": 7.78, "elapsed_time": "2:37:02", "remaining_time": "1 day, 7:02:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 845, "total_steps": 10853, "loss": 0.1962, "learning_rate": 4.989422091303625e-06, "epoch": 0.07785506979315428, "percentage": 7.79, "elapsed_time": "2:37:11", "remaining_time": "1 day, 7:01:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 846, "total_steps": 10853, "loss": 0.2039, "learning_rate": 4.989351972800045e-06, "epoch": 0.07794720597042429, "percentage": 7.8, "elapsed_time": "2:37:23", "remaining_time": "1 day, 7:01:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 847, "total_steps": 10853, "loss": 0.205, "learning_rate": 4.989281623159866e-06, "epoch": 0.0780393421476943, "percentage": 7.8, "elapsed_time": "2:37:35", "remaining_time": "1 day, 7:01:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 848, "total_steps": 10853, "loss": 0.2094, "learning_rate": 4.98921104238962e-06, "epoch": 0.0781314783249643, "percentage": 7.81, "elapsed_time": "2:37:46", "remaining_time": "1 day, 7:01:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 849, "total_steps": 10853, "loss": 0.2017, "learning_rate": 4.989140230495862e-06, "epoch": 0.0782236145022343, "percentage": 7.82, "elapsed_time": "2:37:56", "remaining_time": "1 day, 7:01:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 850, "total_steps": 10853, "loss": 0.1959, "learning_rate": 4.989069187485165e-06, "epoch": 0.0783157506795043, "percentage": 7.83, "elapsed_time": "2:38:07", "remaining_time": "1 day, 7:00:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 851, "total_steps": 10853, "loss": 0.1943, "learning_rate": 4.988997913364126e-06, "epoch": 0.07840788685677431, "percentage": 7.84, "elapsed_time": "2:38:18", "remaining_time": "1 day, 7:00:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 852, "total_steps": 10853, "loss": 0.2164, "learning_rate": 4.988926408139363e-06, "epoch": 0.07850002303404431, "percentage": 7.85, "elapsed_time": "2:38:31", "remaining_time": "1 day, 7:00:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 853, "total_steps": 10853, "loss": 0.2032, "learning_rate": 4.988854671817516e-06, "epoch": 0.07859215921131432, "percentage": 7.86, "elapsed_time": "2:38:43", "remaining_time": "1 day, 7:00:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 854, "total_steps": 10853, "loss": 0.1949, "learning_rate": 4.988782704405244e-06, "epoch": 0.07868429538858433, "percentage": 7.87, "elapsed_time": "2:38:54", "remaining_time": "1 day, 7:00:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 855, "total_steps": 10853, "loss": 0.2328, "learning_rate": 4.98871050590923e-06, "epoch": 0.07877643156585433, "percentage": 7.88, "elapsed_time": "2:39:05", "remaining_time": "1 day, 7:00:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 856, "total_steps": 10853, "loss": 0.2011, "learning_rate": 4.988638076336178e-06, "epoch": 0.07886856774312434, "percentage": 7.89, "elapsed_time": "2:39:14", "remaining_time": "1 day, 6:59:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 857, "total_steps": 10853, "loss": 0.2067, "learning_rate": 4.988565415692812e-06, "epoch": 0.07896070392039434, "percentage": 7.9, "elapsed_time": "2:39:24", "remaining_time": "1 day, 6:59:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 858, "total_steps": 10853, "loss": 0.1788, "learning_rate": 4.988492523985881e-06, "epoch": 0.07905284009766435, "percentage": 7.91, "elapsed_time": "2:39:33", "remaining_time": "1 day, 6:58:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 859, "total_steps": 10853, "loss": 0.2019, "learning_rate": 4.9884194012221496e-06, "epoch": 0.07914497627493436, "percentage": 7.91, "elapsed_time": "2:39:44", "remaining_time": "1 day, 6:58:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 860, "total_steps": 10853, "loss": 0.2019, "learning_rate": 4.98834604740841e-06, "epoch": 0.07923711245220436, "percentage": 7.92, "elapsed_time": "2:39:54", "remaining_time": "1 day, 6:58:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 861, "total_steps": 10853, "loss": 0.204, "learning_rate": 4.988272462551471e-06, "epoch": 0.07932924862947437, "percentage": 7.93, "elapsed_time": "2:40:07", "remaining_time": "1 day, 6:58:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 862, "total_steps": 10853, "loss": 0.1809, "learning_rate": 4.988198646658167e-06, "epoch": 0.07942138480674436, "percentage": 7.94, "elapsed_time": "2:40:19", "remaining_time": "1 day, 6:58:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 863, "total_steps": 10853, "loss": 0.2129, "learning_rate": 4.988124599735351e-06, "epoch": 0.07951352098401437, "percentage": 7.95, "elapsed_time": "2:40:31", "remaining_time": "1 day, 6:58:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 864, "total_steps": 10853, "loss": 0.1985, "learning_rate": 4.988050321789898e-06, "epoch": 0.07960565716128438, "percentage": 7.96, "elapsed_time": "2:40:42", "remaining_time": "1 day, 6:58:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 865, "total_steps": 10853, "loss": 0.1924, "learning_rate": 4.987975812828704e-06, "epoch": 0.07969779333855438, "percentage": 7.97, "elapsed_time": "2:40:52", "remaining_time": "1 day, 6:57:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 866, "total_steps": 10853, "loss": 0.1946, "learning_rate": 4.987901072858689e-06, "epoch": 0.07978992951582439, "percentage": 7.98, "elapsed_time": "2:41:03", "remaining_time": "1 day, 6:57:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 867, "total_steps": 10853, "loss": 0.2062, "learning_rate": 4.9878261018867915e-06, "epoch": 0.07988206569309439, "percentage": 7.99, "elapsed_time": "2:41:13", "remaining_time": "1 day, 6:57:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 868, "total_steps": 10853, "loss": 0.215, "learning_rate": 4.9877508999199724e-06, "epoch": 0.0799742018703644, "percentage": 8.0, "elapsed_time": "2:41:24", "remaining_time": "1 day, 6:56:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 869, "total_steps": 10853, "loss": 0.1872, "learning_rate": 4.987675466965215e-06, "epoch": 0.0800663380476344, "percentage": 8.01, "elapsed_time": "2:41:34", "remaining_time": "1 day, 6:56:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 870, "total_steps": 10853, "loss": 0.2051, "learning_rate": 4.987599803029522e-06, "epoch": 0.08015847422490441, "percentage": 8.02, "elapsed_time": "2:41:44", "remaining_time": "1 day, 6:55:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 871, "total_steps": 10853, "loss": 0.1988, "learning_rate": 4.98752390811992e-06, "epoch": 0.08025061040217442, "percentage": 8.03, "elapsed_time": "2:41:55", "remaining_time": "1 day, 6:55:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 872, "total_steps": 10853, "loss": 0.2103, "learning_rate": 4.987447782243456e-06, "epoch": 0.08034274657944442, "percentage": 8.03, "elapsed_time": "2:42:07", "remaining_time": "1 day, 6:55:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 873, "total_steps": 10853, "loss": 0.2106, "learning_rate": 4.9873714254071966e-06, "epoch": 0.08043488275671443, "percentage": 8.04, "elapsed_time": "2:42:16", "remaining_time": "1 day, 6:55:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 874, "total_steps": 10853, "loss": 0.2056, "learning_rate": 4.987294837618233e-06, "epoch": 0.08052701893398442, "percentage": 8.05, "elapsed_time": "2:42:27", "remaining_time": "1 day, 6:54:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 875, "total_steps": 10853, "loss": 0.2022, "learning_rate": 4.987218018883676e-06, "epoch": 0.08061915511125443, "percentage": 8.06, "elapsed_time": "2:42:39", "remaining_time": "1 day, 6:54:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 876, "total_steps": 10853, "loss": 0.2053, "learning_rate": 4.987140969210659e-06, "epoch": 0.08071129128852444, "percentage": 8.07, "elapsed_time": "2:42:49", "remaining_time": "1 day, 6:54:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 877, "total_steps": 10853, "loss": 0.2054, "learning_rate": 4.987063688606335e-06, "epoch": 0.08080342746579444, "percentage": 8.08, "elapsed_time": "2:42:59", "remaining_time": "1 day, 6:54:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 878, "total_steps": 10853, "loss": 0.1949, "learning_rate": 4.98698617707788e-06, "epoch": 0.08089556364306445, "percentage": 8.09, "elapsed_time": "2:43:10", "remaining_time": "1 day, 6:53:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 879, "total_steps": 10853, "loss": 0.183, "learning_rate": 4.98690843463249e-06, "epoch": 0.08098769982033445, "percentage": 8.1, "elapsed_time": "2:43:20", "remaining_time": "1 day, 6:53:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 880, "total_steps": 10853, "loss": 0.1962, "learning_rate": 4.986830461277384e-06, "epoch": 0.08107983599760446, "percentage": 8.11, "elapsed_time": "2:43:29", "remaining_time": "1 day, 6:52:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 881, "total_steps": 10853, "loss": 0.2063, "learning_rate": 4.986752257019804e-06, "epoch": 0.08117197217487447, "percentage": 8.12, "elapsed_time": "2:43:39", "remaining_time": "1 day, 6:52:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 882, "total_steps": 10853, "loss": 0.1873, "learning_rate": 4.9866738218670075e-06, "epoch": 0.08126410835214447, "percentage": 8.13, "elapsed_time": "2:43:51", "remaining_time": "1 day, 6:52:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 883, "total_steps": 10853, "loss": 0.1932, "learning_rate": 4.986595155826279e-06, "epoch": 0.08135624452941448, "percentage": 8.14, "elapsed_time": "2:44:00", "remaining_time": "1 day, 6:51:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 884, "total_steps": 10853, "loss": 0.2085, "learning_rate": 4.986516258904923e-06, "epoch": 0.08144838070668448, "percentage": 8.15, "elapsed_time": "2:44:12", "remaining_time": "1 day, 6:51:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 885, "total_steps": 10853, "loss": 0.1957, "learning_rate": 4.986437131110265e-06, "epoch": 0.08154051688395449, "percentage": 8.15, "elapsed_time": "2:44:24", "remaining_time": "1 day, 6:51:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 886, "total_steps": 10853, "loss": 0.2051, "learning_rate": 4.986357772449652e-06, "epoch": 0.08163265306122448, "percentage": 8.16, "elapsed_time": "2:44:34", "remaining_time": "1 day, 6:51:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 887, "total_steps": 10853, "loss": 0.2071, "learning_rate": 4.986278182930452e-06, "epoch": 0.0817247892384945, "percentage": 8.17, "elapsed_time": "2:44:45", "remaining_time": "1 day, 6:51:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 888, "total_steps": 10853, "loss": 0.2049, "learning_rate": 4.986198362560055e-06, "epoch": 0.0818169254157645, "percentage": 8.18, "elapsed_time": "2:44:57", "remaining_time": "1 day, 6:51:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 889, "total_steps": 10853, "loss": 0.1922, "learning_rate": 4.986118311345873e-06, "epoch": 0.0819090615930345, "percentage": 8.19, "elapsed_time": "2:45:08", "remaining_time": "1 day, 6:50:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 890, "total_steps": 10853, "loss": 0.1961, "learning_rate": 4.9860380292953375e-06, "epoch": 0.08200119777030451, "percentage": 8.2, "elapsed_time": "2:45:18", "remaining_time": "1 day, 6:50:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 891, "total_steps": 10853, "loss": 0.2077, "learning_rate": 4.985957516415903e-06, "epoch": 0.08209333394757451, "percentage": 8.21, "elapsed_time": "2:45:30", "remaining_time": "1 day, 6:50:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 892, "total_steps": 10853, "loss": 0.1845, "learning_rate": 4.985876772715047e-06, "epoch": 0.08218547012484452, "percentage": 8.22, "elapsed_time": "2:45:41", "remaining_time": "1 day, 6:50:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 893, "total_steps": 10853, "loss": 0.1991, "learning_rate": 4.985795798200265e-06, "epoch": 0.08227760630211453, "percentage": 8.23, "elapsed_time": "2:45:53", "remaining_time": "1 day, 6:50:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 894, "total_steps": 10853, "loss": 0.2053, "learning_rate": 4.9857145928790745e-06, "epoch": 0.08236974247938453, "percentage": 8.24, "elapsed_time": "2:46:04", "remaining_time": "1 day, 6:50:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 895, "total_steps": 10853, "loss": 0.2075, "learning_rate": 4.9856331567590175e-06, "epoch": 0.08246187865665454, "percentage": 8.25, "elapsed_time": "2:46:16", "remaining_time": "1 day, 6:49:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 896, "total_steps": 10853, "loss": 0.1784, "learning_rate": 4.985551489847654e-06, "epoch": 0.08255401483392454, "percentage": 8.26, "elapsed_time": "2:46:26", "remaining_time": "1 day, 6:49:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 897, "total_steps": 10853, "loss": 0.1867, "learning_rate": 4.985469592152567e-06, "epoch": 0.08264615101119455, "percentage": 8.26, "elapsed_time": "2:46:37", "remaining_time": "1 day, 6:49:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 898, "total_steps": 10853, "loss": 0.1986, "learning_rate": 4.985387463681361e-06, "epoch": 0.08273828718846456, "percentage": 8.27, "elapsed_time": "2:46:48", "remaining_time": "1 day, 6:49:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 899, "total_steps": 10853, "loss": 0.2064, "learning_rate": 4.985305104441661e-06, "epoch": 0.08283042336573455, "percentage": 8.28, "elapsed_time": "2:46:58", "remaining_time": "1 day, 6:48:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 900, "total_steps": 10853, "loss": 0.2084, "learning_rate": 4.9852225144411156e-06, "epoch": 0.08292255954300456, "percentage": 8.29, "elapsed_time": "2:47:09", "remaining_time": "1 day, 6:48:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 901, "total_steps": 10853, "loss": 0.1888, "learning_rate": 4.985139693687392e-06, "epoch": 0.08301469572027456, "percentage": 8.3, "elapsed_time": "2:47:19", "remaining_time": "1 day, 6:48:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 902, "total_steps": 10853, "loss": 0.2017, "learning_rate": 4.985056642188179e-06, "epoch": 0.08310683189754457, "percentage": 8.31, "elapsed_time": "2:47:30", "remaining_time": "1 day, 6:47:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 903, "total_steps": 10853, "loss": 0.1815, "learning_rate": 4.984973359951192e-06, "epoch": 0.08319896807481457, "percentage": 8.32, "elapsed_time": "2:47:40", "remaining_time": "1 day, 6:47:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 904, "total_steps": 10853, "loss": 0.188, "learning_rate": 4.984889846984159e-06, "epoch": 0.08329110425208458, "percentage": 8.33, "elapsed_time": "2:47:51", "remaining_time": "1 day, 6:47:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 905, "total_steps": 10853, "loss": 0.1874, "learning_rate": 4.984806103294837e-06, "epoch": 0.08338324042935459, "percentage": 8.34, "elapsed_time": "2:48:03", "remaining_time": "1 day, 6:47:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 906, "total_steps": 10853, "loss": 0.2091, "learning_rate": 4.9847221288910004e-06, "epoch": 0.08347537660662459, "percentage": 8.35, "elapsed_time": "2:48:15", "remaining_time": "1 day, 6:47:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 907, "total_steps": 10853, "loss": 0.1896, "learning_rate": 4.984637923780448e-06, "epoch": 0.0835675127838946, "percentage": 8.36, "elapsed_time": "2:48:24", "remaining_time": "1 day, 6:46:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 908, "total_steps": 10853, "loss": 0.2027, "learning_rate": 4.984553487970995e-06, "epoch": 0.0836596489611646, "percentage": 8.37, "elapsed_time": "2:48:34", "remaining_time": "1 day, 6:46:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 909, "total_steps": 10853, "loss": 0.2009, "learning_rate": 4.984468821470485e-06, "epoch": 0.0837517851384346, "percentage": 8.38, "elapsed_time": "2:48:45", "remaining_time": "1 day, 6:46:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 910, "total_steps": 10853, "loss": 0.2073, "learning_rate": 4.984383924286776e-06, "epoch": 0.08384392131570462, "percentage": 8.38, "elapsed_time": "2:48:56", "remaining_time": "1 day, 6:45:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 911, "total_steps": 10853, "loss": 0.2053, "learning_rate": 4.984298796427754e-06, "epoch": 0.08393605749297461, "percentage": 8.39, "elapsed_time": "2:49:06", "remaining_time": "1 day, 6:45:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 912, "total_steps": 10853, "loss": 0.2053, "learning_rate": 4.984213437901321e-06, "epoch": 0.08402819367024462, "percentage": 8.4, "elapsed_time": "2:49:19", "remaining_time": "1 day, 6:45:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 913, "total_steps": 10853, "loss": 0.2002, "learning_rate": 4.984127848715402e-06, "epoch": 0.08412032984751462, "percentage": 8.41, "elapsed_time": "2:49:29", "remaining_time": "1 day, 6:45:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 914, "total_steps": 10853, "loss": 0.1739, "learning_rate": 4.984042028877945e-06, "epoch": 0.08421246602478463, "percentage": 8.42, "elapsed_time": "2:49:37", "remaining_time": "1 day, 6:44:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 915, "total_steps": 10853, "loss": 0.1952, "learning_rate": 4.983955978396919e-06, "epoch": 0.08430460220205464, "percentage": 8.43, "elapsed_time": "2:49:48", "remaining_time": "1 day, 6:44:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 916, "total_steps": 10853, "loss": 0.2054, "learning_rate": 4.983869697280312e-06, "epoch": 0.08439673837932464, "percentage": 8.44, "elapsed_time": "2:49:59", "remaining_time": "1 day, 6:44:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 917, "total_steps": 10853, "loss": 0.1931, "learning_rate": 4.983783185536137e-06, "epoch": 0.08448887455659465, "percentage": 8.45, "elapsed_time": "2:50:11", "remaining_time": "1 day, 6:44:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 918, "total_steps": 10853, "loss": 0.1876, "learning_rate": 4.983696443172426e-06, "epoch": 0.08458101073386465, "percentage": 8.46, "elapsed_time": "2:50:20", "remaining_time": "1 day, 6:43:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 919, "total_steps": 10853, "loss": 0.1866, "learning_rate": 4.983609470197233e-06, "epoch": 0.08467314691113466, "percentage": 8.47, "elapsed_time": "2:50:30", "remaining_time": "1 day, 6:43:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 920, "total_steps": 10853, "loss": 0.196, "learning_rate": 4.983522266618633e-06, "epoch": 0.08476528308840466, "percentage": 8.48, "elapsed_time": "2:50:39", "remaining_time": "1 day, 6:42:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 921, "total_steps": 10853, "loss": 0.1916, "learning_rate": 4.983434832444724e-06, "epoch": 0.08485741926567467, "percentage": 8.49, "elapsed_time": "2:50:50", "remaining_time": "1 day, 6:42:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 922, "total_steps": 10853, "loss": 0.1942, "learning_rate": 4.983347167683623e-06, "epoch": 0.08494955544294468, "percentage": 8.5, "elapsed_time": "2:51:01", "remaining_time": "1 day, 6:42:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 923, "total_steps": 10853, "loss": 0.1998, "learning_rate": 4.98325927234347e-06, "epoch": 0.08504169162021467, "percentage": 8.5, "elapsed_time": "2:51:12", "remaining_time": "1 day, 6:41:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 924, "total_steps": 10853, "loss": 0.1958, "learning_rate": 4.983171146432427e-06, "epoch": 0.08513382779748468, "percentage": 8.51, "elapsed_time": "2:51:23", "remaining_time": "1 day, 6:41:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 925, "total_steps": 10853, "loss": 0.1969, "learning_rate": 4.983082789958675e-06, "epoch": 0.08522596397475468, "percentage": 8.52, "elapsed_time": "2:51:33", "remaining_time": "1 day, 6:41:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 926, "total_steps": 10853, "loss": 0.1979, "learning_rate": 4.9829942029304194e-06, "epoch": 0.08531810015202469, "percentage": 8.53, "elapsed_time": "2:51:43", "remaining_time": "1 day, 6:40:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 927, "total_steps": 10853, "loss": 0.1971, "learning_rate": 4.982905385355885e-06, "epoch": 0.0854102363292947, "percentage": 8.54, "elapsed_time": "2:51:53", "remaining_time": "1 day, 6:40:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 928, "total_steps": 10853, "loss": 0.199, "learning_rate": 4.982816337243318e-06, "epoch": 0.0855023725065647, "percentage": 8.55, "elapsed_time": "2:52:03", "remaining_time": "1 day, 6:40:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 929, "total_steps": 10853, "loss": 0.1991, "learning_rate": 4.982727058600987e-06, "epoch": 0.08559450868383471, "percentage": 8.56, "elapsed_time": "2:52:13", "remaining_time": "1 day, 6:39:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 930, "total_steps": 10853, "loss": 0.1841, "learning_rate": 4.98263754943718e-06, "epoch": 0.08568664486110471, "percentage": 8.57, "elapsed_time": "2:52:24", "remaining_time": "1 day, 6:39:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 931, "total_steps": 10853, "loss": 0.19, "learning_rate": 4.9825478097602115e-06, "epoch": 0.08577878103837472, "percentage": 8.58, "elapsed_time": "2:52:34", "remaining_time": "1 day, 6:39:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 932, "total_steps": 10853, "loss": 0.1975, "learning_rate": 4.982457839578411e-06, "epoch": 0.08587091721564473, "percentage": 8.59, "elapsed_time": "2:52:44", "remaining_time": "1 day, 6:38:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 933, "total_steps": 10853, "loss": 0.206, "learning_rate": 4.982367638900132e-06, "epoch": 0.08596305339291473, "percentage": 8.6, "elapsed_time": "2:52:55", "remaining_time": "1 day, 6:38:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 934, "total_steps": 10853, "loss": 0.1917, "learning_rate": 4.982277207733751e-06, "epoch": 0.08605518957018474, "percentage": 8.61, "elapsed_time": "2:53:06", "remaining_time": "1 day, 6:38:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 935, "total_steps": 10853, "loss": 0.2101, "learning_rate": 4.982186546087665e-06, "epoch": 0.08614732574745473, "percentage": 8.62, "elapsed_time": "2:53:17", "remaining_time": "1 day, 6:38:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 936, "total_steps": 10853, "loss": 0.1853, "learning_rate": 4.98209565397029e-06, "epoch": 0.08623946192472474, "percentage": 8.62, "elapsed_time": "2:53:27", "remaining_time": "1 day, 6:37:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 937, "total_steps": 10853, "loss": 0.1909, "learning_rate": 4.9820045313900675e-06, "epoch": 0.08633159810199474, "percentage": 8.63, "elapsed_time": "2:53:37", "remaining_time": "1 day, 6:37:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 938, "total_steps": 10853, "loss": 0.1798, "learning_rate": 4.981913178355456e-06, "epoch": 0.08642373427926475, "percentage": 8.64, "elapsed_time": "2:53:47", "remaining_time": "1 day, 6:37:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 939, "total_steps": 10853, "loss": 0.1792, "learning_rate": 4.981821594874939e-06, "epoch": 0.08651587045653476, "percentage": 8.65, "elapsed_time": "2:53:58", "remaining_time": "1 day, 6:36:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 940, "total_steps": 10853, "loss": 0.1908, "learning_rate": 4.981729780957021e-06, "epoch": 0.08660800663380476, "percentage": 8.66, "elapsed_time": "2:54:09", "remaining_time": "1 day, 6:36:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 941, "total_steps": 10853, "loss": 0.182, "learning_rate": 4.981637736610224e-06, "epoch": 0.08670014281107477, "percentage": 8.67, "elapsed_time": "2:54:20", "remaining_time": "1 day, 6:36:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 942, "total_steps": 10853, "loss": 0.1962, "learning_rate": 4.981545461843098e-06, "epoch": 0.08679227898834477, "percentage": 8.68, "elapsed_time": "2:54:31", "remaining_time": "1 day, 6:36:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 943, "total_steps": 10853, "loss": 0.1876, "learning_rate": 4.9814529566642065e-06, "epoch": 0.08688441516561478, "percentage": 8.69, "elapsed_time": "2:54:43", "remaining_time": "1 day, 6:36:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 944, "total_steps": 10853, "loss": 0.1981, "learning_rate": 4.981360221082143e-06, "epoch": 0.08697655134288479, "percentage": 8.7, "elapsed_time": "2:54:54", "remaining_time": "1 day, 6:36:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 945, "total_steps": 10853, "loss": 0.2034, "learning_rate": 4.9812672551055144e-06, "epoch": 0.08706868752015479, "percentage": 8.71, "elapsed_time": "2:55:05", "remaining_time": "1 day, 6:35:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 946, "total_steps": 10853, "loss": 0.201, "learning_rate": 4.981174058742955e-06, "epoch": 0.0871608236974248, "percentage": 8.72, "elapsed_time": "2:55:17", "remaining_time": "1 day, 6:35:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 947, "total_steps": 10853, "loss": 0.211, "learning_rate": 4.981080632003117e-06, "epoch": 0.0872529598746948, "percentage": 8.73, "elapsed_time": "2:55:27", "remaining_time": "1 day, 6:35:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 948, "total_steps": 10853, "loss": 0.1781, "learning_rate": 4.980986974894676e-06, "epoch": 0.0873450960519648, "percentage": 8.73, "elapsed_time": "2:55:39", "remaining_time": "1 day, 6:35:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 949, "total_steps": 10853, "loss": 0.1832, "learning_rate": 4.980893087426326e-06, "epoch": 0.08743723222923482, "percentage": 8.74, "elapsed_time": "2:55:49", "remaining_time": "1 day, 6:34:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 950, "total_steps": 10853, "loss": 0.2071, "learning_rate": 4.980798969606787e-06, "epoch": 0.08752936840650481, "percentage": 8.75, "elapsed_time": "2:55:59", "remaining_time": "1 day, 6:34:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 951, "total_steps": 10853, "loss": 0.1889, "learning_rate": 4.980704621444797e-06, "epoch": 0.08762150458377482, "percentage": 8.76, "elapsed_time": "2:56:10", "remaining_time": "1 day, 6:34:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 952, "total_steps": 10853, "loss": 0.2151, "learning_rate": 4.980610042949115e-06, "epoch": 0.08771364076104482, "percentage": 8.77, "elapsed_time": "2:56:22", "remaining_time": "1 day, 6:34:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 953, "total_steps": 10853, "loss": 0.1894, "learning_rate": 4.980515234128522e-06, "epoch": 0.08780577693831483, "percentage": 8.78, "elapsed_time": "2:56:33", "remaining_time": "1 day, 6:34:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 954, "total_steps": 10853, "loss": 0.1723, "learning_rate": 4.980420194991826e-06, "epoch": 0.08789791311558483, "percentage": 8.79, "elapsed_time": "2:56:44", "remaining_time": "1 day, 6:33:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 955, "total_steps": 10853, "loss": 0.2016, "learning_rate": 4.980324925547845e-06, "epoch": 0.08799004929285484, "percentage": 8.8, "elapsed_time": "2:56:55", "remaining_time": "1 day, 6:33:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 956, "total_steps": 10853, "loss": 0.1948, "learning_rate": 4.980229425805429e-06, "epoch": 0.08808218547012485, "percentage": 8.81, "elapsed_time": "2:57:07", "remaining_time": "1 day, 6:33:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 957, "total_steps": 10853, "loss": 0.1976, "learning_rate": 4.9801336957734435e-06, "epoch": 0.08817432164739485, "percentage": 8.82, "elapsed_time": "2:57:18", "remaining_time": "1 day, 6:33:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 958, "total_steps": 10853, "loss": 0.1884, "learning_rate": 4.980037735460778e-06, "epoch": 0.08826645782466486, "percentage": 8.83, "elapsed_time": "2:57:29", "remaining_time": "1 day, 6:33:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 959, "total_steps": 10853, "loss": 0.1905, "learning_rate": 4.9799415448763414e-06, "epoch": 0.08835859400193485, "percentage": 8.84, "elapsed_time": "2:57:40", "remaining_time": "1 day, 6:33:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 960, "total_steps": 10853, "loss": 0.1997, "learning_rate": 4.979845124029066e-06, "epoch": 0.08845073017920486, "percentage": 8.85, "elapsed_time": "2:57:52", "remaining_time": "1 day, 6:32:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 961, "total_steps": 10853, "loss": 0.1826, "learning_rate": 4.979748472927903e-06, "epoch": 0.08854286635647488, "percentage": 8.85, "elapsed_time": "2:58:04", "remaining_time": "1 day, 6:32:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 962, "total_steps": 10853, "loss": 0.1938, "learning_rate": 4.979651591581829e-06, "epoch": 0.08863500253374487, "percentage": 8.86, "elapsed_time": "2:58:15", "remaining_time": "1 day, 6:32:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 963, "total_steps": 10853, "loss": 0.1979, "learning_rate": 4.979554479999836e-06, "epoch": 0.08872713871101488, "percentage": 8.87, "elapsed_time": "2:58:24", "remaining_time": "1 day, 6:32:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 964, "total_steps": 10853, "loss": 0.1991, "learning_rate": 4.979457138190944e-06, "epoch": 0.08881927488828488, "percentage": 8.88, "elapsed_time": "2:58:36", "remaining_time": "1 day, 6:32:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 965, "total_steps": 10853, "loss": 0.1892, "learning_rate": 4.979359566164189e-06, "epoch": 0.08891141106555489, "percentage": 8.89, "elapsed_time": "2:58:47", "remaining_time": "1 day, 6:32:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 966, "total_steps": 10853, "loss": 0.2088, "learning_rate": 4.979261763928632e-06, "epoch": 0.0890035472428249, "percentage": 8.9, "elapsed_time": "2:58:58", "remaining_time": "1 day, 6:31:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 967, "total_steps": 10853, "loss": 0.2057, "learning_rate": 4.979163731493354e-06, "epoch": 0.0890956834200949, "percentage": 8.91, "elapsed_time": "2:59:08", "remaining_time": "1 day, 6:31:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 968, "total_steps": 10853, "loss": 0.1966, "learning_rate": 4.979065468867456e-06, "epoch": 0.08918781959736491, "percentage": 8.92, "elapsed_time": "2:59:18", "remaining_time": "1 day, 6:31:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 969, "total_steps": 10853, "loss": 0.1893, "learning_rate": 4.978966976060062e-06, "epoch": 0.0892799557746349, "percentage": 8.93, "elapsed_time": "2:59:29", "remaining_time": "1 day, 6:30:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 970, "total_steps": 10853, "loss": 0.1795, "learning_rate": 4.978868253080318e-06, "epoch": 0.08937209195190492, "percentage": 8.94, "elapsed_time": "2:59:39", "remaining_time": "1 day, 6:30:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 971, "total_steps": 10853, "loss": 0.1927, "learning_rate": 4.9787692999373895e-06, "epoch": 0.08946422812917491, "percentage": 8.95, "elapsed_time": "2:59:49", "remaining_time": "1 day, 6:30:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 972, "total_steps": 10853, "loss": 0.1886, "learning_rate": 4.978670116640465e-06, "epoch": 0.08955636430644492, "percentage": 8.96, "elapsed_time": "2:59:59", "remaining_time": "1 day, 6:29:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 973, "total_steps": 10853, "loss": 0.2073, "learning_rate": 4.978570703198754e-06, "epoch": 0.08964850048371494, "percentage": 8.97, "elapsed_time": "3:00:10", "remaining_time": "1 day, 6:29:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 974, "total_steps": 10853, "loss": 0.2001, "learning_rate": 4.978471059621486e-06, "epoch": 0.08974063666098493, "percentage": 8.97, "elapsed_time": "3:00:21", "remaining_time": "1 day, 6:29:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 975, "total_steps": 10853, "loss": 0.1871, "learning_rate": 4.978371185917913e-06, "epoch": 0.08983277283825494, "percentage": 8.98, "elapsed_time": "3:00:31", "remaining_time": "1 day, 6:29:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 976, "total_steps": 10853, "loss": 0.1865, "learning_rate": 4.978271082097309e-06, "epoch": 0.08992490901552494, "percentage": 8.99, "elapsed_time": "3:00:43", "remaining_time": "1 day, 6:28:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 977, "total_steps": 10853, "loss": 0.1827, "learning_rate": 4.978170748168968e-06, "epoch": 0.09001704519279495, "percentage": 9.0, "elapsed_time": "3:00:53", "remaining_time": "1 day, 6:28:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 978, "total_steps": 10853, "loss": 0.1955, "learning_rate": 4.978070184142207e-06, "epoch": 0.09010918137006496, "percentage": 9.01, "elapsed_time": "3:01:03", "remaining_time": "1 day, 6:28:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 979, "total_steps": 10853, "loss": 0.1902, "learning_rate": 4.977969390026362e-06, "epoch": 0.09020131754733496, "percentage": 9.02, "elapsed_time": "3:01:14", "remaining_time": "1 day, 6:28:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 980, "total_steps": 10853, "loss": 0.1904, "learning_rate": 4.9778683658307925e-06, "epoch": 0.09029345372460497, "percentage": 9.03, "elapsed_time": "3:01:23", "remaining_time": "1 day, 6:27:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 981, "total_steps": 10853, "loss": 0.1922, "learning_rate": 4.977767111564879e-06, "epoch": 0.09038558990187497, "percentage": 9.04, "elapsed_time": "3:01:35", "remaining_time": "1 day, 6:27:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 982, "total_steps": 10853, "loss": 0.1855, "learning_rate": 4.977665627238023e-06, "epoch": 0.09047772607914498, "percentage": 9.05, "elapsed_time": "3:01:45", "remaining_time": "1 day, 6:26:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 983, "total_steps": 10853, "loss": 0.1869, "learning_rate": 4.977563912859645e-06, "epoch": 0.09056986225641499, "percentage": 9.06, "elapsed_time": "3:01:56", "remaining_time": "1 day, 6:26:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 984, "total_steps": 10853, "loss": 0.1923, "learning_rate": 4.977461968439193e-06, "epoch": 0.09066199843368498, "percentage": 9.07, "elapsed_time": "3:02:07", "remaining_time": "1 day, 6:26:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 985, "total_steps": 10853, "loss": 0.1856, "learning_rate": 4.9773597939861294e-06, "epoch": 0.090754134610955, "percentage": 9.08, "elapsed_time": "3:02:18", "remaining_time": "1 day, 6:26:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 986, "total_steps": 10853, "loss": 0.1929, "learning_rate": 4.977257389509943e-06, "epoch": 0.09084627078822499, "percentage": 9.09, "elapsed_time": "3:02:30", "remaining_time": "1 day, 6:26:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 987, "total_steps": 10853, "loss": 0.1856, "learning_rate": 4.9771547550201414e-06, "epoch": 0.090938406965495, "percentage": 9.09, "elapsed_time": "3:02:41", "remaining_time": "1 day, 6:26:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 988, "total_steps": 10853, "loss": 0.1922, "learning_rate": 4.977051890526254e-06, "epoch": 0.09103054314276501, "percentage": 9.1, "elapsed_time": "3:02:51", "remaining_time": "1 day, 6:25:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 989, "total_steps": 10853, "loss": 0.194, "learning_rate": 4.976948796037831e-06, "epoch": 0.09112267932003501, "percentage": 9.11, "elapsed_time": "3:03:01", "remaining_time": "1 day, 6:25:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 990, "total_steps": 10853, "loss": 0.1924, "learning_rate": 4.976845471564447e-06, "epoch": 0.09121481549730502, "percentage": 9.12, "elapsed_time": "3:03:13", "remaining_time": "1 day, 6:25:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 991, "total_steps": 10853, "loss": 0.1917, "learning_rate": 4.976741917115695e-06, "epoch": 0.09130695167457502, "percentage": 9.13, "elapsed_time": "3:03:24", "remaining_time": "1 day, 6:25:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 992, "total_steps": 10853, "loss": 0.1842, "learning_rate": 4.976638132701188e-06, "epoch": 0.09139908785184503, "percentage": 9.14, "elapsed_time": "3:03:36", "remaining_time": "1 day, 6:25:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 993, "total_steps": 10853, "loss": 0.1788, "learning_rate": 4.976534118330565e-06, "epoch": 0.09149122402911503, "percentage": 9.15, "elapsed_time": "3:03:47", "remaining_time": "1 day, 6:24:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 994, "total_steps": 10853, "loss": 0.1901, "learning_rate": 4.9764298740134814e-06, "epoch": 0.09158336020638504, "percentage": 9.16, "elapsed_time": "3:03:59", "remaining_time": "1 day, 6:24:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 995, "total_steps": 10853, "loss": 0.1951, "learning_rate": 4.976325399759619e-06, "epoch": 0.09167549638365505, "percentage": 9.17, "elapsed_time": "3:04:11", "remaining_time": "1 day, 6:24:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 996, "total_steps": 10853, "loss": 0.1741, "learning_rate": 4.976220695578675e-06, "epoch": 0.09176763256092504, "percentage": 9.18, "elapsed_time": "3:04:21", "remaining_time": "1 day, 6:24:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 997, "total_steps": 10853, "loss": 0.2019, "learning_rate": 4.976115761480373e-06, "epoch": 0.09185976873819506, "percentage": 9.19, "elapsed_time": "3:04:32", "remaining_time": "1 day, 6:24:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 998, "total_steps": 10853, "loss": 0.2021, "learning_rate": 4.9760105974744576e-06, "epoch": 0.09195190491546505, "percentage": 9.2, "elapsed_time": "3:04:42", "remaining_time": "1 day, 6:23:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 999, "total_steps": 10853, "loss": 0.1871, "learning_rate": 4.97590520357069e-06, "epoch": 0.09204404109273506, "percentage": 9.2, "elapsed_time": "3:04:53", "remaining_time": "1 day, 6:23:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1000, "total_steps": 10853, "loss": 0.192, "learning_rate": 4.97579957977886e-06, "epoch": 0.09213617727000507, "percentage": 9.21, "elapsed_time": "3:05:02", "remaining_time": "1 day, 6:23:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1000, "total_steps": 10853, "eval_loss": 0.19303320348262787, "epoch": 0.09213617727000507, "percentage": 9.21, "elapsed_time": "3:10:01", "remaining_time": "1 day, 7:12:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1001, "total_steps": 10853, "loss": 0.1831, "learning_rate": 4.97569372610877e-06, "epoch": 0.09222831344727507, "percentage": 9.22, "elapsed_time": "3:10:13", "remaining_time": "1 day, 7:12:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1002, "total_steps": 10853, "loss": 0.1828, "learning_rate": 4.975587642570252e-06, "epoch": 0.09232044962454508, "percentage": 9.23, "elapsed_time": "3:10:25", "remaining_time": "1 day, 7:12:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1003, "total_steps": 10853, "loss": 0.1856, "learning_rate": 4.975481329173156e-06, "epoch": 0.09241258580181508, "percentage": 9.24, "elapsed_time": "3:10:36", "remaining_time": "1 day, 7:11:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1004, "total_steps": 10853, "loss": 0.1847, "learning_rate": 4.975374785927351e-06, "epoch": 0.09250472197908509, "percentage": 9.25, "elapsed_time": "3:10:47", "remaining_time": "1 day, 7:11:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1005, "total_steps": 10853, "loss": 0.1876, "learning_rate": 4.975268012842732e-06, "epoch": 0.0925968581563551, "percentage": 9.26, "elapsed_time": "3:10:58", "remaining_time": "1 day, 7:11:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1006, "total_steps": 10853, "loss": 0.1964, "learning_rate": 4.97516100992921e-06, "epoch": 0.0926889943336251, "percentage": 9.27, "elapsed_time": "3:11:08", "remaining_time": "1 day, 7:10:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1007, "total_steps": 10853, "loss": 0.2036, "learning_rate": 4.975053777196723e-06, "epoch": 0.09278113051089511, "percentage": 9.28, "elapsed_time": "3:11:19", "remaining_time": "1 day, 7:10:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1008, "total_steps": 10853, "loss": 0.2035, "learning_rate": 4.974946314655226e-06, "epoch": 0.0928732666881651, "percentage": 9.29, "elapsed_time": "3:11:30", "remaining_time": "1 day, 7:10:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1009, "total_steps": 10853, "loss": 0.1969, "learning_rate": 4.974838622314698e-06, "epoch": 0.09296540286543511, "percentage": 9.3, "elapsed_time": "3:11:41", "remaining_time": "1 day, 7:10:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1010, "total_steps": 10853, "loss": 0.2025, "learning_rate": 4.974730700185136e-06, "epoch": 0.09305753904270511, "percentage": 9.31, "elapsed_time": "3:11:52", "remaining_time": "1 day, 7:09:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1011, "total_steps": 10853, "loss": 0.2024, "learning_rate": 4.974622548276564e-06, "epoch": 0.09314967521997512, "percentage": 9.32, "elapsed_time": "3:12:04", "remaining_time": "1 day, 7:09:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1012, "total_steps": 10853, "loss": 0.1936, "learning_rate": 4.974514166599021e-06, "epoch": 0.09324181139724513, "percentage": 9.32, "elapsed_time": "3:12:14", "remaining_time": "1 day, 7:09:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1013, "total_steps": 10853, "loss": 0.1912, "learning_rate": 4.974405555162571e-06, "epoch": 0.09333394757451513, "percentage": 9.33, "elapsed_time": "3:12:26", "remaining_time": "1 day, 7:09:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1014, "total_steps": 10853, "loss": 0.2018, "learning_rate": 4.9742967139773e-06, "epoch": 0.09342608375178514, "percentage": 9.34, "elapsed_time": "3:12:37", "remaining_time": "1 day, 7:09:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1015, "total_steps": 10853, "loss": 0.1711, "learning_rate": 4.974187643053312e-06, "epoch": 0.09351821992905514, "percentage": 9.35, "elapsed_time": "3:12:47", "remaining_time": "1 day, 7:08:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1016, "total_steps": 10853, "loss": 0.1957, "learning_rate": 4.9740783424007355e-06, "epoch": 0.09361035610632515, "percentage": 9.36, "elapsed_time": "3:12:58", "remaining_time": "1 day, 7:08:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1017, "total_steps": 10853, "loss": 0.21, "learning_rate": 4.973968812029718e-06, "epoch": 0.09370249228359516, "percentage": 9.37, "elapsed_time": "3:13:08", "remaining_time": "1 day, 7:07:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1018, "total_steps": 10853, "loss": 0.175, "learning_rate": 4.973859051950431e-06, "epoch": 0.09379462846086516, "percentage": 9.38, "elapsed_time": "3:13:20", "remaining_time": "1 day, 7:07:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1019, "total_steps": 10853, "loss": 0.1994, "learning_rate": 4.973749062173065e-06, "epoch": 0.09388676463813517, "percentage": 9.39, "elapsed_time": "3:13:31", "remaining_time": "1 day, 7:07:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1020, "total_steps": 10853, "loss": 0.1969, "learning_rate": 4.973638842707831e-06, "epoch": 0.09397890081540516, "percentage": 9.4, "elapsed_time": "3:13:41", "remaining_time": "1 day, 7:07:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1021, "total_steps": 10853, "loss": 0.1752, "learning_rate": 4.973528393564965e-06, "epoch": 0.09407103699267517, "percentage": 9.41, "elapsed_time": "3:13:51", "remaining_time": "1 day, 7:06:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1022, "total_steps": 10853, "loss": 0.194, "learning_rate": 4.973417714754721e-06, "epoch": 0.09416317316994519, "percentage": 9.42, "elapsed_time": "3:14:02", "remaining_time": "1 day, 7:06:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1023, "total_steps": 10853, "loss": 0.1903, "learning_rate": 4.973306806287376e-06, "epoch": 0.09425530934721518, "percentage": 9.43, "elapsed_time": "3:14:13", "remaining_time": "1 day, 7:06:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1024, "total_steps": 10853, "loss": 0.1828, "learning_rate": 4.9731956681732284e-06, "epoch": 0.0943474455244852, "percentage": 9.44, "elapsed_time": "3:14:23", "remaining_time": "1 day, 7:05:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1025, "total_steps": 10853, "loss": 0.1931, "learning_rate": 4.973084300422597e-06, "epoch": 0.09443958170175519, "percentage": 9.44, "elapsed_time": "3:14:35", "remaining_time": "1 day, 7:05:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1026, "total_steps": 10853, "loss": 0.195, "learning_rate": 4.972972703045822e-06, "epoch": 0.0945317178790252, "percentage": 9.45, "elapsed_time": "3:14:46", "remaining_time": "1 day, 7:05:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1027, "total_steps": 10853, "loss": 0.1982, "learning_rate": 4.972860876053265e-06, "epoch": 0.0946238540562952, "percentage": 9.46, "elapsed_time": "3:14:56", "remaining_time": "1 day, 7:05:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1028, "total_steps": 10853, "loss": 0.1811, "learning_rate": 4.97274881945531e-06, "epoch": 0.09471599023356521, "percentage": 9.47, "elapsed_time": "3:15:08", "remaining_time": "1 day, 7:05:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1029, "total_steps": 10853, "loss": 0.2073, "learning_rate": 4.97263653326236e-06, "epoch": 0.09480812641083522, "percentage": 9.48, "elapsed_time": "3:15:20", "remaining_time": "1 day, 7:04:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1030, "total_steps": 10853, "loss": 0.1841, "learning_rate": 4.972524017484842e-06, "epoch": 0.09490026258810522, "percentage": 9.49, "elapsed_time": "3:15:31", "remaining_time": "1 day, 7:04:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1031, "total_steps": 10853, "loss": 0.1848, "learning_rate": 4.972411272133204e-06, "epoch": 0.09499239876537523, "percentage": 9.5, "elapsed_time": "3:15:42", "remaining_time": "1 day, 7:04:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1032, "total_steps": 10853, "loss": 0.1851, "learning_rate": 4.972298297217913e-06, "epoch": 0.09508453494264522, "percentage": 9.51, "elapsed_time": "3:15:53", "remaining_time": "1 day, 7:04:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1033, "total_steps": 10853, "loss": 0.1888, "learning_rate": 4.972185092749458e-06, "epoch": 0.09517667111991523, "percentage": 9.52, "elapsed_time": "3:16:03", "remaining_time": "1 day, 7:03:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1034, "total_steps": 10853, "loss": 0.1961, "learning_rate": 4.972071658738352e-06, "epoch": 0.09526880729718525, "percentage": 9.53, "elapsed_time": "3:16:14", "remaining_time": "1 day, 7:03:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1035, "total_steps": 10853, "loss": 0.1919, "learning_rate": 4.971957995195126e-06, "epoch": 0.09536094347445524, "percentage": 9.54, "elapsed_time": "3:16:25", "remaining_time": "1 day, 7:03:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1036, "total_steps": 10853, "loss": 0.1929, "learning_rate": 4.971844102130334e-06, "epoch": 0.09545307965172525, "percentage": 9.55, "elapsed_time": "3:16:36", "remaining_time": "1 day, 7:02:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1037, "total_steps": 10853, "loss": 0.1956, "learning_rate": 4.971729979554551e-06, "epoch": 0.09554521582899525, "percentage": 9.55, "elapsed_time": "3:16:47", "remaining_time": "1 day, 7:02:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1038, "total_steps": 10853, "loss": 0.186, "learning_rate": 4.9716156274783746e-06, "epoch": 0.09563735200626526, "percentage": 9.56, "elapsed_time": "3:16:58", "remaining_time": "1 day, 7:02:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1039, "total_steps": 10853, "loss": 0.2068, "learning_rate": 4.9715010459124205e-06, "epoch": 0.09572948818353527, "percentage": 9.57, "elapsed_time": "3:17:09", "remaining_time": "1 day, 7:02:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1040, "total_steps": 10853, "loss": 0.197, "learning_rate": 4.971386234867328e-06, "epoch": 0.09582162436080527, "percentage": 9.58, "elapsed_time": "3:17:19", "remaining_time": "1 day, 7:01:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1041, "total_steps": 10853, "loss": 0.1895, "learning_rate": 4.971271194353757e-06, "epoch": 0.09591376053807528, "percentage": 9.59, "elapsed_time": "3:17:30", "remaining_time": "1 day, 7:01:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1042, "total_steps": 10853, "loss": 0.1856, "learning_rate": 4.971155924382392e-06, "epoch": 0.09600589671534528, "percentage": 9.6, "elapsed_time": "3:17:39", "remaining_time": "1 day, 7:00:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1043, "total_steps": 10853, "loss": 0.1694, "learning_rate": 4.971040424963931e-06, "epoch": 0.09609803289261529, "percentage": 9.61, "elapsed_time": "3:17:48", "remaining_time": "1 day, 7:00:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1044, "total_steps": 10853, "loss": 0.1974, "learning_rate": 4.970924696109102e-06, "epoch": 0.09619016906988528, "percentage": 9.62, "elapsed_time": "3:18:00", "remaining_time": "1 day, 7:00:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1045, "total_steps": 10853, "loss": 0.214, "learning_rate": 4.970808737828648e-06, "epoch": 0.0962823052471553, "percentage": 9.63, "elapsed_time": "3:18:11", "remaining_time": "1 day, 7:00:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1046, "total_steps": 10853, "loss": 0.1959, "learning_rate": 4.970692550133337e-06, "epoch": 0.0963744414244253, "percentage": 9.64, "elapsed_time": "3:18:21", "remaining_time": "1 day, 6:59:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1047, "total_steps": 10853, "loss": 0.1924, "learning_rate": 4.970576133033958e-06, "epoch": 0.0964665776016953, "percentage": 9.65, "elapsed_time": "3:18:30", "remaining_time": "1 day, 6:59:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1048, "total_steps": 10853, "loss": 0.2013, "learning_rate": 4.970459486541318e-06, "epoch": 0.09655871377896531, "percentage": 9.66, "elapsed_time": "3:18:40", "remaining_time": "1 day, 6:58:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1049, "total_steps": 10853, "loss": 0.1947, "learning_rate": 4.970342610666249e-06, "epoch": 0.09665084995623531, "percentage": 9.67, "elapsed_time": "3:18:49", "remaining_time": "1 day, 6:58:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1050, "total_steps": 10853, "loss": 0.1769, "learning_rate": 4.970225505419602e-06, "epoch": 0.09674298613350532, "percentage": 9.67, "elapsed_time": "3:19:00", "remaining_time": "1 day, 6:58:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1051, "total_steps": 10853, "loss": 0.1953, "learning_rate": 4.970108170812252e-06, "epoch": 0.09683512231077533, "percentage": 9.68, "elapsed_time": "3:19:11", "remaining_time": "1 day, 6:57:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1052, "total_steps": 10853, "loss": 0.2071, "learning_rate": 4.969990606855093e-06, "epoch": 0.09692725848804533, "percentage": 9.69, "elapsed_time": "3:19:24", "remaining_time": "1 day, 6:57:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1053, "total_steps": 10853, "loss": 0.1821, "learning_rate": 4.969872813559039e-06, "epoch": 0.09701939466531534, "percentage": 9.7, "elapsed_time": "3:19:35", "remaining_time": "1 day, 6:57:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1054, "total_steps": 10853, "loss": 0.1987, "learning_rate": 4.9697547909350295e-06, "epoch": 0.09711153084258534, "percentage": 9.71, "elapsed_time": "3:19:46", "remaining_time": "1 day, 6:57:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1055, "total_steps": 10853, "loss": 0.1918, "learning_rate": 4.969636538994021e-06, "epoch": 0.09720366701985535, "percentage": 9.72, "elapsed_time": "3:19:57", "remaining_time": "1 day, 6:57:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1056, "total_steps": 10853, "loss": 0.2002, "learning_rate": 4.969518057746995e-06, "epoch": 0.09729580319712536, "percentage": 9.73, "elapsed_time": "3:20:07", "remaining_time": "1 day, 6:56:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1057, "total_steps": 10853, "loss": 0.1829, "learning_rate": 4.969399347204951e-06, "epoch": 0.09738793937439535, "percentage": 9.74, "elapsed_time": "3:20:19", "remaining_time": "1 day, 6:56:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1058, "total_steps": 10853, "loss": 0.192, "learning_rate": 4.969280407378912e-06, "epoch": 0.09748007555166537, "percentage": 9.75, "elapsed_time": "3:20:30", "remaining_time": "1 day, 6:56:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1059, "total_steps": 10853, "loss": 0.194, "learning_rate": 4.9691612382799215e-06, "epoch": 0.09757221172893536, "percentage": 9.76, "elapsed_time": "3:20:41", "remaining_time": "1 day, 6:55:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1060, "total_steps": 10853, "loss": 0.1909, "learning_rate": 4.969041839919044e-06, "epoch": 0.09766434790620537, "percentage": 9.77, "elapsed_time": "3:20:51", "remaining_time": "1 day, 6:55:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1061, "total_steps": 10853, "loss": 0.1922, "learning_rate": 4.968922212307367e-06, "epoch": 0.09775648408347537, "percentage": 9.78, "elapsed_time": "3:21:01", "remaining_time": "1 day, 6:55:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1062, "total_steps": 10853, "loss": 0.1923, "learning_rate": 4.968802355455995e-06, "epoch": 0.09784862026074538, "percentage": 9.79, "elapsed_time": "3:21:11", "remaining_time": "1 day, 6:54:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1063, "total_steps": 10853, "loss": 0.1751, "learning_rate": 4.96868226937606e-06, "epoch": 0.09794075643801539, "percentage": 9.79, "elapsed_time": "3:21:20", "remaining_time": "1 day, 6:54:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1064, "total_steps": 10853, "loss": 0.1931, "learning_rate": 4.96856195407871e-06, "epoch": 0.09803289261528539, "percentage": 9.8, "elapsed_time": "3:21:31", "remaining_time": "1 day, 6:54:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1065, "total_steps": 10853, "loss": 0.1906, "learning_rate": 4.968441409575117e-06, "epoch": 0.0981250287925554, "percentage": 9.81, "elapsed_time": "3:21:41", "remaining_time": "1 day, 6:53:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1066, "total_steps": 10853, "loss": 0.1857, "learning_rate": 4.968320635876473e-06, "epoch": 0.0982171649698254, "percentage": 9.82, "elapsed_time": "3:21:53", "remaining_time": "1 day, 6:53:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1067, "total_steps": 10853, "loss": 0.1943, "learning_rate": 4.968199632993994e-06, "epoch": 0.09830930114709541, "percentage": 9.83, "elapsed_time": "3:22:03", "remaining_time": "1 day, 6:53:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1068, "total_steps": 10853, "loss": 0.1981, "learning_rate": 4.968078400938912e-06, "epoch": 0.09840143732436542, "percentage": 9.84, "elapsed_time": "3:22:14", "remaining_time": "1 day, 6:52:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1069, "total_steps": 10853, "loss": 0.1969, "learning_rate": 4.967956939722485e-06, "epoch": 0.09849357350163541, "percentage": 9.85, "elapsed_time": "3:22:25", "remaining_time": "1 day, 6:52:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1070, "total_steps": 10853, "loss": 0.1858, "learning_rate": 4.967835249355991e-06, "epoch": 0.09858570967890543, "percentage": 9.86, "elapsed_time": "3:22:37", "remaining_time": "1 day, 6:52:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1071, "total_steps": 10853, "loss": 0.1859, "learning_rate": 4.967713329850728e-06, "epoch": 0.09867784585617542, "percentage": 9.87, "elapsed_time": "3:22:48", "remaining_time": "1 day, 6:52:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1072, "total_steps": 10853, "loss": 0.192, "learning_rate": 4.967591181218017e-06, "epoch": 0.09876998203344543, "percentage": 9.88, "elapsed_time": "3:22:58", "remaining_time": "1 day, 6:51:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1073, "total_steps": 10853, "loss": 0.195, "learning_rate": 4.967468803469199e-06, "epoch": 0.09886211821071544, "percentage": 9.89, "elapsed_time": "3:23:08", "remaining_time": "1 day, 6:51:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1074, "total_steps": 10853, "loss": 0.1767, "learning_rate": 4.967346196615638e-06, "epoch": 0.09895425438798544, "percentage": 9.9, "elapsed_time": "3:23:18", "remaining_time": "1 day, 6:51:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1075, "total_steps": 10853, "loss": 0.1846, "learning_rate": 4.967223360668716e-06, "epoch": 0.09904639056525545, "percentage": 9.91, "elapsed_time": "3:23:29", "remaining_time": "1 day, 6:50:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1076, "total_steps": 10853, "loss": 0.1973, "learning_rate": 4.9671002956398395e-06, "epoch": 0.09913852674252545, "percentage": 9.91, "elapsed_time": "3:23:40", "remaining_time": "1 day, 6:50:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1077, "total_steps": 10853, "loss": 0.1926, "learning_rate": 4.966977001540436e-06, "epoch": 0.09923066291979546, "percentage": 9.92, "elapsed_time": "3:23:51", "remaining_time": "1 day, 6:50:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1078, "total_steps": 10853, "loss": 0.1995, "learning_rate": 4.966853478381951e-06, "epoch": 0.09932279909706546, "percentage": 9.93, "elapsed_time": "3:24:01", "remaining_time": "1 day, 6:50:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1079, "total_steps": 10853, "loss": 0.1848, "learning_rate": 4.966729726175857e-06, "epoch": 0.09941493527433547, "percentage": 9.94, "elapsed_time": "3:24:12", "remaining_time": "1 day, 6:49:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1080, "total_steps": 10853, "loss": 0.1954, "learning_rate": 4.96660574493364e-06, "epoch": 0.09950707145160548, "percentage": 9.95, "elapsed_time": "3:24:23", "remaining_time": "1 day, 6:49:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1081, "total_steps": 10853, "loss": 0.2055, "learning_rate": 4.9664815346668165e-06, "epoch": 0.09959920762887547, "percentage": 9.96, "elapsed_time": "3:24:35", "remaining_time": "1 day, 6:49:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1082, "total_steps": 10853, "loss": 0.1972, "learning_rate": 4.966357095386915e-06, "epoch": 0.09969134380614549, "percentage": 9.97, "elapsed_time": "3:24:44", "remaining_time": "1 day, 6:48:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1083, "total_steps": 10853, "loss": 0.1825, "learning_rate": 4.966232427105493e-06, "epoch": 0.09978347998341548, "percentage": 9.98, "elapsed_time": "3:24:54", "remaining_time": "1 day, 6:48:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1084, "total_steps": 10853, "loss": 0.1679, "learning_rate": 4.9661075298341245e-06, "epoch": 0.0998756161606855, "percentage": 9.99, "elapsed_time": "3:25:05", "remaining_time": "1 day, 6:48:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1085, "total_steps": 10853, "loss": 0.1978, "learning_rate": 4.965982403584406e-06, "epoch": 0.0999677523379555, "percentage": 10.0, "elapsed_time": "3:25:17", "remaining_time": "1 day, 6:48:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1086, "total_steps": 10853, "loss": 0.2016, "learning_rate": 4.965857048367956e-06, "epoch": 0.1000598885152255, "percentage": 10.01, "elapsed_time": "3:25:28", "remaining_time": "1 day, 6:47:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1087, "total_steps": 10853, "loss": 0.1981, "learning_rate": 4.965731464196415e-06, "epoch": 0.10015202469249551, "percentage": 10.02, "elapsed_time": "3:25:39", "remaining_time": "1 day, 6:47:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1088, "total_steps": 10853, "loss": 0.2093, "learning_rate": 4.96560565108144e-06, "epoch": 0.10024416086976551, "percentage": 10.02, "elapsed_time": "3:25:49", "remaining_time": "1 day, 6:47:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1089, "total_steps": 10853, "loss": 0.1761, "learning_rate": 4.965479609034717e-06, "epoch": 0.10033629704703552, "percentage": 10.03, "elapsed_time": "3:26:00", "remaining_time": "1 day, 6:47:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1090, "total_steps": 10853, "loss": 0.2124, "learning_rate": 4.9653533380679455e-06, "epoch": 0.10042843322430553, "percentage": 10.04, "elapsed_time": "3:26:11", "remaining_time": "1 day, 6:46:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1091, "total_steps": 10853, "loss": 0.1835, "learning_rate": 4.965226838192852e-06, "epoch": 0.10052056940157553, "percentage": 10.05, "elapsed_time": "3:26:22", "remaining_time": "1 day, 6:46:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1092, "total_steps": 10853, "loss": 0.1779, "learning_rate": 4.965100109421182e-06, "epoch": 0.10061270557884554, "percentage": 10.06, "elapsed_time": "3:26:32", "remaining_time": "1 day, 6:46:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1093, "total_steps": 10853, "loss": 0.1769, "learning_rate": 4.9649731517647e-06, "epoch": 0.10070484175611553, "percentage": 10.07, "elapsed_time": "3:26:42", "remaining_time": "1 day, 6:45:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1094, "total_steps": 10853, "loss": 0.1934, "learning_rate": 4.964845965235196e-06, "epoch": 0.10079697793338555, "percentage": 10.08, "elapsed_time": "3:26:53", "remaining_time": "1 day, 6:45:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1095, "total_steps": 10853, "loss": 0.2077, "learning_rate": 4.964718549844479e-06, "epoch": 0.10088911411065554, "percentage": 10.09, "elapsed_time": "3:27:02", "remaining_time": "1 day, 6:45:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1096, "total_steps": 10853, "loss": 0.1839, "learning_rate": 4.964590905604379e-06, "epoch": 0.10098125028792555, "percentage": 10.1, "elapsed_time": "3:27:12", "remaining_time": "1 day, 6:44:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1097, "total_steps": 10853, "loss": 0.1921, "learning_rate": 4.964463032526749e-06, "epoch": 0.10107338646519556, "percentage": 10.11, "elapsed_time": "3:27:23", "remaining_time": "1 day, 6:44:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1098, "total_steps": 10853, "loss": 0.1873, "learning_rate": 4.9643349306234615e-06, "epoch": 0.10116552264246556, "percentage": 10.12, "elapsed_time": "3:27:34", "remaining_time": "1 day, 6:44:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1099, "total_steps": 10853, "loss": 0.1809, "learning_rate": 4.96420659990641e-06, "epoch": 0.10125765881973557, "percentage": 10.13, "elapsed_time": "3:27:45", "remaining_time": "1 day, 6:43:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1100, "total_steps": 10853, "loss": 0.1995, "learning_rate": 4.9640780403875095e-06, "epoch": 0.10134979499700557, "percentage": 10.14, "elapsed_time": "3:27:55", "remaining_time": "1 day, 6:43:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1101, "total_steps": 10853, "loss": 0.1965, "learning_rate": 4.963949252078698e-06, "epoch": 0.10144193117427558, "percentage": 10.14, "elapsed_time": "3:28:07", "remaining_time": "1 day, 6:43:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1102, "total_steps": 10853, "loss": 0.2028, "learning_rate": 4.963820234991934e-06, "epoch": 0.10153406735154559, "percentage": 10.15, "elapsed_time": "3:28:17", "remaining_time": "1 day, 6:43:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1103, "total_steps": 10853, "loss": 0.1775, "learning_rate": 4.963690989139196e-06, "epoch": 0.10162620352881559, "percentage": 10.16, "elapsed_time": "3:28:29", "remaining_time": "1 day, 6:42:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1104, "total_steps": 10853, "loss": 0.174, "learning_rate": 4.963561514532485e-06, "epoch": 0.1017183397060856, "percentage": 10.17, "elapsed_time": "3:28:41", "remaining_time": "1 day, 6:42:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1105, "total_steps": 10853, "loss": 0.1923, "learning_rate": 4.963431811183821e-06, "epoch": 0.1018104758833556, "percentage": 10.18, "elapsed_time": "3:28:51", "remaining_time": "1 day, 6:42:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1106, "total_steps": 10853, "loss": 0.1735, "learning_rate": 4.963301879105249e-06, "epoch": 0.1019026120606256, "percentage": 10.19, "elapsed_time": "3:29:02", "remaining_time": "1 day, 6:42:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1107, "total_steps": 10853, "loss": 0.1939, "learning_rate": 4.963171718308833e-06, "epoch": 0.10199474823789562, "percentage": 10.2, "elapsed_time": "3:29:13", "remaining_time": "1 day, 6:42:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1108, "total_steps": 10853, "loss": 0.184, "learning_rate": 4.963041328806656e-06, "epoch": 0.10208688441516561, "percentage": 10.21, "elapsed_time": "3:29:23", "remaining_time": "1 day, 6:41:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1109, "total_steps": 10853, "loss": 0.1919, "learning_rate": 4.962910710610827e-06, "epoch": 0.10217902059243562, "percentage": 10.22, "elapsed_time": "3:29:35", "remaining_time": "1 day, 6:41:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1110, "total_steps": 10853, "loss": 0.1765, "learning_rate": 4.962779863733475e-06, "epoch": 0.10227115676970562, "percentage": 10.23, "elapsed_time": "3:29:47", "remaining_time": "1 day, 6:41:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1111, "total_steps": 10853, "loss": 0.1892, "learning_rate": 4.962648788186747e-06, "epoch": 0.10236329294697563, "percentage": 10.24, "elapsed_time": "3:29:58", "remaining_time": "1 day, 6:41:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1112, "total_steps": 10853, "loss": 0.1818, "learning_rate": 4.9625174839828135e-06, "epoch": 0.10245542912424563, "percentage": 10.25, "elapsed_time": "3:30:10", "remaining_time": "1 day, 6:41:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1113, "total_steps": 10853, "loss": 0.1859, "learning_rate": 4.9623859511338664e-06, "epoch": 0.10254756530151564, "percentage": 10.26, "elapsed_time": "3:30:22", "remaining_time": "1 day, 6:41:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1114, "total_steps": 10853, "loss": 0.1938, "learning_rate": 4.962254189652119e-06, "epoch": 0.10263970147878565, "percentage": 10.26, "elapsed_time": "3:30:34", "remaining_time": "1 day, 6:40:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1115, "total_steps": 10853, "loss": 0.1842, "learning_rate": 4.962122199549806e-06, "epoch": 0.10273183765605565, "percentage": 10.27, "elapsed_time": "3:30:46", "remaining_time": "1 day, 6:40:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1116, "total_steps": 10853, "loss": 0.1868, "learning_rate": 4.96198998083918e-06, "epoch": 0.10282397383332566, "percentage": 10.28, "elapsed_time": "3:30:58", "remaining_time": "1 day, 6:40:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1117, "total_steps": 10853, "loss": 0.2017, "learning_rate": 4.961857533532521e-06, "epoch": 0.10291611001059565, "percentage": 10.29, "elapsed_time": "3:31:08", "remaining_time": "1 day, 6:40:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1118, "total_steps": 10853, "loss": 0.188, "learning_rate": 4.961724857642125e-06, "epoch": 0.10300824618786567, "percentage": 10.3, "elapsed_time": "3:31:19", "remaining_time": "1 day, 6:40:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1119, "total_steps": 10853, "loss": 0.1807, "learning_rate": 4.96159195318031e-06, "epoch": 0.10310038236513568, "percentage": 10.31, "elapsed_time": "3:31:28", "remaining_time": "1 day, 6:39:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1120, "total_steps": 10853, "loss": 0.1962, "learning_rate": 4.9614588201594175e-06, "epoch": 0.10319251854240567, "percentage": 10.32, "elapsed_time": "3:31:40", "remaining_time": "1 day, 6:39:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1121, "total_steps": 10853, "loss": 0.1967, "learning_rate": 4.961325458591809e-06, "epoch": 0.10328465471967568, "percentage": 10.33, "elapsed_time": "3:31:51", "remaining_time": "1 day, 6:39:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1122, "total_steps": 10853, "loss": 0.1847, "learning_rate": 4.961191868489866e-06, "epoch": 0.10337679089694568, "percentage": 10.34, "elapsed_time": "3:32:03", "remaining_time": "1 day, 6:39:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1123, "total_steps": 10853, "loss": 0.1841, "learning_rate": 4.961058049865994e-06, "epoch": 0.10346892707421569, "percentage": 10.35, "elapsed_time": "3:32:14", "remaining_time": "1 day, 6:38:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1124, "total_steps": 10853, "loss": 0.2036, "learning_rate": 4.960924002732616e-06, "epoch": 0.1035610632514857, "percentage": 10.36, "elapsed_time": "3:32:25", "remaining_time": "1 day, 6:38:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1125, "total_steps": 10853, "loss": 0.1765, "learning_rate": 4.9607897271021815e-06, "epoch": 0.1036531994287557, "percentage": 10.37, "elapsed_time": "3:32:36", "remaining_time": "1 day, 6:38:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1126, "total_steps": 10853, "loss": 0.2013, "learning_rate": 4.960655222987155e-06, "epoch": 0.10374533560602571, "percentage": 10.38, "elapsed_time": "3:32:46", "remaining_time": "1 day, 6:38:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1127, "total_steps": 10853, "loss": 0.1849, "learning_rate": 4.960520490400026e-06, "epoch": 0.1038374717832957, "percentage": 10.38, "elapsed_time": "3:32:57", "remaining_time": "1 day, 6:37:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1128, "total_steps": 10853, "loss": 0.1859, "learning_rate": 4.9603855293533045e-06, "epoch": 0.10392960796056572, "percentage": 10.39, "elapsed_time": "3:33:07", "remaining_time": "1 day, 6:37:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1129, "total_steps": 10853, "loss": 0.1922, "learning_rate": 4.960250339859523e-06, "epoch": 0.10402174413783571, "percentage": 10.4, "elapsed_time": "3:33:17", "remaining_time": "1 day, 6:37:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1130, "total_steps": 10853, "loss": 0.1816, "learning_rate": 4.960114921931231e-06, "epoch": 0.10411388031510573, "percentage": 10.41, "elapsed_time": "3:33:28", "remaining_time": "1 day, 6:36:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1131, "total_steps": 10853, "loss": 0.1926, "learning_rate": 4.959979275581005e-06, "epoch": 0.10420601649237574, "percentage": 10.42, "elapsed_time": "3:33:38", "remaining_time": "1 day, 6:36:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1132, "total_steps": 10853, "loss": 0.187, "learning_rate": 4.959843400821438e-06, "epoch": 0.10429815266964573, "percentage": 10.43, "elapsed_time": "3:33:47", "remaining_time": "1 day, 6:35:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1133, "total_steps": 10853, "loss": 0.1666, "learning_rate": 4.959707297665146e-06, "epoch": 0.10439028884691574, "percentage": 10.44, "elapsed_time": "3:33:58", "remaining_time": "1 day, 6:35:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1134, "total_steps": 10853, "loss": 0.1983, "learning_rate": 4.959570966124768e-06, "epoch": 0.10448242502418574, "percentage": 10.45, "elapsed_time": "3:34:09", "remaining_time": "1 day, 6:35:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1135, "total_steps": 10853, "loss": 0.187, "learning_rate": 4.959434406212959e-06, "epoch": 0.10457456120145575, "percentage": 10.46, "elapsed_time": "3:34:19", "remaining_time": "1 day, 6:35:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1136, "total_steps": 10853, "loss": 0.2021, "learning_rate": 4.959297617942403e-06, "epoch": 0.10466669737872576, "percentage": 10.47, "elapsed_time": "3:34:30", "remaining_time": "1 day, 6:34:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1137, "total_steps": 10853, "loss": 0.1852, "learning_rate": 4.959160601325797e-06, "epoch": 0.10475883355599576, "percentage": 10.48, "elapsed_time": "3:34:39", "remaining_time": "1 day, 6:34:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1138, "total_steps": 10853, "loss": 0.1921, "learning_rate": 4.959023356375866e-06, "epoch": 0.10485096973326577, "percentage": 10.49, "elapsed_time": "3:34:50", "remaining_time": "1 day, 6:34:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1139, "total_steps": 10853, "loss": 0.1953, "learning_rate": 4.9588858831053495e-06, "epoch": 0.10494310591053577, "percentage": 10.49, "elapsed_time": "3:35:02", "remaining_time": "1 day, 6:34:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1140, "total_steps": 10853, "loss": 0.1834, "learning_rate": 4.958748181527016e-06, "epoch": 0.10503524208780578, "percentage": 10.5, "elapsed_time": "3:35:13", "remaining_time": "1 day, 6:33:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1141, "total_steps": 10853, "loss": 0.1766, "learning_rate": 4.958610251653649e-06, "epoch": 0.10512737826507579, "percentage": 10.51, "elapsed_time": "3:35:25", "remaining_time": "1 day, 6:33:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1142, "total_steps": 10853, "loss": 0.1942, "learning_rate": 4.958472093498055e-06, "epoch": 0.10521951444234579, "percentage": 10.52, "elapsed_time": "3:35:36", "remaining_time": "1 day, 6:33:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1143, "total_steps": 10853, "loss": 0.1839, "learning_rate": 4.9583337070730625e-06, "epoch": 0.1053116506196158, "percentage": 10.53, "elapsed_time": "3:35:47", "remaining_time": "1 day, 6:33:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1144, "total_steps": 10853, "loss": 0.1908, "learning_rate": 4.958195092391521e-06, "epoch": 0.10540378679688579, "percentage": 10.54, "elapsed_time": "3:35:58", "remaining_time": "1 day, 6:32:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1145, "total_steps": 10853, "loss": 0.1772, "learning_rate": 4.958056249466301e-06, "epoch": 0.1054959229741558, "percentage": 10.55, "elapsed_time": "3:36:10", "remaining_time": "1 day, 6:32:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1146, "total_steps": 10853, "loss": 0.1931, "learning_rate": 4.957917178310293e-06, "epoch": 0.1055880591514258, "percentage": 10.56, "elapsed_time": "3:36:21", "remaining_time": "1 day, 6:32:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1147, "total_steps": 10853, "loss": 0.1966, "learning_rate": 4.957777878936411e-06, "epoch": 0.10568019532869581, "percentage": 10.57, "elapsed_time": "3:36:32", "remaining_time": "1 day, 6:32:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1148, "total_steps": 10853, "loss": 0.1931, "learning_rate": 4.957638351357587e-06, "epoch": 0.10577233150596582, "percentage": 10.58, "elapsed_time": "3:36:43", "remaining_time": "1 day, 6:32:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1149, "total_steps": 10853, "loss": 0.1823, "learning_rate": 4.957498595586779e-06, "epoch": 0.10586446768323582, "percentage": 10.59, "elapsed_time": "3:36:52", "remaining_time": "1 day, 6:31:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1150, "total_steps": 10853, "loss": 0.178, "learning_rate": 4.957358611636962e-06, "epoch": 0.10595660386050583, "percentage": 10.6, "elapsed_time": "3:37:04", "remaining_time": "1 day, 6:31:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1151, "total_steps": 10853, "loss": 0.1908, "learning_rate": 4.957218399521133e-06, "epoch": 0.10604874003777583, "percentage": 10.61, "elapsed_time": "3:37:15", "remaining_time": "1 day, 6:31:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1152, "total_steps": 10853, "loss": 0.1955, "learning_rate": 4.957077959252311e-06, "epoch": 0.10614087621504584, "percentage": 10.61, "elapsed_time": "3:37:25", "remaining_time": "1 day, 6:30:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1153, "total_steps": 10853, "loss": 0.1904, "learning_rate": 4.956937290843537e-06, "epoch": 0.10623301239231585, "percentage": 10.62, "elapsed_time": "3:37:36", "remaining_time": "1 day, 6:30:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1154, "total_steps": 10853, "loss": 0.2227, "learning_rate": 4.95679639430787e-06, "epoch": 0.10632514856958585, "percentage": 10.63, "elapsed_time": "3:37:46", "remaining_time": "1 day, 6:30:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1155, "total_steps": 10853, "loss": 0.1822, "learning_rate": 4.956655269658393e-06, "epoch": 0.10641728474685586, "percentage": 10.64, "elapsed_time": "3:37:57", "remaining_time": "1 day, 6:30:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1156, "total_steps": 10853, "loss": 0.1937, "learning_rate": 4.956513916908211e-06, "epoch": 0.10650942092412585, "percentage": 10.65, "elapsed_time": "3:38:08", "remaining_time": "1 day, 6:29:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1157, "total_steps": 10853, "loss": 0.1808, "learning_rate": 4.956372336070448e-06, "epoch": 0.10660155710139586, "percentage": 10.66, "elapsed_time": "3:38:18", "remaining_time": "1 day, 6:29:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1158, "total_steps": 10853, "loss": 0.1749, "learning_rate": 4.956230527158248e-06, "epoch": 0.10669369327866587, "percentage": 10.67, "elapsed_time": "3:38:28", "remaining_time": "1 day, 6:29:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1159, "total_steps": 10853, "loss": 0.1849, "learning_rate": 4.95608849018478e-06, "epoch": 0.10678582945593587, "percentage": 10.68, "elapsed_time": "3:38:38", "remaining_time": "1 day, 6:28:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1160, "total_steps": 10853, "loss": 0.2029, "learning_rate": 4.95594622516323e-06, "epoch": 0.10687796563320588, "percentage": 10.69, "elapsed_time": "3:38:49", "remaining_time": "1 day, 6:28:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1161, "total_steps": 10853, "loss": 0.2107, "learning_rate": 4.95580373210681e-06, "epoch": 0.10697010181047588, "percentage": 10.7, "elapsed_time": "3:38:58", "remaining_time": "1 day, 6:28:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1162, "total_steps": 10853, "loss": 0.2075, "learning_rate": 4.955661011028748e-06, "epoch": 0.10706223798774589, "percentage": 10.71, "elapsed_time": "3:39:10", "remaining_time": "1 day, 6:27:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1163, "total_steps": 10853, "loss": 0.1868, "learning_rate": 4.955518061942298e-06, "epoch": 0.1071543741650159, "percentage": 10.72, "elapsed_time": "3:39:20", "remaining_time": "1 day, 6:27:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1164, "total_steps": 10853, "loss": 0.2038, "learning_rate": 4.955374884860731e-06, "epoch": 0.1072465103422859, "percentage": 10.73, "elapsed_time": "3:39:31", "remaining_time": "1 day, 6:27:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1165, "total_steps": 10853, "loss": 0.2008, "learning_rate": 4.9552314797973426e-06, "epoch": 0.10733864651955591, "percentage": 10.73, "elapsed_time": "3:39:42", "remaining_time": "1 day, 6:27:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1166, "total_steps": 10853, "loss": 0.1886, "learning_rate": 4.955087846765446e-06, "epoch": 0.1074307826968259, "percentage": 10.74, "elapsed_time": "3:39:53", "remaining_time": "1 day, 6:26:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1167, "total_steps": 10853, "loss": 0.1911, "learning_rate": 4.954943985778379e-06, "epoch": 0.10752291887409592, "percentage": 10.75, "elapsed_time": "3:40:04", "remaining_time": "1 day, 6:26:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1168, "total_steps": 10853, "loss": 0.1988, "learning_rate": 4.954799896849499e-06, "epoch": 0.10761505505136591, "percentage": 10.76, "elapsed_time": "3:40:15", "remaining_time": "1 day, 6:26:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1169, "total_steps": 10853, "loss": 0.2008, "learning_rate": 4.954655579992184e-06, "epoch": 0.10770719122863592, "percentage": 10.77, "elapsed_time": "3:40:26", "remaining_time": "1 day, 6:26:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1170, "total_steps": 10853, "loss": 0.1905, "learning_rate": 4.954511035219835e-06, "epoch": 0.10779932740590593, "percentage": 10.78, "elapsed_time": "3:40:37", "remaining_time": "1 day, 6:25:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1171, "total_steps": 10853, "loss": 0.1893, "learning_rate": 4.954366262545871e-06, "epoch": 0.10789146358317593, "percentage": 10.79, "elapsed_time": "3:40:49", "remaining_time": "1 day, 6:25:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1172, "total_steps": 10853, "loss": 0.1841, "learning_rate": 4.954221261983736e-06, "epoch": 0.10798359976044594, "percentage": 10.8, "elapsed_time": "3:41:00", "remaining_time": "1 day, 6:25:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1173, "total_steps": 10853, "loss": 0.1942, "learning_rate": 4.954076033546892e-06, "epoch": 0.10807573593771594, "percentage": 10.81, "elapsed_time": "3:41:10", "remaining_time": "1 day, 6:25:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1174, "total_steps": 10853, "loss": 0.1924, "learning_rate": 4.953930577248825e-06, "epoch": 0.10816787211498595, "percentage": 10.82, "elapsed_time": "3:41:20", "remaining_time": "1 day, 6:24:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1175, "total_steps": 10853, "loss": 0.1795, "learning_rate": 4.95378489310304e-06, "epoch": 0.10826000829225596, "percentage": 10.83, "elapsed_time": "3:41:30", "remaining_time": "1 day, 6:24:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1176, "total_steps": 10853, "loss": 0.1859, "learning_rate": 4.953638981123063e-06, "epoch": 0.10835214446952596, "percentage": 10.84, "elapsed_time": "3:41:40", "remaining_time": "1 day, 6:24:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1177, "total_steps": 10853, "loss": 0.1685, "learning_rate": 4.9534928413224424e-06, "epoch": 0.10844428064679597, "percentage": 10.84, "elapsed_time": "3:41:51", "remaining_time": "1 day, 6:23:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1178, "total_steps": 10853, "loss": 0.1972, "learning_rate": 4.953346473714748e-06, "epoch": 0.10853641682406596, "percentage": 10.85, "elapsed_time": "3:42:03", "remaining_time": "1 day, 6:23:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1179, "total_steps": 10853, "loss": 0.1833, "learning_rate": 4.953199878313569e-06, "epoch": 0.10862855300133598, "percentage": 10.86, "elapsed_time": "3:42:14", "remaining_time": "1 day, 6:23:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1180, "total_steps": 10853, "loss": 0.1868, "learning_rate": 4.953053055132518e-06, "epoch": 0.10872068917860599, "percentage": 10.87, "elapsed_time": "3:42:24", "remaining_time": "1 day, 6:23:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1181, "total_steps": 10853, "loss": 0.1877, "learning_rate": 4.9529060041852264e-06, "epoch": 0.10881282535587598, "percentage": 10.88, "elapsed_time": "3:42:35", "remaining_time": "1 day, 6:22:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1182, "total_steps": 10853, "loss": 0.1765, "learning_rate": 4.9527587254853485e-06, "epoch": 0.108904961533146, "percentage": 10.89, "elapsed_time": "3:42:46", "remaining_time": "1 day, 6:22:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1183, "total_steps": 10853, "loss": 0.1975, "learning_rate": 4.952611219046559e-06, "epoch": 0.10899709771041599, "percentage": 10.9, "elapsed_time": "3:42:56", "remaining_time": "1 day, 6:22:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1184, "total_steps": 10853, "loss": 0.1746, "learning_rate": 4.952463484882553e-06, "epoch": 0.109089233887686, "percentage": 10.91, "elapsed_time": "3:43:06", "remaining_time": "1 day, 6:21:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1185, "total_steps": 10853, "loss": 0.1882, "learning_rate": 4.9523155230070495e-06, "epoch": 0.109181370064956, "percentage": 10.92, "elapsed_time": "3:43:17", "remaining_time": "1 day, 6:21:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1186, "total_steps": 10853, "loss": 0.1813, "learning_rate": 4.952167333433785e-06, "epoch": 0.10927350624222601, "percentage": 10.93, "elapsed_time": "3:43:27", "remaining_time": "1 day, 6:21:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1187, "total_steps": 10853, "loss": 0.1867, "learning_rate": 4.952018916176521e-06, "epoch": 0.10936564241949602, "percentage": 10.94, "elapsed_time": "3:43:38", "remaining_time": "1 day, 6:21:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1188, "total_steps": 10853, "loss": 0.1697, "learning_rate": 4.9518702712490355e-06, "epoch": 0.10945777859676602, "percentage": 10.95, "elapsed_time": "3:43:47", "remaining_time": "1 day, 6:20:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1189, "total_steps": 10853, "loss": 0.195, "learning_rate": 4.951721398665131e-06, "epoch": 0.10954991477403603, "percentage": 10.96, "elapsed_time": "3:43:58", "remaining_time": "1 day, 6:20:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1190, "total_steps": 10853, "loss": 0.1778, "learning_rate": 4.951572298438632e-06, "epoch": 0.10964205095130602, "percentage": 10.96, "elapsed_time": "3:44:08", "remaining_time": "1 day, 6:20:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1191, "total_steps": 10853, "loss": 0.182, "learning_rate": 4.95142297058338e-06, "epoch": 0.10973418712857604, "percentage": 10.97, "elapsed_time": "3:44:18", "remaining_time": "1 day, 6:19:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1192, "total_steps": 10853, "loss": 0.191, "learning_rate": 4.951273415113243e-06, "epoch": 0.10982632330584605, "percentage": 10.98, "elapsed_time": "3:44:28", "remaining_time": "1 day, 6:19:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1193, "total_steps": 10853, "loss": 0.1876, "learning_rate": 4.951123632042104e-06, "epoch": 0.10991845948311604, "percentage": 10.99, "elapsed_time": "3:44:38", "remaining_time": "1 day, 6:18:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1194, "total_steps": 10853, "loss": 0.1682, "learning_rate": 4.950973621383873e-06, "epoch": 0.11001059566038605, "percentage": 11.0, "elapsed_time": "3:44:47", "remaining_time": "1 day, 6:18:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1195, "total_steps": 10853, "loss": 0.2048, "learning_rate": 4.950823383152478e-06, "epoch": 0.11010273183765605, "percentage": 11.01, "elapsed_time": "3:44:57", "remaining_time": "1 day, 6:18:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1196, "total_steps": 10853, "loss": 0.1819, "learning_rate": 4.9506729173618675e-06, "epoch": 0.11019486801492606, "percentage": 11.02, "elapsed_time": "3:45:08", "remaining_time": "1 day, 6:17:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1197, "total_steps": 10853, "loss": 0.1729, "learning_rate": 4.950522224026012e-06, "epoch": 0.11028700419219607, "percentage": 11.03, "elapsed_time": "3:45:20", "remaining_time": "1 day, 6:17:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1198, "total_steps": 10853, "loss": 0.1789, "learning_rate": 4.950371303158905e-06, "epoch": 0.11037914036946607, "percentage": 11.04, "elapsed_time": "3:45:31", "remaining_time": "1 day, 6:17:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1199, "total_steps": 10853, "loss": 0.1733, "learning_rate": 4.950220154774559e-06, "epoch": 0.11047127654673608, "percentage": 11.05, "elapsed_time": "3:45:41", "remaining_time": "1 day, 6:17:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1200, "total_steps": 10853, "loss": 0.1753, "learning_rate": 4.950068778887007e-06, "epoch": 0.11056341272400608, "percentage": 11.06, "elapsed_time": "3:45:51", "remaining_time": "1 day, 6:16:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1201, "total_steps": 10853, "loss": 0.1912, "learning_rate": 4.949917175510307e-06, "epoch": 0.11065554890127609, "percentage": 11.07, "elapsed_time": "3:46:01", "remaining_time": "1 day, 6:16:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1202, "total_steps": 10853, "loss": 0.1807, "learning_rate": 4.949765344658532e-06, "epoch": 0.11074768507854608, "percentage": 11.08, "elapsed_time": "3:46:10", "remaining_time": "1 day, 6:16:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1203, "total_steps": 10853, "loss": 0.1897, "learning_rate": 4.949613286345781e-06, "epoch": 0.1108398212558161, "percentage": 11.08, "elapsed_time": "3:46:21", "remaining_time": "1 day, 6:15:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1204, "total_steps": 10853, "loss": 0.1855, "learning_rate": 4.9494610005861745e-06, "epoch": 0.1109319574330861, "percentage": 11.09, "elapsed_time": "3:46:33", "remaining_time": "1 day, 6:15:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1205, "total_steps": 10853, "loss": 0.1887, "learning_rate": 4.949308487393849e-06, "epoch": 0.1110240936103561, "percentage": 11.1, "elapsed_time": "3:46:45", "remaining_time": "1 day, 6:15:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1206, "total_steps": 10853, "loss": 0.2123, "learning_rate": 4.949155746782966e-06, "epoch": 0.11111622978762611, "percentage": 11.11, "elapsed_time": "3:46:57", "remaining_time": "1 day, 6:15:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1207, "total_steps": 10853, "loss": 0.1698, "learning_rate": 4.94900277876771e-06, "epoch": 0.11120836596489611, "percentage": 11.12, "elapsed_time": "3:47:07", "remaining_time": "1 day, 6:15:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1208, "total_steps": 10853, "loss": 0.1939, "learning_rate": 4.948849583362282e-06, "epoch": 0.11130050214216612, "percentage": 11.13, "elapsed_time": "3:47:18", "remaining_time": "1 day, 6:14:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1209, "total_steps": 10853, "loss": 0.2061, "learning_rate": 4.948696160580907e-06, "epoch": 0.11139263831943613, "percentage": 11.14, "elapsed_time": "3:47:28", "remaining_time": "1 day, 6:14:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1210, "total_steps": 10853, "loss": 0.1791, "learning_rate": 4.948542510437829e-06, "epoch": 0.11148477449670613, "percentage": 11.15, "elapsed_time": "3:47:38", "remaining_time": "1 day, 6:14:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1211, "total_steps": 10853, "loss": 0.1618, "learning_rate": 4.948388632947316e-06, "epoch": 0.11157691067397614, "percentage": 11.16, "elapsed_time": "3:47:49", "remaining_time": "1 day, 6:13:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1212, "total_steps": 10853, "loss": 0.1926, "learning_rate": 4.948234528123655e-06, "epoch": 0.11166904685124614, "percentage": 11.17, "elapsed_time": "3:48:01", "remaining_time": "1 day, 6:13:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1213, "total_steps": 10853, "loss": 0.1871, "learning_rate": 4.948080195981154e-06, "epoch": 0.11176118302851615, "percentage": 11.18, "elapsed_time": "3:48:10", "remaining_time": "1 day, 6:13:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1214, "total_steps": 10853, "loss": 0.1781, "learning_rate": 4.947925636534144e-06, "epoch": 0.11185331920578616, "percentage": 11.19, "elapsed_time": "3:48:21", "remaining_time": "1 day, 6:13:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1215, "total_steps": 10853, "loss": 0.1888, "learning_rate": 4.947770849796975e-06, "epoch": 0.11194545538305616, "percentage": 11.2, "elapsed_time": "3:48:32", "remaining_time": "1 day, 6:12:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1216, "total_steps": 10853, "loss": 0.1795, "learning_rate": 4.9476158357840194e-06, "epoch": 0.11203759156032617, "percentage": 11.2, "elapsed_time": "3:48:41", "remaining_time": "1 day, 6:12:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1217, "total_steps": 10853, "loss": 0.2044, "learning_rate": 4.9474605945096695e-06, "epoch": 0.11212972773759616, "percentage": 11.21, "elapsed_time": "3:48:51", "remaining_time": "1 day, 6:12:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1218, "total_steps": 10853, "loss": 0.1849, "learning_rate": 4.94730512598834e-06, "epoch": 0.11222186391486617, "percentage": 11.22, "elapsed_time": "3:49:02", "remaining_time": "1 day, 6:11:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1219, "total_steps": 10853, "loss": 0.1906, "learning_rate": 4.947149430234467e-06, "epoch": 0.11231400009213617, "percentage": 11.23, "elapsed_time": "3:49:12", "remaining_time": "1 day, 6:11:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1220, "total_steps": 10853, "loss": 0.1858, "learning_rate": 4.946993507262505e-06, "epoch": 0.11240613626940618, "percentage": 11.24, "elapsed_time": "3:49:21", "remaining_time": "1 day, 6:11:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1221, "total_steps": 10853, "loss": 0.1871, "learning_rate": 4.946837357086933e-06, "epoch": 0.11249827244667619, "percentage": 11.25, "elapsed_time": "3:49:34", "remaining_time": "1 day, 6:10:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1222, "total_steps": 10853, "loss": 0.2072, "learning_rate": 4.946680979722249e-06, "epoch": 0.11259040862394619, "percentage": 11.26, "elapsed_time": "3:49:44", "remaining_time": "1 day, 6:10:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1223, "total_steps": 10853, "loss": 0.1849, "learning_rate": 4.946524375182973e-06, "epoch": 0.1126825448012162, "percentage": 11.27, "elapsed_time": "3:49:55", "remaining_time": "1 day, 6:10:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1224, "total_steps": 10853, "loss": 0.1948, "learning_rate": 4.946367543483645e-06, "epoch": 0.1127746809784862, "percentage": 11.28, "elapsed_time": "3:50:06", "remaining_time": "1 day, 6:10:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1225, "total_steps": 10853, "loss": 0.1842, "learning_rate": 4.946210484638827e-06, "epoch": 0.11286681715575621, "percentage": 11.29, "elapsed_time": "3:50:17", "remaining_time": "1 day, 6:09:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1226, "total_steps": 10853, "loss": 0.1647, "learning_rate": 4.946053198663103e-06, "epoch": 0.11295895333302622, "percentage": 11.3, "elapsed_time": "3:50:27", "remaining_time": "1 day, 6:09:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1227, "total_steps": 10853, "loss": 0.2078, "learning_rate": 4.945895685571076e-06, "epoch": 0.11305108951029622, "percentage": 11.31, "elapsed_time": "3:50:38", "remaining_time": "1 day, 6:09:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1228, "total_steps": 10853, "loss": 0.1812, "learning_rate": 4.945737945377372e-06, "epoch": 0.11314322568756623, "percentage": 11.31, "elapsed_time": "3:50:49", "remaining_time": "1 day, 6:09:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1229, "total_steps": 10853, "loss": 0.1841, "learning_rate": 4.945579978096635e-06, "epoch": 0.11323536186483622, "percentage": 11.32, "elapsed_time": "3:51:00", "remaining_time": "1 day, 6:08:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1230, "total_steps": 10853, "loss": 0.1818, "learning_rate": 4.945421783743535e-06, "epoch": 0.11332749804210623, "percentage": 11.33, "elapsed_time": "3:51:11", "remaining_time": "1 day, 6:08:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1231, "total_steps": 10853, "loss": 0.1857, "learning_rate": 4.945263362332759e-06, "epoch": 0.11341963421937624, "percentage": 11.34, "elapsed_time": "3:51:22", "remaining_time": "1 day, 6:08:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1232, "total_steps": 10853, "loss": 0.1891, "learning_rate": 4.945104713879017e-06, "epoch": 0.11351177039664624, "percentage": 11.35, "elapsed_time": "3:51:33", "remaining_time": "1 day, 6:08:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1233, "total_steps": 10853, "loss": 0.1791, "learning_rate": 4.9449458383970386e-06, "epoch": 0.11360390657391625, "percentage": 11.36, "elapsed_time": "3:51:45", "remaining_time": "1 day, 6:08:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1234, "total_steps": 10853, "loss": 0.1794, "learning_rate": 4.944786735901576e-06, "epoch": 0.11369604275118625, "percentage": 11.37, "elapsed_time": "3:51:56", "remaining_time": "1 day, 6:07:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1235, "total_steps": 10853, "loss": 0.1932, "learning_rate": 4.944627406407401e-06, "epoch": 0.11378817892845626, "percentage": 11.38, "elapsed_time": "3:52:07", "remaining_time": "1 day, 6:07:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1236, "total_steps": 10853, "loss": 0.17, "learning_rate": 4.94446784992931e-06, "epoch": 0.11388031510572626, "percentage": 11.39, "elapsed_time": "3:52:18", "remaining_time": "1 day, 6:07:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1237, "total_steps": 10853, "loss": 0.1939, "learning_rate": 4.9443080664821156e-06, "epoch": 0.11397245128299627, "percentage": 11.4, "elapsed_time": "3:52:29", "remaining_time": "1 day, 6:07:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1238, "total_steps": 10853, "loss": 0.1994, "learning_rate": 4.944148056080654e-06, "epoch": 0.11406458746026628, "percentage": 11.41, "elapsed_time": "3:52:40", "remaining_time": "1 day, 6:07:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1239, "total_steps": 10853, "loss": 0.1876, "learning_rate": 4.943987818739782e-06, "epoch": 0.11415672363753628, "percentage": 11.42, "elapsed_time": "3:52:53", "remaining_time": "1 day, 6:07:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1240, "total_steps": 10853, "loss": 0.1894, "learning_rate": 4.943827354474378e-06, "epoch": 0.11424885981480629, "percentage": 11.43, "elapsed_time": "3:53:02", "remaining_time": "1 day, 6:06:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1241, "total_steps": 10853, "loss": 0.1729, "learning_rate": 4.943666663299341e-06, "epoch": 0.11434099599207628, "percentage": 11.43, "elapsed_time": "3:53:12", "remaining_time": "1 day, 6:06:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1242, "total_steps": 10853, "loss": 0.1855, "learning_rate": 4.943505745229592e-06, "epoch": 0.1144331321693463, "percentage": 11.44, "elapsed_time": "3:53:24", "remaining_time": "1 day, 6:06:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1243, "total_steps": 10853, "loss": 0.2035, "learning_rate": 4.943344600280071e-06, "epoch": 0.1145252683466163, "percentage": 11.45, "elapsed_time": "3:53:36", "remaining_time": "1 day, 6:06:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1244, "total_steps": 10853, "loss": 0.1993, "learning_rate": 4.943183228465742e-06, "epoch": 0.1146174045238863, "percentage": 11.46, "elapsed_time": "3:53:46", "remaining_time": "1 day, 6:05:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1245, "total_steps": 10853, "loss": 0.1691, "learning_rate": 4.943021629801586e-06, "epoch": 0.11470954070115631, "percentage": 11.47, "elapsed_time": "3:53:57", "remaining_time": "1 day, 6:05:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1246, "total_steps": 10853, "loss": 0.1846, "learning_rate": 4.9428598043026085e-06, "epoch": 0.11480167687842631, "percentage": 11.48, "elapsed_time": "3:54:08", "remaining_time": "1 day, 6:05:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1247, "total_steps": 10853, "loss": 0.1773, "learning_rate": 4.942697751983837e-06, "epoch": 0.11489381305569632, "percentage": 11.49, "elapsed_time": "3:54:18", "remaining_time": "1 day, 6:04:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1248, "total_steps": 10853, "loss": 0.1787, "learning_rate": 4.942535472860315e-06, "epoch": 0.11498594923296633, "percentage": 11.5, "elapsed_time": "3:54:30", "remaining_time": "1 day, 6:04:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1249, "total_steps": 10853, "loss": 0.1866, "learning_rate": 4.942372966947112e-06, "epoch": 0.11507808541023633, "percentage": 11.51, "elapsed_time": "3:54:41", "remaining_time": "1 day, 6:04:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1250, "total_steps": 10853, "loss": 0.1778, "learning_rate": 4.942210234259316e-06, "epoch": 0.11517022158750634, "percentage": 11.52, "elapsed_time": "3:54:51", "remaining_time": "1 day, 6:04:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1251, "total_steps": 10853, "loss": 0.1941, "learning_rate": 4.9420472748120365e-06, "epoch": 0.11526235776477634, "percentage": 11.53, "elapsed_time": "3:55:02", "remaining_time": "1 day, 6:04:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1252, "total_steps": 10853, "loss": 0.1731, "learning_rate": 4.941884088620405e-06, "epoch": 0.11535449394204635, "percentage": 11.54, "elapsed_time": "3:55:13", "remaining_time": "1 day, 6:03:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1253, "total_steps": 10853, "loss": 0.1819, "learning_rate": 4.941720675699573e-06, "epoch": 0.11544663011931634, "percentage": 11.55, "elapsed_time": "3:55:23", "remaining_time": "1 day, 6:03:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1254, "total_steps": 10853, "loss": 0.1838, "learning_rate": 4.941557036064714e-06, "epoch": 0.11553876629658635, "percentage": 11.55, "elapsed_time": "3:55:35", "remaining_time": "1 day, 6:03:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1255, "total_steps": 10853, "loss": 0.197, "learning_rate": 4.9413931697310215e-06, "epoch": 0.11563090247385636, "percentage": 11.56, "elapsed_time": "3:55:46", "remaining_time": "1 day, 6:03:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1256, "total_steps": 10853, "loss": 0.1999, "learning_rate": 4.941229076713709e-06, "epoch": 0.11572303865112636, "percentage": 11.57, "elapsed_time": "3:55:56", "remaining_time": "1 day, 6:02:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1257, "total_steps": 10853, "loss": 0.1699, "learning_rate": 4.9410647570280156e-06, "epoch": 0.11581517482839637, "percentage": 11.58, "elapsed_time": "3:56:09", "remaining_time": "1 day, 6:02:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1258, "total_steps": 10853, "loss": 0.1965, "learning_rate": 4.940900210689196e-06, "epoch": 0.11590731100566637, "percentage": 11.59, "elapsed_time": "3:56:20", "remaining_time": "1 day, 6:02:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1259, "total_steps": 10853, "loss": 0.1971, "learning_rate": 4.94073543771253e-06, "epoch": 0.11599944718293638, "percentage": 11.6, "elapsed_time": "3:56:31", "remaining_time": "1 day, 6:02:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1260, "total_steps": 10853, "loss": 0.1916, "learning_rate": 4.940570438113315e-06, "epoch": 0.11609158336020639, "percentage": 11.61, "elapsed_time": "3:56:42", "remaining_time": "1 day, 6:02:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1261, "total_steps": 10853, "loss": 0.19, "learning_rate": 4.940405211906872e-06, "epoch": 0.11618371953747639, "percentage": 11.62, "elapsed_time": "3:56:53", "remaining_time": "1 day, 6:01:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1262, "total_steps": 10853, "loss": 0.1901, "learning_rate": 4.9402397591085435e-06, "epoch": 0.1162758557147464, "percentage": 11.63, "elapsed_time": "3:57:04", "remaining_time": "1 day, 6:01:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1263, "total_steps": 10853, "loss": 0.2099, "learning_rate": 4.94007407973369e-06, "epoch": 0.1163679918920164, "percentage": 11.64, "elapsed_time": "3:57:14", "remaining_time": "1 day, 6:01:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1264, "total_steps": 10853, "loss": 0.1796, "learning_rate": 4.939908173797696e-06, "epoch": 0.1164601280692864, "percentage": 11.65, "elapsed_time": "3:57:25", "remaining_time": "1 day, 6:01:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1265, "total_steps": 10853, "loss": 0.1764, "learning_rate": 4.939742041315964e-06, "epoch": 0.11655226424655642, "percentage": 11.66, "elapsed_time": "3:57:35", "remaining_time": "1 day, 6:00:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1266, "total_steps": 10853, "loss": 0.1946, "learning_rate": 4.939575682303923e-06, "epoch": 0.11664440042382641, "percentage": 11.66, "elapsed_time": "3:57:45", "remaining_time": "1 day, 6:00:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1267, "total_steps": 10853, "loss": 0.1816, "learning_rate": 4.939409096777017e-06, "epoch": 0.11673653660109642, "percentage": 11.67, "elapsed_time": "3:57:55", "remaining_time": "1 day, 6:00:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1268, "total_steps": 10853, "loss": 0.1787, "learning_rate": 4.939242284750712e-06, "epoch": 0.11682867277836642, "percentage": 11.68, "elapsed_time": "3:58:05", "remaining_time": "1 day, 5:59:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1269, "total_steps": 10853, "loss": 0.182, "learning_rate": 4.9390752462405e-06, "epoch": 0.11692080895563643, "percentage": 11.69, "elapsed_time": "3:58:16", "remaining_time": "1 day, 5:59:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1270, "total_steps": 10853, "loss": 0.1925, "learning_rate": 4.938907981261889e-06, "epoch": 0.11701294513290643, "percentage": 11.7, "elapsed_time": "3:58:28", "remaining_time": "1 day, 5:59:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1271, "total_steps": 10853, "loss": 0.1858, "learning_rate": 4.938740489830409e-06, "epoch": 0.11710508131017644, "percentage": 11.71, "elapsed_time": "3:58:40", "remaining_time": "1 day, 5:59:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1272, "total_steps": 10853, "loss": 0.193, "learning_rate": 4.938572771961612e-06, "epoch": 0.11719721748744645, "percentage": 11.72, "elapsed_time": "3:58:50", "remaining_time": "1 day, 5:58:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1273, "total_steps": 10853, "loss": 0.1942, "learning_rate": 4.93840482767107e-06, "epoch": 0.11728935366471645, "percentage": 11.73, "elapsed_time": "3:59:01", "remaining_time": "1 day, 5:58:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1274, "total_steps": 10853, "loss": 0.1703, "learning_rate": 4.938236656974378e-06, "epoch": 0.11738148984198646, "percentage": 11.74, "elapsed_time": "3:59:11", "remaining_time": "1 day, 5:58:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1275, "total_steps": 10853, "loss": 0.1821, "learning_rate": 4.9380682598871505e-06, "epoch": 0.11747362601925646, "percentage": 11.75, "elapsed_time": "3:59:21", "remaining_time": "1 day, 5:58:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1276, "total_steps": 10853, "loss": 0.2, "learning_rate": 4.937899636425022e-06, "epoch": 0.11756576219652647, "percentage": 11.76, "elapsed_time": "3:59:33", "remaining_time": "1 day, 5:57:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1277, "total_steps": 10853, "loss": 0.1895, "learning_rate": 4.9377307866036506e-06, "epoch": 0.11765789837379648, "percentage": 11.77, "elapsed_time": "3:59:42", "remaining_time": "1 day, 5:57:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1278, "total_steps": 10853, "loss": 0.1887, "learning_rate": 4.9375617104387124e-06, "epoch": 0.11775003455106647, "percentage": 11.78, "elapsed_time": "3:59:52", "remaining_time": "1 day, 5:57:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1279, "total_steps": 10853, "loss": 0.1895, "learning_rate": 4.9373924079459076e-06, "epoch": 0.11784217072833648, "percentage": 11.78, "elapsed_time": "4:00:02", "remaining_time": "1 day, 5:56:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1280, "total_steps": 10853, "loss": 0.1948, "learning_rate": 4.937222879140955e-06, "epoch": 0.11793430690560648, "percentage": 11.79, "elapsed_time": "4:00:13", "remaining_time": "1 day, 5:56:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1281, "total_steps": 10853, "loss": 0.1793, "learning_rate": 4.937053124039597e-06, "epoch": 0.11802644308287649, "percentage": 11.8, "elapsed_time": "4:00:23", "remaining_time": "1 day, 5:56:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1282, "total_steps": 10853, "loss": 0.182, "learning_rate": 4.9368831426575925e-06, "epoch": 0.1181185792601465, "percentage": 11.81, "elapsed_time": "4:00:34", "remaining_time": "1 day, 5:56:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1283, "total_steps": 10853, "loss": 0.1837, "learning_rate": 4.9367129350107265e-06, "epoch": 0.1182107154374165, "percentage": 11.82, "elapsed_time": "4:00:45", "remaining_time": "1 day, 5:55:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1284, "total_steps": 10853, "loss": 0.1852, "learning_rate": 4.936542501114803e-06, "epoch": 0.11830285161468651, "percentage": 11.83, "elapsed_time": "4:00:56", "remaining_time": "1 day, 5:55:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1285, "total_steps": 10853, "loss": 0.17, "learning_rate": 4.936371840985645e-06, "epoch": 0.11839498779195651, "percentage": 11.84, "elapsed_time": "4:01:07", "remaining_time": "1 day, 5:55:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1286, "total_steps": 10853, "loss": 0.1717, "learning_rate": 4.9362009546391e-06, "epoch": 0.11848712396922652, "percentage": 11.85, "elapsed_time": "4:01:18", "remaining_time": "1 day, 5:55:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1287, "total_steps": 10853, "loss": 0.1647, "learning_rate": 4.9360298420910335e-06, "epoch": 0.11857926014649652, "percentage": 11.86, "elapsed_time": "4:01:29", "remaining_time": "1 day, 5:54:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1288, "total_steps": 10853, "loss": 0.1872, "learning_rate": 4.935858503357335e-06, "epoch": 0.11867139632376653, "percentage": 11.87, "elapsed_time": "4:01:41", "remaining_time": "1 day, 5:54:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1289, "total_steps": 10853, "loss": 0.19, "learning_rate": 4.935686938453912e-06, "epoch": 0.11876353250103654, "percentage": 11.88, "elapsed_time": "4:01:52", "remaining_time": "1 day, 5:54:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1290, "total_steps": 10853, "loss": 0.1942, "learning_rate": 4.935515147396695e-06, "epoch": 0.11885566867830653, "percentage": 11.89, "elapsed_time": "4:02:04", "remaining_time": "1 day, 5:54:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1291, "total_steps": 10853, "loss": 0.1719, "learning_rate": 4.935343130201633e-06, "epoch": 0.11894780485557654, "percentage": 11.9, "elapsed_time": "4:02:16", "remaining_time": "1 day, 5:54:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1292, "total_steps": 10853, "loss": 0.1981, "learning_rate": 4.935170886884701e-06, "epoch": 0.11903994103284654, "percentage": 11.9, "elapsed_time": "4:02:27", "remaining_time": "1 day, 5:54:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1293, "total_steps": 10853, "loss": 0.1832, "learning_rate": 4.934998417461888e-06, "epoch": 0.11913207721011655, "percentage": 11.91, "elapsed_time": "4:02:37", "remaining_time": "1 day, 5:53:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1294, "total_steps": 10853, "loss": 0.1683, "learning_rate": 4.9348257219492116e-06, "epoch": 0.11922421338738656, "percentage": 11.92, "elapsed_time": "4:02:48", "remaining_time": "1 day, 5:53:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1295, "total_steps": 10853, "loss": 0.2061, "learning_rate": 4.934652800362704e-06, "epoch": 0.11931634956465656, "percentage": 11.93, "elapsed_time": "4:02:59", "remaining_time": "1 day, 5:53:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1296, "total_steps": 10853, "loss": 0.1865, "learning_rate": 4.934479652718422e-06, "epoch": 0.11940848574192657, "percentage": 11.94, "elapsed_time": "4:03:11", "remaining_time": "1 day, 5:53:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1297, "total_steps": 10853, "loss": 0.1836, "learning_rate": 4.934306279032442e-06, "epoch": 0.11950062191919657, "percentage": 11.95, "elapsed_time": "4:03:21", "remaining_time": "1 day, 5:53:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1298, "total_steps": 10853, "loss": 0.1818, "learning_rate": 4.934132679320863e-06, "epoch": 0.11959275809646658, "percentage": 11.96, "elapsed_time": "4:03:33", "remaining_time": "1 day, 5:52:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1299, "total_steps": 10853, "loss": 0.2019, "learning_rate": 4.933958853599803e-06, "epoch": 0.11968489427373659, "percentage": 11.97, "elapsed_time": "4:03:44", "remaining_time": "1 day, 5:52:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1300, "total_steps": 10853, "loss": 0.191, "learning_rate": 4.9337848018854005e-06, "epoch": 0.11977703045100659, "percentage": 11.98, "elapsed_time": "4:03:56", "remaining_time": "1 day, 5:52:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1301, "total_steps": 10853, "loss": 0.1575, "learning_rate": 4.933610524193817e-06, "epoch": 0.1198691666282766, "percentage": 11.99, "elapsed_time": "4:04:06", "remaining_time": "1 day, 5:52:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1302, "total_steps": 10853, "loss": 0.1935, "learning_rate": 4.933436020541235e-06, "epoch": 0.1199613028055466, "percentage": 12.0, "elapsed_time": "4:04:17", "remaining_time": "1 day, 5:52:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1303, "total_steps": 10853, "loss": 0.1634, "learning_rate": 4.933261290943856e-06, "epoch": 0.1200534389828166, "percentage": 12.01, "elapsed_time": "4:04:28", "remaining_time": "1 day, 5:51:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1304, "total_steps": 10853, "loss": 0.1912, "learning_rate": 4.933086335417905e-06, "epoch": 0.1201455751600866, "percentage": 12.02, "elapsed_time": "4:04:39", "remaining_time": "1 day, 5:51:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1305, "total_steps": 10853, "loss": 0.1788, "learning_rate": 4.932911153979626e-06, "epoch": 0.12023771133735661, "percentage": 12.02, "elapsed_time": "4:04:48", "remaining_time": "1 day, 5:51:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1306, "total_steps": 10853, "loss": 0.1872, "learning_rate": 4.932735746645284e-06, "epoch": 0.12032984751462662, "percentage": 12.03, "elapsed_time": "4:04:59", "remaining_time": "1 day, 5:50:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1307, "total_steps": 10853, "loss": 0.1716, "learning_rate": 4.9325601134311665e-06, "epoch": 0.12042198369189662, "percentage": 12.04, "elapsed_time": "4:05:09", "remaining_time": "1 day, 5:50:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1308, "total_steps": 10853, "loss": 0.2076, "learning_rate": 4.932384254353581e-06, "epoch": 0.12051411986916663, "percentage": 12.05, "elapsed_time": "4:05:19", "remaining_time": "1 day, 5:50:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1309, "total_steps": 10853, "loss": 0.1822, "learning_rate": 4.932208169428855e-06, "epoch": 0.12060625604643663, "percentage": 12.06, "elapsed_time": "4:05:29", "remaining_time": "1 day, 5:49:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1310, "total_steps": 10853, "loss": 0.1814, "learning_rate": 4.932031858673338e-06, "epoch": 0.12069839222370664, "percentage": 12.07, "elapsed_time": "4:05:40", "remaining_time": "1 day, 5:49:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1311, "total_steps": 10853, "loss": 0.1932, "learning_rate": 4.931855322103403e-06, "epoch": 0.12079052840097665, "percentage": 12.08, "elapsed_time": "4:05:51", "remaining_time": "1 day, 5:49:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1312, "total_steps": 10853, "loss": 0.1805, "learning_rate": 4.9316785597354385e-06, "epoch": 0.12088266457824665, "percentage": 12.09, "elapsed_time": "4:06:01", "remaining_time": "1 day, 5:49:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1313, "total_steps": 10853, "loss": 0.1845, "learning_rate": 4.931501571585858e-06, "epoch": 0.12097480075551666, "percentage": 12.1, "elapsed_time": "4:06:11", "remaining_time": "1 day, 5:48:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1314, "total_steps": 10853, "loss": 0.1851, "learning_rate": 4.931324357671095e-06, "epoch": 0.12106693693278665, "percentage": 12.11, "elapsed_time": "4:06:23", "remaining_time": "1 day, 5:48:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1315, "total_steps": 10853, "loss": 0.1836, "learning_rate": 4.931146918007604e-06, "epoch": 0.12115907311005666, "percentage": 12.12, "elapsed_time": "4:06:33", "remaining_time": "1 day, 5:48:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1316, "total_steps": 10853, "loss": 0.1784, "learning_rate": 4.93096925261186e-06, "epoch": 0.12125120928732668, "percentage": 12.13, "elapsed_time": "4:06:45", "remaining_time": "1 day, 5:48:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1317, "total_steps": 10853, "loss": 0.1995, "learning_rate": 4.930791361500359e-06, "epoch": 0.12134334546459667, "percentage": 12.13, "elapsed_time": "4:06:57", "remaining_time": "1 day, 5:48:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1318, "total_steps": 10853, "loss": 0.1876, "learning_rate": 4.930613244689618e-06, "epoch": 0.12143548164186668, "percentage": 12.14, "elapsed_time": "4:07:08", "remaining_time": "1 day, 5:47:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1319, "total_steps": 10853, "loss": 0.1844, "learning_rate": 4.930434902196177e-06, "epoch": 0.12152761781913668, "percentage": 12.15, "elapsed_time": "4:07:19", "remaining_time": "1 day, 5:47:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1320, "total_steps": 10853, "loss": 0.1834, "learning_rate": 4.930256334036593e-06, "epoch": 0.12161975399640669, "percentage": 12.16, "elapsed_time": "4:07:29", "remaining_time": "1 day, 5:47:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1321, "total_steps": 10853, "loss": 0.1792, "learning_rate": 4.930077540227447e-06, "epoch": 0.12171189017367669, "percentage": 12.17, "elapsed_time": "4:07:41", "remaining_time": "1 day, 5:47:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1322, "total_steps": 10853, "loss": 0.1636, "learning_rate": 4.92989852078534e-06, "epoch": 0.1218040263509467, "percentage": 12.18, "elapsed_time": "4:07:52", "remaining_time": "1 day, 5:47:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1323, "total_steps": 10853, "loss": 0.1838, "learning_rate": 4.929719275726893e-06, "epoch": 0.12189616252821671, "percentage": 12.19, "elapsed_time": "4:08:03", "remaining_time": "1 day, 5:46:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1324, "total_steps": 10853, "loss": 0.1737, "learning_rate": 4.9295398050687505e-06, "epoch": 0.1219882987054867, "percentage": 12.2, "elapsed_time": "4:08:14", "remaining_time": "1 day, 5:46:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1325, "total_steps": 10853, "loss": 0.1867, "learning_rate": 4.929360108827575e-06, "epoch": 0.12208043488275672, "percentage": 12.21, "elapsed_time": "4:08:26", "remaining_time": "1 day, 5:46:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1326, "total_steps": 10853, "loss": 0.1873, "learning_rate": 4.929180187020053e-06, "epoch": 0.12217257106002671, "percentage": 12.22, "elapsed_time": "4:08:38", "remaining_time": "1 day, 5:46:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1327, "total_steps": 10853, "loss": 0.1845, "learning_rate": 4.9290000396628875e-06, "epoch": 0.12226470723729672, "percentage": 12.23, "elapsed_time": "4:08:48", "remaining_time": "1 day, 5:46:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1328, "total_steps": 10853, "loss": 0.1789, "learning_rate": 4.928819666772808e-06, "epoch": 0.12235684341456673, "percentage": 12.24, "elapsed_time": "4:09:00", "remaining_time": "1 day, 5:45:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1329, "total_steps": 10853, "loss": 0.1886, "learning_rate": 4.9286390683665615e-06, "epoch": 0.12244897959183673, "percentage": 12.25, "elapsed_time": "4:09:12", "remaining_time": "1 day, 5:45:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1330, "total_steps": 10853, "loss": 0.1816, "learning_rate": 4.9284582444609156e-06, "epoch": 0.12254111576910674, "percentage": 12.25, "elapsed_time": "4:09:24", "remaining_time": "1 day, 5:45:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1331, "total_steps": 10853, "loss": 0.1864, "learning_rate": 4.9282771950726605e-06, "epoch": 0.12263325194637674, "percentage": 12.26, "elapsed_time": "4:09:36", "remaining_time": "1 day, 5:45:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1332, "total_steps": 10853, "loss": 0.1797, "learning_rate": 4.928095920218606e-06, "epoch": 0.12272538812364675, "percentage": 12.27, "elapsed_time": "4:09:46", "remaining_time": "1 day, 5:45:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1333, "total_steps": 10853, "loss": 0.1858, "learning_rate": 4.927914419915585e-06, "epoch": 0.12281752430091676, "percentage": 12.28, "elapsed_time": "4:09:58", "remaining_time": "1 day, 5:45:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1334, "total_steps": 10853, "loss": 0.1894, "learning_rate": 4.927732694180448e-06, "epoch": 0.12290966047818676, "percentage": 12.29, "elapsed_time": "4:10:08", "remaining_time": "1 day, 5:44:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1335, "total_steps": 10853, "loss": 0.19, "learning_rate": 4.9275507430300694e-06, "epoch": 0.12300179665545677, "percentage": 12.3, "elapsed_time": "4:10:18", "remaining_time": "1 day, 5:44:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1336, "total_steps": 10853, "loss": 0.1768, "learning_rate": 4.927368566481343e-06, "epoch": 0.12309393283272677, "percentage": 12.31, "elapsed_time": "4:10:29", "remaining_time": "1 day, 5:44:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1337, "total_steps": 10853, "loss": 0.1661, "learning_rate": 4.927186164551184e-06, "epoch": 0.12318606900999678, "percentage": 12.32, "elapsed_time": "4:10:38", "remaining_time": "1 day, 5:43:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1338, "total_steps": 10853, "loss": 0.1896, "learning_rate": 4.927003537256528e-06, "epoch": 0.12327820518726679, "percentage": 12.33, "elapsed_time": "4:10:48", "remaining_time": "1 day, 5:43:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1339, "total_steps": 10853, "loss": 0.1783, "learning_rate": 4.926820684614333e-06, "epoch": 0.12337034136453678, "percentage": 12.34, "elapsed_time": "4:11:00", "remaining_time": "1 day, 5:43:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1340, "total_steps": 10853, "loss": 0.2, "learning_rate": 4.9266376066415764e-06, "epoch": 0.1234624775418068, "percentage": 12.35, "elapsed_time": "4:11:11", "remaining_time": "1 day, 5:43:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1341, "total_steps": 10853, "loss": 0.1778, "learning_rate": 4.926454303355256e-06, "epoch": 0.12355461371907679, "percentage": 12.36, "elapsed_time": "4:11:20", "remaining_time": "1 day, 5:42:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1342, "total_steps": 10853, "loss": 0.1868, "learning_rate": 4.926270774772392e-06, "epoch": 0.1236467498963468, "percentage": 12.37, "elapsed_time": "4:11:31", "remaining_time": "1 day, 5:42:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1343, "total_steps": 10853, "loss": 0.1689, "learning_rate": 4.926087020910027e-06, "epoch": 0.1237388860736168, "percentage": 12.37, "elapsed_time": "4:11:41", "remaining_time": "1 day, 5:42:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1344, "total_steps": 10853, "loss": 0.1915, "learning_rate": 4.925903041785221e-06, "epoch": 0.12383102225088681, "percentage": 12.38, "elapsed_time": "4:11:52", "remaining_time": "1 day, 5:42:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1345, "total_steps": 10853, "loss": 0.1874, "learning_rate": 4.925718837415055e-06, "epoch": 0.12392315842815682, "percentage": 12.39, "elapsed_time": "4:12:03", "remaining_time": "1 day, 5:41:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1346, "total_steps": 10853, "loss": 0.1769, "learning_rate": 4.925534407816634e-06, "epoch": 0.12401529460542682, "percentage": 12.4, "elapsed_time": "4:12:12", "remaining_time": "1 day, 5:41:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1347, "total_steps": 10853, "loss": 0.1737, "learning_rate": 4.925349753007083e-06, "epoch": 0.12410743078269683, "percentage": 12.41, "elapsed_time": "4:12:24", "remaining_time": "1 day, 5:41:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1348, "total_steps": 10853, "loss": 0.184, "learning_rate": 4.925164873003546e-06, "epoch": 0.12419956695996683, "percentage": 12.42, "elapsed_time": "4:12:34", "remaining_time": "1 day, 5:40:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1349, "total_steps": 10853, "loss": 0.1924, "learning_rate": 4.92497976782319e-06, "epoch": 0.12429170313723684, "percentage": 12.43, "elapsed_time": "4:12:45", "remaining_time": "1 day, 5:40:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1350, "total_steps": 10853, "loss": 0.1723, "learning_rate": 4.924794437483202e-06, "epoch": 0.12438383931450685, "percentage": 12.44, "elapsed_time": "4:12:56", "remaining_time": "1 day, 5:40:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1351, "total_steps": 10853, "loss": 0.1987, "learning_rate": 4.924608882000789e-06, "epoch": 0.12447597549177684, "percentage": 12.45, "elapsed_time": "4:13:08", "remaining_time": "1 day, 5:40:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1352, "total_steps": 10853, "loss": 0.1765, "learning_rate": 4.92442310139318e-06, "epoch": 0.12456811166904685, "percentage": 12.46, "elapsed_time": "4:13:20", "remaining_time": "1 day, 5:40:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1353, "total_steps": 10853, "loss": 0.1783, "learning_rate": 4.924237095677625e-06, "epoch": 0.12466024784631685, "percentage": 12.47, "elapsed_time": "4:13:31", "remaining_time": "1 day, 5:40:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1354, "total_steps": 10853, "loss": 0.191, "learning_rate": 4.924050864871396e-06, "epoch": 0.12475238402358686, "percentage": 12.48, "elapsed_time": "4:13:41", "remaining_time": "1 day, 5:39:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1355, "total_steps": 10853, "loss": 0.1873, "learning_rate": 4.923864408991782e-06, "epoch": 0.12484452020085687, "percentage": 12.49, "elapsed_time": "4:13:51", "remaining_time": "1 day, 5:39:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1356, "total_steps": 10853, "loss": 0.184, "learning_rate": 4.923677728056098e-06, "epoch": 0.12493665637812687, "percentage": 12.49, "elapsed_time": "4:14:01", "remaining_time": "1 day, 5:39:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1357, "total_steps": 10853, "loss": 0.1831, "learning_rate": 4.923490822081675e-06, "epoch": 0.12502879255539687, "percentage": 12.5, "elapsed_time": "4:14:11", "remaining_time": "1 day, 5:38:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1358, "total_steps": 10853, "loss": 0.1716, "learning_rate": 4.923303691085869e-06, "epoch": 0.1251209287326669, "percentage": 12.51, "elapsed_time": "4:14:22", "remaining_time": "1 day, 5:38:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1359, "total_steps": 10853, "loss": 0.1734, "learning_rate": 4.9231163350860535e-06, "epoch": 0.1252130649099369, "percentage": 12.52, "elapsed_time": "4:14:33", "remaining_time": "1 day, 5:38:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1360, "total_steps": 10853, "loss": 0.1706, "learning_rate": 4.922928754099626e-06, "epoch": 0.12530520108720689, "percentage": 12.53, "elapsed_time": "4:14:45", "remaining_time": "1 day, 5:38:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1361, "total_steps": 10853, "loss": 0.2038, "learning_rate": 4.9227409481440034e-06, "epoch": 0.1253973372644769, "percentage": 12.54, "elapsed_time": "4:14:57", "remaining_time": "1 day, 5:38:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1362, "total_steps": 10853, "loss": 0.1746, "learning_rate": 4.922552917236622e-06, "epoch": 0.1254894734417469, "percentage": 12.55, "elapsed_time": "4:15:08", "remaining_time": "1 day, 5:37:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1363, "total_steps": 10853, "loss": 0.1879, "learning_rate": 4.922364661394943e-06, "epoch": 0.1255816096190169, "percentage": 12.56, "elapsed_time": "4:15:16", "remaining_time": "1 day, 5:37:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1364, "total_steps": 10853, "loss": 0.1632, "learning_rate": 4.922176180636443e-06, "epoch": 0.1256737457962869, "percentage": 12.57, "elapsed_time": "4:15:26", "remaining_time": "1 day, 5:37:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1365, "total_steps": 10853, "loss": 0.1888, "learning_rate": 4.921987474978626e-06, "epoch": 0.12576588197355693, "percentage": 12.58, "elapsed_time": "4:15:36", "remaining_time": "1 day, 5:36:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1366, "total_steps": 10853, "loss": 0.1875, "learning_rate": 4.921798544439009e-06, "epoch": 0.12585801815082692, "percentage": 12.59, "elapsed_time": "4:15:49", "remaining_time": "1 day, 5:36:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1367, "total_steps": 10853, "loss": 0.1997, "learning_rate": 4.921609389035138e-06, "epoch": 0.12595015432809692, "percentage": 12.6, "elapsed_time": "4:16:00", "remaining_time": "1 day, 5:36:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1368, "total_steps": 10853, "loss": 0.1905, "learning_rate": 4.921420008784573e-06, "epoch": 0.12604229050536694, "percentage": 12.6, "elapsed_time": "4:16:12", "remaining_time": "1 day, 5:36:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1369, "total_steps": 10853, "loss": 0.1829, "learning_rate": 4.9212304037049015e-06, "epoch": 0.12613442668263694, "percentage": 12.61, "elapsed_time": "4:16:22", "remaining_time": "1 day, 5:36:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1370, "total_steps": 10853, "loss": 0.1732, "learning_rate": 4.921040573813726e-06, "epoch": 0.12622656285990694, "percentage": 12.62, "elapsed_time": "4:16:32", "remaining_time": "1 day, 5:35:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1371, "total_steps": 10853, "loss": 0.1855, "learning_rate": 4.9208505191286714e-06, "epoch": 0.12631869903717693, "percentage": 12.63, "elapsed_time": "4:16:43", "remaining_time": "1 day, 5:35:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1372, "total_steps": 10853, "loss": 0.209, "learning_rate": 4.920660239667387e-06, "epoch": 0.12641083521444696, "percentage": 12.64, "elapsed_time": "4:16:54", "remaining_time": "1 day, 5:35:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1373, "total_steps": 10853, "loss": 0.1883, "learning_rate": 4.920469735447538e-06, "epoch": 0.12650297139171696, "percentage": 12.65, "elapsed_time": "4:17:04", "remaining_time": "1 day, 5:35:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1374, "total_steps": 10853, "loss": 0.1812, "learning_rate": 4.920279006486815e-06, "epoch": 0.12659510756898695, "percentage": 12.66, "elapsed_time": "4:17:16", "remaining_time": "1 day, 5:34:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1375, "total_steps": 10853, "loss": 0.1908, "learning_rate": 4.920088052802924e-06, "epoch": 0.12668724374625698, "percentage": 12.67, "elapsed_time": "4:17:27", "remaining_time": "1 day, 5:34:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1376, "total_steps": 10853, "loss": 0.1756, "learning_rate": 4.919896874413597e-06, "epoch": 0.12677937992352697, "percentage": 12.68, "elapsed_time": "4:17:36", "remaining_time": "1 day, 5:34:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1377, "total_steps": 10853, "loss": 0.1696, "learning_rate": 4.919705471336585e-06, "epoch": 0.12687151610079697, "percentage": 12.69, "elapsed_time": "4:17:46", "remaining_time": "1 day, 5:33:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1378, "total_steps": 10853, "loss": 0.1979, "learning_rate": 4.919513843589661e-06, "epoch": 0.126963652278067, "percentage": 12.7, "elapsed_time": "4:17:57", "remaining_time": "1 day, 5:33:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1379, "total_steps": 10853, "loss": 0.1803, "learning_rate": 4.919321991190614e-06, "epoch": 0.127055788455337, "percentage": 12.71, "elapsed_time": "4:18:08", "remaining_time": "1 day, 5:33:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1380, "total_steps": 10853, "loss": 0.1933, "learning_rate": 4.919129914157261e-06, "epoch": 0.127147924632607, "percentage": 12.72, "elapsed_time": "4:18:19", "remaining_time": "1 day, 5:33:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1381, "total_steps": 10853, "loss": 0.1769, "learning_rate": 4.918937612507435e-06, "epoch": 0.127240060809877, "percentage": 12.72, "elapsed_time": "4:18:30", "remaining_time": "1 day, 5:33:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1382, "total_steps": 10853, "loss": 0.1717, "learning_rate": 4.918745086258992e-06, "epoch": 0.127332196987147, "percentage": 12.73, "elapsed_time": "4:18:40", "remaining_time": "1 day, 5:32:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1383, "total_steps": 10853, "loss": 0.1644, "learning_rate": 4.918552335429806e-06, "epoch": 0.127424333164417, "percentage": 12.74, "elapsed_time": "4:18:51", "remaining_time": "1 day, 5:32:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1384, "total_steps": 10853, "loss": 0.1759, "learning_rate": 4.918359360037776e-06, "epoch": 0.127516469341687, "percentage": 12.75, "elapsed_time": "4:19:03", "remaining_time": "1 day, 5:32:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1385, "total_steps": 10853, "loss": 0.1868, "learning_rate": 4.918166160100819e-06, "epoch": 0.12760860551895703, "percentage": 12.76, "elapsed_time": "4:19:14", "remaining_time": "1 day, 5:32:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1386, "total_steps": 10853, "loss": 0.1792, "learning_rate": 4.917972735636875e-06, "epoch": 0.12770074169622703, "percentage": 12.77, "elapsed_time": "4:19:25", "remaining_time": "1 day, 5:31:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1387, "total_steps": 10853, "loss": 0.1576, "learning_rate": 4.9177790866639005e-06, "epoch": 0.12779287787349702, "percentage": 12.78, "elapsed_time": "4:19:36", "remaining_time": "1 day, 5:31:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1388, "total_steps": 10853, "loss": 0.1748, "learning_rate": 4.917585213199878e-06, "epoch": 0.12788501405076702, "percentage": 12.79, "elapsed_time": "4:19:46", "remaining_time": "1 day, 5:31:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1389, "total_steps": 10853, "loss": 0.202, "learning_rate": 4.9173911152628095e-06, "epoch": 0.12797715022803705, "percentage": 12.8, "elapsed_time": "4:19:56", "remaining_time": "1 day, 5:31:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1390, "total_steps": 10853, "loss": 0.1892, "learning_rate": 4.917196792870715e-06, "epoch": 0.12806928640530704, "percentage": 12.81, "elapsed_time": "4:20:07", "remaining_time": "1 day, 5:30:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1391, "total_steps": 10853, "loss": 0.2017, "learning_rate": 4.917002246041638e-06, "epoch": 0.12816142258257704, "percentage": 12.82, "elapsed_time": "4:20:18", "remaining_time": "1 day, 5:30:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1392, "total_steps": 10853, "loss": 0.2083, "learning_rate": 4.916807474793643e-06, "epoch": 0.12825355875984706, "percentage": 12.83, "elapsed_time": "4:20:30", "remaining_time": "1 day, 5:30:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1393, "total_steps": 10853, "loss": 0.1898, "learning_rate": 4.916612479144812e-06, "epoch": 0.12834569493711706, "percentage": 12.84, "elapsed_time": "4:20:41", "remaining_time": "1 day, 5:30:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1394, "total_steps": 10853, "loss": 0.186, "learning_rate": 4.916417259113254e-06, "epoch": 0.12843783111438706, "percentage": 12.84, "elapsed_time": "4:20:51", "remaining_time": "1 day, 5:30:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1395, "total_steps": 10853, "loss": 0.1941, "learning_rate": 4.916221814717092e-06, "epoch": 0.12852996729165708, "percentage": 12.85, "elapsed_time": "4:21:02", "remaining_time": "1 day, 5:29:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1396, "total_steps": 10853, "loss": 0.1863, "learning_rate": 4.916026145974476e-06, "epoch": 0.12862210346892708, "percentage": 12.86, "elapsed_time": "4:21:13", "remaining_time": "1 day, 5:29:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1397, "total_steps": 10853, "loss": 0.1809, "learning_rate": 4.915830252903572e-06, "epoch": 0.12871423964619708, "percentage": 12.87, "elapsed_time": "4:21:25", "remaining_time": "1 day, 5:29:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1398, "total_steps": 10853, "loss": 0.1737, "learning_rate": 4.915634135522569e-06, "epoch": 0.12880637582346707, "percentage": 12.88, "elapsed_time": "4:21:37", "remaining_time": "1 day, 5:29:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1399, "total_steps": 10853, "loss": 0.1936, "learning_rate": 4.915437793849676e-06, "epoch": 0.1288985120007371, "percentage": 12.89, "elapsed_time": "4:21:49", "remaining_time": "1 day, 5:29:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1400, "total_steps": 10853, "loss": 0.176, "learning_rate": 4.915241227903125e-06, "epoch": 0.1289906481780071, "percentage": 12.9, "elapsed_time": "4:22:00", "remaining_time": "1 day, 5:29:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1401, "total_steps": 10853, "loss": 0.193, "learning_rate": 4.915044437701165e-06, "epoch": 0.1290827843552771, "percentage": 12.91, "elapsed_time": "4:22:11", "remaining_time": "1 day, 5:28:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1402, "total_steps": 10853, "loss": 0.1772, "learning_rate": 4.914847423262069e-06, "epoch": 0.12917492053254712, "percentage": 12.92, "elapsed_time": "4:22:23", "remaining_time": "1 day, 5:28:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1403, "total_steps": 10853, "loss": 0.1813, "learning_rate": 4.9146501846041304e-06, "epoch": 0.1292670567098171, "percentage": 12.93, "elapsed_time": "4:22:32", "remaining_time": "1 day, 5:28:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1404, "total_steps": 10853, "loss": 0.1751, "learning_rate": 4.914452721745662e-06, "epoch": 0.1293591928870871, "percentage": 12.94, "elapsed_time": "4:22:42", "remaining_time": "1 day, 5:28:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1405, "total_steps": 10853, "loss": 0.2063, "learning_rate": 4.914255034704998e-06, "epoch": 0.1294513290643571, "percentage": 12.95, "elapsed_time": "4:22:53", "remaining_time": "1 day, 5:27:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1406, "total_steps": 10853, "loss": 0.1864, "learning_rate": 4.914057123500495e-06, "epoch": 0.12954346524162713, "percentage": 12.95, "elapsed_time": "4:23:04", "remaining_time": "1 day, 5:27:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1407, "total_steps": 10853, "loss": 0.1817, "learning_rate": 4.913858988150528e-06, "epoch": 0.12963560141889713, "percentage": 12.96, "elapsed_time": "4:23:15", "remaining_time": "1 day, 5:27:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1408, "total_steps": 10853, "loss": 0.1638, "learning_rate": 4.9136606286734945e-06, "epoch": 0.12972773759616713, "percentage": 12.97, "elapsed_time": "4:23:26", "remaining_time": "1 day, 5:27:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1409, "total_steps": 10853, "loss": 0.1735, "learning_rate": 4.913462045087811e-06, "epoch": 0.12981987377343715, "percentage": 12.98, "elapsed_time": "4:23:37", "remaining_time": "1 day, 5:26:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1410, "total_steps": 10853, "loss": 0.1859, "learning_rate": 4.9132632374119185e-06, "epoch": 0.12991200995070715, "percentage": 12.99, "elapsed_time": "4:23:47", "remaining_time": "1 day, 5:26:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1411, "total_steps": 10853, "loss": 0.18, "learning_rate": 4.913064205664273e-06, "epoch": 0.13000414612797714, "percentage": 13.0, "elapsed_time": "4:23:58", "remaining_time": "1 day, 5:26:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1412, "total_steps": 10853, "loss": 0.1701, "learning_rate": 4.912864949863358e-06, "epoch": 0.13009628230524717, "percentage": 13.01, "elapsed_time": "4:24:09", "remaining_time": "1 day, 5:26:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1413, "total_steps": 10853, "loss": 0.1975, "learning_rate": 4.912665470027671e-06, "epoch": 0.13018841848251717, "percentage": 13.02, "elapsed_time": "4:24:20", "remaining_time": "1 day, 5:26:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1414, "total_steps": 10853, "loss": 0.1686, "learning_rate": 4.912465766175736e-06, "epoch": 0.13028055465978716, "percentage": 13.03, "elapsed_time": "4:24:31", "remaining_time": "1 day, 5:25:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1415, "total_steps": 10853, "loss": 0.1649, "learning_rate": 4.912265838326095e-06, "epoch": 0.13037269083705716, "percentage": 13.04, "elapsed_time": "4:24:41", "remaining_time": "1 day, 5:25:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1416, "total_steps": 10853, "loss": 0.1792, "learning_rate": 4.912065686497312e-06, "epoch": 0.13046482701432718, "percentage": 13.05, "elapsed_time": "4:24:52", "remaining_time": "1 day, 5:25:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1417, "total_steps": 10853, "loss": 0.1733, "learning_rate": 4.91186531070797e-06, "epoch": 0.13055696319159718, "percentage": 13.06, "elapsed_time": "4:25:04", "remaining_time": "1 day, 5:25:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1418, "total_steps": 10853, "loss": 0.1911, "learning_rate": 4.911664710976674e-06, "epoch": 0.13064909936886718, "percentage": 13.07, "elapsed_time": "4:25:15", "remaining_time": "1 day, 5:24:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1419, "total_steps": 10853, "loss": 0.1959, "learning_rate": 4.91146388732205e-06, "epoch": 0.1307412355461372, "percentage": 13.07, "elapsed_time": "4:25:27", "remaining_time": "1 day, 5:24:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1420, "total_steps": 10853, "loss": 0.1844, "learning_rate": 4.911262839762745e-06, "epoch": 0.1308333717234072, "percentage": 13.08, "elapsed_time": "4:25:38", "remaining_time": "1 day, 5:24:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1421, "total_steps": 10853, "loss": 0.1839, "learning_rate": 4.911061568317425e-06, "epoch": 0.1309255079006772, "percentage": 13.09, "elapsed_time": "4:25:48", "remaining_time": "1 day, 5:24:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1422, "total_steps": 10853, "loss": 0.1893, "learning_rate": 4.910860073004779e-06, "epoch": 0.1310176440779472, "percentage": 13.1, "elapsed_time": "4:25:59", "remaining_time": "1 day, 5:24:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1423, "total_steps": 10853, "loss": 0.1757, "learning_rate": 4.910658353843517e-06, "epoch": 0.13110978025521722, "percentage": 13.11, "elapsed_time": "4:26:10", "remaining_time": "1 day, 5:23:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1424, "total_steps": 10853, "loss": 0.163, "learning_rate": 4.910456410852367e-06, "epoch": 0.13120191643248721, "percentage": 13.12, "elapsed_time": "4:26:20", "remaining_time": "1 day, 5:23:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1425, "total_steps": 10853, "loss": 0.1723, "learning_rate": 4.91025424405008e-06, "epoch": 0.1312940526097572, "percentage": 13.13, "elapsed_time": "4:26:31", "remaining_time": "1 day, 5:23:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1426, "total_steps": 10853, "loss": 0.1911, "learning_rate": 4.910051853455426e-06, "epoch": 0.13138618878702724, "percentage": 13.14, "elapsed_time": "4:26:42", "remaining_time": "1 day, 5:23:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1427, "total_steps": 10853, "loss": 0.1988, "learning_rate": 4.909849239087199e-06, "epoch": 0.13147832496429723, "percentage": 13.15, "elapsed_time": "4:26:54", "remaining_time": "1 day, 5:23:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1428, "total_steps": 10853, "loss": 0.1951, "learning_rate": 4.90964640096421e-06, "epoch": 0.13157046114156723, "percentage": 13.16, "elapsed_time": "4:27:04", "remaining_time": "1 day, 5:22:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1429, "total_steps": 10853, "loss": 0.1812, "learning_rate": 4.9094433391052935e-06, "epoch": 0.13166259731883725, "percentage": 13.17, "elapsed_time": "4:27:16", "remaining_time": "1 day, 5:22:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1430, "total_steps": 10853, "loss": 0.1985, "learning_rate": 4.909240053529304e-06, "epoch": 0.13175473349610725, "percentage": 13.18, "elapsed_time": "4:27:27", "remaining_time": "1 day, 5:22:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1431, "total_steps": 10853, "loss": 0.1702, "learning_rate": 4.909036544255116e-06, "epoch": 0.13184686967337725, "percentage": 13.19, "elapsed_time": "4:27:38", "remaining_time": "1 day, 5:22:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1432, "total_steps": 10853, "loss": 0.1781, "learning_rate": 4.908832811301626e-06, "epoch": 0.13193900585064725, "percentage": 13.19, "elapsed_time": "4:27:49", "remaining_time": "1 day, 5:21:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1433, "total_steps": 10853, "loss": 0.1743, "learning_rate": 4.90862885468775e-06, "epoch": 0.13203114202791727, "percentage": 13.2, "elapsed_time": "4:27:59", "remaining_time": "1 day, 5:21:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1434, "total_steps": 10853, "loss": 0.1895, "learning_rate": 4.908424674432425e-06, "epoch": 0.13212327820518727, "percentage": 13.21, "elapsed_time": "4:28:11", "remaining_time": "1 day, 5:21:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1435, "total_steps": 10853, "loss": 0.1809, "learning_rate": 4.908220270554611e-06, "epoch": 0.13221541438245726, "percentage": 13.22, "elapsed_time": "4:28:22", "remaining_time": "1 day, 5:21:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1436, "total_steps": 10853, "loss": 0.1833, "learning_rate": 4.908015643073285e-06, "epoch": 0.1323075505597273, "percentage": 13.23, "elapsed_time": "4:28:31", "remaining_time": "1 day, 5:20:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1437, "total_steps": 10853, "loss": 0.1984, "learning_rate": 4.907810792007447e-06, "epoch": 0.13239968673699729, "percentage": 13.24, "elapsed_time": "4:28:42", "remaining_time": "1 day, 5:20:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1438, "total_steps": 10853, "loss": 0.1864, "learning_rate": 4.907605717376118e-06, "epoch": 0.13249182291426728, "percentage": 13.25, "elapsed_time": "4:28:52", "remaining_time": "1 day, 5:20:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1439, "total_steps": 10853, "loss": 0.1758, "learning_rate": 4.90740041919834e-06, "epoch": 0.13258395909153728, "percentage": 13.26, "elapsed_time": "4:29:04", "remaining_time": "1 day, 5:20:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1440, "total_steps": 10853, "loss": 0.1771, "learning_rate": 4.907194897493173e-06, "epoch": 0.1326760952688073, "percentage": 13.27, "elapsed_time": "4:29:15", "remaining_time": "1 day, 5:20:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1441, "total_steps": 10853, "loss": 0.1905, "learning_rate": 4.906989152279701e-06, "epoch": 0.1327682314460773, "percentage": 13.28, "elapsed_time": "4:29:26", "remaining_time": "1 day, 5:19:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1442, "total_steps": 10853, "loss": 0.1738, "learning_rate": 4.9067831835770275e-06, "epoch": 0.1328603676233473, "percentage": 13.29, "elapsed_time": "4:29:37", "remaining_time": "1 day, 5:19:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1443, "total_steps": 10853, "loss": 0.1854, "learning_rate": 4.906576991404276e-06, "epoch": 0.13295250380061732, "percentage": 13.3, "elapsed_time": "4:29:48", "remaining_time": "1 day, 5:19:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1444, "total_steps": 10853, "loss": 0.1985, "learning_rate": 4.9063705757805915e-06, "epoch": 0.13304463997788732, "percentage": 13.31, "elapsed_time": "4:29:59", "remaining_time": "1 day, 5:19:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1445, "total_steps": 10853, "loss": 0.1595, "learning_rate": 4.906163936725141e-06, "epoch": 0.13313677615515732, "percentage": 13.31, "elapsed_time": "4:30:10", "remaining_time": "1 day, 5:19:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1446, "total_steps": 10853, "loss": 0.1716, "learning_rate": 4.905957074257109e-06, "epoch": 0.13322891233242734, "percentage": 13.32, "elapsed_time": "4:30:21", "remaining_time": "1 day, 5:18:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1447, "total_steps": 10853, "loss": 0.1686, "learning_rate": 4.905749988395704e-06, "epoch": 0.13332104850969734, "percentage": 13.33, "elapsed_time": "4:30:33", "remaining_time": "1 day, 5:18:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1448, "total_steps": 10853, "loss": 0.1682, "learning_rate": 4.905542679160155e-06, "epoch": 0.13341318468696733, "percentage": 13.34, "elapsed_time": "4:30:43", "remaining_time": "1 day, 5:18:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1449, "total_steps": 10853, "loss": 0.1972, "learning_rate": 4.905335146569707e-06, "epoch": 0.13350532086423733, "percentage": 13.35, "elapsed_time": "4:30:53", "remaining_time": "1 day, 5:18:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1450, "total_steps": 10853, "loss": 0.1786, "learning_rate": 4.9051273906436335e-06, "epoch": 0.13359745704150736, "percentage": 13.36, "elapsed_time": "4:31:04", "remaining_time": "1 day, 5:17:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1451, "total_steps": 10853, "loss": 0.1753, "learning_rate": 4.904919411401222e-06, "epoch": 0.13368959321877735, "percentage": 13.37, "elapsed_time": "4:31:13", "remaining_time": "1 day, 5:17:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1452, "total_steps": 10853, "loss": 0.1685, "learning_rate": 4.9047112088617855e-06, "epoch": 0.13378172939604735, "percentage": 13.38, "elapsed_time": "4:31:23", "remaining_time": "1 day, 5:17:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1453, "total_steps": 10853, "loss": 0.183, "learning_rate": 4.904502783044654e-06, "epoch": 0.13387386557331737, "percentage": 13.39, "elapsed_time": "4:31:34", "remaining_time": "1 day, 5:16:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1454, "total_steps": 10853, "loss": 0.1997, "learning_rate": 4.90429413396918e-06, "epoch": 0.13396600175058737, "percentage": 13.4, "elapsed_time": "4:31:45", "remaining_time": "1 day, 5:16:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1455, "total_steps": 10853, "loss": 0.1874, "learning_rate": 4.904085261654736e-06, "epoch": 0.13405813792785737, "percentage": 13.41, "elapsed_time": "4:31:56", "remaining_time": "1 day, 5:16:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1456, "total_steps": 10853, "loss": 0.186, "learning_rate": 4.903876166120718e-06, "epoch": 0.13415027410512737, "percentage": 13.42, "elapsed_time": "4:32:07", "remaining_time": "1 day, 5:16:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1457, "total_steps": 10853, "loss": 0.1926, "learning_rate": 4.903666847386539e-06, "epoch": 0.1342424102823974, "percentage": 13.42, "elapsed_time": "4:32:18", "remaining_time": "1 day, 5:16:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1458, "total_steps": 10853, "loss": 0.1888, "learning_rate": 4.903457305471635e-06, "epoch": 0.1343345464596674, "percentage": 13.43, "elapsed_time": "4:32:31", "remaining_time": "1 day, 5:16:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1459, "total_steps": 10853, "loss": 0.1899, "learning_rate": 4.90324754039546e-06, "epoch": 0.13442668263693738, "percentage": 13.44, "elapsed_time": "4:32:40", "remaining_time": "1 day, 5:15:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1460, "total_steps": 10853, "loss": 0.1743, "learning_rate": 4.903037552177494e-06, "epoch": 0.1345188188142074, "percentage": 13.45, "elapsed_time": "4:32:49", "remaining_time": "1 day, 5:15:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1461, "total_steps": 10853, "loss": 0.1809, "learning_rate": 4.9028273408372315e-06, "epoch": 0.1346109549914774, "percentage": 13.46, "elapsed_time": "4:33:00", "remaining_time": "1 day, 5:15:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1462, "total_steps": 10853, "loss": 0.1636, "learning_rate": 4.902616906394193e-06, "epoch": 0.1347030911687474, "percentage": 13.47, "elapsed_time": "4:33:12", "remaining_time": "1 day, 5:14:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1463, "total_steps": 10853, "loss": 0.1743, "learning_rate": 4.9024062488679145e-06, "epoch": 0.13479522734601743, "percentage": 13.48, "elapsed_time": "4:33:24", "remaining_time": "1 day, 5:14:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1464, "total_steps": 10853, "loss": 0.1561, "learning_rate": 4.9021953682779585e-06, "epoch": 0.13488736352328742, "percentage": 13.49, "elapsed_time": "4:33:35", "remaining_time": "1 day, 5:14:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1465, "total_steps": 10853, "loss": 0.1925, "learning_rate": 4.901984264643904e-06, "epoch": 0.13497949970055742, "percentage": 13.5, "elapsed_time": "4:33:47", "remaining_time": "1 day, 5:14:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1466, "total_steps": 10853, "loss": 0.1992, "learning_rate": 4.9017729379853515e-06, "epoch": 0.13507163587782742, "percentage": 13.51, "elapsed_time": "4:33:59", "remaining_time": "1 day, 5:14:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1467, "total_steps": 10853, "loss": 0.2045, "learning_rate": 4.901561388321923e-06, "epoch": 0.13516377205509744, "percentage": 13.52, "elapsed_time": "4:34:11", "remaining_time": "1 day, 5:14:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1468, "total_steps": 10853, "loss": 0.1572, "learning_rate": 4.901349615673262e-06, "epoch": 0.13525590823236744, "percentage": 13.53, "elapsed_time": "4:34:22", "remaining_time": "1 day, 5:14:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1469, "total_steps": 10853, "loss": 0.1802, "learning_rate": 4.90113762005903e-06, "epoch": 0.13534804440963744, "percentage": 13.54, "elapsed_time": "4:34:32", "remaining_time": "1 day, 5:13:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1470, "total_steps": 10853, "loss": 0.1858, "learning_rate": 4.900925401498912e-06, "epoch": 0.13544018058690746, "percentage": 13.54, "elapsed_time": "4:34:43", "remaining_time": "1 day, 5:13:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1471, "total_steps": 10853, "loss": 0.1801, "learning_rate": 4.900712960012612e-06, "epoch": 0.13553231676417746, "percentage": 13.55, "elapsed_time": "4:34:56", "remaining_time": "1 day, 5:13:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1472, "total_steps": 10853, "loss": 0.1808, "learning_rate": 4.900500295619855e-06, "epoch": 0.13562445294144745, "percentage": 13.56, "elapsed_time": "4:35:07", "remaining_time": "1 day, 5:13:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1473, "total_steps": 10853, "loss": 0.1707, "learning_rate": 4.900287408340387e-06, "epoch": 0.13571658911871745, "percentage": 13.57, "elapsed_time": "4:35:16", "remaining_time": "1 day, 5:12:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1474, "total_steps": 10853, "loss": 0.1826, "learning_rate": 4.900074298193976e-06, "epoch": 0.13580872529598748, "percentage": 13.58, "elapsed_time": "4:35:28", "remaining_time": "1 day, 5:12:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1475, "total_steps": 10853, "loss": 0.1936, "learning_rate": 4.899860965200407e-06, "epoch": 0.13590086147325747, "percentage": 13.59, "elapsed_time": "4:35:40", "remaining_time": "1 day, 5:12:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1476, "total_steps": 10853, "loss": 0.1949, "learning_rate": 4.89964740937949e-06, "epoch": 0.13599299765052747, "percentage": 13.6, "elapsed_time": "4:35:51", "remaining_time": "1 day, 5:12:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1477, "total_steps": 10853, "loss": 0.1812, "learning_rate": 4.899433630751052e-06, "epoch": 0.1360851338277975, "percentage": 13.61, "elapsed_time": "4:36:02", "remaining_time": "1 day, 5:12:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1478, "total_steps": 10853, "loss": 0.1692, "learning_rate": 4.8992196293349435e-06, "epoch": 0.1361772700050675, "percentage": 13.62, "elapsed_time": "4:36:12", "remaining_time": "1 day, 5:12:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1479, "total_steps": 10853, "loss": 0.173, "learning_rate": 4.899005405151034e-06, "epoch": 0.1362694061823375, "percentage": 13.63, "elapsed_time": "4:36:23", "remaining_time": "1 day, 5:11:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1480, "total_steps": 10853, "loss": 0.1917, "learning_rate": 4.898790958219215e-06, "epoch": 0.1363615423596075, "percentage": 13.64, "elapsed_time": "4:36:35", "remaining_time": "1 day, 5:11:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1481, "total_steps": 10853, "loss": 0.194, "learning_rate": 4.898576288559396e-06, "epoch": 0.1364536785368775, "percentage": 13.65, "elapsed_time": "4:36:47", "remaining_time": "1 day, 5:11:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1482, "total_steps": 10853, "loss": 0.1869, "learning_rate": 4.898361396191512e-06, "epoch": 0.1365458147141475, "percentage": 13.66, "elapsed_time": "4:36:57", "remaining_time": "1 day, 5:11:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1483, "total_steps": 10853, "loss": 0.1878, "learning_rate": 4.898146281135514e-06, "epoch": 0.1366379508914175, "percentage": 13.66, "elapsed_time": "4:37:08", "remaining_time": "1 day, 5:11:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1484, "total_steps": 10853, "loss": 0.171, "learning_rate": 4.8979309434113745e-06, "epoch": 0.13673008706868753, "percentage": 13.67, "elapsed_time": "4:37:18", "remaining_time": "1 day, 5:10:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1485, "total_steps": 10853, "loss": 0.176, "learning_rate": 4.89771538303909e-06, "epoch": 0.13682222324595752, "percentage": 13.68, "elapsed_time": "4:37:29", "remaining_time": "1 day, 5:10:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1486, "total_steps": 10853, "loss": 0.1763, "learning_rate": 4.897499600038673e-06, "epoch": 0.13691435942322752, "percentage": 13.69, "elapsed_time": "4:37:39", "remaining_time": "1 day, 5:10:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1487, "total_steps": 10853, "loss": 0.181, "learning_rate": 4.8972835944301615e-06, "epoch": 0.13700649560049755, "percentage": 13.7, "elapsed_time": "4:37:50", "remaining_time": "1 day, 5:09:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1488, "total_steps": 10853, "loss": 0.1687, "learning_rate": 4.89706736623361e-06, "epoch": 0.13709863177776754, "percentage": 13.71, "elapsed_time": "4:38:01", "remaining_time": "1 day, 5:09:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1489, "total_steps": 10853, "loss": 0.1708, "learning_rate": 4.896850915469095e-06, "epoch": 0.13719076795503754, "percentage": 13.72, "elapsed_time": "4:38:11", "remaining_time": "1 day, 5:09:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1490, "total_steps": 10853, "loss": 0.1981, "learning_rate": 4.896634242156715e-06, "epoch": 0.13728290413230754, "percentage": 13.73, "elapsed_time": "4:38:22", "remaining_time": "1 day, 5:09:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1491, "total_steps": 10853, "loss": 0.2006, "learning_rate": 4.896417346316587e-06, "epoch": 0.13737504030957756, "percentage": 13.74, "elapsed_time": "4:38:33", "remaining_time": "1 day, 5:09:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1492, "total_steps": 10853, "loss": 0.176, "learning_rate": 4.8962002279688514e-06, "epoch": 0.13746717648684756, "percentage": 13.75, "elapsed_time": "4:38:42", "remaining_time": "1 day, 5:08:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1493, "total_steps": 10853, "loss": 0.1824, "learning_rate": 4.8959828871336665e-06, "epoch": 0.13755931266411756, "percentage": 13.76, "elapsed_time": "4:38:53", "remaining_time": "1 day, 5:08:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1494, "total_steps": 10853, "loss": 0.1798, "learning_rate": 4.895765323831212e-06, "epoch": 0.13765144884138758, "percentage": 13.77, "elapsed_time": "4:39:05", "remaining_time": "1 day, 5:08:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1495, "total_steps": 10853, "loss": 0.1865, "learning_rate": 4.895547538081691e-06, "epoch": 0.13774358501865758, "percentage": 13.77, "elapsed_time": "4:39:16", "remaining_time": "1 day, 5:08:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1496, "total_steps": 10853, "loss": 0.1798, "learning_rate": 4.895329529905322e-06, "epoch": 0.13783572119592757, "percentage": 13.78, "elapsed_time": "4:39:27", "remaining_time": "1 day, 5:07:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1497, "total_steps": 10853, "loss": 0.1779, "learning_rate": 4.895111299322348e-06, "epoch": 0.1379278573731976, "percentage": 13.79, "elapsed_time": "4:39:40", "remaining_time": "1 day, 5:07:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1498, "total_steps": 10853, "loss": 0.1718, "learning_rate": 4.894892846353032e-06, "epoch": 0.1380199935504676, "percentage": 13.8, "elapsed_time": "4:39:51", "remaining_time": "1 day, 5:07:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1499, "total_steps": 10853, "loss": 0.1769, "learning_rate": 4.8946741710176584e-06, "epoch": 0.1381121297277376, "percentage": 13.81, "elapsed_time": "4:40:01", "remaining_time": "1 day, 5:07:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1500, "total_steps": 10853, "loss": 0.1963, "learning_rate": 4.894455273336531e-06, "epoch": 0.1382042659050076, "percentage": 13.82, "elapsed_time": "4:40:12", "remaining_time": "1 day, 5:07:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1500, "total_steps": 10853, "eval_loss": 0.1832522302865982, "epoch": 0.1382042659050076, "percentage": 13.82, "elapsed_time": "4:45:13", "remaining_time": "1 day, 5:38:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1501, "total_steps": 10853, "loss": 0.1821, "learning_rate": 4.894236153329972e-06, "epoch": 0.13829640208227761, "percentage": 13.83, "elapsed_time": "4:45:25", "remaining_time": "1 day, 5:38:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1502, "total_steps": 10853, "loss": 0.164, "learning_rate": 4.894016811018329e-06, "epoch": 0.1383885382595476, "percentage": 13.84, "elapsed_time": "4:45:35", "remaining_time": "1 day, 5:38:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1503, "total_steps": 10853, "loss": 0.1967, "learning_rate": 4.893797246421968e-06, "epoch": 0.1384806744368176, "percentage": 13.85, "elapsed_time": "4:45:47", "remaining_time": "1 day, 5:37:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1504, "total_steps": 10853, "loss": 0.1844, "learning_rate": 4.893577459561274e-06, "epoch": 0.13857281061408763, "percentage": 13.86, "elapsed_time": "4:45:58", "remaining_time": "1 day, 5:37:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1505, "total_steps": 10853, "loss": 0.1896, "learning_rate": 4.893357450456657e-06, "epoch": 0.13866494679135763, "percentage": 13.87, "elapsed_time": "4:46:10", "remaining_time": "1 day, 5:37:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1506, "total_steps": 10853, "loss": 0.1719, "learning_rate": 4.893137219128542e-06, "epoch": 0.13875708296862763, "percentage": 13.88, "elapsed_time": "4:46:20", "remaining_time": "1 day, 5:37:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1507, "total_steps": 10853, "loss": 0.1735, "learning_rate": 4.892916765597378e-06, "epoch": 0.13884921914589762, "percentage": 13.89, "elapsed_time": "4:46:30", "remaining_time": "1 day, 5:36:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1508, "total_steps": 10853, "loss": 0.2017, "learning_rate": 4.892696089883636e-06, "epoch": 0.13894135532316765, "percentage": 13.89, "elapsed_time": "4:46:42", "remaining_time": "1 day, 5:36:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1509, "total_steps": 10853, "loss": 0.1845, "learning_rate": 4.8924751920078045e-06, "epoch": 0.13903349150043764, "percentage": 13.9, "elapsed_time": "4:46:52", "remaining_time": "1 day, 5:36:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1510, "total_steps": 10853, "loss": 0.1673, "learning_rate": 4.892254071990393e-06, "epoch": 0.13912562767770764, "percentage": 13.91, "elapsed_time": "4:47:04", "remaining_time": "1 day, 5:36:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1511, "total_steps": 10853, "loss": 0.1638, "learning_rate": 4.892032729851934e-06, "epoch": 0.13921776385497767, "percentage": 13.92, "elapsed_time": "4:47:15", "remaining_time": "1 day, 5:35:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1512, "total_steps": 10853, "loss": 0.2006, "learning_rate": 4.891811165612979e-06, "epoch": 0.13930990003224766, "percentage": 13.93, "elapsed_time": "4:47:26", "remaining_time": "1 day, 5:35:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1513, "total_steps": 10853, "loss": 0.1741, "learning_rate": 4.8915893792941e-06, "epoch": 0.13940203620951766, "percentage": 13.94, "elapsed_time": "4:47:35", "remaining_time": "1 day, 5:35:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1514, "total_steps": 10853, "loss": 0.1853, "learning_rate": 4.891367370915889e-06, "epoch": 0.13949417238678768, "percentage": 13.95, "elapsed_time": "4:47:47", "remaining_time": "1 day, 5:35:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1515, "total_steps": 10853, "loss": 0.1853, "learning_rate": 4.89114514049896e-06, "epoch": 0.13958630856405768, "percentage": 13.96, "elapsed_time": "4:47:59", "remaining_time": "1 day, 5:35:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1516, "total_steps": 10853, "loss": 0.1713, "learning_rate": 4.890922688063949e-06, "epoch": 0.13967844474132768, "percentage": 13.97, "elapsed_time": "4:48:10", "remaining_time": "1 day, 5:34:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1517, "total_steps": 10853, "loss": 0.159, "learning_rate": 4.8907000136315075e-06, "epoch": 0.13977058091859768, "percentage": 13.98, "elapsed_time": "4:48:20", "remaining_time": "1 day, 5:34:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1518, "total_steps": 10853, "loss": 0.1646, "learning_rate": 4.890477117222313e-06, "epoch": 0.1398627170958677, "percentage": 13.99, "elapsed_time": "4:48:31", "remaining_time": "1 day, 5:34:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1519, "total_steps": 10853, "loss": 0.1712, "learning_rate": 4.890253998857061e-06, "epoch": 0.1399548532731377, "percentage": 14.0, "elapsed_time": "4:48:41", "remaining_time": "1 day, 5:33:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1520, "total_steps": 10853, "loss": 0.1763, "learning_rate": 4.890030658556467e-06, "epoch": 0.1400469894504077, "percentage": 14.01, "elapsed_time": "4:48:52", "remaining_time": "1 day, 5:33:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1521, "total_steps": 10853, "loss": 0.1778, "learning_rate": 4.88980709634127e-06, "epoch": 0.14013912562767772, "percentage": 14.01, "elapsed_time": "4:49:04", "remaining_time": "1 day, 5:33:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1522, "total_steps": 10853, "loss": 0.2014, "learning_rate": 4.889583312232227e-06, "epoch": 0.14023126180494772, "percentage": 14.02, "elapsed_time": "4:49:15", "remaining_time": "1 day, 5:33:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1523, "total_steps": 10853, "loss": 0.173, "learning_rate": 4.889359306250117e-06, "epoch": 0.1403233979822177, "percentage": 14.03, "elapsed_time": "4:49:27", "remaining_time": "1 day, 5:33:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1524, "total_steps": 10853, "loss": 0.1703, "learning_rate": 4.889135078415736e-06, "epoch": 0.1404155341594877, "percentage": 14.04, "elapsed_time": "4:49:37", "remaining_time": "1 day, 5:32:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1525, "total_steps": 10853, "loss": 0.2035, "learning_rate": 4.888910628749908e-06, "epoch": 0.14050767033675773, "percentage": 14.05, "elapsed_time": "4:49:49", "remaining_time": "1 day, 5:32:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1526, "total_steps": 10853, "loss": 0.1804, "learning_rate": 4.88868595727347e-06, "epoch": 0.14059980651402773, "percentage": 14.06, "elapsed_time": "4:49:59", "remaining_time": "1 day, 5:32:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1527, "total_steps": 10853, "loss": 0.1767, "learning_rate": 4.888461064007284e-06, "epoch": 0.14069194269129773, "percentage": 14.07, "elapsed_time": "4:50:08", "remaining_time": "1 day, 5:32:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1528, "total_steps": 10853, "loss": 0.1853, "learning_rate": 4.888235948972232e-06, "epoch": 0.14078407886856775, "percentage": 14.08, "elapsed_time": "4:50:20", "remaining_time": "1 day, 5:31:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1529, "total_steps": 10853, "loss": 0.1643, "learning_rate": 4.888010612189213e-06, "epoch": 0.14087621504583775, "percentage": 14.09, "elapsed_time": "4:50:30", "remaining_time": "1 day, 5:31:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1530, "total_steps": 10853, "loss": 0.191, "learning_rate": 4.8877850536791535e-06, "epoch": 0.14096835122310775, "percentage": 14.1, "elapsed_time": "4:50:40", "remaining_time": "1 day, 5:31:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1531, "total_steps": 10853, "loss": 0.1941, "learning_rate": 4.887559273462994e-06, "epoch": 0.14106048740037777, "percentage": 14.11, "elapsed_time": "4:50:52", "remaining_time": "1 day, 5:31:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1532, "total_steps": 10853, "loss": 0.1845, "learning_rate": 4.8873332715617e-06, "epoch": 0.14115262357764777, "percentage": 14.12, "elapsed_time": "4:51:03", "remaining_time": "1 day, 5:30:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1533, "total_steps": 10853, "loss": 0.1911, "learning_rate": 4.887107047996253e-06, "epoch": 0.14124475975491776, "percentage": 14.13, "elapsed_time": "4:51:14", "remaining_time": "1 day, 5:30:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1534, "total_steps": 10853, "loss": 0.1763, "learning_rate": 4.886880602787661e-06, "epoch": 0.14133689593218776, "percentage": 14.13, "elapsed_time": "4:51:24", "remaining_time": "1 day, 5:30:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1535, "total_steps": 10853, "loss": 0.172, "learning_rate": 4.886653935956949e-06, "epoch": 0.1414290321094578, "percentage": 14.14, "elapsed_time": "4:51:35", "remaining_time": "1 day, 5:30:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1536, "total_steps": 10853, "loss": 0.1664, "learning_rate": 4.88642704752516e-06, "epoch": 0.14152116828672778, "percentage": 14.15, "elapsed_time": "4:51:45", "remaining_time": "1 day, 5:29:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1537, "total_steps": 10853, "loss": 0.1725, "learning_rate": 4.886199937513365e-06, "epoch": 0.14161330446399778, "percentage": 14.16, "elapsed_time": "4:51:57", "remaining_time": "1 day, 5:29:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1538, "total_steps": 10853, "loss": 0.1811, "learning_rate": 4.885972605942647e-06, "epoch": 0.1417054406412678, "percentage": 14.17, "elapsed_time": "4:52:08", "remaining_time": "1 day, 5:29:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1539, "total_steps": 10853, "loss": 0.1725, "learning_rate": 4.8857450528341166e-06, "epoch": 0.1417975768185378, "percentage": 14.18, "elapsed_time": "4:52:17", "remaining_time": "1 day, 5:28:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1540, "total_steps": 10853, "loss": 0.1632, "learning_rate": 4.8855172782089015e-06, "epoch": 0.1418897129958078, "percentage": 14.19, "elapsed_time": "4:52:28", "remaining_time": "1 day, 5:28:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1541, "total_steps": 10853, "loss": 0.1759, "learning_rate": 4.88528928208815e-06, "epoch": 0.1419818491730778, "percentage": 14.2, "elapsed_time": "4:52:39", "remaining_time": "1 day, 5:28:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1542, "total_steps": 10853, "loss": 0.1786, "learning_rate": 4.885061064493033e-06, "epoch": 0.14207398535034782, "percentage": 14.21, "elapsed_time": "4:52:51", "remaining_time": "1 day, 5:28:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1543, "total_steps": 10853, "loss": 0.1732, "learning_rate": 4.884832625444738e-06, "epoch": 0.14216612152761782, "percentage": 14.22, "elapsed_time": "4:53:01", "remaining_time": "1 day, 5:28:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1544, "total_steps": 10853, "loss": 0.1662, "learning_rate": 4.8846039649644785e-06, "epoch": 0.1422582577048878, "percentage": 14.23, "elapsed_time": "4:53:13", "remaining_time": "1 day, 5:27:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1545, "total_steps": 10853, "loss": 0.1715, "learning_rate": 4.884375083073483e-06, "epoch": 0.14235039388215784, "percentage": 14.24, "elapsed_time": "4:53:23", "remaining_time": "1 day, 5:27:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1546, "total_steps": 10853, "loss": 0.1841, "learning_rate": 4.8841459797930045e-06, "epoch": 0.14244253005942784, "percentage": 14.24, "elapsed_time": "4:53:34", "remaining_time": "1 day, 5:27:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1547, "total_steps": 10853, "loss": 0.1917, "learning_rate": 4.8839166551443165e-06, "epoch": 0.14253466623669783, "percentage": 14.25, "elapsed_time": "4:53:45", "remaining_time": "1 day, 5:27:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1548, "total_steps": 10853, "loss": 0.1909, "learning_rate": 4.883687109148709e-06, "epoch": 0.14262680241396786, "percentage": 14.26, "elapsed_time": "4:53:56", "remaining_time": "1 day, 5:26:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1549, "total_steps": 10853, "loss": 0.1634, "learning_rate": 4.883457341827498e-06, "epoch": 0.14271893859123785, "percentage": 14.27, "elapsed_time": "4:54:07", "remaining_time": "1 day, 5:26:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1550, "total_steps": 10853, "loss": 0.1905, "learning_rate": 4.883227353202016e-06, "epoch": 0.14281107476850785, "percentage": 14.28, "elapsed_time": "4:54:17", "remaining_time": "1 day, 5:26:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1551, "total_steps": 10853, "loss": 0.1766, "learning_rate": 4.882997143293617e-06, "epoch": 0.14290321094577785, "percentage": 14.29, "elapsed_time": "4:54:26", "remaining_time": "1 day, 5:25:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1552, "total_steps": 10853, "loss": 0.177, "learning_rate": 4.882766712123677e-06, "epoch": 0.14299534712304787, "percentage": 14.3, "elapsed_time": "4:54:38", "remaining_time": "1 day, 5:25:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1553, "total_steps": 10853, "loss": 0.1902, "learning_rate": 4.882536059713592e-06, "epoch": 0.14308748330031787, "percentage": 14.31, "elapsed_time": "4:54:48", "remaining_time": "1 day, 5:25:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1554, "total_steps": 10853, "loss": 0.1828, "learning_rate": 4.882305186084777e-06, "epoch": 0.14317961947758787, "percentage": 14.32, "elapsed_time": "4:54:59", "remaining_time": "1 day, 5:25:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1555, "total_steps": 10853, "loss": 0.1784, "learning_rate": 4.88207409125867e-06, "epoch": 0.1432717556548579, "percentage": 14.33, "elapsed_time": "4:55:09", "remaining_time": "1 day, 5:24:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1556, "total_steps": 10853, "loss": 0.1802, "learning_rate": 4.881842775256726e-06, "epoch": 0.1433638918321279, "percentage": 14.34, "elapsed_time": "4:55:19", "remaining_time": "1 day, 5:24:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1557, "total_steps": 10853, "loss": 0.1722, "learning_rate": 4.8816112381004245e-06, "epoch": 0.14345602800939788, "percentage": 14.35, "elapsed_time": "4:55:28", "remaining_time": "1 day, 5:24:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1558, "total_steps": 10853, "loss": 0.183, "learning_rate": 4.881379479811263e-06, "epoch": 0.14354816418666788, "percentage": 14.36, "elapsed_time": "4:55:39", "remaining_time": "1 day, 5:23:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1559, "total_steps": 10853, "loss": 0.1727, "learning_rate": 4.881147500410761e-06, "epoch": 0.1436403003639379, "percentage": 14.36, "elapsed_time": "4:55:48", "remaining_time": "1 day, 5:23:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1560, "total_steps": 10853, "loss": 0.183, "learning_rate": 4.880915299920457e-06, "epoch": 0.1437324365412079, "percentage": 14.37, "elapsed_time": "4:55:57", "remaining_time": "1 day, 5:23:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1561, "total_steps": 10853, "loss": 0.1648, "learning_rate": 4.8806828783619106e-06, "epoch": 0.1438245727184779, "percentage": 14.38, "elapsed_time": "4:56:07", "remaining_time": "1 day, 5:22:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1562, "total_steps": 10853, "loss": 0.1858, "learning_rate": 4.880450235756704e-06, "epoch": 0.14391670889574792, "percentage": 14.39, "elapsed_time": "4:56:17", "remaining_time": "1 day, 5:22:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1563, "total_steps": 10853, "loss": 0.1709, "learning_rate": 4.880217372126436e-06, "epoch": 0.14400884507301792, "percentage": 14.4, "elapsed_time": "4:56:28", "remaining_time": "1 day, 5:22:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1564, "total_steps": 10853, "loss": 0.1833, "learning_rate": 4.8799842874927285e-06, "epoch": 0.14410098125028792, "percentage": 14.41, "elapsed_time": "4:56:38", "remaining_time": "1 day, 5:21:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1565, "total_steps": 10853, "loss": 0.1751, "learning_rate": 4.879750981877224e-06, "epoch": 0.14419311742755794, "percentage": 14.42, "elapsed_time": "4:56:50", "remaining_time": "1 day, 5:21:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1566, "total_steps": 10853, "loss": 0.1696, "learning_rate": 4.879517455301585e-06, "epoch": 0.14428525360482794, "percentage": 14.43, "elapsed_time": "4:57:00", "remaining_time": "1 day, 5:21:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1567, "total_steps": 10853, "loss": 0.1897, "learning_rate": 4.8792837077874945e-06, "epoch": 0.14437738978209794, "percentage": 14.44, "elapsed_time": "4:57:10", "remaining_time": "1 day, 5:21:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1568, "total_steps": 10853, "loss": 0.1905, "learning_rate": 4.8790497393566546e-06, "epoch": 0.14446952595936793, "percentage": 14.45, "elapsed_time": "4:57:22", "remaining_time": "1 day, 5:20:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1569, "total_steps": 10853, "loss": 0.1772, "learning_rate": 4.878815550030792e-06, "epoch": 0.14456166213663796, "percentage": 14.46, "elapsed_time": "4:57:31", "remaining_time": "1 day, 5:20:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1570, "total_steps": 10853, "loss": 0.174, "learning_rate": 4.878581139831649e-06, "epoch": 0.14465379831390796, "percentage": 14.47, "elapsed_time": "4:57:42", "remaining_time": "1 day, 5:20:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1571, "total_steps": 10853, "loss": 0.1878, "learning_rate": 4.87834650878099e-06, "epoch": 0.14474593449117795, "percentage": 14.48, "elapsed_time": "4:57:53", "remaining_time": "1 day, 5:20:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1572, "total_steps": 10853, "loss": 0.1783, "learning_rate": 4.8781116569006026e-06, "epoch": 0.14483807066844798, "percentage": 14.48, "elapsed_time": "4:58:04", "remaining_time": "1 day, 5:19:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1573, "total_steps": 10853, "loss": 0.1789, "learning_rate": 4.877876584212292e-06, "epoch": 0.14493020684571797, "percentage": 14.49, "elapsed_time": "4:58:17", "remaining_time": "1 day, 5:19:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1574, "total_steps": 10853, "loss": 0.1659, "learning_rate": 4.8776412907378845e-06, "epoch": 0.14502234302298797, "percentage": 14.5, "elapsed_time": "4:58:28", "remaining_time": "1 day, 5:19:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1575, "total_steps": 10853, "loss": 0.1903, "learning_rate": 4.8774057764992275e-06, "epoch": 0.14511447920025797, "percentage": 14.51, "elapsed_time": "4:58:38", "remaining_time": "1 day, 5:19:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1576, "total_steps": 10853, "loss": 0.1846, "learning_rate": 4.877170041518187e-06, "epoch": 0.145206615377528, "percentage": 14.52, "elapsed_time": "4:58:49", "remaining_time": "1 day, 5:19:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1577, "total_steps": 10853, "loss": 0.1805, "learning_rate": 4.876934085816654e-06, "epoch": 0.145298751554798, "percentage": 14.53, "elapsed_time": "4:59:00", "remaining_time": "1 day, 5:18:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1578, "total_steps": 10853, "loss": 0.1767, "learning_rate": 4.8766979094165346e-06, "epoch": 0.14539088773206799, "percentage": 14.54, "elapsed_time": "4:59:12", "remaining_time": "1 day, 5:18:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1579, "total_steps": 10853, "loss": 0.1773, "learning_rate": 4.8764615123397584e-06, "epoch": 0.145483023909338, "percentage": 14.55, "elapsed_time": "4:59:21", "remaining_time": "1 day, 5:18:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1580, "total_steps": 10853, "loss": 0.1836, "learning_rate": 4.876224894608275e-06, "epoch": 0.145575160086608, "percentage": 14.56, "elapsed_time": "4:59:32", "remaining_time": "1 day, 5:18:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1581, "total_steps": 10853, "loss": 0.1951, "learning_rate": 4.875988056244055e-06, "epoch": 0.145667296263878, "percentage": 14.57, "elapsed_time": "4:59:43", "remaining_time": "1 day, 5:17:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1582, "total_steps": 10853, "loss": 0.1713, "learning_rate": 4.875750997269088e-06, "epoch": 0.14575943244114803, "percentage": 14.58, "elapsed_time": "4:59:53", "remaining_time": "1 day, 5:17:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1583, "total_steps": 10853, "loss": 0.1803, "learning_rate": 4.875513717705385e-06, "epoch": 0.14585156861841803, "percentage": 14.59, "elapsed_time": "5:00:03", "remaining_time": "1 day, 5:17:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1584, "total_steps": 10853, "loss": 0.1804, "learning_rate": 4.875276217574978e-06, "epoch": 0.14594370479568802, "percentage": 14.6, "elapsed_time": "5:00:14", "remaining_time": "1 day, 5:16:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1585, "total_steps": 10853, "loss": 0.1776, "learning_rate": 4.875038496899919e-06, "epoch": 0.14603584097295802, "percentage": 14.6, "elapsed_time": "5:00:24", "remaining_time": "1 day, 5:16:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1586, "total_steps": 10853, "loss": 0.1859, "learning_rate": 4.874800555702278e-06, "epoch": 0.14612797715022804, "percentage": 14.61, "elapsed_time": "5:00:36", "remaining_time": "1 day, 5:16:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1587, "total_steps": 10853, "loss": 0.1852, "learning_rate": 4.874562394004152e-06, "epoch": 0.14622011332749804, "percentage": 14.62, "elapsed_time": "5:00:46", "remaining_time": "1 day, 5:16:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1588, "total_steps": 10853, "loss": 0.1743, "learning_rate": 4.874324011827651e-06, "epoch": 0.14631224950476804, "percentage": 14.63, "elapsed_time": "5:00:57", "remaining_time": "1 day, 5:15:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1589, "total_steps": 10853, "loss": 0.1961, "learning_rate": 4.874085409194911e-06, "epoch": 0.14640438568203806, "percentage": 14.64, "elapsed_time": "5:01:08", "remaining_time": "1 day, 5:15:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1590, "total_steps": 10853, "loss": 0.1683, "learning_rate": 4.873846586128083e-06, "epoch": 0.14649652185930806, "percentage": 14.65, "elapsed_time": "5:01:18", "remaining_time": "1 day, 5:15:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1591, "total_steps": 10853, "loss": 0.1814, "learning_rate": 4.873607542649347e-06, "epoch": 0.14658865803657806, "percentage": 14.66, "elapsed_time": "5:01:28", "remaining_time": "1 day, 5:15:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1592, "total_steps": 10853, "loss": 0.1835, "learning_rate": 4.873368278780893e-06, "epoch": 0.14668079421384805, "percentage": 14.67, "elapsed_time": "5:01:40", "remaining_time": "1 day, 5:14:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1593, "total_steps": 10853, "loss": 0.1687, "learning_rate": 4.87312879454494e-06, "epoch": 0.14677293039111808, "percentage": 14.68, "elapsed_time": "5:01:49", "remaining_time": "1 day, 5:14:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1594, "total_steps": 10853, "loss": 0.1999, "learning_rate": 4.872889089963723e-06, "epoch": 0.14686506656838808, "percentage": 14.69, "elapsed_time": "5:02:00", "remaining_time": "1 day, 5:14:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1595, "total_steps": 10853, "loss": 0.196, "learning_rate": 4.872649165059497e-06, "epoch": 0.14695720274565807, "percentage": 14.7, "elapsed_time": "5:02:10", "remaining_time": "1 day, 5:13:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1596, "total_steps": 10853, "loss": 0.1674, "learning_rate": 4.872409019854543e-06, "epoch": 0.1470493389229281, "percentage": 14.71, "elapsed_time": "5:02:20", "remaining_time": "1 day, 5:13:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1597, "total_steps": 10853, "loss": 0.1735, "learning_rate": 4.872168654371155e-06, "epoch": 0.1471414751001981, "percentage": 14.71, "elapsed_time": "5:02:31", "remaining_time": "1 day, 5:13:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1598, "total_steps": 10853, "loss": 0.1662, "learning_rate": 4.8719280686316524e-06, "epoch": 0.1472336112774681, "percentage": 14.72, "elapsed_time": "5:02:40", "remaining_time": "1 day, 5:12:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1599, "total_steps": 10853, "loss": 0.1887, "learning_rate": 4.871687262658373e-06, "epoch": 0.14732574745473812, "percentage": 14.73, "elapsed_time": "5:02:51", "remaining_time": "1 day, 5:12:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1600, "total_steps": 10853, "loss": 0.1807, "learning_rate": 4.871446236473676e-06, "epoch": 0.1474178836320081, "percentage": 14.74, "elapsed_time": "5:03:03", "remaining_time": "1 day, 5:12:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1601, "total_steps": 10853, "loss": 0.1689, "learning_rate": 4.871204990099941e-06, "epoch": 0.1475100198092781, "percentage": 14.75, "elapsed_time": "5:03:14", "remaining_time": "1 day, 5:12:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1602, "total_steps": 10853, "loss": 0.1768, "learning_rate": 4.870963523559567e-06, "epoch": 0.1476021559865481, "percentage": 14.76, "elapsed_time": "5:03:25", "remaining_time": "1 day, 5:12:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1603, "total_steps": 10853, "loss": 0.2019, "learning_rate": 4.8707218368749755e-06, "epoch": 0.14769429216381813, "percentage": 14.77, "elapsed_time": "5:03:36", "remaining_time": "1 day, 5:11:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1604, "total_steps": 10853, "loss": 0.1846, "learning_rate": 4.870479930068607e-06, "epoch": 0.14778642834108813, "percentage": 14.78, "elapsed_time": "5:03:47", "remaining_time": "1 day, 5:11:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1605, "total_steps": 10853, "loss": 0.1703, "learning_rate": 4.8702378031629204e-06, "epoch": 0.14787856451835812, "percentage": 14.79, "elapsed_time": "5:03:57", "remaining_time": "1 day, 5:11:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1606, "total_steps": 10853, "loss": 0.1724, "learning_rate": 4.869995456180399e-06, "epoch": 0.14797070069562815, "percentage": 14.8, "elapsed_time": "5:04:07", "remaining_time": "1 day, 5:11:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1607, "total_steps": 10853, "loss": 0.1831, "learning_rate": 4.869752889143544e-06, "epoch": 0.14806283687289815, "percentage": 14.81, "elapsed_time": "5:04:17", "remaining_time": "1 day, 5:10:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1608, "total_steps": 10853, "loss": 0.1707, "learning_rate": 4.8695101020748796e-06, "epoch": 0.14815497305016814, "percentage": 14.82, "elapsed_time": "5:04:27", "remaining_time": "1 day, 5:10:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1609, "total_steps": 10853, "loss": 0.1821, "learning_rate": 4.869267094996946e-06, "epoch": 0.14824710922743817, "percentage": 14.83, "elapsed_time": "5:04:39", "remaining_time": "1 day, 5:10:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1610, "total_steps": 10853, "loss": 0.173, "learning_rate": 4.869023867932309e-06, "epoch": 0.14833924540470816, "percentage": 14.83, "elapsed_time": "5:04:51", "remaining_time": "1 day, 5:10:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1611, "total_steps": 10853, "loss": 0.1802, "learning_rate": 4.868780420903549e-06, "epoch": 0.14843138158197816, "percentage": 14.84, "elapsed_time": "5:05:01", "remaining_time": "1 day, 5:09:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1612, "total_steps": 10853, "loss": 0.1892, "learning_rate": 4.868536753933273e-06, "epoch": 0.14852351775924816, "percentage": 14.85, "elapsed_time": "5:05:11", "remaining_time": "1 day, 5:09:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1613, "total_steps": 10853, "loss": 0.1802, "learning_rate": 4.868292867044104e-06, "epoch": 0.14861565393651818, "percentage": 14.86, "elapsed_time": "5:05:22", "remaining_time": "1 day, 5:09:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1614, "total_steps": 10853, "loss": 0.1893, "learning_rate": 4.868048760258688e-06, "epoch": 0.14870779011378818, "percentage": 14.87, "elapsed_time": "5:05:32", "remaining_time": "1 day, 5:09:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1615, "total_steps": 10853, "loss": 0.1895, "learning_rate": 4.86780443359969e-06, "epoch": 0.14879992629105818, "percentage": 14.88, "elapsed_time": "5:05:42", "remaining_time": "1 day, 5:08:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1616, "total_steps": 10853, "loss": 0.1775, "learning_rate": 4.8675598870897945e-06, "epoch": 0.1488920624683282, "percentage": 14.89, "elapsed_time": "5:05:52", "remaining_time": "1 day, 5:08:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1617, "total_steps": 10853, "loss": 0.1766, "learning_rate": 4.86731512075171e-06, "epoch": 0.1489841986455982, "percentage": 14.9, "elapsed_time": "5:06:02", "remaining_time": "1 day, 5:08:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1618, "total_steps": 10853, "loss": 0.1785, "learning_rate": 4.86707013460816e-06, "epoch": 0.1490763348228682, "percentage": 14.91, "elapsed_time": "5:06:13", "remaining_time": "1 day, 5:07:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1619, "total_steps": 10853, "loss": 0.1896, "learning_rate": 4.866824928681895e-06, "epoch": 0.1491684710001382, "percentage": 14.92, "elapsed_time": "5:06:24", "remaining_time": "1 day, 5:07:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1620, "total_steps": 10853, "loss": 0.1908, "learning_rate": 4.86657950299568e-06, "epoch": 0.14926060717740822, "percentage": 14.93, "elapsed_time": "5:06:35", "remaining_time": "1 day, 5:07:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1621, "total_steps": 10853, "loss": 0.1854, "learning_rate": 4.866333857572303e-06, "epoch": 0.1493527433546782, "percentage": 14.94, "elapsed_time": "5:06:45", "remaining_time": "1 day, 5:07:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1622, "total_steps": 10853, "loss": 0.157, "learning_rate": 4.866087992434573e-06, "epoch": 0.1494448795319482, "percentage": 14.95, "elapsed_time": "5:06:56", "remaining_time": "1 day, 5:06:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1623, "total_steps": 10853, "loss": 0.1824, "learning_rate": 4.865841907605319e-06, "epoch": 0.14953701570921824, "percentage": 14.95, "elapsed_time": "5:07:05", "remaining_time": "1 day, 5:06:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1624, "total_steps": 10853, "loss": 0.1777, "learning_rate": 4.865595603107388e-06, "epoch": 0.14962915188648823, "percentage": 14.96, "elapsed_time": "5:07:18", "remaining_time": "1 day, 5:06:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1625, "total_steps": 10853, "loss": 0.1883, "learning_rate": 4.865349078963652e-06, "epoch": 0.14972128806375823, "percentage": 14.97, "elapsed_time": "5:07:28", "remaining_time": "1 day, 5:06:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1626, "total_steps": 10853, "loss": 0.1851, "learning_rate": 4.865102335196999e-06, "epoch": 0.14981342424102825, "percentage": 14.98, "elapsed_time": "5:07:39", "remaining_time": "1 day, 5:05:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1627, "total_steps": 10853, "loss": 0.1826, "learning_rate": 4.8648553718303386e-06, "epoch": 0.14990556041829825, "percentage": 14.99, "elapsed_time": "5:07:48", "remaining_time": "1 day, 5:05:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1628, "total_steps": 10853, "loss": 0.1822, "learning_rate": 4.864608188886603e-06, "epoch": 0.14999769659556825, "percentage": 15.0, "elapsed_time": "5:07:59", "remaining_time": "1 day, 5:05:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1629, "total_steps": 10853, "loss": 0.1828, "learning_rate": 4.8643607863887435e-06, "epoch": 0.15008983277283824, "percentage": 15.01, "elapsed_time": "5:08:09", "remaining_time": "1 day, 5:04:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1630, "total_steps": 10853, "loss": 0.2041, "learning_rate": 4.8641131643597294e-06, "epoch": 0.15018196895010827, "percentage": 15.02, "elapsed_time": "5:08:20", "remaining_time": "1 day, 5:04:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1631, "total_steps": 10853, "loss": 0.1904, "learning_rate": 4.863865322822553e-06, "epoch": 0.15027410512737827, "percentage": 15.03, "elapsed_time": "5:08:31", "remaining_time": "1 day, 5:04:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1632, "total_steps": 10853, "loss": 0.1853, "learning_rate": 4.863617261800229e-06, "epoch": 0.15036624130464826, "percentage": 15.04, "elapsed_time": "5:08:43", "remaining_time": "1 day, 5:04:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1633, "total_steps": 10853, "loss": 0.1869, "learning_rate": 4.863368981315786e-06, "epoch": 0.1504583774819183, "percentage": 15.05, "elapsed_time": "5:08:55", "remaining_time": "1 day, 5:04:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1634, "total_steps": 10853, "loss": 0.1867, "learning_rate": 4.86312048139228e-06, "epoch": 0.15055051365918828, "percentage": 15.06, "elapsed_time": "5:09:05", "remaining_time": "1 day, 5:03:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1635, "total_steps": 10853, "loss": 0.1667, "learning_rate": 4.862871762052782e-06, "epoch": 0.15064264983645828, "percentage": 15.06, "elapsed_time": "5:09:16", "remaining_time": "1 day, 5:03:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1636, "total_steps": 10853, "loss": 0.1788, "learning_rate": 4.862622823320388e-06, "epoch": 0.15073478601372828, "percentage": 15.07, "elapsed_time": "5:09:28", "remaining_time": "1 day, 5:03:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1637, "total_steps": 10853, "loss": 0.1648, "learning_rate": 4.862373665218209e-06, "epoch": 0.1508269221909983, "percentage": 15.08, "elapsed_time": "5:09:39", "remaining_time": "1 day, 5:03:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1638, "total_steps": 10853, "loss": 0.1888, "learning_rate": 4.862124287769382e-06, "epoch": 0.1509190583682683, "percentage": 15.09, "elapsed_time": "5:09:50", "remaining_time": "1 day, 5:03:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1639, "total_steps": 10853, "loss": 0.1736, "learning_rate": 4.86187469099706e-06, "epoch": 0.1510111945455383, "percentage": 15.1, "elapsed_time": "5:10:00", "remaining_time": "1 day, 5:02:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1640, "total_steps": 10853, "loss": 0.1875, "learning_rate": 4.861624874924419e-06, "epoch": 0.15110333072280832, "percentage": 15.11, "elapsed_time": "5:10:11", "remaining_time": "1 day, 5:02:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1641, "total_steps": 10853, "loss": 0.1712, "learning_rate": 4.861374839574654e-06, "epoch": 0.15119546690007832, "percentage": 15.12, "elapsed_time": "5:10:23", "remaining_time": "1 day, 5:02:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1642, "total_steps": 10853, "loss": 0.193, "learning_rate": 4.861124584970981e-06, "epoch": 0.15128760307734831, "percentage": 15.13, "elapsed_time": "5:10:35", "remaining_time": "1 day, 5:02:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1643, "total_steps": 10853, "loss": 0.1775, "learning_rate": 4.860874111136637e-06, "epoch": 0.15137973925461834, "percentage": 15.14, "elapsed_time": "5:10:46", "remaining_time": "1 day, 5:02:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1644, "total_steps": 10853, "loss": 0.1907, "learning_rate": 4.860623418094877e-06, "epoch": 0.15147187543188834, "percentage": 15.15, "elapsed_time": "5:10:56", "remaining_time": "1 day, 5:01:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1645, "total_steps": 10853, "loss": 0.1903, "learning_rate": 4.8603725058689785e-06, "epoch": 0.15156401160915833, "percentage": 15.16, "elapsed_time": "5:11:08", "remaining_time": "1 day, 5:01:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1646, "total_steps": 10853, "loss": 0.1722, "learning_rate": 4.860121374482239e-06, "epoch": 0.15165614778642833, "percentage": 15.17, "elapsed_time": "5:11:19", "remaining_time": "1 day, 5:01:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1647, "total_steps": 10853, "loss": 0.1835, "learning_rate": 4.859870023957976e-06, "epoch": 0.15174828396369835, "percentage": 15.18, "elapsed_time": "5:11:30", "remaining_time": "1 day, 5:01:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1648, "total_steps": 10853, "loss": 0.1555, "learning_rate": 4.8596184543195265e-06, "epoch": 0.15184042014096835, "percentage": 15.18, "elapsed_time": "5:11:40", "remaining_time": "1 day, 5:00:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1649, "total_steps": 10853, "loss": 0.1959, "learning_rate": 4.859366665590251e-06, "epoch": 0.15193255631823835, "percentage": 15.19, "elapsed_time": "5:11:51", "remaining_time": "1 day, 5:00:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1650, "total_steps": 10853, "loss": 0.1843, "learning_rate": 4.859114657793526e-06, "epoch": 0.15202469249550837, "percentage": 15.2, "elapsed_time": "5:12:01", "remaining_time": "1 day, 5:00:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1651, "total_steps": 10853, "loss": 0.1683, "learning_rate": 4.858862430952751e-06, "epoch": 0.15211682867277837, "percentage": 15.21, "elapsed_time": "5:12:13", "remaining_time": "1 day, 5:00:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1652, "total_steps": 10853, "loss": 0.188, "learning_rate": 4.858609985091345e-06, "epoch": 0.15220896485004837, "percentage": 15.22, "elapsed_time": "5:12:26", "remaining_time": "1 day, 5:00:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1653, "total_steps": 10853, "loss": 0.1684, "learning_rate": 4.858357320232749e-06, "epoch": 0.15230110102731836, "percentage": 15.23, "elapsed_time": "5:12:38", "remaining_time": "1 day, 5:00:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1654, "total_steps": 10853, "loss": 0.1672, "learning_rate": 4.858104436400422e-06, "epoch": 0.1523932372045884, "percentage": 15.24, "elapsed_time": "5:12:48", "remaining_time": "1 day, 4:59:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1655, "total_steps": 10853, "loss": 0.1833, "learning_rate": 4.857851333617844e-06, "epoch": 0.15248537338185839, "percentage": 15.25, "elapsed_time": "5:12:59", "remaining_time": "1 day, 4:59:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1656, "total_steps": 10853, "loss": 0.1706, "learning_rate": 4.857598011908515e-06, "epoch": 0.15257750955912838, "percentage": 15.26, "elapsed_time": "5:13:08", "remaining_time": "1 day, 4:59:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1657, "total_steps": 10853, "loss": 0.186, "learning_rate": 4.857344471295958e-06, "epoch": 0.1526696457363984, "percentage": 15.27, "elapsed_time": "5:13:19", "remaining_time": "1 day, 4:58:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1658, "total_steps": 10853, "loss": 0.1812, "learning_rate": 4.857090711803713e-06, "epoch": 0.1527617819136684, "percentage": 15.28, "elapsed_time": "5:13:29", "remaining_time": "1 day, 4:58:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1659, "total_steps": 10853, "loss": 0.1638, "learning_rate": 4.856836733455341e-06, "epoch": 0.1528539180909384, "percentage": 15.29, "elapsed_time": "5:13:39", "remaining_time": "1 day, 4:58:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1660, "total_steps": 10853, "loss": 0.1753, "learning_rate": 4.8565825362744255e-06, "epoch": 0.15294605426820843, "percentage": 15.3, "elapsed_time": "5:13:51", "remaining_time": "1 day, 4:58:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1661, "total_steps": 10853, "loss": 0.1608, "learning_rate": 4.8563281202845666e-06, "epoch": 0.15303819044547842, "percentage": 15.3, "elapsed_time": "5:14:02", "remaining_time": "1 day, 4:57:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1662, "total_steps": 10853, "loss": 0.1871, "learning_rate": 4.85607348550939e-06, "epoch": 0.15313032662274842, "percentage": 15.31, "elapsed_time": "5:14:11", "remaining_time": "1 day, 4:57:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1663, "total_steps": 10853, "loss": 0.1832, "learning_rate": 4.855818631972535e-06, "epoch": 0.15322246280001842, "percentage": 15.32, "elapsed_time": "5:14:21", "remaining_time": "1 day, 4:57:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1664, "total_steps": 10853, "loss": 0.1684, "learning_rate": 4.855563559697668e-06, "epoch": 0.15331459897728844, "percentage": 15.33, "elapsed_time": "5:14:32", "remaining_time": "1 day, 4:56:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1665, "total_steps": 10853, "loss": 0.1647, "learning_rate": 4.855308268708469e-06, "epoch": 0.15340673515455844, "percentage": 15.34, "elapsed_time": "5:14:43", "remaining_time": "1 day, 4:56:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1666, "total_steps": 10853, "loss": 0.1803, "learning_rate": 4.8550527590286455e-06, "epoch": 0.15349887133182843, "percentage": 15.35, "elapsed_time": "5:14:53", "remaining_time": "1 day, 4:56:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1667, "total_steps": 10853, "loss": 0.168, "learning_rate": 4.85479703068192e-06, "epoch": 0.15359100750909846, "percentage": 15.36, "elapsed_time": "5:15:03", "remaining_time": "1 day, 4:56:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1668, "total_steps": 10853, "loss": 0.1746, "learning_rate": 4.854541083692036e-06, "epoch": 0.15368314368636846, "percentage": 15.37, "elapsed_time": "5:15:13", "remaining_time": "1 day, 4:55:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1669, "total_steps": 10853, "loss": 0.1695, "learning_rate": 4.854284918082759e-06, "epoch": 0.15377527986363845, "percentage": 15.38, "elapsed_time": "5:15:23", "remaining_time": "1 day, 4:55:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1670, "total_steps": 10853, "loss": 0.1782, "learning_rate": 4.854028533877874e-06, "epoch": 0.15386741604090845, "percentage": 15.39, "elapsed_time": "5:15:32", "remaining_time": "1 day, 4:55:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1671, "total_steps": 10853, "loss": 0.1767, "learning_rate": 4.8537719311011865e-06, "epoch": 0.15395955221817847, "percentage": 15.4, "elapsed_time": "5:15:43", "remaining_time": "1 day, 4:54:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1672, "total_steps": 10853, "loss": 0.1781, "learning_rate": 4.853515109776522e-06, "epoch": 0.15405168839544847, "percentage": 15.41, "elapsed_time": "5:15:53", "remaining_time": "1 day, 4:54:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1673, "total_steps": 10853, "loss": 0.1655, "learning_rate": 4.8532580699277256e-06, "epoch": 0.15414382457271847, "percentage": 15.42, "elapsed_time": "5:16:04", "remaining_time": "1 day, 4:54:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1674, "total_steps": 10853, "loss": 0.1713, "learning_rate": 4.853000811578665e-06, "epoch": 0.1542359607499885, "percentage": 15.42, "elapsed_time": "5:16:16", "remaining_time": "1 day, 4:54:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1675, "total_steps": 10853, "loss": 0.1772, "learning_rate": 4.852743334753226e-06, "epoch": 0.1543280969272585, "percentage": 15.43, "elapsed_time": "5:16:28", "remaining_time": "1 day, 4:54:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1676, "total_steps": 10853, "loss": 0.1827, "learning_rate": 4.852485639475314e-06, "epoch": 0.1544202331045285, "percentage": 15.44, "elapsed_time": "5:16:39", "remaining_time": "1 day, 4:53:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1677, "total_steps": 10853, "loss": 0.1753, "learning_rate": 4.852227725768857e-06, "epoch": 0.1545123692817985, "percentage": 15.45, "elapsed_time": "5:16:48", "remaining_time": "1 day, 4:53:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1678, "total_steps": 10853, "loss": 0.1828, "learning_rate": 4.8519695936578045e-06, "epoch": 0.1546045054590685, "percentage": 15.46, "elapsed_time": "5:16:59", "remaining_time": "1 day, 4:53:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1679, "total_steps": 10853, "loss": 0.1808, "learning_rate": 4.851711243166121e-06, "epoch": 0.1546966416363385, "percentage": 15.47, "elapsed_time": "5:17:09", "remaining_time": "1 day, 4:52:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1680, "total_steps": 10853, "loss": 0.1898, "learning_rate": 4.851452674317795e-06, "epoch": 0.1547887778136085, "percentage": 15.48, "elapsed_time": "5:17:20", "remaining_time": "1 day, 4:52:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1681, "total_steps": 10853, "loss": 0.1635, "learning_rate": 4.851193887136835e-06, "epoch": 0.15488091399087853, "percentage": 15.49, "elapsed_time": "5:17:32", "remaining_time": "1 day, 4:52:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1682, "total_steps": 10853, "loss": 0.1802, "learning_rate": 4.850934881647271e-06, "epoch": 0.15497305016814852, "percentage": 15.5, "elapsed_time": "5:17:43", "remaining_time": "1 day, 4:52:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1683, "total_steps": 10853, "loss": 0.2002, "learning_rate": 4.850675657873149e-06, "epoch": 0.15506518634541852, "percentage": 15.51, "elapsed_time": "5:17:54", "remaining_time": "1 day, 4:52:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1684, "total_steps": 10853, "loss": 0.1796, "learning_rate": 4.850416215838539e-06, "epoch": 0.15515732252268855, "percentage": 15.52, "elapsed_time": "5:18:04", "remaining_time": "1 day, 4:51:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1685, "total_steps": 10853, "loss": 0.1758, "learning_rate": 4.850156555567531e-06, "epoch": 0.15524945869995854, "percentage": 15.53, "elapsed_time": "5:18:16", "remaining_time": "1 day, 4:51:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1686, "total_steps": 10853, "loss": 0.1774, "learning_rate": 4.849896677084234e-06, "epoch": 0.15534159487722854, "percentage": 15.53, "elapsed_time": "5:18:27", "remaining_time": "1 day, 4:51:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1687, "total_steps": 10853, "loss": 0.2034, "learning_rate": 4.849636580412778e-06, "epoch": 0.15543373105449854, "percentage": 15.54, "elapsed_time": "5:18:37", "remaining_time": "1 day, 4:51:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1688, "total_steps": 10853, "loss": 0.1867, "learning_rate": 4.849376265577312e-06, "epoch": 0.15552586723176856, "percentage": 15.55, "elapsed_time": "5:18:48", "remaining_time": "1 day, 4:50:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1689, "total_steps": 10853, "loss": 0.2, "learning_rate": 4.849115732602006e-06, "epoch": 0.15561800340903856, "percentage": 15.56, "elapsed_time": "5:19:00", "remaining_time": "1 day, 4:50:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1690, "total_steps": 10853, "loss": 0.1634, "learning_rate": 4.848854981511053e-06, "epoch": 0.15571013958630855, "percentage": 15.57, "elapsed_time": "5:19:11", "remaining_time": "1 day, 4:50:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1691, "total_steps": 10853, "loss": 0.1763, "learning_rate": 4.848594012328661e-06, "epoch": 0.15580227576357858, "percentage": 15.58, "elapsed_time": "5:19:23", "remaining_time": "1 day, 4:50:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1692, "total_steps": 10853, "loss": 0.1853, "learning_rate": 4.848332825079063e-06, "epoch": 0.15589441194084858, "percentage": 15.59, "elapsed_time": "5:19:34", "remaining_time": "1 day, 4:50:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1693, "total_steps": 10853, "loss": 0.1715, "learning_rate": 4.848071419786509e-06, "epoch": 0.15598654811811857, "percentage": 15.6, "elapsed_time": "5:19:44", "remaining_time": "1 day, 4:49:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1694, "total_steps": 10853, "loss": 0.1743, "learning_rate": 4.847809796475271e-06, "epoch": 0.1560786842953886, "percentage": 15.61, "elapsed_time": "5:19:55", "remaining_time": "1 day, 4:49:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1695, "total_steps": 10853, "loss": 0.1714, "learning_rate": 4.8475479551696405e-06, "epoch": 0.1561708204726586, "percentage": 15.62, "elapsed_time": "5:20:04", "remaining_time": "1 day, 4:49:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1696, "total_steps": 10853, "loss": 0.1881, "learning_rate": 4.847285895893931e-06, "epoch": 0.1562629566499286, "percentage": 15.63, "elapsed_time": "5:20:14", "remaining_time": "1 day, 4:49:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1697, "total_steps": 10853, "loss": 0.1628, "learning_rate": 4.847023618672472e-06, "epoch": 0.1563550928271986, "percentage": 15.64, "elapsed_time": "5:20:24", "remaining_time": "1 day, 4:48:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1698, "total_steps": 10853, "loss": 0.1644, "learning_rate": 4.846761123529618e-06, "epoch": 0.1564472290044686, "percentage": 15.65, "elapsed_time": "5:20:34", "remaining_time": "1 day, 4:48:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1699, "total_steps": 10853, "loss": 0.1682, "learning_rate": 4.846498410489741e-06, "epoch": 0.1565393651817386, "percentage": 15.65, "elapsed_time": "5:20:45", "remaining_time": "1 day, 4:48:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1700, "total_steps": 10853, "loss": 0.1853, "learning_rate": 4.846235479577234e-06, "epoch": 0.1566315013590086, "percentage": 15.66, "elapsed_time": "5:20:56", "remaining_time": "1 day, 4:47:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1701, "total_steps": 10853, "loss": 0.1927, "learning_rate": 4.845972330816511e-06, "epoch": 0.15672363753627863, "percentage": 15.67, "elapsed_time": "5:21:07", "remaining_time": "1 day, 4:47:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1702, "total_steps": 10853, "loss": 0.1904, "learning_rate": 4.845708964232003e-06, "epoch": 0.15681577371354863, "percentage": 15.68, "elapsed_time": "5:21:18", "remaining_time": "1 day, 4:47:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1703, "total_steps": 10853, "loss": 0.1812, "learning_rate": 4.845445379848167e-06, "epoch": 0.15690790989081863, "percentage": 15.69, "elapsed_time": "5:21:28", "remaining_time": "1 day, 4:47:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1704, "total_steps": 10853, "loss": 0.1826, "learning_rate": 4.845181577689474e-06, "epoch": 0.15700004606808862, "percentage": 15.7, "elapsed_time": "5:21:38", "remaining_time": "1 day, 4:46:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1705, "total_steps": 10853, "loss": 0.1794, "learning_rate": 4.844917557780419e-06, "epoch": 0.15709218224535865, "percentage": 15.71, "elapsed_time": "5:21:49", "remaining_time": "1 day, 4:46:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1706, "total_steps": 10853, "loss": 0.2025, "learning_rate": 4.844653320145517e-06, "epoch": 0.15718431842262864, "percentage": 15.72, "elapsed_time": "5:22:01", "remaining_time": "1 day, 4:46:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1707, "total_steps": 10853, "loss": 0.1754, "learning_rate": 4.844388864809302e-06, "epoch": 0.15727645459989864, "percentage": 15.73, "elapsed_time": "5:22:12", "remaining_time": "1 day, 4:46:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1708, "total_steps": 10853, "loss": 0.1871, "learning_rate": 4.844124191796328e-06, "epoch": 0.15736859077716867, "percentage": 15.74, "elapsed_time": "5:22:22", "remaining_time": "1 day, 4:46:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1709, "total_steps": 10853, "loss": 0.2118, "learning_rate": 4.843859301131171e-06, "epoch": 0.15746072695443866, "percentage": 15.75, "elapsed_time": "5:22:33", "remaining_time": "1 day, 4:45:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1710, "total_steps": 10853, "loss": 0.1991, "learning_rate": 4.843594192838425e-06, "epoch": 0.15755286313170866, "percentage": 15.76, "elapsed_time": "5:22:44", "remaining_time": "1 day, 4:45:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1711, "total_steps": 10853, "loss": 0.1673, "learning_rate": 4.8433288669427055e-06, "epoch": 0.15764499930897868, "percentage": 15.77, "elapsed_time": "5:22:57", "remaining_time": "1 day, 4:45:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1712, "total_steps": 10853, "loss": 0.1813, "learning_rate": 4.84306332346865e-06, "epoch": 0.15773713548624868, "percentage": 15.77, "elapsed_time": "5:23:07", "remaining_time": "1 day, 4:45:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1713, "total_steps": 10853, "loss": 0.1716, "learning_rate": 4.842797562440913e-06, "epoch": 0.15782927166351868, "percentage": 15.78, "elapsed_time": "5:23:18", "remaining_time": "1 day, 4:45:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1714, "total_steps": 10853, "loss": 0.1797, "learning_rate": 4.842531583884168e-06, "epoch": 0.15792140784078867, "percentage": 15.79, "elapsed_time": "5:23:29", "remaining_time": "1 day, 4:44:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1715, "total_steps": 10853, "loss": 0.1949, "learning_rate": 4.842265387823115e-06, "epoch": 0.1580135440180587, "percentage": 15.8, "elapsed_time": "5:23:39", "remaining_time": "1 day, 4:44:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1716, "total_steps": 10853, "loss": 0.1687, "learning_rate": 4.841998974282469e-06, "epoch": 0.1581056801953287, "percentage": 15.81, "elapsed_time": "5:23:49", "remaining_time": "1 day, 4:44:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1717, "total_steps": 10853, "loss": 0.1737, "learning_rate": 4.841732343286965e-06, "epoch": 0.1581978163725987, "percentage": 15.82, "elapsed_time": "5:24:01", "remaining_time": "1 day, 4:44:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1718, "total_steps": 10853, "loss": 0.1811, "learning_rate": 4.841465494861362e-06, "epoch": 0.15828995254986872, "percentage": 15.83, "elapsed_time": "5:24:10", "remaining_time": "1 day, 4:43:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1719, "total_steps": 10853, "loss": 0.1739, "learning_rate": 4.841198429030435e-06, "epoch": 0.15838208872713871, "percentage": 15.84, "elapsed_time": "5:24:21", "remaining_time": "1 day, 4:43:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1720, "total_steps": 10853, "loss": 0.1632, "learning_rate": 4.840931145818982e-06, "epoch": 0.1584742249044087, "percentage": 15.85, "elapsed_time": "5:24:31", "remaining_time": "1 day, 4:43:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1721, "total_steps": 10853, "loss": 0.1721, "learning_rate": 4.84066364525182e-06, "epoch": 0.1585663610816787, "percentage": 15.86, "elapsed_time": "5:24:42", "remaining_time": "1 day, 4:42:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1722, "total_steps": 10853, "loss": 0.1739, "learning_rate": 4.8403959273537875e-06, "epoch": 0.15865849725894873, "percentage": 15.87, "elapsed_time": "5:24:53", "remaining_time": "1 day, 4:42:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1723, "total_steps": 10853, "loss": 0.1902, "learning_rate": 4.8401279921497405e-06, "epoch": 0.15875063343621873, "percentage": 15.88, "elapsed_time": "5:25:03", "remaining_time": "1 day, 4:42:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1724, "total_steps": 10853, "loss": 0.198, "learning_rate": 4.839859839664557e-06, "epoch": 0.15884276961348873, "percentage": 15.89, "elapsed_time": "5:25:13", "remaining_time": "1 day, 4:42:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1725, "total_steps": 10853, "loss": 0.1676, "learning_rate": 4.839591469923137e-06, "epoch": 0.15893490579075875, "percentage": 15.89, "elapsed_time": "5:25:24", "remaining_time": "1 day, 4:41:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1726, "total_steps": 10853, "loss": 0.1838, "learning_rate": 4.8393228829503966e-06, "epoch": 0.15902704196802875, "percentage": 15.9, "elapsed_time": "5:25:35", "remaining_time": "1 day, 4:41:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1727, "total_steps": 10853, "loss": 0.1838, "learning_rate": 4.839054078771275e-06, "epoch": 0.15911917814529875, "percentage": 15.91, "elapsed_time": "5:25:45", "remaining_time": "1 day, 4:41:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1728, "total_steps": 10853, "loss": 0.1835, "learning_rate": 4.83878505741073e-06, "epoch": 0.15921131432256877, "percentage": 15.92, "elapsed_time": "5:25:56", "remaining_time": "1 day, 4:41:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1729, "total_steps": 10853, "loss": 0.172, "learning_rate": 4.838515818893741e-06, "epoch": 0.15930345049983877, "percentage": 15.93, "elapsed_time": "5:26:05", "remaining_time": "1 day, 4:40:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1730, "total_steps": 10853, "loss": 0.1641, "learning_rate": 4.838246363245306e-06, "epoch": 0.15939558667710876, "percentage": 15.94, "elapsed_time": "5:26:16", "remaining_time": "1 day, 4:40:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1731, "total_steps": 10853, "loss": 0.1905, "learning_rate": 4.837976690490445e-06, "epoch": 0.15948772285437876, "percentage": 15.95, "elapsed_time": "5:26:28", "remaining_time": "1 day, 4:40:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1732, "total_steps": 10853, "loss": 0.1769, "learning_rate": 4.837706800654197e-06, "epoch": 0.15957985903164879, "percentage": 15.96, "elapsed_time": "5:26:40", "remaining_time": "1 day, 4:40:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1733, "total_steps": 10853, "loss": 0.1803, "learning_rate": 4.83743669376162e-06, "epoch": 0.15967199520891878, "percentage": 15.97, "elapsed_time": "5:26:50", "remaining_time": "1 day, 4:40:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1734, "total_steps": 10853, "loss": 0.1683, "learning_rate": 4.8371663698377955e-06, "epoch": 0.15976413138618878, "percentage": 15.98, "elapsed_time": "5:27:01", "remaining_time": "1 day, 4:39:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1735, "total_steps": 10853, "loss": 0.1851, "learning_rate": 4.836895828907822e-06, "epoch": 0.1598562675634588, "percentage": 15.99, "elapsed_time": "5:27:12", "remaining_time": "1 day, 4:39:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1736, "total_steps": 10853, "loss": 0.188, "learning_rate": 4.836625070996818e-06, "epoch": 0.1599484037407288, "percentage": 16.0, "elapsed_time": "5:27:21", "remaining_time": "1 day, 4:39:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1737, "total_steps": 10853, "loss": 0.1659, "learning_rate": 4.836354096129926e-06, "epoch": 0.1600405399179988, "percentage": 16.0, "elapsed_time": "5:27:32", "remaining_time": "1 day, 4:38:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1738, "total_steps": 10853, "loss": 0.1832, "learning_rate": 4.8360829043323046e-06, "epoch": 0.1601326760952688, "percentage": 16.01, "elapsed_time": "5:27:43", "remaining_time": "1 day, 4:38:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1739, "total_steps": 10853, "loss": 0.175, "learning_rate": 4.835811495629134e-06, "epoch": 0.16022481227253882, "percentage": 16.02, "elapsed_time": "5:27:53", "remaining_time": "1 day, 4:38:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1740, "total_steps": 10853, "loss": 0.1992, "learning_rate": 4.835539870045613e-06, "epoch": 0.16031694844980882, "percentage": 16.03, "elapsed_time": "5:28:03", "remaining_time": "1 day, 4:38:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1741, "total_steps": 10853, "loss": 0.1653, "learning_rate": 4.8352680276069654e-06, "epoch": 0.1604090846270788, "percentage": 16.04, "elapsed_time": "5:28:14", "remaining_time": "1 day, 4:37:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1742, "total_steps": 10853, "loss": 0.1795, "learning_rate": 4.83499596833843e-06, "epoch": 0.16050122080434884, "percentage": 16.05, "elapsed_time": "5:28:25", "remaining_time": "1 day, 4:37:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1743, "total_steps": 10853, "loss": 0.1817, "learning_rate": 4.834723692265268e-06, "epoch": 0.16059335698161883, "percentage": 16.06, "elapsed_time": "5:28:36", "remaining_time": "1 day, 4:37:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1744, "total_steps": 10853, "loss": 0.1781, "learning_rate": 4.834451199412759e-06, "epoch": 0.16068549315888883, "percentage": 16.07, "elapsed_time": "5:28:47", "remaining_time": "1 day, 4:37:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1745, "total_steps": 10853, "loss": 0.1819, "learning_rate": 4.8341784898062056e-06, "epoch": 0.16077762933615886, "percentage": 16.08, "elapsed_time": "5:28:57", "remaining_time": "1 day, 4:37:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1746, "total_steps": 10853, "loss": 0.1706, "learning_rate": 4.833905563470928e-06, "epoch": 0.16086976551342885, "percentage": 16.09, "elapsed_time": "5:29:07", "remaining_time": "1 day, 4:36:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1747, "total_steps": 10853, "loss": 0.1831, "learning_rate": 4.833632420432267e-06, "epoch": 0.16096190169069885, "percentage": 16.1, "elapsed_time": "5:29:18", "remaining_time": "1 day, 4:36:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1748, "total_steps": 10853, "loss": 0.19, "learning_rate": 4.833359060715586e-06, "epoch": 0.16105403786796885, "percentage": 16.11, "elapsed_time": "5:29:29", "remaining_time": "1 day, 4:36:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1749, "total_steps": 10853, "loss": 0.1804, "learning_rate": 4.8330854843462635e-06, "epoch": 0.16114617404523887, "percentage": 16.12, "elapsed_time": "5:29:40", "remaining_time": "1 day, 4:36:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1750, "total_steps": 10853, "loss": 0.1804, "learning_rate": 4.832811691349703e-06, "epoch": 0.16123831022250887, "percentage": 16.12, "elapsed_time": "5:29:51", "remaining_time": "1 day, 4:35:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1751, "total_steps": 10853, "loss": 0.1827, "learning_rate": 4.832537681751327e-06, "epoch": 0.16133044639977887, "percentage": 16.13, "elapsed_time": "5:30:03", "remaining_time": "1 day, 4:35:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1752, "total_steps": 10853, "loss": 0.1972, "learning_rate": 4.832263455576576e-06, "epoch": 0.1614225825770489, "percentage": 16.14, "elapsed_time": "5:30:14", "remaining_time": "1 day, 4:35:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1753, "total_steps": 10853, "loss": 0.1822, "learning_rate": 4.8319890128509115e-06, "epoch": 0.1615147187543189, "percentage": 16.15, "elapsed_time": "5:30:25", "remaining_time": "1 day, 4:35:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1754, "total_steps": 10853, "loss": 0.1886, "learning_rate": 4.831714353599817e-06, "epoch": 0.16160685493158888, "percentage": 16.16, "elapsed_time": "5:30:35", "remaining_time": "1 day, 4:34:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1755, "total_steps": 10853, "loss": 0.1725, "learning_rate": 4.831439477848793e-06, "epoch": 0.16169899110885888, "percentage": 16.17, "elapsed_time": "5:30:45", "remaining_time": "1 day, 4:34:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1756, "total_steps": 10853, "loss": 0.1589, "learning_rate": 4.831164385623362e-06, "epoch": 0.1617911272861289, "percentage": 16.18, "elapsed_time": "5:30:54", "remaining_time": "1 day, 4:34:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1757, "total_steps": 10853, "loss": 0.1746, "learning_rate": 4.830889076949069e-06, "epoch": 0.1618832634633989, "percentage": 16.19, "elapsed_time": "5:31:06", "remaining_time": "1 day, 4:34:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1758, "total_steps": 10853, "loss": 0.1681, "learning_rate": 4.830613551851473e-06, "epoch": 0.1619753996406689, "percentage": 16.2, "elapsed_time": "5:31:17", "remaining_time": "1 day, 4:33:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1759, "total_steps": 10853, "loss": 0.1776, "learning_rate": 4.830337810356157e-06, "epoch": 0.16206753581793892, "percentage": 16.21, "elapsed_time": "5:31:26", "remaining_time": "1 day, 4:33:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1760, "total_steps": 10853, "loss": 0.1828, "learning_rate": 4.830061852488726e-06, "epoch": 0.16215967199520892, "percentage": 16.22, "elapsed_time": "5:31:38", "remaining_time": "1 day, 4:33:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1761, "total_steps": 10853, "loss": 0.1839, "learning_rate": 4.829785678274801e-06, "epoch": 0.16225180817247892, "percentage": 16.23, "elapsed_time": "5:31:48", "remaining_time": "1 day, 4:33:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1762, "total_steps": 10853, "loss": 0.1788, "learning_rate": 4.829509287740024e-06, "epoch": 0.16234394434974894, "percentage": 16.24, "elapsed_time": "5:32:00", "remaining_time": "1 day, 4:32:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1763, "total_steps": 10853, "loss": 0.188, "learning_rate": 4.82923268091006e-06, "epoch": 0.16243608052701894, "percentage": 16.24, "elapsed_time": "5:32:11", "remaining_time": "1 day, 4:32:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1764, "total_steps": 10853, "loss": 0.191, "learning_rate": 4.828955857810591e-06, "epoch": 0.16252821670428894, "percentage": 16.25, "elapsed_time": "5:32:20", "remaining_time": "1 day, 4:32:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1765, "total_steps": 10853, "loss": 0.1763, "learning_rate": 4.828678818467319e-06, "epoch": 0.16262035288155893, "percentage": 16.26, "elapsed_time": "5:32:32", "remaining_time": "1 day, 4:32:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1766, "total_steps": 10853, "loss": 0.2075, "learning_rate": 4.828401562905969e-06, "epoch": 0.16271248905882896, "percentage": 16.27, "elapsed_time": "5:32:44", "remaining_time": "1 day, 4:32:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1767, "total_steps": 10853, "loss": 0.1737, "learning_rate": 4.828124091152283e-06, "epoch": 0.16280462523609895, "percentage": 16.28, "elapsed_time": "5:32:54", "remaining_time": "1 day, 4:31:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1768, "total_steps": 10853, "loss": 0.1928, "learning_rate": 4.827846403232024e-06, "epoch": 0.16289676141336895, "percentage": 16.29, "elapsed_time": "5:33:05", "remaining_time": "1 day, 4:31:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1769, "total_steps": 10853, "loss": 0.1722, "learning_rate": 4.827568499170977e-06, "epoch": 0.16298889759063898, "percentage": 16.3, "elapsed_time": "5:33:16", "remaining_time": "1 day, 4:31:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1770, "total_steps": 10853, "loss": 0.1732, "learning_rate": 4.8272903789949435e-06, "epoch": 0.16308103376790897, "percentage": 16.31, "elapsed_time": "5:33:26", "remaining_time": "1 day, 4:31:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1771, "total_steps": 10853, "loss": 0.1892, "learning_rate": 4.8270120427297485e-06, "epoch": 0.16317316994517897, "percentage": 16.32, "elapsed_time": "5:33:37", "remaining_time": "1 day, 4:30:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1772, "total_steps": 10853, "loss": 0.1798, "learning_rate": 4.8267334904012345e-06, "epoch": 0.16326530612244897, "percentage": 16.33, "elapsed_time": "5:33:47", "remaining_time": "1 day, 4:30:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1773, "total_steps": 10853, "loss": 0.1862, "learning_rate": 4.8264547220352655e-06, "epoch": 0.163357442299719, "percentage": 16.34, "elapsed_time": "5:33:58", "remaining_time": "1 day, 4:30:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1774, "total_steps": 10853, "loss": 0.1913, "learning_rate": 4.826175737657725e-06, "epoch": 0.163449578476989, "percentage": 16.35, "elapsed_time": "5:34:08", "remaining_time": "1 day, 4:30:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1775, "total_steps": 10853, "loss": 0.1854, "learning_rate": 4.825896537294518e-06, "epoch": 0.16354171465425899, "percentage": 16.35, "elapsed_time": "5:34:21", "remaining_time": "1 day, 4:29:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1776, "total_steps": 10853, "loss": 0.1747, "learning_rate": 4.825617120971566e-06, "epoch": 0.163633850831529, "percentage": 16.36, "elapsed_time": "5:34:31", "remaining_time": "1 day, 4:29:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1777, "total_steps": 10853, "loss": 0.185, "learning_rate": 4.825337488714814e-06, "epoch": 0.163725987008799, "percentage": 16.37, "elapsed_time": "5:34:42", "remaining_time": "1 day, 4:29:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1778, "total_steps": 10853, "loss": 0.1875, "learning_rate": 4.825057640550226e-06, "epoch": 0.163818123186069, "percentage": 16.38, "elapsed_time": "5:34:52", "remaining_time": "1 day, 4:29:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1779, "total_steps": 10853, "loss": 0.1832, "learning_rate": 4.824777576503786e-06, "epoch": 0.16391025936333903, "percentage": 16.39, "elapsed_time": "5:35:02", "remaining_time": "1 day, 4:28:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1780, "total_steps": 10853, "loss": 0.1743, "learning_rate": 4.824497296601499e-06, "epoch": 0.16400239554060903, "percentage": 16.4, "elapsed_time": "5:35:13", "remaining_time": "1 day, 4:28:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1781, "total_steps": 10853, "loss": 0.1688, "learning_rate": 4.8242168008693864e-06, "epoch": 0.16409453171787902, "percentage": 16.41, "elapsed_time": "5:35:22", "remaining_time": "1 day, 4:28:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1782, "total_steps": 10853, "loss": 0.1679, "learning_rate": 4.823936089333494e-06, "epoch": 0.16418666789514902, "percentage": 16.42, "elapsed_time": "5:35:32", "remaining_time": "1 day, 4:27:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1783, "total_steps": 10853, "loss": 0.1616, "learning_rate": 4.823655162019886e-06, "epoch": 0.16427880407241904, "percentage": 16.43, "elapsed_time": "5:35:43", "remaining_time": "1 day, 4:27:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1784, "total_steps": 10853, "loss": 0.1665, "learning_rate": 4.823374018954646e-06, "epoch": 0.16437094024968904, "percentage": 16.44, "elapsed_time": "5:35:54", "remaining_time": "1 day, 4:27:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1785, "total_steps": 10853, "loss": 0.1528, "learning_rate": 4.823092660163878e-06, "epoch": 0.16446307642695904, "percentage": 16.45, "elapsed_time": "5:36:04", "remaining_time": "1 day, 4:27:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1786, "total_steps": 10853, "loss": 0.1691, "learning_rate": 4.822811085673706e-06, "epoch": 0.16455521260422906, "percentage": 16.46, "elapsed_time": "5:36:14", "remaining_time": "1 day, 4:27:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1787, "total_steps": 10853, "loss": 0.1568, "learning_rate": 4.822529295510276e-06, "epoch": 0.16464734878149906, "percentage": 16.47, "elapsed_time": "5:36:24", "remaining_time": "1 day, 4:26:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1788, "total_steps": 10853, "loss": 0.1783, "learning_rate": 4.82224728969975e-06, "epoch": 0.16473948495876906, "percentage": 16.47, "elapsed_time": "5:36:35", "remaining_time": "1 day, 4:26:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1789, "total_steps": 10853, "loss": 0.1727, "learning_rate": 4.821965068268314e-06, "epoch": 0.16483162113603905, "percentage": 16.48, "elapsed_time": "5:36:46", "remaining_time": "1 day, 4:26:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1790, "total_steps": 10853, "loss": 0.1741, "learning_rate": 4.82168263124217e-06, "epoch": 0.16492375731330908, "percentage": 16.49, "elapsed_time": "5:36:56", "remaining_time": "1 day, 4:25:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1791, "total_steps": 10853, "loss": 0.186, "learning_rate": 4.8213999786475455e-06, "epoch": 0.16501589349057907, "percentage": 16.5, "elapsed_time": "5:37:08", "remaining_time": "1 day, 4:25:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1792, "total_steps": 10853, "loss": 0.1634, "learning_rate": 4.821117110510683e-06, "epoch": 0.16510802966784907, "percentage": 16.51, "elapsed_time": "5:37:20", "remaining_time": "1 day, 4:25:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1793, "total_steps": 10853, "loss": 0.1793, "learning_rate": 4.820834026857846e-06, "epoch": 0.1652001658451191, "percentage": 16.52, "elapsed_time": "5:37:30", "remaining_time": "1 day, 4:25:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1794, "total_steps": 10853, "loss": 0.1889, "learning_rate": 4.820550727715321e-06, "epoch": 0.1652923020223891, "percentage": 16.53, "elapsed_time": "5:37:41", "remaining_time": "1 day, 4:25:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1795, "total_steps": 10853, "loss": 0.1724, "learning_rate": 4.820267213109409e-06, "epoch": 0.1653844381996591, "percentage": 16.54, "elapsed_time": "5:37:52", "remaining_time": "1 day, 4:24:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1796, "total_steps": 10853, "loss": 0.1777, "learning_rate": 4.8199834830664395e-06, "epoch": 0.16547657437692911, "percentage": 16.55, "elapsed_time": "5:38:04", "remaining_time": "1 day, 4:24:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1797, "total_steps": 10853, "loss": 0.1615, "learning_rate": 4.819699537612752e-06, "epoch": 0.1655687105541991, "percentage": 16.56, "elapsed_time": "5:38:14", "remaining_time": "1 day, 4:24:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1798, "total_steps": 10853, "loss": 0.1827, "learning_rate": 4.819415376774714e-06, "epoch": 0.1656608467314691, "percentage": 16.57, "elapsed_time": "5:38:26", "remaining_time": "1 day, 4:24:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1799, "total_steps": 10853, "loss": 0.1843, "learning_rate": 4.819131000578707e-06, "epoch": 0.1657529829087391, "percentage": 16.58, "elapsed_time": "5:38:36", "remaining_time": "1 day, 4:24:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1800, "total_steps": 10853, "loss": 0.1813, "learning_rate": 4.818846409051139e-06, "epoch": 0.16584511908600913, "percentage": 16.59, "elapsed_time": "5:38:46", "remaining_time": "1 day, 4:23:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1801, "total_steps": 10853, "loss": 0.1838, "learning_rate": 4.818561602218431e-06, "epoch": 0.16593725526327913, "percentage": 16.59, "elapsed_time": "5:38:58", "remaining_time": "1 day, 4:23:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1802, "total_steps": 10853, "loss": 0.1702, "learning_rate": 4.818276580107029e-06, "epoch": 0.16602939144054912, "percentage": 16.6, "elapsed_time": "5:39:08", "remaining_time": "1 day, 4:23:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1803, "total_steps": 10853, "loss": 0.1735, "learning_rate": 4.817991342743396e-06, "epoch": 0.16612152761781915, "percentage": 16.61, "elapsed_time": "5:39:18", "remaining_time": "1 day, 4:23:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1804, "total_steps": 10853, "loss": 0.1796, "learning_rate": 4.81770589015402e-06, "epoch": 0.16621366379508914, "percentage": 16.62, "elapsed_time": "5:39:28", "remaining_time": "1 day, 4:22:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1805, "total_steps": 10853, "loss": 0.1843, "learning_rate": 4.8174202223654e-06, "epoch": 0.16630579997235914, "percentage": 16.63, "elapsed_time": "5:39:38", "remaining_time": "1 day, 4:22:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1806, "total_steps": 10853, "loss": 0.1745, "learning_rate": 4.8171343394040645e-06, "epoch": 0.16639793614962914, "percentage": 16.64, "elapsed_time": "5:39:48", "remaining_time": "1 day, 4:22:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1807, "total_steps": 10853, "loss": 0.1695, "learning_rate": 4.816848241296556e-06, "epoch": 0.16649007232689916, "percentage": 16.65, "elapsed_time": "5:39:59", "remaining_time": "1 day, 4:22:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1808, "total_steps": 10853, "loss": 0.1825, "learning_rate": 4.816561928069439e-06, "epoch": 0.16658220850416916, "percentage": 16.66, "elapsed_time": "5:40:10", "remaining_time": "1 day, 4:21:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1809, "total_steps": 10853, "loss": 0.1758, "learning_rate": 4.8162753997492965e-06, "epoch": 0.16667434468143916, "percentage": 16.67, "elapsed_time": "5:40:21", "remaining_time": "1 day, 4:21:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1810, "total_steps": 10853, "loss": 0.1908, "learning_rate": 4.815988656362735e-06, "epoch": 0.16676648085870918, "percentage": 16.68, "elapsed_time": "5:40:32", "remaining_time": "1 day, 4:21:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1811, "total_steps": 10853, "loss": 0.1817, "learning_rate": 4.815701697936377e-06, "epoch": 0.16685861703597918, "percentage": 16.69, "elapsed_time": "5:40:43", "remaining_time": "1 day, 4:21:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1812, "total_steps": 10853, "loss": 0.1689, "learning_rate": 4.815414524496867e-06, "epoch": 0.16695075321324918, "percentage": 16.7, "elapsed_time": "5:40:53", "remaining_time": "1 day, 4:20:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1813, "total_steps": 10853, "loss": 0.1817, "learning_rate": 4.8151271360708704e-06, "epoch": 0.1670428893905192, "percentage": 16.71, "elapsed_time": "5:41:04", "remaining_time": "1 day, 4:20:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1814, "total_steps": 10853, "loss": 0.1794, "learning_rate": 4.814839532685069e-06, "epoch": 0.1671350255677892, "percentage": 16.71, "elapsed_time": "5:41:15", "remaining_time": "1 day, 4:20:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1815, "total_steps": 10853, "loss": 0.1775, "learning_rate": 4.814551714366168e-06, "epoch": 0.1672271617450592, "percentage": 16.72, "elapsed_time": "5:41:25", "remaining_time": "1 day, 4:20:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1816, "total_steps": 10853, "loss": 0.1789, "learning_rate": 4.814263681140892e-06, "epoch": 0.1673192979223292, "percentage": 16.73, "elapsed_time": "5:41:34", "remaining_time": "1 day, 4:19:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1817, "total_steps": 10853, "loss": 0.18, "learning_rate": 4.813975433035984e-06, "epoch": 0.16741143409959922, "percentage": 16.74, "elapsed_time": "5:41:44", "remaining_time": "1 day, 4:19:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1818, "total_steps": 10853, "loss": 0.1861, "learning_rate": 4.813686970078207e-06, "epoch": 0.1675035702768692, "percentage": 16.75, "elapsed_time": "5:41:53", "remaining_time": "1 day, 4:19:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1819, "total_steps": 10853, "loss": 0.1782, "learning_rate": 4.813398292294345e-06, "epoch": 0.1675957064541392, "percentage": 16.76, "elapsed_time": "5:42:04", "remaining_time": "1 day, 4:18:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1820, "total_steps": 10853, "loss": 0.1605, "learning_rate": 4.813109399711204e-06, "epoch": 0.16768784263140923, "percentage": 16.77, "elapsed_time": "5:42:15", "remaining_time": "1 day, 4:18:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1821, "total_steps": 10853, "loss": 0.1768, "learning_rate": 4.812820292355607e-06, "epoch": 0.16777997880867923, "percentage": 16.78, "elapsed_time": "5:42:26", "remaining_time": "1 day, 4:18:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1822, "total_steps": 10853, "loss": 0.1768, "learning_rate": 4.812530970254396e-06, "epoch": 0.16787211498594923, "percentage": 16.79, "elapsed_time": "5:42:37", "remaining_time": "1 day, 4:18:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1823, "total_steps": 10853, "loss": 0.188, "learning_rate": 4.812241433434436e-06, "epoch": 0.16796425116321922, "percentage": 16.8, "elapsed_time": "5:42:48", "remaining_time": "1 day, 4:18:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1824, "total_steps": 10853, "loss": 0.1749, "learning_rate": 4.81195168192261e-06, "epoch": 0.16805638734048925, "percentage": 16.81, "elapsed_time": "5:42:59", "remaining_time": "1 day, 4:17:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1825, "total_steps": 10853, "loss": 0.1782, "learning_rate": 4.81166171574582e-06, "epoch": 0.16814852351775925, "percentage": 16.82, "elapsed_time": "5:43:11", "remaining_time": "1 day, 4:17:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1826, "total_steps": 10853, "loss": 0.1805, "learning_rate": 4.811371534930993e-06, "epoch": 0.16824065969502924, "percentage": 16.82, "elapsed_time": "5:43:21", "remaining_time": "1 day, 4:17:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1827, "total_steps": 10853, "loss": 0.1696, "learning_rate": 4.8110811395050695e-06, "epoch": 0.16833279587229927, "percentage": 16.83, "elapsed_time": "5:43:32", "remaining_time": "1 day, 4:17:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1828, "total_steps": 10853, "loss": 0.1791, "learning_rate": 4.810790529495013e-06, "epoch": 0.16842493204956926, "percentage": 16.84, "elapsed_time": "5:43:42", "remaining_time": "1 day, 4:16:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1829, "total_steps": 10853, "loss": 0.1723, "learning_rate": 4.810499704927808e-06, "epoch": 0.16851706822683926, "percentage": 16.85, "elapsed_time": "5:43:53", "remaining_time": "1 day, 4:16:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1830, "total_steps": 10853, "loss": 0.1907, "learning_rate": 4.810208665830456e-06, "epoch": 0.1686092044041093, "percentage": 16.86, "elapsed_time": "5:44:03", "remaining_time": "1 day, 4:16:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1831, "total_steps": 10853, "loss": 0.1788, "learning_rate": 4.809917412229981e-06, "epoch": 0.16870134058137928, "percentage": 16.87, "elapsed_time": "5:44:14", "remaining_time": "1 day, 4:16:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1832, "total_steps": 10853, "loss": 0.1617, "learning_rate": 4.809625944153425e-06, "epoch": 0.16879347675864928, "percentage": 16.88, "elapsed_time": "5:44:25", "remaining_time": "1 day, 4:15:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1833, "total_steps": 10853, "loss": 0.1809, "learning_rate": 4.8093342616278525e-06, "epoch": 0.16888561293591928, "percentage": 16.89, "elapsed_time": "5:44:36", "remaining_time": "1 day, 4:15:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1834, "total_steps": 10853, "loss": 0.1634, "learning_rate": 4.809042364680345e-06, "epoch": 0.1689777491131893, "percentage": 16.9, "elapsed_time": "5:44:47", "remaining_time": "1 day, 4:15:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1835, "total_steps": 10853, "loss": 0.1871, "learning_rate": 4.808750253338006e-06, "epoch": 0.1690698852904593, "percentage": 16.91, "elapsed_time": "5:44:57", "remaining_time": "1 day, 4:15:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1836, "total_steps": 10853, "loss": 0.176, "learning_rate": 4.8084579276279565e-06, "epoch": 0.1691620214677293, "percentage": 16.92, "elapsed_time": "5:45:09", "remaining_time": "1 day, 4:15:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1837, "total_steps": 10853, "loss": 0.1954, "learning_rate": 4.80816538757734e-06, "epoch": 0.16925415764499932, "percentage": 16.93, "elapsed_time": "5:45:20", "remaining_time": "1 day, 4:14:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1838, "total_steps": 10853, "loss": 0.1638, "learning_rate": 4.80787263321332e-06, "epoch": 0.16934629382226932, "percentage": 16.94, "elapsed_time": "5:45:30", "remaining_time": "1 day, 4:14:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1839, "total_steps": 10853, "loss": 0.1839, "learning_rate": 4.8075796645630764e-06, "epoch": 0.16943842999953931, "percentage": 16.94, "elapsed_time": "5:45:39", "remaining_time": "1 day, 4:14:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1840, "total_steps": 10853, "loss": 0.1719, "learning_rate": 4.807286481653813e-06, "epoch": 0.1695305661768093, "percentage": 16.95, "elapsed_time": "5:45:50", "remaining_time": "1 day, 4:14:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1841, "total_steps": 10853, "loss": 0.1786, "learning_rate": 4.806993084512752e-06, "epoch": 0.16962270235407934, "percentage": 16.96, "elapsed_time": "5:46:01", "remaining_time": "1 day, 4:13:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1842, "total_steps": 10853, "loss": 0.1916, "learning_rate": 4.806699473167134e-06, "epoch": 0.16971483853134933, "percentage": 16.97, "elapsed_time": "5:46:11", "remaining_time": "1 day, 4:13:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1843, "total_steps": 10853, "loss": 0.1826, "learning_rate": 4.806405647644222e-06, "epoch": 0.16980697470861933, "percentage": 16.98, "elapsed_time": "5:46:23", "remaining_time": "1 day, 4:13:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1844, "total_steps": 10853, "loss": 0.1751, "learning_rate": 4.806111607971298e-06, "epoch": 0.16989911088588935, "percentage": 16.99, "elapsed_time": "5:46:33", "remaining_time": "1 day, 4:13:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1845, "total_steps": 10853, "loss": 0.1715, "learning_rate": 4.805817354175663e-06, "epoch": 0.16999124706315935, "percentage": 17.0, "elapsed_time": "5:46:43", "remaining_time": "1 day, 4:12:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1846, "total_steps": 10853, "loss": 0.1731, "learning_rate": 4.805522886284637e-06, "epoch": 0.17008338324042935, "percentage": 17.01, "elapsed_time": "5:46:55", "remaining_time": "1 day, 4:12:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1847, "total_steps": 10853, "loss": 0.1777, "learning_rate": 4.8052282043255635e-06, "epoch": 0.17017551941769937, "percentage": 17.02, "elapsed_time": "5:47:07", "remaining_time": "1 day, 4:12:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1848, "total_steps": 10853, "loss": 0.1694, "learning_rate": 4.804933308325804e-06, "epoch": 0.17026765559496937, "percentage": 17.03, "elapsed_time": "5:47:17", "remaining_time": "1 day, 4:12:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1849, "total_steps": 10853, "loss": 0.2018, "learning_rate": 4.8046381983127385e-06, "epoch": 0.17035979177223937, "percentage": 17.04, "elapsed_time": "5:47:26", "remaining_time": "1 day, 4:11:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1850, "total_steps": 10853, "loss": 0.1867, "learning_rate": 4.8043428743137675e-06, "epoch": 0.17045192794950936, "percentage": 17.05, "elapsed_time": "5:47:38", "remaining_time": "1 day, 4:11:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1851, "total_steps": 10853, "loss": 0.1637, "learning_rate": 4.8040473363563136e-06, "epoch": 0.1705440641267794, "percentage": 17.06, "elapsed_time": "5:47:47", "remaining_time": "1 day, 4:11:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1852, "total_steps": 10853, "loss": 0.1866, "learning_rate": 4.8037515844678165e-06, "epoch": 0.17063620030404938, "percentage": 17.06, "elapsed_time": "5:47:59", "remaining_time": "1 day, 4:11:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1853, "total_steps": 10853, "loss": 0.1784, "learning_rate": 4.803455618675736e-06, "epoch": 0.17072833648131938, "percentage": 17.07, "elapsed_time": "5:48:09", "remaining_time": "1 day, 4:11:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1854, "total_steps": 10853, "loss": 0.1678, "learning_rate": 4.803159439007554e-06, "epoch": 0.1708204726585894, "percentage": 17.08, "elapsed_time": "5:48:20", "remaining_time": "1 day, 4:10:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1855, "total_steps": 10853, "loss": 0.1844, "learning_rate": 4.80286304549077e-06, "epoch": 0.1709126088358594, "percentage": 17.09, "elapsed_time": "5:48:31", "remaining_time": "1 day, 4:10:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1856, "total_steps": 10853, "loss": 0.1707, "learning_rate": 4.802566438152904e-06, "epoch": 0.1710047450131294, "percentage": 17.1, "elapsed_time": "5:48:43", "remaining_time": "1 day, 4:10:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1857, "total_steps": 10853, "loss": 0.1965, "learning_rate": 4.802269617021497e-06, "epoch": 0.1710968811903994, "percentage": 17.11, "elapsed_time": "5:48:55", "remaining_time": "1 day, 4:10:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1858, "total_steps": 10853, "loss": 0.1855, "learning_rate": 4.801972582124108e-06, "epoch": 0.17118901736766942, "percentage": 17.12, "elapsed_time": "5:49:04", "remaining_time": "1 day, 4:09:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1859, "total_steps": 10853, "loss": 0.1846, "learning_rate": 4.801675333488317e-06, "epoch": 0.17128115354493942, "percentage": 17.13, "elapsed_time": "5:49:14", "remaining_time": "1 day, 4:09:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1860, "total_steps": 10853, "loss": 0.1818, "learning_rate": 4.801377871141723e-06, "epoch": 0.17137328972220942, "percentage": 17.14, "elapsed_time": "5:49:25", "remaining_time": "1 day, 4:09:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1861, "total_steps": 10853, "loss": 0.1728, "learning_rate": 4.801080195111948e-06, "epoch": 0.17146542589947944, "percentage": 17.15, "elapsed_time": "5:49:37", "remaining_time": "1 day, 4:09:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1862, "total_steps": 10853, "loss": 0.1736, "learning_rate": 4.800782305426628e-06, "epoch": 0.17155756207674944, "percentage": 17.16, "elapsed_time": "5:49:49", "remaining_time": "1 day, 4:09:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1863, "total_steps": 10853, "loss": 0.1725, "learning_rate": 4.800484202113423e-06, "epoch": 0.17164969825401943, "percentage": 17.17, "elapsed_time": "5:50:00", "remaining_time": "1 day, 4:08:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1864, "total_steps": 10853, "loss": 0.1723, "learning_rate": 4.800185885200013e-06, "epoch": 0.17174183443128946, "percentage": 17.17, "elapsed_time": "5:50:12", "remaining_time": "1 day, 4:08:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1865, "total_steps": 10853, "loss": 0.1721, "learning_rate": 4.7998873547140954e-06, "epoch": 0.17183397060855946, "percentage": 17.18, "elapsed_time": "5:50:23", "remaining_time": "1 day, 4:08:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1866, "total_steps": 10853, "loss": 0.1845, "learning_rate": 4.799588610683389e-06, "epoch": 0.17192610678582945, "percentage": 17.19, "elapsed_time": "5:50:35", "remaining_time": "1 day, 4:08:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1867, "total_steps": 10853, "loss": 0.1756, "learning_rate": 4.799289653135633e-06, "epoch": 0.17201824296309945, "percentage": 17.2, "elapsed_time": "5:50:45", "remaining_time": "1 day, 4:08:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1868, "total_steps": 10853, "loss": 0.1747, "learning_rate": 4.7989904820985854e-06, "epoch": 0.17211037914036947, "percentage": 17.21, "elapsed_time": "5:50:56", "remaining_time": "1 day, 4:07:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1869, "total_steps": 10853, "loss": 0.1783, "learning_rate": 4.798691097600024e-06, "epoch": 0.17220251531763947, "percentage": 17.22, "elapsed_time": "5:51:08", "remaining_time": "1 day, 4:07:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1870, "total_steps": 10853, "loss": 0.1806, "learning_rate": 4.798391499667747e-06, "epoch": 0.17229465149490947, "percentage": 17.23, "elapsed_time": "5:51:19", "remaining_time": "1 day, 4:07:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1871, "total_steps": 10853, "loss": 0.1792, "learning_rate": 4.798091688329572e-06, "epoch": 0.1723867876721795, "percentage": 17.24, "elapsed_time": "5:51:30", "remaining_time": "1 day, 4:07:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1872, "total_steps": 10853, "loss": 0.166, "learning_rate": 4.7977916636133365e-06, "epoch": 0.1724789238494495, "percentage": 17.25, "elapsed_time": "5:51:41", "remaining_time": "1 day, 4:07:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1873, "total_steps": 10853, "loss": 0.1624, "learning_rate": 4.797491425546898e-06, "epoch": 0.17257106002671949, "percentage": 17.26, "elapsed_time": "5:51:50", "remaining_time": "1 day, 4:06:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1874, "total_steps": 10853, "loss": 0.1804, "learning_rate": 4.797190974158133e-06, "epoch": 0.17266319620398948, "percentage": 17.27, "elapsed_time": "5:52:01", "remaining_time": "1 day, 4:06:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1875, "total_steps": 10853, "loss": 0.1924, "learning_rate": 4.796890309474938e-06, "epoch": 0.1727553323812595, "percentage": 17.28, "elapsed_time": "5:52:12", "remaining_time": "1 day, 4:06:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1876, "total_steps": 10853, "loss": 0.1717, "learning_rate": 4.796589431525232e-06, "epoch": 0.1728474685585295, "percentage": 17.29, "elapsed_time": "5:52:24", "remaining_time": "1 day, 4:06:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1877, "total_steps": 10853, "loss": 0.1824, "learning_rate": 4.796288340336949e-06, "epoch": 0.1729396047357995, "percentage": 17.29, "elapsed_time": "5:52:34", "remaining_time": "1 day, 4:06:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1878, "total_steps": 10853, "loss": 0.1598, "learning_rate": 4.795987035938047e-06, "epoch": 0.17303174091306953, "percentage": 17.3, "elapsed_time": "5:52:44", "remaining_time": "1 day, 4:05:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1879, "total_steps": 10853, "loss": 0.176, "learning_rate": 4.795685518356501e-06, "epoch": 0.17312387709033952, "percentage": 17.31, "elapsed_time": "5:52:53", "remaining_time": "1 day, 4:05:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1880, "total_steps": 10853, "loss": 0.1622, "learning_rate": 4.795383787620308e-06, "epoch": 0.17321601326760952, "percentage": 17.32, "elapsed_time": "5:53:03", "remaining_time": "1 day, 4:05:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1881, "total_steps": 10853, "loss": 0.1579, "learning_rate": 4.795081843757483e-06, "epoch": 0.17330814944487954, "percentage": 17.33, "elapsed_time": "5:53:13", "remaining_time": "1 day, 4:04:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1882, "total_steps": 10853, "loss": 0.166, "learning_rate": 4.794779686796062e-06, "epoch": 0.17340028562214954, "percentage": 17.34, "elapsed_time": "5:53:24", "remaining_time": "1 day, 4:04:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1883, "total_steps": 10853, "loss": 0.1842, "learning_rate": 4.794477316764101e-06, "epoch": 0.17349242179941954, "percentage": 17.35, "elapsed_time": "5:53:35", "remaining_time": "1 day, 4:04:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1884, "total_steps": 10853, "loss": 0.1672, "learning_rate": 4.794174733689672e-06, "epoch": 0.17358455797668954, "percentage": 17.36, "elapsed_time": "5:53:45", "remaining_time": "1 day, 4:04:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1885, "total_steps": 10853, "loss": 0.1689, "learning_rate": 4.793871937600874e-06, "epoch": 0.17367669415395956, "percentage": 17.37, "elapsed_time": "5:53:57", "remaining_time": "1 day, 4:03:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1886, "total_steps": 10853, "loss": 0.1695, "learning_rate": 4.7935689285258195e-06, "epoch": 0.17376883033122956, "percentage": 17.38, "elapsed_time": "5:54:08", "remaining_time": "1 day, 4:03:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1887, "total_steps": 10853, "loss": 0.175, "learning_rate": 4.793265706492643e-06, "epoch": 0.17386096650849955, "percentage": 17.39, "elapsed_time": "5:54:19", "remaining_time": "1 day, 4:03:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1888, "total_steps": 10853, "loss": 0.1694, "learning_rate": 4.792962271529499e-06, "epoch": 0.17395310268576958, "percentage": 17.4, "elapsed_time": "5:54:31", "remaining_time": "1 day, 4:03:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1889, "total_steps": 10853, "loss": 0.1788, "learning_rate": 4.792658623664561e-06, "epoch": 0.17404523886303958, "percentage": 17.41, "elapsed_time": "5:54:40", "remaining_time": "1 day, 4:03:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1890, "total_steps": 10853, "loss": 0.1604, "learning_rate": 4.792354762926023e-06, "epoch": 0.17413737504030957, "percentage": 17.41, "elapsed_time": "5:54:51", "remaining_time": "1 day, 4:02:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1891, "total_steps": 10853, "loss": 0.1882, "learning_rate": 4.792050689342098e-06, "epoch": 0.17422951121757957, "percentage": 17.42, "elapsed_time": "5:55:03", "remaining_time": "1 day, 4:02:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1892, "total_steps": 10853, "loss": 0.1583, "learning_rate": 4.791746402941021e-06, "epoch": 0.1743216473948496, "percentage": 17.43, "elapsed_time": "5:55:14", "remaining_time": "1 day, 4:02:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1893, "total_steps": 10853, "loss": 0.1835, "learning_rate": 4.791441903751043e-06, "epoch": 0.1744137835721196, "percentage": 17.44, "elapsed_time": "5:55:25", "remaining_time": "1 day, 4:02:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1894, "total_steps": 10853, "loss": 0.1817, "learning_rate": 4.791137191800438e-06, "epoch": 0.1745059197493896, "percentage": 17.45, "elapsed_time": "5:55:37", "remaining_time": "1 day, 4:02:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1895, "total_steps": 10853, "loss": 0.1633, "learning_rate": 4.790832267117498e-06, "epoch": 0.1745980559266596, "percentage": 17.46, "elapsed_time": "5:55:48", "remaining_time": "1 day, 4:01:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1896, "total_steps": 10853, "loss": 0.1825, "learning_rate": 4.790527129730536e-06, "epoch": 0.1746901921039296, "percentage": 17.47, "elapsed_time": "5:55:59", "remaining_time": "1 day, 4:01:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1897, "total_steps": 10853, "loss": 0.1834, "learning_rate": 4.790221779667883e-06, "epoch": 0.1747823282811996, "percentage": 17.48, "elapsed_time": "5:56:10", "remaining_time": "1 day, 4:01:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1898, "total_steps": 10853, "loss": 0.1793, "learning_rate": 4.789916216957892e-06, "epoch": 0.17487446445846963, "percentage": 17.49, "elapsed_time": "5:56:19", "remaining_time": "1 day, 4:01:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1899, "total_steps": 10853, "loss": 0.1805, "learning_rate": 4.789610441628932e-06, "epoch": 0.17496660063573963, "percentage": 17.5, "elapsed_time": "5:56:30", "remaining_time": "1 day, 4:00:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1900, "total_steps": 10853, "loss": 0.1692, "learning_rate": 4.789304453709398e-06, "epoch": 0.17505873681300962, "percentage": 17.51, "elapsed_time": "5:56:41", "remaining_time": "1 day, 4:00:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1901, "total_steps": 10853, "loss": 0.1774, "learning_rate": 4.788998253227698e-06, "epoch": 0.17515087299027962, "percentage": 17.52, "elapsed_time": "5:56:53", "remaining_time": "1 day, 4:00:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1902, "total_steps": 10853, "loss": 0.1696, "learning_rate": 4.788691840212264e-06, "epoch": 0.17524300916754965, "percentage": 17.53, "elapsed_time": "5:57:04", "remaining_time": "1 day, 4:00:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1903, "total_steps": 10853, "loss": 0.1758, "learning_rate": 4.788385214691546e-06, "epoch": 0.17533514534481964, "percentage": 17.53, "elapsed_time": "5:57:15", "remaining_time": "1 day, 4:00:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1904, "total_steps": 10853, "loss": 0.18, "learning_rate": 4.788078376694017e-06, "epoch": 0.17542728152208964, "percentage": 17.54, "elapsed_time": "5:57:26", "remaining_time": "1 day, 4:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1905, "total_steps": 10853, "loss": 0.1738, "learning_rate": 4.787771326248162e-06, "epoch": 0.17551941769935966, "percentage": 17.55, "elapsed_time": "5:57:38", "remaining_time": "1 day, 3:59:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1906, "total_steps": 10853, "loss": 0.157, "learning_rate": 4.787464063382493e-06, "epoch": 0.17561155387662966, "percentage": 17.56, "elapsed_time": "5:57:47", "remaining_time": "1 day, 3:59:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1907, "total_steps": 10853, "loss": 0.1738, "learning_rate": 4.787156588125541e-06, "epoch": 0.17570369005389966, "percentage": 17.57, "elapsed_time": "5:57:57", "remaining_time": "1 day, 3:59:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1908, "total_steps": 10853, "loss": 0.197, "learning_rate": 4.786848900505852e-06, "epoch": 0.17579582623116966, "percentage": 17.58, "elapsed_time": "5:58:08", "remaining_time": "1 day, 3:58:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1909, "total_steps": 10853, "loss": 0.1709, "learning_rate": 4.786541000551997e-06, "epoch": 0.17588796240843968, "percentage": 17.59, "elapsed_time": "5:58:19", "remaining_time": "1 day, 3:58:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1910, "total_steps": 10853, "loss": 0.1696, "learning_rate": 4.786232888292564e-06, "epoch": 0.17598009858570968, "percentage": 17.6, "elapsed_time": "5:58:28", "remaining_time": "1 day, 3:58:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1911, "total_steps": 10853, "loss": 0.1778, "learning_rate": 4.785924563756162e-06, "epoch": 0.17607223476297967, "percentage": 17.61, "elapsed_time": "5:58:38", "remaining_time": "1 day, 3:58:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1912, "total_steps": 10853, "loss": 0.1802, "learning_rate": 4.785616026971418e-06, "epoch": 0.1761643709402497, "percentage": 17.62, "elapsed_time": "5:58:50", "remaining_time": "1 day, 3:58:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1913, "total_steps": 10853, "loss": 0.1735, "learning_rate": 4.78530727796698e-06, "epoch": 0.1762565071175197, "percentage": 17.63, "elapsed_time": "5:59:00", "remaining_time": "1 day, 3:57:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1914, "total_steps": 10853, "loss": 0.1739, "learning_rate": 4.784998316771515e-06, "epoch": 0.1763486432947897, "percentage": 17.64, "elapsed_time": "5:59:10", "remaining_time": "1 day, 3:57:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1915, "total_steps": 10853, "loss": 0.1829, "learning_rate": 4.784689143413711e-06, "epoch": 0.17644077947205972, "percentage": 17.64, "elapsed_time": "5:59:21", "remaining_time": "1 day, 3:57:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1916, "total_steps": 10853, "loss": 0.1647, "learning_rate": 4.784379757922273e-06, "epoch": 0.1765329156493297, "percentage": 17.65, "elapsed_time": "5:59:31", "remaining_time": "1 day, 3:56:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1917, "total_steps": 10853, "loss": 0.183, "learning_rate": 4.78407016032593e-06, "epoch": 0.1766250518265997, "percentage": 17.66, "elapsed_time": "5:59:41", "remaining_time": "1 day, 3:56:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1918, "total_steps": 10853, "loss": 0.1575, "learning_rate": 4.783760350653426e-06, "epoch": 0.1767171880038697, "percentage": 17.67, "elapsed_time": "5:59:52", "remaining_time": "1 day, 3:56:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1919, "total_steps": 10853, "loss": 0.1746, "learning_rate": 4.783450328933527e-06, "epoch": 0.17680932418113973, "percentage": 17.68, "elapsed_time": "6:00:03", "remaining_time": "1 day, 3:56:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1920, "total_steps": 10853, "loss": 0.1945, "learning_rate": 4.78314009519502e-06, "epoch": 0.17690146035840973, "percentage": 17.69, "elapsed_time": "6:00:14", "remaining_time": "1 day, 3:56:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1921, "total_steps": 10853, "loss": 0.1613, "learning_rate": 4.782829649466709e-06, "epoch": 0.17699359653567973, "percentage": 17.7, "elapsed_time": "6:00:25", "remaining_time": "1 day, 3:55:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1922, "total_steps": 10853, "loss": 0.1661, "learning_rate": 4.78251899177742e-06, "epoch": 0.17708573271294975, "percentage": 17.71, "elapsed_time": "6:00:36", "remaining_time": "1 day, 3:55:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1923, "total_steps": 10853, "loss": 0.1866, "learning_rate": 4.7822081221559965e-06, "epoch": 0.17717786889021975, "percentage": 17.72, "elapsed_time": "6:00:47", "remaining_time": "1 day, 3:55:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1924, "total_steps": 10853, "loss": 0.1652, "learning_rate": 4.781897040631304e-06, "epoch": 0.17727000506748974, "percentage": 17.73, "elapsed_time": "6:00:59", "remaining_time": "1 day, 3:55:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1925, "total_steps": 10853, "loss": 0.1963, "learning_rate": 4.781585747232224e-06, "epoch": 0.17736214124475974, "percentage": 17.74, "elapsed_time": "6:01:09", "remaining_time": "1 day, 3:55:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1926, "total_steps": 10853, "loss": 0.1687, "learning_rate": 4.781274241987664e-06, "epoch": 0.17745427742202977, "percentage": 17.75, "elapsed_time": "6:01:20", "remaining_time": "1 day, 3:54:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1927, "total_steps": 10853, "loss": 0.1633, "learning_rate": 4.7809625249265436e-06, "epoch": 0.17754641359929976, "percentage": 17.76, "elapsed_time": "6:01:30", "remaining_time": "1 day, 3:54:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1928, "total_steps": 10853, "loss": 0.1839, "learning_rate": 4.780650596077808e-06, "epoch": 0.17763854977656976, "percentage": 17.76, "elapsed_time": "6:01:42", "remaining_time": "1 day, 3:54:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1929, "total_steps": 10853, "loss": 0.1784, "learning_rate": 4.780338455470419e-06, "epoch": 0.17773068595383978, "percentage": 17.77, "elapsed_time": "6:01:52", "remaining_time": "1 day, 3:54:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1930, "total_steps": 10853, "loss": 0.1671, "learning_rate": 4.780026103133358e-06, "epoch": 0.17782282213110978, "percentage": 17.78, "elapsed_time": "6:02:03", "remaining_time": "1 day, 3:53:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1931, "total_steps": 10853, "loss": 0.1667, "learning_rate": 4.7797135390956294e-06, "epoch": 0.17791495830837978, "percentage": 17.79, "elapsed_time": "6:02:13", "remaining_time": "1 day, 3:53:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1932, "total_steps": 10853, "loss": 0.1912, "learning_rate": 4.779400763386253e-06, "epoch": 0.1780070944856498, "percentage": 17.8, "elapsed_time": "6:02:24", "remaining_time": "1 day, 3:53:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1933, "total_steps": 10853, "loss": 0.1753, "learning_rate": 4.77908777603427e-06, "epoch": 0.1780992306629198, "percentage": 17.81, "elapsed_time": "6:02:35", "remaining_time": "1 day, 3:53:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1934, "total_steps": 10853, "loss": 0.1856, "learning_rate": 4.778774577068741e-06, "epoch": 0.1781913668401898, "percentage": 17.82, "elapsed_time": "6:02:45", "remaining_time": "1 day, 3:52:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1935, "total_steps": 10853, "loss": 0.162, "learning_rate": 4.778461166518748e-06, "epoch": 0.1782835030174598, "percentage": 17.83, "elapsed_time": "6:02:55", "remaining_time": "1 day, 3:52:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1936, "total_steps": 10853, "loss": 0.1728, "learning_rate": 4.778147544413392e-06, "epoch": 0.17837563919472982, "percentage": 17.84, "elapsed_time": "6:03:06", "remaining_time": "1 day, 3:52:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1937, "total_steps": 10853, "loss": 0.1957, "learning_rate": 4.777833710781789e-06, "epoch": 0.17846777537199982, "percentage": 17.85, "elapsed_time": "6:03:17", "remaining_time": "1 day, 3:52:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1938, "total_steps": 10853, "loss": 0.1878, "learning_rate": 4.777519665653082e-06, "epoch": 0.1785599115492698, "percentage": 17.86, "elapsed_time": "6:03:28", "remaining_time": "1 day, 3:52:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1939, "total_steps": 10853, "loss": 0.1779, "learning_rate": 4.777205409056429e-06, "epoch": 0.17865204772653984, "percentage": 17.87, "elapsed_time": "6:03:39", "remaining_time": "1 day, 3:51:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1940, "total_steps": 10853, "loss": 0.2017, "learning_rate": 4.776890941021008e-06, "epoch": 0.17874418390380983, "percentage": 17.88, "elapsed_time": "6:03:49", "remaining_time": "1 day, 3:51:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1941, "total_steps": 10853, "loss": 0.1722, "learning_rate": 4.776576261576018e-06, "epoch": 0.17883632008107983, "percentage": 17.88, "elapsed_time": "6:04:00", "remaining_time": "1 day, 3:51:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1942, "total_steps": 10853, "loss": 0.1706, "learning_rate": 4.776261370750678e-06, "epoch": 0.17892845625834983, "percentage": 17.89, "elapsed_time": "6:04:10", "remaining_time": "1 day, 3:51:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1943, "total_steps": 10853, "loss": 0.1763, "learning_rate": 4.775946268574224e-06, "epoch": 0.17902059243561985, "percentage": 17.9, "elapsed_time": "6:04:22", "remaining_time": "1 day, 3:50:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1944, "total_steps": 10853, "loss": 0.1992, "learning_rate": 4.775630955075915e-06, "epoch": 0.17911272861288985, "percentage": 17.91, "elapsed_time": "6:04:34", "remaining_time": "1 day, 3:50:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1945, "total_steps": 10853, "loss": 0.1981, "learning_rate": 4.775315430285026e-06, "epoch": 0.17920486479015985, "percentage": 17.92, "elapsed_time": "6:04:44", "remaining_time": "1 day, 3:50:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1946, "total_steps": 10853, "loss": 0.1888, "learning_rate": 4.7749996942308546e-06, "epoch": 0.17929700096742987, "percentage": 17.93, "elapsed_time": "6:04:54", "remaining_time": "1 day, 3:50:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1947, "total_steps": 10853, "loss": 0.1842, "learning_rate": 4.774683746942717e-06, "epoch": 0.17938913714469987, "percentage": 17.94, "elapsed_time": "6:05:07", "remaining_time": "1 day, 3:50:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1948, "total_steps": 10853, "loss": 0.1578, "learning_rate": 4.774367588449948e-06, "epoch": 0.17948127332196986, "percentage": 17.95, "elapsed_time": "6:05:19", "remaining_time": "1 day, 3:50:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1949, "total_steps": 10853, "loss": 0.1632, "learning_rate": 4.774051218781904e-06, "epoch": 0.1795734094992399, "percentage": 17.96, "elapsed_time": "6:05:29", "remaining_time": "1 day, 3:49:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1950, "total_steps": 10853, "loss": 0.1786, "learning_rate": 4.77373463796796e-06, "epoch": 0.17966554567650989, "percentage": 17.97, "elapsed_time": "6:05:40", "remaining_time": "1 day, 3:49:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1951, "total_steps": 10853, "loss": 0.1657, "learning_rate": 4.7734178460375105e-06, "epoch": 0.17975768185377988, "percentage": 17.98, "elapsed_time": "6:05:50", "remaining_time": "1 day, 3:49:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1952, "total_steps": 10853, "loss": 0.1662, "learning_rate": 4.773100843019969e-06, "epoch": 0.17984981803104988, "percentage": 17.99, "elapsed_time": "6:06:00", "remaining_time": "1 day, 3:48:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1953, "total_steps": 10853, "loss": 0.1815, "learning_rate": 4.7727836289447685e-06, "epoch": 0.1799419542083199, "percentage": 18.0, "elapsed_time": "6:06:12", "remaining_time": "1 day, 3:48:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1954, "total_steps": 10853, "loss": 0.1805, "learning_rate": 4.7724662038413646e-06, "epoch": 0.1800340903855899, "percentage": 18.0, "elapsed_time": "6:06:22", "remaining_time": "1 day, 3:48:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1955, "total_steps": 10853, "loss": 0.172, "learning_rate": 4.772148567739229e-06, "epoch": 0.1801262265628599, "percentage": 18.01, "elapsed_time": "6:06:33", "remaining_time": "1 day, 3:48:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1956, "total_steps": 10853, "loss": 0.1828, "learning_rate": 4.7718307206678535e-06, "epoch": 0.18021836274012992, "percentage": 18.02, "elapsed_time": "6:06:43", "remaining_time": "1 day, 3:48:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1957, "total_steps": 10853, "loss": 0.1541, "learning_rate": 4.7715126626567525e-06, "epoch": 0.18031049891739992, "percentage": 18.03, "elapsed_time": "6:06:53", "remaining_time": "1 day, 3:47:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1958, "total_steps": 10853, "loss": 0.1751, "learning_rate": 4.7711943937354555e-06, "epoch": 0.18040263509466992, "percentage": 18.04, "elapsed_time": "6:07:04", "remaining_time": "1 day, 3:47:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1959, "total_steps": 10853, "loss": 0.1851, "learning_rate": 4.770875913933515e-06, "epoch": 0.18049477127193994, "percentage": 18.05, "elapsed_time": "6:07:15", "remaining_time": "1 day, 3:47:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1960, "total_steps": 10853, "loss": 0.1919, "learning_rate": 4.770557223280501e-06, "epoch": 0.18058690744920994, "percentage": 18.06, "elapsed_time": "6:07:28", "remaining_time": "1 day, 3:47:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1961, "total_steps": 10853, "loss": 0.1772, "learning_rate": 4.7702383218060044e-06, "epoch": 0.18067904362647993, "percentage": 18.07, "elapsed_time": "6:07:40", "remaining_time": "1 day, 3:47:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1962, "total_steps": 10853, "loss": 0.2, "learning_rate": 4.769919209539635e-06, "epoch": 0.18077117980374993, "percentage": 18.08, "elapsed_time": "6:07:51", "remaining_time": "1 day, 3:47:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1963, "total_steps": 10853, "loss": 0.1847, "learning_rate": 4.769599886511024e-06, "epoch": 0.18086331598101996, "percentage": 18.09, "elapsed_time": "6:08:02", "remaining_time": "1 day, 3:46:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1964, "total_steps": 10853, "loss": 0.1636, "learning_rate": 4.769280352749817e-06, "epoch": 0.18095545215828995, "percentage": 18.1, "elapsed_time": "6:08:13", "remaining_time": "1 day, 3:46:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1965, "total_steps": 10853, "loss": 0.1729, "learning_rate": 4.768960608285688e-06, "epoch": 0.18104758833555995, "percentage": 18.11, "elapsed_time": "6:08:23", "remaining_time": "1 day, 3:46:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1966, "total_steps": 10853, "loss": 0.1748, "learning_rate": 4.76864065314832e-06, "epoch": 0.18113972451282997, "percentage": 18.11, "elapsed_time": "6:08:34", "remaining_time": "1 day, 3:46:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1967, "total_steps": 10853, "loss": 0.1683, "learning_rate": 4.768320487367424e-06, "epoch": 0.18123186069009997, "percentage": 18.12, "elapsed_time": "6:08:44", "remaining_time": "1 day, 3:45:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1968, "total_steps": 10853, "loss": 0.1689, "learning_rate": 4.768000110972727e-06, "epoch": 0.18132399686736997, "percentage": 18.13, "elapsed_time": "6:08:54", "remaining_time": "1 day, 3:45:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1969, "total_steps": 10853, "loss": 0.1883, "learning_rate": 4.767679523993976e-06, "epoch": 0.18141613304463997, "percentage": 18.14, "elapsed_time": "6:09:05", "remaining_time": "1 day, 3:45:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1970, "total_steps": 10853, "loss": 0.1605, "learning_rate": 4.767358726460936e-06, "epoch": 0.18150826922191, "percentage": 18.15, "elapsed_time": "6:09:15", "remaining_time": "1 day, 3:45:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1971, "total_steps": 10853, "loss": 0.1687, "learning_rate": 4.7670377184033944e-06, "epoch": 0.18160040539918, "percentage": 18.16, "elapsed_time": "6:09:27", "remaining_time": "1 day, 3:44:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1972, "total_steps": 10853, "loss": 0.1911, "learning_rate": 4.7667164998511574e-06, "epoch": 0.18169254157644998, "percentage": 18.17, "elapsed_time": "6:09:39", "remaining_time": "1 day, 3:44:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1973, "total_steps": 10853, "loss": 0.1783, "learning_rate": 4.766395070834049e-06, "epoch": 0.18178467775372, "percentage": 18.18, "elapsed_time": "6:09:49", "remaining_time": "1 day, 3:44:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1974, "total_steps": 10853, "loss": 0.1666, "learning_rate": 4.7660734313819135e-06, "epoch": 0.18187681393099, "percentage": 18.19, "elapsed_time": "6:10:01", "remaining_time": "1 day, 3:44:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1975, "total_steps": 10853, "loss": 0.1551, "learning_rate": 4.765751581524617e-06, "epoch": 0.18196895010826, "percentage": 18.2, "elapsed_time": "6:10:10", "remaining_time": "1 day, 3:44:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1976, "total_steps": 10853, "loss": 0.1812, "learning_rate": 4.765429521292042e-06, "epoch": 0.18206108628553003, "percentage": 18.21, "elapsed_time": "6:10:22", "remaining_time": "1 day, 3:43:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1977, "total_steps": 10853, "loss": 0.17, "learning_rate": 4.765107250714093e-06, "epoch": 0.18215322246280002, "percentage": 18.22, "elapsed_time": "6:10:33", "remaining_time": "1 day, 3:43:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1978, "total_steps": 10853, "loss": 0.1843, "learning_rate": 4.764784769820691e-06, "epoch": 0.18224535864007002, "percentage": 18.23, "elapsed_time": "6:10:44", "remaining_time": "1 day, 3:43:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1979, "total_steps": 10853, "loss": 0.1797, "learning_rate": 4.76446207864178e-06, "epoch": 0.18233749481734002, "percentage": 18.23, "elapsed_time": "6:10:55", "remaining_time": "1 day, 3:43:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1980, "total_steps": 10853, "loss": 0.187, "learning_rate": 4.764139177207321e-06, "epoch": 0.18242963099461004, "percentage": 18.24, "elapsed_time": "6:11:06", "remaining_time": "1 day, 3:43:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1981, "total_steps": 10853, "loss": 0.1686, "learning_rate": 4.763816065547295e-06, "epoch": 0.18252176717188004, "percentage": 18.25, "elapsed_time": "6:11:17", "remaining_time": "1 day, 3:42:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1982, "total_steps": 10853, "loss": 0.1591, "learning_rate": 4.763492743691705e-06, "epoch": 0.18261390334915004, "percentage": 18.26, "elapsed_time": "6:11:28", "remaining_time": "1 day, 3:42:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1983, "total_steps": 10853, "loss": 0.176, "learning_rate": 4.7631692116705695e-06, "epoch": 0.18270603952642006, "percentage": 18.27, "elapsed_time": "6:11:39", "remaining_time": "1 day, 3:42:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1984, "total_steps": 10853, "loss": 0.1638, "learning_rate": 4.76284546951393e-06, "epoch": 0.18279817570369006, "percentage": 18.28, "elapsed_time": "6:11:49", "remaining_time": "1 day, 3:42:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1985, "total_steps": 10853, "loss": 0.1889, "learning_rate": 4.762521517251844e-06, "epoch": 0.18289031188096005, "percentage": 18.29, "elapsed_time": "6:12:00", "remaining_time": "1 day, 3:41:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1986, "total_steps": 10853, "loss": 0.1789, "learning_rate": 4.762197354914391e-06, "epoch": 0.18298244805823005, "percentage": 18.3, "elapsed_time": "6:12:12", "remaining_time": "1 day, 3:41:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1987, "total_steps": 10853, "loss": 0.188, "learning_rate": 4.761872982531671e-06, "epoch": 0.18307458423550008, "percentage": 18.31, "elapsed_time": "6:12:23", "remaining_time": "1 day, 3:41:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1988, "total_steps": 10853, "loss": 0.1727, "learning_rate": 4.761548400133801e-06, "epoch": 0.18316672041277007, "percentage": 18.32, "elapsed_time": "6:12:33", "remaining_time": "1 day, 3:41:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1989, "total_steps": 10853, "loss": 0.1821, "learning_rate": 4.761223607750919e-06, "epoch": 0.18325885659004007, "percentage": 18.33, "elapsed_time": "6:12:43", "remaining_time": "1 day, 3:41:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1990, "total_steps": 10853, "loss": 0.1953, "learning_rate": 4.760898605413182e-06, "epoch": 0.1833509927673101, "percentage": 18.34, "elapsed_time": "6:12:54", "remaining_time": "1 day, 3:40:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1991, "total_steps": 10853, "loss": 0.1682, "learning_rate": 4.760573393150766e-06, "epoch": 0.1834431289445801, "percentage": 18.35, "elapsed_time": "6:13:05", "remaining_time": "1 day, 3:40:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1992, "total_steps": 10853, "loss": 0.187, "learning_rate": 4.760247970993867e-06, "epoch": 0.1835352651218501, "percentage": 18.35, "elapsed_time": "6:13:14", "remaining_time": "1 day, 3:40:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1993, "total_steps": 10853, "loss": 0.166, "learning_rate": 4.7599223389727e-06, "epoch": 0.1836274012991201, "percentage": 18.36, "elapsed_time": "6:13:24", "remaining_time": "1 day, 3:40:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1994, "total_steps": 10853, "loss": 0.1621, "learning_rate": 4.759596497117501e-06, "epoch": 0.1837195374763901, "percentage": 18.37, "elapsed_time": "6:13:33", "remaining_time": "1 day, 3:39:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1995, "total_steps": 10853, "loss": 0.186, "learning_rate": 4.759270445458524e-06, "epoch": 0.1838116736536601, "percentage": 18.38, "elapsed_time": "6:13:44", "remaining_time": "1 day, 3:39:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1996, "total_steps": 10853, "loss": 0.1755, "learning_rate": 4.758944184026043e-06, "epoch": 0.1839038098309301, "percentage": 18.39, "elapsed_time": "6:13:54", "remaining_time": "1 day, 3:39:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1997, "total_steps": 10853, "loss": 0.1656, "learning_rate": 4.758617712850352e-06, "epoch": 0.18399594600820013, "percentage": 18.4, "elapsed_time": "6:14:05", "remaining_time": "1 day, 3:38:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1998, "total_steps": 10853, "loss": 0.1774, "learning_rate": 4.758291031961763e-06, "epoch": 0.18408808218547013, "percentage": 18.41, "elapsed_time": "6:14:16", "remaining_time": "1 day, 3:38:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1999, "total_steps": 10853, "loss": 0.1779, "learning_rate": 4.757964141390609e-06, "epoch": 0.18418021836274012, "percentage": 18.42, "elapsed_time": "6:14:27", "remaining_time": "1 day, 3:38:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2000, "total_steps": 10853, "loss": 0.1701, "learning_rate": 4.75763704116724e-06, "epoch": 0.18427235454001015, "percentage": 18.43, "elapsed_time": "6:14:38", "remaining_time": "1 day, 3:38:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2000, "total_steps": 10853, "eval_loss": 0.1747845858335495, "epoch": 0.18427235454001015, "percentage": 18.43, "elapsed_time": "6:19:37", "remaining_time": "1 day, 4:00:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2001, "total_steps": 10853, "loss": 0.1766, "learning_rate": 4.757309731322029e-06, "epoch": 0.18436449071728014, "percentage": 18.44, "elapsed_time": "6:19:48", "remaining_time": "1 day, 4:00:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2002, "total_steps": 10853, "loss": 0.185, "learning_rate": 4.756982211885368e-06, "epoch": 0.18445662689455014, "percentage": 18.45, "elapsed_time": "6:19:59", "remaining_time": "1 day, 3:59:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2003, "total_steps": 10853, "loss": 0.1629, "learning_rate": 4.756654482887665e-06, "epoch": 0.18454876307182014, "percentage": 18.46, "elapsed_time": "6:20:09", "remaining_time": "1 day, 3:59:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2004, "total_steps": 10853, "loss": 0.1677, "learning_rate": 4.756326544359351e-06, "epoch": 0.18464089924909016, "percentage": 18.46, "elapsed_time": "6:20:20", "remaining_time": "1 day, 3:59:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2005, "total_steps": 10853, "loss": 0.159, "learning_rate": 4.7559983963308735e-06, "epoch": 0.18473303542636016, "percentage": 18.47, "elapsed_time": "6:20:32", "remaining_time": "1 day, 3:59:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2006, "total_steps": 10853, "loss": 0.1657, "learning_rate": 4.755670038832703e-06, "epoch": 0.18482517160363016, "percentage": 18.48, "elapsed_time": "6:20:40", "remaining_time": "1 day, 3:58:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2007, "total_steps": 10853, "loss": 0.1813, "learning_rate": 4.755341471895325e-06, "epoch": 0.18491730778090018, "percentage": 18.49, "elapsed_time": "6:20:51", "remaining_time": "1 day, 3:58:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2008, "total_steps": 10853, "loss": 0.1655, "learning_rate": 4.75501269554925e-06, "epoch": 0.18500944395817018, "percentage": 18.5, "elapsed_time": "6:21:01", "remaining_time": "1 day, 3:58:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2009, "total_steps": 10853, "loss": 0.1762, "learning_rate": 4.754683709825003e-06, "epoch": 0.18510158013544017, "percentage": 18.51, "elapsed_time": "6:21:12", "remaining_time": "1 day, 3:58:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2010, "total_steps": 10853, "loss": 0.1677, "learning_rate": 4.7543545147531314e-06, "epoch": 0.1851937163127102, "percentage": 18.52, "elapsed_time": "6:21:23", "remaining_time": "1 day, 3:57:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2011, "total_steps": 10853, "loss": 0.1648, "learning_rate": 4.754025110364201e-06, "epoch": 0.1852858524899802, "percentage": 18.53, "elapsed_time": "6:21:32", "remaining_time": "1 day, 3:57:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2012, "total_steps": 10853, "loss": 0.1641, "learning_rate": 4.753695496688795e-06, "epoch": 0.1853779886672502, "percentage": 18.54, "elapsed_time": "6:21:44", "remaining_time": "1 day, 3:57:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2013, "total_steps": 10853, "loss": 0.1783, "learning_rate": 4.753365673757521e-06, "epoch": 0.1854701248445202, "percentage": 18.55, "elapsed_time": "6:21:55", "remaining_time": "1 day, 3:57:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2014, "total_steps": 10853, "loss": 0.1584, "learning_rate": 4.7530356416010004e-06, "epoch": 0.18556226102179021, "percentage": 18.56, "elapsed_time": "6:22:05", "remaining_time": "1 day, 3:56:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2015, "total_steps": 10853, "loss": 0.1692, "learning_rate": 4.7527054002498785e-06, "epoch": 0.1856543971990602, "percentage": 18.57, "elapsed_time": "6:22:17", "remaining_time": "1 day, 3:56:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2016, "total_steps": 10853, "loss": 0.1764, "learning_rate": 4.752374949734818e-06, "epoch": 0.1857465333763302, "percentage": 18.58, "elapsed_time": "6:22:28", "remaining_time": "1 day, 3:56:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2017, "total_steps": 10853, "loss": 0.174, "learning_rate": 4.752044290086501e-06, "epoch": 0.18583866955360023, "percentage": 18.58, "elapsed_time": "6:22:38", "remaining_time": "1 day, 3:56:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2018, "total_steps": 10853, "loss": 0.1584, "learning_rate": 4.75171342133563e-06, "epoch": 0.18593080573087023, "percentage": 18.59, "elapsed_time": "6:22:48", "remaining_time": "1 day, 3:55:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2019, "total_steps": 10853, "loss": 0.1765, "learning_rate": 4.751382343512924e-06, "epoch": 0.18602294190814023, "percentage": 18.6, "elapsed_time": "6:23:00", "remaining_time": "1 day, 3:55:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2020, "total_steps": 10853, "loss": 0.1754, "learning_rate": 4.751051056649126e-06, "epoch": 0.18611507808541022, "percentage": 18.61, "elapsed_time": "6:23:11", "remaining_time": "1 day, 3:55:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2021, "total_steps": 10853, "loss": 0.1713, "learning_rate": 4.750719560774994e-06, "epoch": 0.18620721426268025, "percentage": 18.62, "elapsed_time": "6:23:21", "remaining_time": "1 day, 3:55:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2022, "total_steps": 10853, "loss": 0.1624, "learning_rate": 4.75038785592131e-06, "epoch": 0.18629935043995025, "percentage": 18.63, "elapsed_time": "6:23:32", "remaining_time": "1 day, 3:55:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2023, "total_steps": 10853, "loss": 0.1772, "learning_rate": 4.750055942118871e-06, "epoch": 0.18639148661722024, "percentage": 18.64, "elapsed_time": "6:23:42", "remaining_time": "1 day, 3:54:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2024, "total_steps": 10853, "loss": 0.1693, "learning_rate": 4.749723819398496e-06, "epoch": 0.18648362279449027, "percentage": 18.65, "elapsed_time": "6:23:53", "remaining_time": "1 day, 3:54:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2025, "total_steps": 10853, "loss": 0.167, "learning_rate": 4.749391487791021e-06, "epoch": 0.18657575897176026, "percentage": 18.66, "elapsed_time": "6:24:05", "remaining_time": "1 day, 3:54:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2026, "total_steps": 10853, "loss": 0.1675, "learning_rate": 4.749058947327306e-06, "epoch": 0.18666789514903026, "percentage": 18.67, "elapsed_time": "6:24:16", "remaining_time": "1 day, 3:54:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2027, "total_steps": 10853, "loss": 0.1686, "learning_rate": 4.7487261980382235e-06, "epoch": 0.18676003132630029, "percentage": 18.68, "elapsed_time": "6:24:27", "remaining_time": "1 day, 3:54:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2028, "total_steps": 10853, "loss": 0.1811, "learning_rate": 4.748393239954674e-06, "epoch": 0.18685216750357028, "percentage": 18.69, "elapsed_time": "6:24:39", "remaining_time": "1 day, 3:53:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2029, "total_steps": 10853, "loss": 0.1852, "learning_rate": 4.748060073107568e-06, "epoch": 0.18694430368084028, "percentage": 18.7, "elapsed_time": "6:24:49", "remaining_time": "1 day, 3:53:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2030, "total_steps": 10853, "loss": 0.1744, "learning_rate": 4.747726697527844e-06, "epoch": 0.18703643985811028, "percentage": 18.7, "elapsed_time": "6:24:58", "remaining_time": "1 day, 3:53:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2031, "total_steps": 10853, "loss": 0.1643, "learning_rate": 4.747393113246453e-06, "epoch": 0.1871285760353803, "percentage": 18.71, "elapsed_time": "6:25:09", "remaining_time": "1 day, 3:53:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2032, "total_steps": 10853, "loss": 0.1742, "learning_rate": 4.74705932029437e-06, "epoch": 0.1872207122126503, "percentage": 18.72, "elapsed_time": "6:25:20", "remaining_time": "1 day, 3:52:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2033, "total_steps": 10853, "loss": 0.166, "learning_rate": 4.746725318702587e-06, "epoch": 0.1873128483899203, "percentage": 18.73, "elapsed_time": "6:25:30", "remaining_time": "1 day, 3:52:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2034, "total_steps": 10853, "loss": 0.1829, "learning_rate": 4.746391108502116e-06, "epoch": 0.18740498456719032, "percentage": 18.74, "elapsed_time": "6:25:42", "remaining_time": "1 day, 3:52:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2035, "total_steps": 10853, "loss": 0.1662, "learning_rate": 4.7460566897239905e-06, "epoch": 0.18749712074446032, "percentage": 18.75, "elapsed_time": "6:25:54", "remaining_time": "1 day, 3:52:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2036, "total_steps": 10853, "loss": 0.1904, "learning_rate": 4.745722062399258e-06, "epoch": 0.1875892569217303, "percentage": 18.76, "elapsed_time": "6:26:05", "remaining_time": "1 day, 3:51:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2037, "total_steps": 10853, "loss": 0.1578, "learning_rate": 4.745387226558991e-06, "epoch": 0.1876813930990003, "percentage": 18.77, "elapsed_time": "6:26:15", "remaining_time": "1 day, 3:51:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2038, "total_steps": 10853, "loss": 0.1845, "learning_rate": 4.745052182234278e-06, "epoch": 0.18777352927627033, "percentage": 18.78, "elapsed_time": "6:26:27", "remaining_time": "1 day, 3:51:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2039, "total_steps": 10853, "loss": 0.1648, "learning_rate": 4.744716929456229e-06, "epoch": 0.18786566545354033, "percentage": 18.79, "elapsed_time": "6:26:38", "remaining_time": "1 day, 3:51:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2040, "total_steps": 10853, "loss": 0.1719, "learning_rate": 4.744381468255971e-06, "epoch": 0.18795780163081033, "percentage": 18.8, "elapsed_time": "6:26:50", "remaining_time": "1 day, 3:51:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2041, "total_steps": 10853, "loss": 0.1741, "learning_rate": 4.7440457986646525e-06, "epoch": 0.18804993780808035, "percentage": 18.81, "elapsed_time": "6:27:00", "remaining_time": "1 day, 3:50:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2042, "total_steps": 10853, "loss": 0.1623, "learning_rate": 4.743709920713439e-06, "epoch": 0.18814207398535035, "percentage": 18.82, "elapsed_time": "6:27:09", "remaining_time": "1 day, 3:50:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2043, "total_steps": 10853, "loss": 0.1722, "learning_rate": 4.743373834433519e-06, "epoch": 0.18823421016262035, "percentage": 18.82, "elapsed_time": "6:27:20", "remaining_time": "1 day, 3:50:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2044, "total_steps": 10853, "loss": 0.1874, "learning_rate": 4.743037539856097e-06, "epoch": 0.18832634633989037, "percentage": 18.83, "elapsed_time": "6:27:32", "remaining_time": "1 day, 3:50:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2045, "total_steps": 10853, "loss": 0.1707, "learning_rate": 4.742701037012397e-06, "epoch": 0.18841848251716037, "percentage": 18.84, "elapsed_time": "6:27:42", "remaining_time": "1 day, 3:49:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2046, "total_steps": 10853, "loss": 0.1754, "learning_rate": 4.7423643259336656e-06, "epoch": 0.18851061869443037, "percentage": 18.85, "elapsed_time": "6:27:54", "remaining_time": "1 day, 3:49:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2047, "total_steps": 10853, "loss": 0.1647, "learning_rate": 4.742027406651164e-06, "epoch": 0.18860275487170036, "percentage": 18.86, "elapsed_time": "6:28:03", "remaining_time": "1 day, 3:49:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2048, "total_steps": 10853, "loss": 0.1866, "learning_rate": 4.741690279196178e-06, "epoch": 0.1886948910489704, "percentage": 18.87, "elapsed_time": "6:28:14", "remaining_time": "1 day, 3:49:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2049, "total_steps": 10853, "loss": 0.1817, "learning_rate": 4.741352943600007e-06, "epoch": 0.18878702722624038, "percentage": 18.88, "elapsed_time": "6:28:25", "remaining_time": "1 day, 3:48:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2050, "total_steps": 10853, "loss": 0.176, "learning_rate": 4.741015399893974e-06, "epoch": 0.18887916340351038, "percentage": 18.89, "elapsed_time": "6:28:34", "remaining_time": "1 day, 3:48:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2051, "total_steps": 10853, "loss": 0.1825, "learning_rate": 4.740677648109421e-06, "epoch": 0.1889712995807804, "percentage": 18.9, "elapsed_time": "6:28:45", "remaining_time": "1 day, 3:48:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2052, "total_steps": 10853, "loss": 0.1708, "learning_rate": 4.740339688277707e-06, "epoch": 0.1890634357580504, "percentage": 18.91, "elapsed_time": "6:28:55", "remaining_time": "1 day, 3:48:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2053, "total_steps": 10853, "loss": 0.1527, "learning_rate": 4.7400015204302105e-06, "epoch": 0.1891555719353204, "percentage": 18.92, "elapsed_time": "6:29:04", "remaining_time": "1 day, 3:47:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2054, "total_steps": 10853, "loss": 0.1734, "learning_rate": 4.739663144598333e-06, "epoch": 0.1892477081125904, "percentage": 18.93, "elapsed_time": "6:29:14", "remaining_time": "1 day, 3:47:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2055, "total_steps": 10853, "loss": 0.1641, "learning_rate": 4.739324560813491e-06, "epoch": 0.18933984428986042, "percentage": 18.93, "elapsed_time": "6:29:26", "remaining_time": "1 day, 3:47:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2056, "total_steps": 10853, "loss": 0.2055, "learning_rate": 4.738985769107123e-06, "epoch": 0.18943198046713042, "percentage": 18.94, "elapsed_time": "6:29:37", "remaining_time": "1 day, 3:47:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2057, "total_steps": 10853, "loss": 0.1707, "learning_rate": 4.738646769510685e-06, "epoch": 0.18952411664440041, "percentage": 18.95, "elapsed_time": "6:29:49", "remaining_time": "1 day, 3:46:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2058, "total_steps": 10853, "loss": 0.1777, "learning_rate": 4.738307562055653e-06, "epoch": 0.18961625282167044, "percentage": 18.96, "elapsed_time": "6:29:58", "remaining_time": "1 day, 3:46:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2059, "total_steps": 10853, "loss": 0.1703, "learning_rate": 4.737968146773524e-06, "epoch": 0.18970838899894044, "percentage": 18.97, "elapsed_time": "6:30:10", "remaining_time": "1 day, 3:46:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2060, "total_steps": 10853, "loss": 0.1727, "learning_rate": 4.737628523695811e-06, "epoch": 0.18980052517621043, "percentage": 18.98, "elapsed_time": "6:30:21", "remaining_time": "1 day, 3:46:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2061, "total_steps": 10853, "loss": 0.1813, "learning_rate": 4.737288692854049e-06, "epoch": 0.18989266135348046, "percentage": 18.99, "elapsed_time": "6:30:32", "remaining_time": "1 day, 3:45:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2062, "total_steps": 10853, "loss": 0.1772, "learning_rate": 4.736948654279791e-06, "epoch": 0.18998479753075045, "percentage": 19.0, "elapsed_time": "6:30:44", "remaining_time": "1 day, 3:45:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2063, "total_steps": 10853, "loss": 0.1589, "learning_rate": 4.73660840800461e-06, "epoch": 0.19007693370802045, "percentage": 19.01, "elapsed_time": "6:30:54", "remaining_time": "1 day, 3:45:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2064, "total_steps": 10853, "loss": 0.1712, "learning_rate": 4.736267954060097e-06, "epoch": 0.19016906988529045, "percentage": 19.02, "elapsed_time": "6:31:06", "remaining_time": "1 day, 3:45:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2065, "total_steps": 10853, "loss": 0.1814, "learning_rate": 4.735927292477864e-06, "epoch": 0.19026120606256047, "percentage": 19.03, "elapsed_time": "6:31:18", "remaining_time": "1 day, 3:45:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2066, "total_steps": 10853, "loss": 0.168, "learning_rate": 4.735586423289542e-06, "epoch": 0.19035334223983047, "percentage": 19.04, "elapsed_time": "6:31:29", "remaining_time": "1 day, 3:45:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2067, "total_steps": 10853, "loss": 0.1755, "learning_rate": 4.735245346526779e-06, "epoch": 0.19044547841710047, "percentage": 19.05, "elapsed_time": "6:31:39", "remaining_time": "1 day, 3:44:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2068, "total_steps": 10853, "loss": 0.1798, "learning_rate": 4.734904062221246e-06, "epoch": 0.1905376145943705, "percentage": 19.05, "elapsed_time": "6:31:50", "remaining_time": "1 day, 3:44:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2069, "total_steps": 10853, "loss": 0.1725, "learning_rate": 4.734562570404629e-06, "epoch": 0.1906297507716405, "percentage": 19.06, "elapsed_time": "6:32:00", "remaining_time": "1 day, 3:44:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2070, "total_steps": 10853, "loss": 0.1639, "learning_rate": 4.734220871108638e-06, "epoch": 0.19072188694891049, "percentage": 19.07, "elapsed_time": "6:32:12", "remaining_time": "1 day, 3:44:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2071, "total_steps": 10853, "loss": 0.1762, "learning_rate": 4.733878964364998e-06, "epoch": 0.19081402312618048, "percentage": 19.08, "elapsed_time": "6:32:23", "remaining_time": "1 day, 3:43:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2072, "total_steps": 10853, "loss": 0.1787, "learning_rate": 4.7335368502054564e-06, "epoch": 0.1909061593034505, "percentage": 19.09, "elapsed_time": "6:32:35", "remaining_time": "1 day, 3:43:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2073, "total_steps": 10853, "loss": 0.1751, "learning_rate": 4.733194528661778e-06, "epoch": 0.1909982954807205, "percentage": 19.1, "elapsed_time": "6:32:46", "remaining_time": "1 day, 3:43:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2074, "total_steps": 10853, "loss": 0.1684, "learning_rate": 4.732851999765747e-06, "epoch": 0.1910904316579905, "percentage": 19.11, "elapsed_time": "6:32:56", "remaining_time": "1 day, 3:43:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2075, "total_steps": 10853, "loss": 0.1713, "learning_rate": 4.732509263549167e-06, "epoch": 0.19118256783526053, "percentage": 19.12, "elapsed_time": "6:33:07", "remaining_time": "1 day, 3:43:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2076, "total_steps": 10853, "loss": 0.1595, "learning_rate": 4.732166320043862e-06, "epoch": 0.19127470401253052, "percentage": 19.13, "elapsed_time": "6:33:18", "remaining_time": "1 day, 3:42:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2077, "total_steps": 10853, "loss": 0.1726, "learning_rate": 4.731823169281674e-06, "epoch": 0.19136684018980052, "percentage": 19.14, "elapsed_time": "6:33:29", "remaining_time": "1 day, 3:42:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2078, "total_steps": 10853, "loss": 0.1802, "learning_rate": 4.731479811294464e-06, "epoch": 0.19145897636707054, "percentage": 19.15, "elapsed_time": "6:33:40", "remaining_time": "1 day, 3:42:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2079, "total_steps": 10853, "loss": 0.1786, "learning_rate": 4.731136246114114e-06, "epoch": 0.19155111254434054, "percentage": 19.16, "elapsed_time": "6:33:50", "remaining_time": "1 day, 3:42:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2080, "total_steps": 10853, "loss": 0.17, "learning_rate": 4.730792473772523e-06, "epoch": 0.19164324872161054, "percentage": 19.17, "elapsed_time": "6:34:01", "remaining_time": "1 day, 3:41:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2081, "total_steps": 10853, "loss": 0.174, "learning_rate": 4.730448494301612e-06, "epoch": 0.19173538489888053, "percentage": 19.17, "elapsed_time": "6:34:12", "remaining_time": "1 day, 3:41:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2082, "total_steps": 10853, "loss": 0.1805, "learning_rate": 4.7301043077333165e-06, "epoch": 0.19182752107615056, "percentage": 19.18, "elapsed_time": "6:34:22", "remaining_time": "1 day, 3:41:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2083, "total_steps": 10853, "loss": 0.1636, "learning_rate": 4.729759914099597e-06, "epoch": 0.19191965725342056, "percentage": 19.19, "elapsed_time": "6:34:32", "remaining_time": "1 day, 3:41:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2084, "total_steps": 10853, "loss": 0.17, "learning_rate": 4.729415313432429e-06, "epoch": 0.19201179343069055, "percentage": 19.2, "elapsed_time": "6:34:43", "remaining_time": "1 day, 3:40:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2085, "total_steps": 10853, "loss": 0.1798, "learning_rate": 4.729070505763809e-06, "epoch": 0.19210392960796058, "percentage": 19.21, "elapsed_time": "6:34:54", "remaining_time": "1 day, 3:40:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2086, "total_steps": 10853, "loss": 0.1726, "learning_rate": 4.728725491125753e-06, "epoch": 0.19219606578523057, "percentage": 19.22, "elapsed_time": "6:35:05", "remaining_time": "1 day, 3:40:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2087, "total_steps": 10853, "loss": 0.1876, "learning_rate": 4.728380269550296e-06, "epoch": 0.19228820196250057, "percentage": 19.23, "elapsed_time": "6:35:16", "remaining_time": "1 day, 3:40:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2088, "total_steps": 10853, "loss": 0.1865, "learning_rate": 4.7280348410694905e-06, "epoch": 0.19238033813977057, "percentage": 19.24, "elapsed_time": "6:35:28", "remaining_time": "1 day, 3:40:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2089, "total_steps": 10853, "loss": 0.1876, "learning_rate": 4.72768920571541e-06, "epoch": 0.1924724743170406, "percentage": 19.25, "elapsed_time": "6:35:37", "remaining_time": "1 day, 3:39:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2090, "total_steps": 10853, "loss": 0.1715, "learning_rate": 4.727343363520147e-06, "epoch": 0.1925646104943106, "percentage": 19.26, "elapsed_time": "6:35:48", "remaining_time": "1 day, 3:39:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2091, "total_steps": 10853, "loss": 0.168, "learning_rate": 4.7269973145158134e-06, "epoch": 0.1926567466715806, "percentage": 19.27, "elapsed_time": "6:35:59", "remaining_time": "1 day, 3:39:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2092, "total_steps": 10853, "loss": 0.1712, "learning_rate": 4.7266510587345395e-06, "epoch": 0.1927488828488506, "percentage": 19.28, "elapsed_time": "6:36:11", "remaining_time": "1 day, 3:39:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2093, "total_steps": 10853, "loss": 0.1624, "learning_rate": 4.726304596208475e-06, "epoch": 0.1928410190261206, "percentage": 19.28, "elapsed_time": "6:36:22", "remaining_time": "1 day, 3:38:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2094, "total_steps": 10853, "loss": 0.1564, "learning_rate": 4.725957926969789e-06, "epoch": 0.1929331552033906, "percentage": 19.29, "elapsed_time": "6:36:32", "remaining_time": "1 day, 3:38:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2095, "total_steps": 10853, "loss": 0.169, "learning_rate": 4.72561105105067e-06, "epoch": 0.19302529138066063, "percentage": 19.3, "elapsed_time": "6:36:43", "remaining_time": "1 day, 3:38:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2096, "total_steps": 10853, "loss": 0.1687, "learning_rate": 4.7252639684833255e-06, "epoch": 0.19311742755793063, "percentage": 19.31, "elapsed_time": "6:36:54", "remaining_time": "1 day, 3:38:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2097, "total_steps": 10853, "loss": 0.1664, "learning_rate": 4.724916679299982e-06, "epoch": 0.19320956373520062, "percentage": 19.32, "elapsed_time": "6:37:04", "remaining_time": "1 day, 3:37:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2098, "total_steps": 10853, "loss": 0.1676, "learning_rate": 4.7245691835328855e-06, "epoch": 0.19330169991247062, "percentage": 19.33, "elapsed_time": "6:37:15", "remaining_time": "1 day, 3:37:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2099, "total_steps": 10853, "loss": 0.1673, "learning_rate": 4.724221481214301e-06, "epoch": 0.19339383608974064, "percentage": 19.34, "elapsed_time": "6:37:26", "remaining_time": "1 day, 3:37:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2100, "total_steps": 10853, "loss": 0.185, "learning_rate": 4.723873572376512e-06, "epoch": 0.19348597226701064, "percentage": 19.35, "elapsed_time": "6:37:36", "remaining_time": "1 day, 3:37:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2101, "total_steps": 10853, "loss": 0.1795, "learning_rate": 4.723525457051823e-06, "epoch": 0.19357810844428064, "percentage": 19.36, "elapsed_time": "6:37:46", "remaining_time": "1 day, 3:37:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2102, "total_steps": 10853, "loss": 0.1752, "learning_rate": 4.723177135272556e-06, "epoch": 0.19367024462155066, "percentage": 19.37, "elapsed_time": "6:37:58", "remaining_time": "1 day, 3:36:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2103, "total_steps": 10853, "loss": 0.1726, "learning_rate": 4.7228286070710525e-06, "epoch": 0.19376238079882066, "percentage": 19.38, "elapsed_time": "6:38:08", "remaining_time": "1 day, 3:36:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2104, "total_steps": 10853, "loss": 0.1588, "learning_rate": 4.722479872479674e-06, "epoch": 0.19385451697609066, "percentage": 19.39, "elapsed_time": "6:38:18", "remaining_time": "1 day, 3:36:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2105, "total_steps": 10853, "loss": 0.1765, "learning_rate": 4.7221309315308e-06, "epoch": 0.19394665315336065, "percentage": 19.4, "elapsed_time": "6:38:29", "remaining_time": "1 day, 3:36:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2106, "total_steps": 10853, "loss": 0.1535, "learning_rate": 4.721781784256829e-06, "epoch": 0.19403878933063068, "percentage": 19.4, "elapsed_time": "6:38:41", "remaining_time": "1 day, 3:35:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2107, "total_steps": 10853, "loss": 0.18, "learning_rate": 4.721432430690181e-06, "epoch": 0.19413092550790068, "percentage": 19.41, "elapsed_time": "6:38:52", "remaining_time": "1 day, 3:35:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2108, "total_steps": 10853, "loss": 0.1744, "learning_rate": 4.721082870863293e-06, "epoch": 0.19422306168517067, "percentage": 19.42, "elapsed_time": "6:39:02", "remaining_time": "1 day, 3:35:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2109, "total_steps": 10853, "loss": 0.1563, "learning_rate": 4.720733104808621e-06, "epoch": 0.1943151978624407, "percentage": 19.43, "elapsed_time": "6:39:13", "remaining_time": "1 day, 3:35:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2110, "total_steps": 10853, "loss": 0.174, "learning_rate": 4.720383132558641e-06, "epoch": 0.1944073340397107, "percentage": 19.44, "elapsed_time": "6:39:22", "remaining_time": "1 day, 3:34:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2111, "total_steps": 10853, "loss": 0.1774, "learning_rate": 4.720032954145849e-06, "epoch": 0.1944994702169807, "percentage": 19.45, "elapsed_time": "6:39:34", "remaining_time": "1 day, 3:34:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2112, "total_steps": 10853, "loss": 0.1692, "learning_rate": 4.719682569602757e-06, "epoch": 0.19459160639425072, "percentage": 19.46, "elapsed_time": "6:39:45", "remaining_time": "1 day, 3:34:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2113, "total_steps": 10853, "loss": 0.1729, "learning_rate": 4.7193319789619e-06, "epoch": 0.1946837425715207, "percentage": 19.47, "elapsed_time": "6:39:55", "remaining_time": "1 day, 3:34:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2114, "total_steps": 10853, "loss": 0.167, "learning_rate": 4.718981182255831e-06, "epoch": 0.1947758787487907, "percentage": 19.48, "elapsed_time": "6:40:04", "remaining_time": "1 day, 3:33:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2115, "total_steps": 10853, "loss": 0.1851, "learning_rate": 4.71863017951712e-06, "epoch": 0.1948680149260607, "percentage": 19.49, "elapsed_time": "6:40:16", "remaining_time": "1 day, 3:33:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2116, "total_steps": 10853, "loss": 0.1704, "learning_rate": 4.718278970778357e-06, "epoch": 0.19496015110333073, "percentage": 19.5, "elapsed_time": "6:40:26", "remaining_time": "1 day, 3:33:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2117, "total_steps": 10853, "loss": 0.175, "learning_rate": 4.717927556072153e-06, "epoch": 0.19505228728060073, "percentage": 19.51, "elapsed_time": "6:40:37", "remaining_time": "1 day, 3:33:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2118, "total_steps": 10853, "loss": 0.1741, "learning_rate": 4.717575935431138e-06, "epoch": 0.19514442345787072, "percentage": 19.52, "elapsed_time": "6:40:49", "remaining_time": "1 day, 3:33:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2119, "total_steps": 10853, "loss": 0.1854, "learning_rate": 4.7172241088879575e-06, "epoch": 0.19523655963514075, "percentage": 19.52, "elapsed_time": "6:41:00", "remaining_time": "1 day, 3:32:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2120, "total_steps": 10853, "loss": 0.1786, "learning_rate": 4.716872076475281e-06, "epoch": 0.19532869581241075, "percentage": 19.53, "elapsed_time": "6:41:10", "remaining_time": "1 day, 3:32:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2121, "total_steps": 10853, "loss": 0.1691, "learning_rate": 4.7165198382257926e-06, "epoch": 0.19542083198968074, "percentage": 19.54, "elapsed_time": "6:41:21", "remaining_time": "1 day, 3:32:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2122, "total_steps": 10853, "loss": 0.1747, "learning_rate": 4.716167394172198e-06, "epoch": 0.19551296816695074, "percentage": 19.55, "elapsed_time": "6:41:33", "remaining_time": "1 day, 3:32:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2123, "total_steps": 10853, "loss": 0.1699, "learning_rate": 4.715814744347224e-06, "epoch": 0.19560510434422076, "percentage": 19.56, "elapsed_time": "6:41:43", "remaining_time": "1 day, 3:31:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2124, "total_steps": 10853, "loss": 0.1581, "learning_rate": 4.715461888783612e-06, "epoch": 0.19569724052149076, "percentage": 19.57, "elapsed_time": "6:41:53", "remaining_time": "1 day, 3:31:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2125, "total_steps": 10853, "loss": 0.1852, "learning_rate": 4.715108827514125e-06, "epoch": 0.19578937669876076, "percentage": 19.58, "elapsed_time": "6:42:05", "remaining_time": "1 day, 3:31:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2126, "total_steps": 10853, "loss": 0.1806, "learning_rate": 4.714755560571545e-06, "epoch": 0.19588151287603078, "percentage": 19.59, "elapsed_time": "6:42:16", "remaining_time": "1 day, 3:31:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2127, "total_steps": 10853, "loss": 0.1678, "learning_rate": 4.7144020879886736e-06, "epoch": 0.19597364905330078, "percentage": 19.6, "elapsed_time": "6:42:27", "remaining_time": "1 day, 3:31:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2128, "total_steps": 10853, "loss": 0.1588, "learning_rate": 4.714048409798328e-06, "epoch": 0.19606578523057078, "percentage": 19.61, "elapsed_time": "6:42:37", "remaining_time": "1 day, 3:30:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2129, "total_steps": 10853, "loss": 0.1696, "learning_rate": 4.713694526033351e-06, "epoch": 0.1961579214078408, "percentage": 19.62, "elapsed_time": "6:42:47", "remaining_time": "1 day, 3:30:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2130, "total_steps": 10853, "loss": 0.1876, "learning_rate": 4.713340436726599e-06, "epoch": 0.1962500575851108, "percentage": 19.63, "elapsed_time": "6:42:59", "remaining_time": "1 day, 3:30:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2131, "total_steps": 10853, "loss": 0.1833, "learning_rate": 4.712986141910948e-06, "epoch": 0.1963421937623808, "percentage": 19.64, "elapsed_time": "6:43:11", "remaining_time": "1 day, 3:30:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2132, "total_steps": 10853, "loss": 0.1813, "learning_rate": 4.712631641619297e-06, "epoch": 0.1964343299396508, "percentage": 19.64, "elapsed_time": "6:43:23", "remaining_time": "1 day, 3:30:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2133, "total_steps": 10853, "loss": 0.1834, "learning_rate": 4.7122769358845595e-06, "epoch": 0.19652646611692082, "percentage": 19.65, "elapsed_time": "6:43:34", "remaining_time": "1 day, 3:29:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2134, "total_steps": 10853, "loss": 0.1883, "learning_rate": 4.71192202473967e-06, "epoch": 0.19661860229419081, "percentage": 19.66, "elapsed_time": "6:43:45", "remaining_time": "1 day, 3:29:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2135, "total_steps": 10853, "loss": 0.1733, "learning_rate": 4.711566908217583e-06, "epoch": 0.1967107384714608, "percentage": 19.67, "elapsed_time": "6:43:56", "remaining_time": "1 day, 3:29:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2136, "total_steps": 10853, "loss": 0.1693, "learning_rate": 4.71121158635127e-06, "epoch": 0.19680287464873084, "percentage": 19.68, "elapsed_time": "6:44:08", "remaining_time": "1 day, 3:29:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2137, "total_steps": 10853, "loss": 0.1597, "learning_rate": 4.710856059173723e-06, "epoch": 0.19689501082600083, "percentage": 19.69, "elapsed_time": "6:44:19", "remaining_time": "1 day, 3:29:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2138, "total_steps": 10853, "loss": 0.1789, "learning_rate": 4.710500326717954e-06, "epoch": 0.19698714700327083, "percentage": 19.7, "elapsed_time": "6:44:29", "remaining_time": "1 day, 3:28:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2139, "total_steps": 10853, "loss": 0.1681, "learning_rate": 4.7101443890169915e-06, "epoch": 0.19707928318054083, "percentage": 19.71, "elapsed_time": "6:44:40", "remaining_time": "1 day, 3:28:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2140, "total_steps": 10853, "loss": 0.1725, "learning_rate": 4.7097882461038845e-06, "epoch": 0.19717141935781085, "percentage": 19.72, "elapsed_time": "6:44:50", "remaining_time": "1 day, 3:28:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2141, "total_steps": 10853, "loss": 0.1759, "learning_rate": 4.7094318980117005e-06, "epoch": 0.19726355553508085, "percentage": 19.73, "elapsed_time": "6:45:01", "remaining_time": "1 day, 3:28:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2142, "total_steps": 10853, "loss": 0.179, "learning_rate": 4.709075344773527e-06, "epoch": 0.19735569171235084, "percentage": 19.74, "elapsed_time": "6:45:12", "remaining_time": "1 day, 3:27:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2143, "total_steps": 10853, "loss": 0.1669, "learning_rate": 4.70871858642247e-06, "epoch": 0.19744782788962087, "percentage": 19.75, "elapsed_time": "6:45:23", "remaining_time": "1 day, 3:27:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2144, "total_steps": 10853, "loss": 0.164, "learning_rate": 4.708361622991656e-06, "epoch": 0.19753996406689087, "percentage": 19.75, "elapsed_time": "6:45:32", "remaining_time": "1 day, 3:27:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2145, "total_steps": 10853, "loss": 0.183, "learning_rate": 4.708004454514226e-06, "epoch": 0.19763210024416086, "percentage": 19.76, "elapsed_time": "6:45:44", "remaining_time": "1 day, 3:27:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2146, "total_steps": 10853, "loss": 0.1715, "learning_rate": 4.7076470810233455e-06, "epoch": 0.1977242364214309, "percentage": 19.77, "elapsed_time": "6:45:54", "remaining_time": "1 day, 3:26:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2147, "total_steps": 10853, "loss": 0.1791, "learning_rate": 4.707289502552196e-06, "epoch": 0.19781637259870088, "percentage": 19.78, "elapsed_time": "6:46:04", "remaining_time": "1 day, 3:26:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2148, "total_steps": 10853, "loss": 0.1655, "learning_rate": 4.706931719133978e-06, "epoch": 0.19790850877597088, "percentage": 19.79, "elapsed_time": "6:46:15", "remaining_time": "1 day, 3:26:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2149, "total_steps": 10853, "loss": 0.189, "learning_rate": 4.706573730801913e-06, "epoch": 0.19800064495324088, "percentage": 19.8, "elapsed_time": "6:46:25", "remaining_time": "1 day, 3:26:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2150, "total_steps": 10853, "loss": 0.1758, "learning_rate": 4.706215537589239e-06, "epoch": 0.1980927811305109, "percentage": 19.81, "elapsed_time": "6:46:36", "remaining_time": "1 day, 3:25:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2151, "total_steps": 10853, "loss": 0.1497, "learning_rate": 4.705857139529215e-06, "epoch": 0.1981849173077809, "percentage": 19.82, "elapsed_time": "6:46:46", "remaining_time": "1 day, 3:25:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2152, "total_steps": 10853, "loss": 0.1821, "learning_rate": 4.705498536655119e-06, "epoch": 0.1982770534850509, "percentage": 19.83, "elapsed_time": "6:46:57", "remaining_time": "1 day, 3:25:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2153, "total_steps": 10853, "loss": 0.1692, "learning_rate": 4.705139729000246e-06, "epoch": 0.19836918966232092, "percentage": 19.84, "elapsed_time": "6:47:08", "remaining_time": "1 day, 3:25:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2154, "total_steps": 10853, "loss": 0.177, "learning_rate": 4.704780716597912e-06, "epoch": 0.19846132583959092, "percentage": 19.85, "elapsed_time": "6:47:18", "remaining_time": "1 day, 3:24:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2155, "total_steps": 10853, "loss": 0.1872, "learning_rate": 4.7044214994814505e-06, "epoch": 0.19855346201686092, "percentage": 19.86, "elapsed_time": "6:47:30", "remaining_time": "1 day, 3:24:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2156, "total_steps": 10853, "loss": 0.1692, "learning_rate": 4.704062077684216e-06, "epoch": 0.1986455981941309, "percentage": 19.87, "elapsed_time": "6:47:40", "remaining_time": "1 day, 3:24:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2157, "total_steps": 10853, "loss": 0.1711, "learning_rate": 4.703702451239582e-06, "epoch": 0.19873773437140094, "percentage": 19.87, "elapsed_time": "6:47:51", "remaining_time": "1 day, 3:24:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2158, "total_steps": 10853, "loss": 0.1891, "learning_rate": 4.703342620180936e-06, "epoch": 0.19882987054867093, "percentage": 19.88, "elapsed_time": "6:48:04", "remaining_time": "1 day, 3:24:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2159, "total_steps": 10853, "loss": 0.1695, "learning_rate": 4.702982584541691e-06, "epoch": 0.19892200672594093, "percentage": 19.89, "elapsed_time": "6:48:15", "remaining_time": "1 day, 3:23:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2160, "total_steps": 10853, "loss": 0.1771, "learning_rate": 4.702622344355276e-06, "epoch": 0.19901414290321096, "percentage": 19.9, "elapsed_time": "6:48:26", "remaining_time": "1 day, 3:23:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2161, "total_steps": 10853, "loss": 0.177, "learning_rate": 4.702261899655139e-06, "epoch": 0.19910627908048095, "percentage": 19.91, "elapsed_time": "6:48:36", "remaining_time": "1 day, 3:23:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2162, "total_steps": 10853, "loss": 0.1827, "learning_rate": 4.701901250474748e-06, "epoch": 0.19919841525775095, "percentage": 19.92, "elapsed_time": "6:48:46", "remaining_time": "1 day, 3:23:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2163, "total_steps": 10853, "loss": 0.1706, "learning_rate": 4.70154039684759e-06, "epoch": 0.19929055143502097, "percentage": 19.93, "elapsed_time": "6:48:57", "remaining_time": "1 day, 3:23:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2164, "total_steps": 10853, "loss": 0.1866, "learning_rate": 4.701179338807168e-06, "epoch": 0.19938268761229097, "percentage": 19.94, "elapsed_time": "6:49:09", "remaining_time": "1 day, 3:22:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2165, "total_steps": 10853, "loss": 0.1569, "learning_rate": 4.7008180763870075e-06, "epoch": 0.19947482378956097, "percentage": 19.95, "elapsed_time": "6:49:19", "remaining_time": "1 day, 3:22:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2166, "total_steps": 10853, "loss": 0.1687, "learning_rate": 4.700456609620652e-06, "epoch": 0.19956695996683096, "percentage": 19.96, "elapsed_time": "6:49:30", "remaining_time": "1 day, 3:22:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2167, "total_steps": 10853, "loss": 0.169, "learning_rate": 4.700094938541664e-06, "epoch": 0.199659096144101, "percentage": 19.97, "elapsed_time": "6:49:42", "remaining_time": "1 day, 3:22:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2168, "total_steps": 10853, "loss": 0.1736, "learning_rate": 4.6997330631836235e-06, "epoch": 0.199751232321371, "percentage": 19.98, "elapsed_time": "6:49:54", "remaining_time": "1 day, 3:22:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2169, "total_steps": 10853, "loss": 0.1676, "learning_rate": 4.699370983580132e-06, "epoch": 0.19984336849864098, "percentage": 19.99, "elapsed_time": "6:50:05", "remaining_time": "1 day, 3:21:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2170, "total_steps": 10853, "loss": 0.1622, "learning_rate": 4.699008699764807e-06, "epoch": 0.199935504675911, "percentage": 19.99, "elapsed_time": "6:50:14", "remaining_time": "1 day, 3:21:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2171, "total_steps": 10853, "loss": 0.1778, "learning_rate": 4.698646211771287e-06, "epoch": 0.200027640853181, "percentage": 20.0, "elapsed_time": "6:50:26", "remaining_time": "1 day, 3:21:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2172, "total_steps": 10853, "loss": 0.173, "learning_rate": 4.698283519633231e-06, "epoch": 0.200119777030451, "percentage": 20.01, "elapsed_time": "6:50:35", "remaining_time": "1 day, 3:21:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2173, "total_steps": 10853, "loss": 0.1763, "learning_rate": 4.6979206233843136e-06, "epoch": 0.200211913207721, "percentage": 20.02, "elapsed_time": "6:50:46", "remaining_time": "1 day, 3:20:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2174, "total_steps": 10853, "loss": 0.1612, "learning_rate": 4.697557523058229e-06, "epoch": 0.20030404938499102, "percentage": 20.03, "elapsed_time": "6:50:57", "remaining_time": "1 day, 3:20:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2175, "total_steps": 10853, "loss": 0.1657, "learning_rate": 4.6971942186886925e-06, "epoch": 0.20039618556226102, "percentage": 20.04, "elapsed_time": "6:51:09", "remaining_time": "1 day, 3:20:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2176, "total_steps": 10853, "loss": 0.1669, "learning_rate": 4.696830710309437e-06, "epoch": 0.20048832173953102, "percentage": 20.05, "elapsed_time": "6:51:19", "remaining_time": "1 day, 3:20:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2177, "total_steps": 10853, "loss": 0.1746, "learning_rate": 4.696466997954212e-06, "epoch": 0.20058045791680104, "percentage": 20.06, "elapsed_time": "6:51:30", "remaining_time": "1 day, 3:19:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2178, "total_steps": 10853, "loss": 0.1701, "learning_rate": 4.696103081656791e-06, "epoch": 0.20067259409407104, "percentage": 20.07, "elapsed_time": "6:51:40", "remaining_time": "1 day, 3:19:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2179, "total_steps": 10853, "loss": 0.1588, "learning_rate": 4.695738961450962e-06, "epoch": 0.20076473027134104, "percentage": 20.08, "elapsed_time": "6:51:52", "remaining_time": "1 day, 3:19:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2180, "total_steps": 10853, "loss": 0.173, "learning_rate": 4.695374637370534e-06, "epoch": 0.20085686644861106, "percentage": 20.09, "elapsed_time": "6:52:02", "remaining_time": "1 day, 3:19:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2181, "total_steps": 10853, "loss": 0.174, "learning_rate": 4.695010109449335e-06, "epoch": 0.20094900262588106, "percentage": 20.1, "elapsed_time": "6:52:13", "remaining_time": "1 day, 3:19:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2182, "total_steps": 10853, "loss": 0.1824, "learning_rate": 4.694645377721211e-06, "epoch": 0.20104113880315105, "percentage": 20.11, "elapsed_time": "6:52:22", "remaining_time": "1 day, 3:18:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2183, "total_steps": 10853, "loss": 0.1606, "learning_rate": 4.694280442220027e-06, "epoch": 0.20113327498042105, "percentage": 20.11, "elapsed_time": "6:52:32", "remaining_time": "1 day, 3:18:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2184, "total_steps": 10853, "loss": 0.1865, "learning_rate": 4.693915302979669e-06, "epoch": 0.20122541115769108, "percentage": 20.12, "elapsed_time": "6:52:44", "remaining_time": "1 day, 3:18:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2185, "total_steps": 10853, "loss": 0.1758, "learning_rate": 4.693549960034038e-06, "epoch": 0.20131754733496107, "percentage": 20.13, "elapsed_time": "6:52:56", "remaining_time": "1 day, 3:18:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2186, "total_steps": 10853, "loss": 0.1652, "learning_rate": 4.693184413417058e-06, "epoch": 0.20140968351223107, "percentage": 20.14, "elapsed_time": "6:53:06", "remaining_time": "1 day, 3:17:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2187, "total_steps": 10853, "loss": 0.1668, "learning_rate": 4.692818663162668e-06, "epoch": 0.2015018196895011, "percentage": 20.15, "elapsed_time": "6:53:16", "remaining_time": "1 day, 3:17:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2188, "total_steps": 10853, "loss": 0.1626, "learning_rate": 4.69245270930483e-06, "epoch": 0.2015939558667711, "percentage": 20.16, "elapsed_time": "6:53:27", "remaining_time": "1 day, 3:17:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2189, "total_steps": 10853, "loss": 0.161, "learning_rate": 4.6920865518775214e-06, "epoch": 0.2016860920440411, "percentage": 20.17, "elapsed_time": "6:53:38", "remaining_time": "1 day, 3:17:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2190, "total_steps": 10853, "loss": 0.1838, "learning_rate": 4.6917201909147415e-06, "epoch": 0.20177822822131108, "percentage": 20.18, "elapsed_time": "6:53:48", "remaining_time": "1 day, 3:16:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2191, "total_steps": 10853, "loss": 0.1726, "learning_rate": 4.691353626450505e-06, "epoch": 0.2018703643985811, "percentage": 20.19, "elapsed_time": "6:53:59", "remaining_time": "1 day, 3:16:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2192, "total_steps": 10853, "loss": 0.1822, "learning_rate": 4.690986858518849e-06, "epoch": 0.2019625005758511, "percentage": 20.2, "elapsed_time": "6:54:09", "remaining_time": "1 day, 3:16:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2193, "total_steps": 10853, "loss": 0.1639, "learning_rate": 4.6906198871538265e-06, "epoch": 0.2020546367531211, "percentage": 20.21, "elapsed_time": "6:54:20", "remaining_time": "1 day, 3:16:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2194, "total_steps": 10853, "loss": 0.1855, "learning_rate": 4.690252712389513e-06, "epoch": 0.20214677293039113, "percentage": 20.22, "elapsed_time": "6:54:31", "remaining_time": "1 day, 3:15:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2195, "total_steps": 10853, "loss": 0.1567, "learning_rate": 4.6898853342599994e-06, "epoch": 0.20223890910766112, "percentage": 20.22, "elapsed_time": "6:54:43", "remaining_time": "1 day, 3:15:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2196, "total_steps": 10853, "loss": 0.1904, "learning_rate": 4.689517752799396e-06, "epoch": 0.20233104528493112, "percentage": 20.23, "elapsed_time": "6:54:54", "remaining_time": "1 day, 3:15:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2197, "total_steps": 10853, "loss": 0.1844, "learning_rate": 4.689149968041834e-06, "epoch": 0.20242318146220115, "percentage": 20.24, "elapsed_time": "6:55:04", "remaining_time": "1 day, 3:15:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2198, "total_steps": 10853, "loss": 0.1743, "learning_rate": 4.6887819800214615e-06, "epoch": 0.20251531763947114, "percentage": 20.25, "elapsed_time": "6:55:14", "remaining_time": "1 day, 3:15:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2199, "total_steps": 10853, "loss": 0.1788, "learning_rate": 4.688413788772447e-06, "epoch": 0.20260745381674114, "percentage": 20.26, "elapsed_time": "6:55:26", "remaining_time": "1 day, 3:14:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2200, "total_steps": 10853, "loss": 0.1737, "learning_rate": 4.688045394328976e-06, "epoch": 0.20269958999401114, "percentage": 20.27, "elapsed_time": "6:55:37", "remaining_time": "1 day, 3:14:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2201, "total_steps": 10853, "loss": 0.1634, "learning_rate": 4.687676796725256e-06, "epoch": 0.20279172617128116, "percentage": 20.28, "elapsed_time": "6:55:47", "remaining_time": "1 day, 3:14:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2202, "total_steps": 10853, "loss": 0.1661, "learning_rate": 4.687307995995509e-06, "epoch": 0.20288386234855116, "percentage": 20.29, "elapsed_time": "6:55:58", "remaining_time": "1 day, 3:14:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2203, "total_steps": 10853, "loss": 0.1687, "learning_rate": 4.68693899217398e-06, "epoch": 0.20297599852582116, "percentage": 20.3, "elapsed_time": "6:56:10", "remaining_time": "1 day, 3:14:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2204, "total_steps": 10853, "loss": 0.1661, "learning_rate": 4.6865697852949285e-06, "epoch": 0.20306813470309118, "percentage": 20.31, "elapsed_time": "6:56:21", "remaining_time": "1 day, 3:13:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2205, "total_steps": 10853, "loss": 0.182, "learning_rate": 4.686200375392639e-06, "epoch": 0.20316027088036118, "percentage": 20.32, "elapsed_time": "6:56:31", "remaining_time": "1 day, 3:13:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2206, "total_steps": 10853, "loss": 0.1579, "learning_rate": 4.6858307625014084e-06, "epoch": 0.20325240705763117, "percentage": 20.33, "elapsed_time": "6:56:41", "remaining_time": "1 day, 3:13:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2207, "total_steps": 10853, "loss": 0.1784, "learning_rate": 4.685460946655556e-06, "epoch": 0.20334454323490117, "percentage": 20.34, "elapsed_time": "6:56:52", "remaining_time": "1 day, 3:13:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2208, "total_steps": 10853, "loss": 0.1754, "learning_rate": 4.68509092788942e-06, "epoch": 0.2034366794121712, "percentage": 20.34, "elapsed_time": "6:57:02", "remaining_time": "1 day, 3:12:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2209, "total_steps": 10853, "loss": 0.1666, "learning_rate": 4.684720706237356e-06, "epoch": 0.2035288155894412, "percentage": 20.35, "elapsed_time": "6:57:13", "remaining_time": "1 day, 3:12:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2210, "total_steps": 10853, "loss": 0.1643, "learning_rate": 4.68435028173374e-06, "epoch": 0.2036209517667112, "percentage": 20.36, "elapsed_time": "6:57:23", "remaining_time": "1 day, 3:12:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2211, "total_steps": 10853, "loss": 0.1965, "learning_rate": 4.683979654412965e-06, "epoch": 0.2037130879439812, "percentage": 20.37, "elapsed_time": "6:57:34", "remaining_time": "1 day, 3:12:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2212, "total_steps": 10853, "loss": 0.1751, "learning_rate": 4.683608824309443e-06, "epoch": 0.2038052241212512, "percentage": 20.38, "elapsed_time": "6:57:45", "remaining_time": "1 day, 3:11:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2213, "total_steps": 10853, "loss": 0.1772, "learning_rate": 4.683237791457608e-06, "epoch": 0.2038973602985212, "percentage": 20.39, "elapsed_time": "6:57:56", "remaining_time": "1 day, 3:11:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2214, "total_steps": 10853, "loss": 0.1808, "learning_rate": 4.682866555891908e-06, "epoch": 0.20398949647579123, "percentage": 20.4, "elapsed_time": "6:58:08", "remaining_time": "1 day, 3:11:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2215, "total_steps": 10853, "loss": 0.1652, "learning_rate": 4.6824951176468134e-06, "epoch": 0.20408163265306123, "percentage": 20.41, "elapsed_time": "6:58:18", "remaining_time": "1 day, 3:11:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2216, "total_steps": 10853, "loss": 0.1685, "learning_rate": 4.682123476756813e-06, "epoch": 0.20417376883033123, "percentage": 20.42, "elapsed_time": "6:58:28", "remaining_time": "1 day, 3:11:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2217, "total_steps": 10853, "loss": 0.1668, "learning_rate": 4.681751633256413e-06, "epoch": 0.20426590500760122, "percentage": 20.43, "elapsed_time": "6:58:39", "remaining_time": "1 day, 3:10:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2218, "total_steps": 10853, "loss": 0.175, "learning_rate": 4.681379587180138e-06, "epoch": 0.20435804118487125, "percentage": 20.44, "elapsed_time": "6:58:50", "remaining_time": "1 day, 3:10:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2219, "total_steps": 10853, "loss": 0.1796, "learning_rate": 4.681007338562535e-06, "epoch": 0.20445017736214124, "percentage": 20.45, "elapsed_time": "6:59:01", "remaining_time": "1 day, 3:10:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2220, "total_steps": 10853, "loss": 0.1733, "learning_rate": 4.680634887438165e-06, "epoch": 0.20454231353941124, "percentage": 20.46, "elapsed_time": "6:59:12", "remaining_time": "1 day, 3:10:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2221, "total_steps": 10853, "loss": 0.161, "learning_rate": 4.6802622338416115e-06, "epoch": 0.20463444971668127, "percentage": 20.46, "elapsed_time": "6:59:23", "remaining_time": "1 day, 3:09:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2222, "total_steps": 10853, "loss": 0.1514, "learning_rate": 4.679889377807475e-06, "epoch": 0.20472658589395126, "percentage": 20.47, "elapsed_time": "6:59:33", "remaining_time": "1 day, 3:09:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2223, "total_steps": 10853, "loss": 0.1527, "learning_rate": 4.679516319370374e-06, "epoch": 0.20481872207122126, "percentage": 20.48, "elapsed_time": "6:59:44", "remaining_time": "1 day, 3:09:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2224, "total_steps": 10853, "loss": 0.1844, "learning_rate": 4.679143058564949e-06, "epoch": 0.20491085824849126, "percentage": 20.49, "elapsed_time": "6:59:55", "remaining_time": "1 day, 3:09:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2225, "total_steps": 10853, "loss": 0.1941, "learning_rate": 4.678769595425856e-06, "epoch": 0.20500299442576128, "percentage": 20.5, "elapsed_time": "7:00:07", "remaining_time": "1 day, 3:09:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2226, "total_steps": 10853, "loss": 0.1606, "learning_rate": 4.6783959299877725e-06, "epoch": 0.20509513060303128, "percentage": 20.51, "elapsed_time": "7:00:18", "remaining_time": "1 day, 3:08:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2227, "total_steps": 10853, "loss": 0.1753, "learning_rate": 4.678022062285392e-06, "epoch": 0.20518726678030128, "percentage": 20.52, "elapsed_time": "7:00:30", "remaining_time": "1 day, 3:08:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2228, "total_steps": 10853, "loss": 0.1654, "learning_rate": 4.677647992353428e-06, "epoch": 0.2052794029575713, "percentage": 20.53, "elapsed_time": "7:00:41", "remaining_time": "1 day, 3:08:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2229, "total_steps": 10853, "loss": 0.1701, "learning_rate": 4.677273720226615e-06, "epoch": 0.2053715391348413, "percentage": 20.54, "elapsed_time": "7:00:53", "remaining_time": "1 day, 3:08:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2230, "total_steps": 10853, "loss": 0.1505, "learning_rate": 4.6768992459397015e-06, "epoch": 0.2054636753121113, "percentage": 20.55, "elapsed_time": "7:01:03", "remaining_time": "1 day, 3:08:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2231, "total_steps": 10853, "loss": 0.1564, "learning_rate": 4.67652456952746e-06, "epoch": 0.20555581148938132, "percentage": 20.56, "elapsed_time": "7:01:14", "remaining_time": "1 day, 3:07:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2232, "total_steps": 10853, "loss": 0.1708, "learning_rate": 4.6761496910246766e-06, "epoch": 0.20564794766665132, "percentage": 20.57, "elapsed_time": "7:01:23", "remaining_time": "1 day, 3:07:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2233, "total_steps": 10853, "loss": 0.159, "learning_rate": 4.6757746104661606e-06, "epoch": 0.2057400838439213, "percentage": 20.57, "elapsed_time": "7:01:34", "remaining_time": "1 day, 3:07:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2234, "total_steps": 10853, "loss": 0.1598, "learning_rate": 4.675399327886738e-06, "epoch": 0.2058322200211913, "percentage": 20.58, "elapsed_time": "7:01:44", "remaining_time": "1 day, 3:07:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2235, "total_steps": 10853, "loss": 0.1645, "learning_rate": 4.675023843321254e-06, "epoch": 0.20592435619846133, "percentage": 20.59, "elapsed_time": "7:01:55", "remaining_time": "1 day, 3:06:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2236, "total_steps": 10853, "loss": 0.1508, "learning_rate": 4.674648156804571e-06, "epoch": 0.20601649237573133, "percentage": 20.6, "elapsed_time": "7:02:05", "remaining_time": "1 day, 3:06:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2237, "total_steps": 10853, "loss": 0.177, "learning_rate": 4.674272268371574e-06, "epoch": 0.20610862855300133, "percentage": 20.61, "elapsed_time": "7:02:14", "remaining_time": "1 day, 3:06:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2238, "total_steps": 10853, "loss": 0.1725, "learning_rate": 4.673896178057162e-06, "epoch": 0.20620076473027135, "percentage": 20.62, "elapsed_time": "7:02:25", "remaining_time": "1 day, 3:06:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2239, "total_steps": 10853, "loss": 0.182, "learning_rate": 4.673519885896256e-06, "epoch": 0.20629290090754135, "percentage": 20.63, "elapsed_time": "7:02:35", "remaining_time": "1 day, 3:05:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2240, "total_steps": 10853, "loss": 0.1788, "learning_rate": 4.673143391923794e-06, "epoch": 0.20638503708481135, "percentage": 20.64, "elapsed_time": "7:02:46", "remaining_time": "1 day, 3:05:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2241, "total_steps": 10853, "loss": 0.1664, "learning_rate": 4.672766696174736e-06, "epoch": 0.20647717326208134, "percentage": 20.65, "elapsed_time": "7:02:56", "remaining_time": "1 day, 3:05:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2242, "total_steps": 10853, "loss": 0.173, "learning_rate": 4.672389798684055e-06, "epoch": 0.20656930943935137, "percentage": 20.66, "elapsed_time": "7:03:07", "remaining_time": "1 day, 3:05:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2243, "total_steps": 10853, "loss": 0.1722, "learning_rate": 4.672012699486748e-06, "epoch": 0.20666144561662136, "percentage": 20.67, "elapsed_time": "7:03:18", "remaining_time": "1 day, 3:04:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2244, "total_steps": 10853, "loss": 0.1616, "learning_rate": 4.671635398617828e-06, "epoch": 0.20675358179389136, "percentage": 20.68, "elapsed_time": "7:03:29", "remaining_time": "1 day, 3:04:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2245, "total_steps": 10853, "loss": 0.1604, "learning_rate": 4.671257896112327e-06, "epoch": 0.20684571797116139, "percentage": 20.69, "elapsed_time": "7:03:40", "remaining_time": "1 day, 3:04:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2246, "total_steps": 10853, "loss": 0.165, "learning_rate": 4.670880192005298e-06, "epoch": 0.20693785414843138, "percentage": 20.69, "elapsed_time": "7:03:50", "remaining_time": "1 day, 3:04:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2247, "total_steps": 10853, "loss": 0.1805, "learning_rate": 4.670502286331809e-06, "epoch": 0.20702999032570138, "percentage": 20.7, "elapsed_time": "7:04:00", "remaining_time": "1 day, 3:03:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2248, "total_steps": 10853, "loss": 0.1761, "learning_rate": 4.670124179126948e-06, "epoch": 0.2071221265029714, "percentage": 20.71, "elapsed_time": "7:04:11", "remaining_time": "1 day, 3:03:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2249, "total_steps": 10853, "loss": 0.172, "learning_rate": 4.669745870425824e-06, "epoch": 0.2072142626802414, "percentage": 20.72, "elapsed_time": "7:04:21", "remaining_time": "1 day, 3:03:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2250, "total_steps": 10853, "loss": 0.1517, "learning_rate": 4.669367360263563e-06, "epoch": 0.2073063988575114, "percentage": 20.73, "elapsed_time": "7:04:32", "remaining_time": "1 day, 3:03:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2251, "total_steps": 10853, "loss": 0.164, "learning_rate": 4.668988648675309e-06, "epoch": 0.2073985350347814, "percentage": 20.74, "elapsed_time": "7:04:44", "remaining_time": "1 day, 3:03:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2252, "total_steps": 10853, "loss": 0.1628, "learning_rate": 4.668609735696225e-06, "epoch": 0.20749067121205142, "percentage": 20.75, "elapsed_time": "7:04:55", "remaining_time": "1 day, 3:02:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2253, "total_steps": 10853, "loss": 0.1642, "learning_rate": 4.668230621361494e-06, "epoch": 0.20758280738932142, "percentage": 20.76, "elapsed_time": "7:05:07", "remaining_time": "1 day, 3:02:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2254, "total_steps": 10853, "loss": 0.1875, "learning_rate": 4.667851305706316e-06, "epoch": 0.2076749435665914, "percentage": 20.77, "elapsed_time": "7:05:18", "remaining_time": "1 day, 3:02:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2255, "total_steps": 10853, "loss": 0.169, "learning_rate": 4.667471788765911e-06, "epoch": 0.20776707974386144, "percentage": 20.78, "elapsed_time": "7:05:28", "remaining_time": "1 day, 3:02:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2256, "total_steps": 10853, "loss": 0.1769, "learning_rate": 4.667092070575518e-06, "epoch": 0.20785921592113143, "percentage": 20.79, "elapsed_time": "7:05:39", "remaining_time": "1 day, 3:02:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2257, "total_steps": 10853, "loss": 0.151, "learning_rate": 4.666712151170392e-06, "epoch": 0.20795135209840143, "percentage": 20.8, "elapsed_time": "7:05:51", "remaining_time": "1 day, 3:01:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2258, "total_steps": 10853, "loss": 0.1674, "learning_rate": 4.6663320305858106e-06, "epoch": 0.20804348827567143, "percentage": 20.81, "elapsed_time": "7:06:01", "remaining_time": "1 day, 3:01:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2259, "total_steps": 10853, "loss": 0.1701, "learning_rate": 4.665951708857066e-06, "epoch": 0.20813562445294145, "percentage": 20.81, "elapsed_time": "7:06:11", "remaining_time": "1 day, 3:01:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2260, "total_steps": 10853, "loss": 0.159, "learning_rate": 4.665571186019473e-06, "epoch": 0.20822776063021145, "percentage": 20.82, "elapsed_time": "7:06:22", "remaining_time": "1 day, 3:01:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2261, "total_steps": 10853, "loss": 0.1625, "learning_rate": 4.665190462108362e-06, "epoch": 0.20831989680748145, "percentage": 20.83, "elapsed_time": "7:06:32", "remaining_time": "1 day, 3:00:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2262, "total_steps": 10853, "loss": 0.179, "learning_rate": 4.664809537159084e-06, "epoch": 0.20841203298475147, "percentage": 20.84, "elapsed_time": "7:06:43", "remaining_time": "1 day, 3:00:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2263, "total_steps": 10853, "loss": 0.1548, "learning_rate": 4.664428411207007e-06, "epoch": 0.20850416916202147, "percentage": 20.85, "elapsed_time": "7:06:52", "remaining_time": "1 day, 3:00:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2264, "total_steps": 10853, "loss": 0.171, "learning_rate": 4.664047084287518e-06, "epoch": 0.20859630533929147, "percentage": 20.86, "elapsed_time": "7:07:03", "remaining_time": "1 day, 3:00:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2265, "total_steps": 10853, "loss": 0.1658, "learning_rate": 4.663665556436025e-06, "epoch": 0.2086884415165615, "percentage": 20.87, "elapsed_time": "7:07:14", "remaining_time": "1 day, 2:59:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2266, "total_steps": 10853, "loss": 0.1773, "learning_rate": 4.663283827687953e-06, "epoch": 0.2087805776938315, "percentage": 20.88, "elapsed_time": "7:07:25", "remaining_time": "1 day, 2:59:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2267, "total_steps": 10853, "loss": 0.1737, "learning_rate": 4.662901898078746e-06, "epoch": 0.20887271387110148, "percentage": 20.89, "elapsed_time": "7:07:36", "remaining_time": "1 day, 2:59:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2268, "total_steps": 10853, "loss": 0.1678, "learning_rate": 4.662519767643863e-06, "epoch": 0.20896485004837148, "percentage": 20.9, "elapsed_time": "7:07:48", "remaining_time": "1 day, 2:59:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2269, "total_steps": 10853, "loss": 0.1804, "learning_rate": 4.662137436418786e-06, "epoch": 0.2090569862256415, "percentage": 20.91, "elapsed_time": "7:07:59", "remaining_time": "1 day, 2:59:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2270, "total_steps": 10853, "loss": 0.177, "learning_rate": 4.661754904439018e-06, "epoch": 0.2091491224029115, "percentage": 20.92, "elapsed_time": "7:08:10", "remaining_time": "1 day, 2:58:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2271, "total_steps": 10853, "loss": 0.1702, "learning_rate": 4.661372171740073e-06, "epoch": 0.2092412585801815, "percentage": 20.93, "elapsed_time": "7:08:19", "remaining_time": "1 day, 2:58:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2272, "total_steps": 10853, "loss": 0.1725, "learning_rate": 4.660989238357489e-06, "epoch": 0.20933339475745152, "percentage": 20.93, "elapsed_time": "7:08:30", "remaining_time": "1 day, 2:58:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2273, "total_steps": 10853, "loss": 0.1676, "learning_rate": 4.660606104326822e-06, "epoch": 0.20942553093472152, "percentage": 20.94, "elapsed_time": "7:08:41", "remaining_time": "1 day, 2:58:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2274, "total_steps": 10853, "loss": 0.1689, "learning_rate": 4.660222769683645e-06, "epoch": 0.20951766711199152, "percentage": 20.95, "elapsed_time": "7:08:53", "remaining_time": "1 day, 2:58:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2275, "total_steps": 10853, "loss": 0.1666, "learning_rate": 4.659839234463552e-06, "epoch": 0.20960980328926151, "percentage": 20.96, "elapsed_time": "7:09:04", "remaining_time": "1 day, 2:57:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2276, "total_steps": 10853, "loss": 0.1676, "learning_rate": 4.659455498702154e-06, "epoch": 0.20970193946653154, "percentage": 20.97, "elapsed_time": "7:09:15", "remaining_time": "1 day, 2:57:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2277, "total_steps": 10853, "loss": 0.1778, "learning_rate": 4.65907156243508e-06, "epoch": 0.20979407564380154, "percentage": 20.98, "elapsed_time": "7:09:26", "remaining_time": "1 day, 2:57:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2278, "total_steps": 10853, "loss": 0.1672, "learning_rate": 4.65868742569798e-06, "epoch": 0.20988621182107153, "percentage": 20.99, "elapsed_time": "7:09:36", "remaining_time": "1 day, 2:57:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2279, "total_steps": 10853, "loss": 0.184, "learning_rate": 4.658303088526519e-06, "epoch": 0.20997834799834156, "percentage": 21.0, "elapsed_time": "7:09:46", "remaining_time": "1 day, 2:56:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2280, "total_steps": 10853, "loss": 0.1697, "learning_rate": 4.657918550956384e-06, "epoch": 0.21007048417561155, "percentage": 21.01, "elapsed_time": "7:09:57", "remaining_time": "1 day, 2:56:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2281, "total_steps": 10853, "loss": 0.1737, "learning_rate": 4.65753381302328e-06, "epoch": 0.21016262035288155, "percentage": 21.02, "elapsed_time": "7:10:08", "remaining_time": "1 day, 2:56:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2282, "total_steps": 10853, "loss": 0.1501, "learning_rate": 4.657148874762929e-06, "epoch": 0.21025475653015158, "percentage": 21.03, "elapsed_time": "7:10:18", "remaining_time": "1 day, 2:56:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2283, "total_steps": 10853, "loss": 0.17, "learning_rate": 4.656763736211073e-06, "epoch": 0.21034689270742157, "percentage": 21.04, "elapsed_time": "7:10:29", "remaining_time": "1 day, 2:56:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2284, "total_steps": 10853, "loss": 0.1628, "learning_rate": 4.656378397403472e-06, "epoch": 0.21043902888469157, "percentage": 21.04, "elapsed_time": "7:10:40", "remaining_time": "1 day, 2:55:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2285, "total_steps": 10853, "loss": 0.17, "learning_rate": 4.655992858375904e-06, "epoch": 0.21053116506196157, "percentage": 21.05, "elapsed_time": "7:10:49", "remaining_time": "1 day, 2:55:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2286, "total_steps": 10853, "loss": 0.1624, "learning_rate": 4.655607119164168e-06, "epoch": 0.2106233012392316, "percentage": 21.06, "elapsed_time": "7:11:00", "remaining_time": "1 day, 2:55:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2287, "total_steps": 10853, "loss": 0.1729, "learning_rate": 4.655221179804078e-06, "epoch": 0.2107154374165016, "percentage": 21.07, "elapsed_time": "7:11:11", "remaining_time": "1 day, 2:55:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2288, "total_steps": 10853, "loss": 0.1709, "learning_rate": 4.65483504033147e-06, "epoch": 0.21080757359377159, "percentage": 21.08, "elapsed_time": "7:11:22", "remaining_time": "1 day, 2:54:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2289, "total_steps": 10853, "loss": 0.173, "learning_rate": 4.654448700782197e-06, "epoch": 0.2108997097710416, "percentage": 21.09, "elapsed_time": "7:11:33", "remaining_time": "1 day, 2:54:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2290, "total_steps": 10853, "loss": 0.1816, "learning_rate": 4.65406216119213e-06, "epoch": 0.2109918459483116, "percentage": 21.1, "elapsed_time": "7:11:45", "remaining_time": "1 day, 2:54:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2291, "total_steps": 10853, "loss": 0.1666, "learning_rate": 4.653675421597159e-06, "epoch": 0.2110839821255816, "percentage": 21.11, "elapsed_time": "7:11:55", "remaining_time": "1 day, 2:54:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2292, "total_steps": 10853, "loss": 0.1725, "learning_rate": 4.653288482033194e-06, "epoch": 0.2111761183028516, "percentage": 21.12, "elapsed_time": "7:12:06", "remaining_time": "1 day, 2:53:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2293, "total_steps": 10853, "loss": 0.1893, "learning_rate": 4.652901342536162e-06, "epoch": 0.21126825448012163, "percentage": 21.13, "elapsed_time": "7:12:17", "remaining_time": "1 day, 2:53:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2294, "total_steps": 10853, "loss": 0.1593, "learning_rate": 4.652514003142008e-06, "epoch": 0.21136039065739162, "percentage": 21.14, "elapsed_time": "7:12:28", "remaining_time": "1 day, 2:53:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2295, "total_steps": 10853, "loss": 0.1876, "learning_rate": 4.652126463886697e-06, "epoch": 0.21145252683466162, "percentage": 21.15, "elapsed_time": "7:12:40", "remaining_time": "1 day, 2:53:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2296, "total_steps": 10853, "loss": 0.1547, "learning_rate": 4.651738724806213e-06, "epoch": 0.21154466301193164, "percentage": 21.16, "elapsed_time": "7:12:50", "remaining_time": "1 day, 2:53:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2297, "total_steps": 10853, "loss": 0.1456, "learning_rate": 4.651350785936556e-06, "epoch": 0.21163679918920164, "percentage": 21.16, "elapsed_time": "7:13:00", "remaining_time": "1 day, 2:52:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2298, "total_steps": 10853, "loss": 0.1737, "learning_rate": 4.650962647313747e-06, "epoch": 0.21172893536647164, "percentage": 21.17, "elapsed_time": "7:13:11", "remaining_time": "1 day, 2:52:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2299, "total_steps": 10853, "loss": 0.1832, "learning_rate": 4.650574308973826e-06, "epoch": 0.21182107154374166, "percentage": 21.18, "elapsed_time": "7:13:21", "remaining_time": "1 day, 2:52:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2300, "total_steps": 10853, "loss": 0.1904, "learning_rate": 4.6501857709528475e-06, "epoch": 0.21191320772101166, "percentage": 21.19, "elapsed_time": "7:13:32", "remaining_time": "1 day, 2:52:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2301, "total_steps": 10853, "loss": 0.1821, "learning_rate": 4.649797033286889e-06, "epoch": 0.21200534389828166, "percentage": 21.2, "elapsed_time": "7:13:43", "remaining_time": "1 day, 2:52:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2302, "total_steps": 10853, "loss": 0.1708, "learning_rate": 4.6494080960120444e-06, "epoch": 0.21209748007555165, "percentage": 21.21, "elapsed_time": "7:13:54", "remaining_time": "1 day, 2:51:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2303, "total_steps": 10853, "loss": 0.1596, "learning_rate": 4.6490189591644274e-06, "epoch": 0.21218961625282168, "percentage": 21.22, "elapsed_time": "7:14:04", "remaining_time": "1 day, 2:51:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2304, "total_steps": 10853, "loss": 0.1742, "learning_rate": 4.648629622780169e-06, "epoch": 0.21228175243009167, "percentage": 21.23, "elapsed_time": "7:14:15", "remaining_time": "1 day, 2:51:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2305, "total_steps": 10853, "loss": 0.1585, "learning_rate": 4.648240086895418e-06, "epoch": 0.21237388860736167, "percentage": 21.24, "elapsed_time": "7:14:27", "remaining_time": "1 day, 2:51:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2306, "total_steps": 10853, "loss": 0.1628, "learning_rate": 4.647850351546345e-06, "epoch": 0.2124660247846317, "percentage": 21.25, "elapsed_time": "7:14:37", "remaining_time": "1 day, 2:50:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2307, "total_steps": 10853, "loss": 0.1639, "learning_rate": 4.647460416769134e-06, "epoch": 0.2125581609619017, "percentage": 21.26, "elapsed_time": "7:14:50", "remaining_time": "1 day, 2:50:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2308, "total_steps": 10853, "loss": 0.171, "learning_rate": 4.647070282599994e-06, "epoch": 0.2126502971391717, "percentage": 21.27, "elapsed_time": "7:14:59", "remaining_time": "1 day, 2:50:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2309, "total_steps": 10853, "loss": 0.1932, "learning_rate": 4.646679949075146e-06, "epoch": 0.2127424333164417, "percentage": 21.28, "elapsed_time": "7:15:10", "remaining_time": "1 day, 2:50:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2310, "total_steps": 10853, "loss": 0.1694, "learning_rate": 4.646289416230834e-06, "epoch": 0.2128345694937117, "percentage": 21.28, "elapsed_time": "7:15:21", "remaining_time": "1 day, 2:50:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2311, "total_steps": 10853, "loss": 0.1771, "learning_rate": 4.645898684103318e-06, "epoch": 0.2129267056709817, "percentage": 21.29, "elapsed_time": "7:15:32", "remaining_time": "1 day, 2:49:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2312, "total_steps": 10853, "loss": 0.18, "learning_rate": 4.6455077527288795e-06, "epoch": 0.2130188418482517, "percentage": 21.3, "elapsed_time": "7:15:43", "remaining_time": "1 day, 2:49:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2313, "total_steps": 10853, "loss": 0.1657, "learning_rate": 4.6451166221438145e-06, "epoch": 0.21311097802552173, "percentage": 21.31, "elapsed_time": "7:15:54", "remaining_time": "1 day, 2:49:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2314, "total_steps": 10853, "loss": 0.1681, "learning_rate": 4.644725292384441e-06, "epoch": 0.21320311420279173, "percentage": 21.32, "elapsed_time": "7:16:04", "remaining_time": "1 day, 2:49:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2315, "total_steps": 10853, "loss": 0.1597, "learning_rate": 4.6443337634870926e-06, "epoch": 0.21329525038006172, "percentage": 21.33, "elapsed_time": "7:16:15", "remaining_time": "1 day, 2:49:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2316, "total_steps": 10853, "loss": 0.1665, "learning_rate": 4.643942035488123e-06, "epoch": 0.21338738655733175, "percentage": 21.34, "elapsed_time": "7:16:26", "remaining_time": "1 day, 2:48:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2317, "total_steps": 10853, "loss": 0.1609, "learning_rate": 4.643550108423905e-06, "epoch": 0.21347952273460175, "percentage": 21.35, "elapsed_time": "7:16:37", "remaining_time": "1 day, 2:48:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2318, "total_steps": 10853, "loss": 0.1724, "learning_rate": 4.64315798233083e-06, "epoch": 0.21357165891187174, "percentage": 21.36, "elapsed_time": "7:16:48", "remaining_time": "1 day, 2:48:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2319, "total_steps": 10853, "loss": 0.1703, "learning_rate": 4.642765657245304e-06, "epoch": 0.21366379508914174, "percentage": 21.37, "elapsed_time": "7:17:00", "remaining_time": "1 day, 2:48:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2320, "total_steps": 10853, "loss": 0.1597, "learning_rate": 4.642373133203757e-06, "epoch": 0.21375593126641176, "percentage": 21.38, "elapsed_time": "7:17:10", "remaining_time": "1 day, 2:47:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2321, "total_steps": 10853, "loss": 0.1678, "learning_rate": 4.641980410242634e-06, "epoch": 0.21384806744368176, "percentage": 21.39, "elapsed_time": "7:17:21", "remaining_time": "1 day, 2:47:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2322, "total_steps": 10853, "loss": 0.1672, "learning_rate": 4.6415874883983995e-06, "epoch": 0.21394020362095176, "percentage": 21.4, "elapsed_time": "7:17:33", "remaining_time": "1 day, 2:47:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2323, "total_steps": 10853, "loss": 0.1636, "learning_rate": 4.641194367707535e-06, "epoch": 0.21403233979822178, "percentage": 21.4, "elapsed_time": "7:17:43", "remaining_time": "1 day, 2:47:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2324, "total_steps": 10853, "loss": 0.1702, "learning_rate": 4.640801048206545e-06, "epoch": 0.21412447597549178, "percentage": 21.41, "elapsed_time": "7:17:55", "remaining_time": "1 day, 2:47:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2325, "total_steps": 10853, "loss": 0.1651, "learning_rate": 4.6404075299319465e-06, "epoch": 0.21421661215276178, "percentage": 21.42, "elapsed_time": "7:18:06", "remaining_time": "1 day, 2:46:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2326, "total_steps": 10853, "loss": 0.1584, "learning_rate": 4.640013812920278e-06, "epoch": 0.2143087483300318, "percentage": 21.43, "elapsed_time": "7:18:18", "remaining_time": "1 day, 2:46:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2327, "total_steps": 10853, "loss": 0.1542, "learning_rate": 4.639619897208097e-06, "epoch": 0.2144008845073018, "percentage": 21.44, "elapsed_time": "7:18:28", "remaining_time": "1 day, 2:46:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2328, "total_steps": 10853, "loss": 0.1679, "learning_rate": 4.639225782831978e-06, "epoch": 0.2144930206845718, "percentage": 21.45, "elapsed_time": "7:18:39", "remaining_time": "1 day, 2:46:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2329, "total_steps": 10853, "loss": 0.1701, "learning_rate": 4.638831469828515e-06, "epoch": 0.2145851568618418, "percentage": 21.46, "elapsed_time": "7:18:50", "remaining_time": "1 day, 2:46:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2330, "total_steps": 10853, "loss": 0.1851, "learning_rate": 4.638436958234321e-06, "epoch": 0.21467729303911182, "percentage": 21.47, "elapsed_time": "7:19:01", "remaining_time": "1 day, 2:45:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2331, "total_steps": 10853, "loss": 0.1676, "learning_rate": 4.638042248086023e-06, "epoch": 0.2147694292163818, "percentage": 21.48, "elapsed_time": "7:19:12", "remaining_time": "1 day, 2:45:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2332, "total_steps": 10853, "loss": 0.172, "learning_rate": 4.637647339420273e-06, "epoch": 0.2148615653936518, "percentage": 21.49, "elapsed_time": "7:19:23", "remaining_time": "1 day, 2:45:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2333, "total_steps": 10853, "loss": 0.1764, "learning_rate": 4.637252232273738e-06, "epoch": 0.21495370157092183, "percentage": 21.5, "elapsed_time": "7:19:34", "remaining_time": "1 day, 2:45:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2334, "total_steps": 10853, "loss": 0.1557, "learning_rate": 4.6368569266831035e-06, "epoch": 0.21504583774819183, "percentage": 21.51, "elapsed_time": "7:19:44", "remaining_time": "1 day, 2:45:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2335, "total_steps": 10853, "loss": 0.1745, "learning_rate": 4.636461422685072e-06, "epoch": 0.21513797392546183, "percentage": 21.51, "elapsed_time": "7:19:55", "remaining_time": "1 day, 2:44:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2336, "total_steps": 10853, "loss": 0.1649, "learning_rate": 4.63606572031637e-06, "epoch": 0.21523011010273183, "percentage": 21.52, "elapsed_time": "7:20:05", "remaining_time": "1 day, 2:44:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2337, "total_steps": 10853, "loss": 0.1642, "learning_rate": 4.635669819613734e-06, "epoch": 0.21532224628000185, "percentage": 21.53, "elapsed_time": "7:20:17", "remaining_time": "1 day, 2:44:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2338, "total_steps": 10853, "loss": 0.1712, "learning_rate": 4.635273720613925e-06, "epoch": 0.21541438245727185, "percentage": 21.54, "elapsed_time": "7:20:28", "remaining_time": "1 day, 2:44:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2339, "total_steps": 10853, "loss": 0.1721, "learning_rate": 4.634877423353723e-06, "epoch": 0.21550651863454184, "percentage": 21.55, "elapsed_time": "7:20:39", "remaining_time": "1 day, 2:44:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2340, "total_steps": 10853, "loss": 0.1668, "learning_rate": 4.634480927869921e-06, "epoch": 0.21559865481181187, "percentage": 21.56, "elapsed_time": "7:20:50", "remaining_time": "1 day, 2:43:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2341, "total_steps": 10853, "loss": 0.1369, "learning_rate": 4.634084234199335e-06, "epoch": 0.21569079098908187, "percentage": 21.57, "elapsed_time": "7:21:01", "remaining_time": "1 day, 2:43:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2342, "total_steps": 10853, "loss": 0.1698, "learning_rate": 4.633687342378799e-06, "epoch": 0.21578292716635186, "percentage": 21.58, "elapsed_time": "7:21:12", "remaining_time": "1 day, 2:43:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2343, "total_steps": 10853, "loss": 0.1878, "learning_rate": 4.633290252445164e-06, "epoch": 0.2158750633436219, "percentage": 21.59, "elapsed_time": "7:21:24", "remaining_time": "1 day, 2:43:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2344, "total_steps": 10853, "loss": 0.1805, "learning_rate": 4.632892964435299e-06, "epoch": 0.21596719952089188, "percentage": 21.6, "elapsed_time": "7:21:36", "remaining_time": "1 day, 2:43:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2345, "total_steps": 10853, "loss": 0.1634, "learning_rate": 4.632495478386092e-06, "epoch": 0.21605933569816188, "percentage": 21.61, "elapsed_time": "7:21:46", "remaining_time": "1 day, 2:42:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2346, "total_steps": 10853, "loss": 0.172, "learning_rate": 4.632097794334451e-06, "epoch": 0.21615147187543188, "percentage": 21.62, "elapsed_time": "7:21:56", "remaining_time": "1 day, 2:42:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2347, "total_steps": 10853, "loss": 0.1656, "learning_rate": 4.631699912317301e-06, "epoch": 0.2162436080527019, "percentage": 21.63, "elapsed_time": "7:22:09", "remaining_time": "1 day, 2:42:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2348, "total_steps": 10853, "loss": 0.1759, "learning_rate": 4.631301832371584e-06, "epoch": 0.2163357442299719, "percentage": 21.63, "elapsed_time": "7:22:20", "remaining_time": "1 day, 2:42:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2349, "total_steps": 10853, "loss": 0.1685, "learning_rate": 4.630903554534262e-06, "epoch": 0.2164278804072419, "percentage": 21.64, "elapsed_time": "7:22:31", "remaining_time": "1 day, 2:42:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2350, "total_steps": 10853, "loss": 0.1823, "learning_rate": 4.630505078842317e-06, "epoch": 0.21652001658451192, "percentage": 21.65, "elapsed_time": "7:22:41", "remaining_time": "1 day, 2:41:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2351, "total_steps": 10853, "loss": 0.1827, "learning_rate": 4.630106405332745e-06, "epoch": 0.21661215276178192, "percentage": 21.66, "elapsed_time": "7:22:52", "remaining_time": "1 day, 2:41:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2352, "total_steps": 10853, "loss": 0.1639, "learning_rate": 4.629707534042564e-06, "epoch": 0.21670428893905191, "percentage": 21.67, "elapsed_time": "7:23:03", "remaining_time": "1 day, 2:41:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2353, "total_steps": 10853, "loss": 0.1795, "learning_rate": 4.6293084650088095e-06, "epoch": 0.2167964251163219, "percentage": 21.68, "elapsed_time": "7:23:14", "remaining_time": "1 day, 2:41:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2354, "total_steps": 10853, "loss": 0.169, "learning_rate": 4.628909198268534e-06, "epoch": 0.21688856129359194, "percentage": 21.69, "elapsed_time": "7:23:25", "remaining_time": "1 day, 2:40:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2355, "total_steps": 10853, "loss": 0.1679, "learning_rate": 4.628509733858813e-06, "epoch": 0.21698069747086193, "percentage": 21.7, "elapsed_time": "7:23:36", "remaining_time": "1 day, 2:40:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2356, "total_steps": 10853, "loss": 0.1624, "learning_rate": 4.628110071816732e-06, "epoch": 0.21707283364813193, "percentage": 21.71, "elapsed_time": "7:23:46", "remaining_time": "1 day, 2:40:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2357, "total_steps": 10853, "loss": 0.1751, "learning_rate": 4.6277102121794015e-06, "epoch": 0.21716496982540195, "percentage": 21.72, "elapsed_time": "7:23:58", "remaining_time": "1 day, 2:40:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2358, "total_steps": 10853, "loss": 0.1738, "learning_rate": 4.62731015498395e-06, "epoch": 0.21725710600267195, "percentage": 21.73, "elapsed_time": "7:24:08", "remaining_time": "1 day, 2:40:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2359, "total_steps": 10853, "loss": 0.1743, "learning_rate": 4.626909900267521e-06, "epoch": 0.21734924217994195, "percentage": 21.74, "elapsed_time": "7:24:18", "remaining_time": "1 day, 2:39:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2360, "total_steps": 10853, "loss": 0.1655, "learning_rate": 4.626509448067279e-06, "epoch": 0.21744137835721197, "percentage": 21.75, "elapsed_time": "7:24:29", "remaining_time": "1 day, 2:39:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2361, "total_steps": 10853, "loss": 0.1574, "learning_rate": 4.626108798420406e-06, "epoch": 0.21753351453448197, "percentage": 21.75, "elapsed_time": "7:24:38", "remaining_time": "1 day, 2:39:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2362, "total_steps": 10853, "loss": 0.1781, "learning_rate": 4.625707951364102e-06, "epoch": 0.21762565071175197, "percentage": 21.76, "elapsed_time": "7:24:50", "remaining_time": "1 day, 2:39:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2363, "total_steps": 10853, "loss": 0.1743, "learning_rate": 4.625306906935586e-06, "epoch": 0.21771778688902196, "percentage": 21.77, "elapsed_time": "7:25:02", "remaining_time": "1 day, 2:38:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2364, "total_steps": 10853, "loss": 0.1642, "learning_rate": 4.624905665172095e-06, "epoch": 0.217809923066292, "percentage": 21.78, "elapsed_time": "7:25:14", "remaining_time": "1 day, 2:38:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2365, "total_steps": 10853, "loss": 0.1668, "learning_rate": 4.6245042261108845e-06, "epoch": 0.21790205924356199, "percentage": 21.79, "elapsed_time": "7:25:24", "remaining_time": "1 day, 2:38:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2366, "total_steps": 10853, "loss": 0.1842, "learning_rate": 4.6241025897892275e-06, "epoch": 0.21799419542083198, "percentage": 21.8, "elapsed_time": "7:25:34", "remaining_time": "1 day, 2:38:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2367, "total_steps": 10853, "loss": 0.1859, "learning_rate": 4.623700756244417e-06, "epoch": 0.218086331598102, "percentage": 21.81, "elapsed_time": "7:25:45", "remaining_time": "1 day, 2:38:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2368, "total_steps": 10853, "loss": 0.1515, "learning_rate": 4.6232987255137625e-06, "epoch": 0.218178467775372, "percentage": 21.82, "elapsed_time": "7:25:56", "remaining_time": "1 day, 2:37:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2369, "total_steps": 10853, "loss": 0.1483, "learning_rate": 4.622896497634593e-06, "epoch": 0.218270603952642, "percentage": 21.83, "elapsed_time": "7:26:05", "remaining_time": "1 day, 2:37:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2370, "total_steps": 10853, "loss": 0.1735, "learning_rate": 4.622494072644255e-06, "epoch": 0.218362740129912, "percentage": 21.84, "elapsed_time": "7:26:15", "remaining_time": "1 day, 2:37:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2371, "total_steps": 10853, "loss": 0.1656, "learning_rate": 4.622091450580114e-06, "epoch": 0.21845487630718202, "percentage": 21.85, "elapsed_time": "7:26:24", "remaining_time": "1 day, 2:37:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2372, "total_steps": 10853, "loss": 0.1653, "learning_rate": 4.621688631479554e-06, "epoch": 0.21854701248445202, "percentage": 21.86, "elapsed_time": "7:26:35", "remaining_time": "1 day, 2:36:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2373, "total_steps": 10853, "loss": 0.1743, "learning_rate": 4.621285615379976e-06, "epoch": 0.21863914866172202, "percentage": 21.86, "elapsed_time": "7:26:46", "remaining_time": "1 day, 2:36:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2374, "total_steps": 10853, "loss": 0.1736, "learning_rate": 4.620882402318799e-06, "epoch": 0.21873128483899204, "percentage": 21.87, "elapsed_time": "7:26:58", "remaining_time": "1 day, 2:36:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2375, "total_steps": 10853, "loss": 0.1618, "learning_rate": 4.620478992333463e-06, "epoch": 0.21882342101626204, "percentage": 21.88, "elapsed_time": "7:27:09", "remaining_time": "1 day, 2:36:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2376, "total_steps": 10853, "loss": 0.1608, "learning_rate": 4.620075385461426e-06, "epoch": 0.21891555719353203, "percentage": 21.89, "elapsed_time": "7:27:20", "remaining_time": "1 day, 2:35:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2377, "total_steps": 10853, "loss": 0.1508, "learning_rate": 4.61967158174016e-06, "epoch": 0.21900769337080206, "percentage": 21.9, "elapsed_time": "7:27:29", "remaining_time": "1 day, 2:35:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2378, "total_steps": 10853, "loss": 0.1579, "learning_rate": 4.61926758120716e-06, "epoch": 0.21909982954807206, "percentage": 21.91, "elapsed_time": "7:27:40", "remaining_time": "1 day, 2:35:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2379, "total_steps": 10853, "loss": 0.1696, "learning_rate": 4.618863383899937e-06, "epoch": 0.21919196572534205, "percentage": 21.92, "elapsed_time": "7:27:51", "remaining_time": "1 day, 2:35:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2380, "total_steps": 10853, "loss": 0.1765, "learning_rate": 4.618458989856021e-06, "epoch": 0.21928410190261205, "percentage": 21.93, "elapsed_time": "7:28:02", "remaining_time": "1 day, 2:35:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2381, "total_steps": 10853, "loss": 0.1675, "learning_rate": 4.618054399112959e-06, "epoch": 0.21937623807988207, "percentage": 21.94, "elapsed_time": "7:28:11", "remaining_time": "1 day, 2:34:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2382, "total_steps": 10853, "loss": 0.1711, "learning_rate": 4.617649611708318e-06, "epoch": 0.21946837425715207, "percentage": 21.95, "elapsed_time": "7:28:22", "remaining_time": "1 day, 2:34:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2383, "total_steps": 10853, "loss": 0.1829, "learning_rate": 4.617244627679684e-06, "epoch": 0.21956051043442207, "percentage": 21.96, "elapsed_time": "7:28:34", "remaining_time": "1 day, 2:34:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2384, "total_steps": 10853, "loss": 0.1639, "learning_rate": 4.6168394470646575e-06, "epoch": 0.2196526466116921, "percentage": 21.97, "elapsed_time": "7:28:44", "remaining_time": "1 day, 2:34:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2385, "total_steps": 10853, "loss": 0.1714, "learning_rate": 4.61643406990086e-06, "epoch": 0.2197447827889621, "percentage": 21.98, "elapsed_time": "7:28:54", "remaining_time": "1 day, 2:33:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2386, "total_steps": 10853, "loss": 0.165, "learning_rate": 4.616028496225933e-06, "epoch": 0.2198369189662321, "percentage": 21.98, "elapsed_time": "7:29:04", "remaining_time": "1 day, 2:33:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2387, "total_steps": 10853, "loss": 0.1637, "learning_rate": 4.6156227260775314e-06, "epoch": 0.21992905514350208, "percentage": 21.99, "elapsed_time": "7:29:14", "remaining_time": "1 day, 2:33:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2388, "total_steps": 10853, "loss": 0.1835, "learning_rate": 4.615216759493332e-06, "epoch": 0.2200211913207721, "percentage": 22.0, "elapsed_time": "7:29:26", "remaining_time": "1 day, 2:33:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2389, "total_steps": 10853, "loss": 0.1571, "learning_rate": 4.614810596511028e-06, "epoch": 0.2201133274980421, "percentage": 22.01, "elapsed_time": "7:29:37", "remaining_time": "1 day, 2:32:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2390, "total_steps": 10853, "loss": 0.1606, "learning_rate": 4.614404237168334e-06, "epoch": 0.2202054636753121, "percentage": 22.02, "elapsed_time": "7:29:49", "remaining_time": "1 day, 2:32:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2391, "total_steps": 10853, "loss": 0.1523, "learning_rate": 4.613997681502977e-06, "epoch": 0.22029759985258213, "percentage": 22.03, "elapsed_time": "7:29:58", "remaining_time": "1 day, 2:32:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2392, "total_steps": 10853, "loss": 0.1544, "learning_rate": 4.61359092955271e-06, "epoch": 0.22038973602985212, "percentage": 22.04, "elapsed_time": "7:30:09", "remaining_time": "1 day, 2:32:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2393, "total_steps": 10853, "loss": 0.1606, "learning_rate": 4.613183981355297e-06, "epoch": 0.22048187220712212, "percentage": 22.05, "elapsed_time": "7:30:20", "remaining_time": "1 day, 2:32:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2394, "total_steps": 10853, "loss": 0.1543, "learning_rate": 4.612776836948524e-06, "epoch": 0.22057400838439215, "percentage": 22.06, "elapsed_time": "7:30:30", "remaining_time": "1 day, 2:31:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2395, "total_steps": 10853, "loss": 0.1574, "learning_rate": 4.612369496370194e-06, "epoch": 0.22066614456166214, "percentage": 22.07, "elapsed_time": "7:30:40", "remaining_time": "1 day, 2:31:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2396, "total_steps": 10853, "loss": 0.1568, "learning_rate": 4.611961959658129e-06, "epoch": 0.22075828073893214, "percentage": 22.08, "elapsed_time": "7:30:51", "remaining_time": "1 day, 2:31:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2397, "total_steps": 10853, "loss": 0.1821, "learning_rate": 4.611554226850168e-06, "epoch": 0.22085041691620214, "percentage": 22.09, "elapsed_time": "7:31:03", "remaining_time": "1 day, 2:31:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2398, "total_steps": 10853, "loss": 0.1621, "learning_rate": 4.6111462979841704e-06, "epoch": 0.22094255309347216, "percentage": 22.1, "elapsed_time": "7:31:12", "remaining_time": "1 day, 2:30:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2399, "total_steps": 10853, "loss": 0.1711, "learning_rate": 4.610738173098012e-06, "epoch": 0.22103468927074216, "percentage": 22.1, "elapsed_time": "7:31:23", "remaining_time": "1 day, 2:30:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2400, "total_steps": 10853, "loss": 0.1566, "learning_rate": 4.610329852229587e-06, "epoch": 0.22112682544801215, "percentage": 22.11, "elapsed_time": "7:31:34", "remaining_time": "1 day, 2:30:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2401, "total_steps": 10853, "loss": 0.1735, "learning_rate": 4.6099213354168085e-06, "epoch": 0.22121896162528218, "percentage": 22.12, "elapsed_time": "7:31:46", "remaining_time": "1 day, 2:30:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2402, "total_steps": 10853, "loss": 0.1564, "learning_rate": 4.609512622697606e-06, "epoch": 0.22131109780255218, "percentage": 22.13, "elapsed_time": "7:31:55", "remaining_time": "1 day, 2:30:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2403, "total_steps": 10853, "loss": 0.1583, "learning_rate": 4.609103714109931e-06, "epoch": 0.22140323397982217, "percentage": 22.14, "elapsed_time": "7:32:06", "remaining_time": "1 day, 2:29:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2404, "total_steps": 10853, "loss": 0.1728, "learning_rate": 4.608694609691747e-06, "epoch": 0.22149537015709217, "percentage": 22.15, "elapsed_time": "7:32:17", "remaining_time": "1 day, 2:29:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2405, "total_steps": 10853, "loss": 0.1636, "learning_rate": 4.608285309481043e-06, "epoch": 0.2215875063343622, "percentage": 22.16, "elapsed_time": "7:32:28", "remaining_time": "1 day, 2:29:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2406, "total_steps": 10853, "loss": 0.1707, "learning_rate": 4.607875813515821e-06, "epoch": 0.2216796425116322, "percentage": 22.17, "elapsed_time": "7:32:39", "remaining_time": "1 day, 2:29:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2407, "total_steps": 10853, "loss": 0.1579, "learning_rate": 4.607466121834103e-06, "epoch": 0.2217717786889022, "percentage": 22.18, "elapsed_time": "7:32:50", "remaining_time": "1 day, 2:28:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2408, "total_steps": 10853, "loss": 0.1578, "learning_rate": 4.607056234473928e-06, "epoch": 0.2218639148661722, "percentage": 22.19, "elapsed_time": "7:32:59", "remaining_time": "1 day, 2:28:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2409, "total_steps": 10853, "loss": 0.1675, "learning_rate": 4.606646151473355e-06, "epoch": 0.2219560510434422, "percentage": 22.2, "elapsed_time": "7:33:10", "remaining_time": "1 day, 2:28:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2410, "total_steps": 10853, "loss": 0.1773, "learning_rate": 4.606235872870461e-06, "epoch": 0.2220481872207122, "percentage": 22.21, "elapsed_time": "7:33:22", "remaining_time": "1 day, 2:28:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2411, "total_steps": 10853, "loss": 0.1751, "learning_rate": 4.605825398703339e-06, "epoch": 0.22214032339798223, "percentage": 22.22, "elapsed_time": "7:33:31", "remaining_time": "1 day, 2:27:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2412, "total_steps": 10853, "loss": 0.1808, "learning_rate": 4.605414729010102e-06, "epoch": 0.22223245957525223, "percentage": 22.22, "elapsed_time": "7:33:43", "remaining_time": "1 day, 2:27:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2413, "total_steps": 10853, "loss": 0.1609, "learning_rate": 4.605003863828881e-06, "epoch": 0.22232459575252222, "percentage": 22.23, "elapsed_time": "7:33:53", "remaining_time": "1 day, 2:27:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2414, "total_steps": 10853, "loss": 0.1822, "learning_rate": 4.604592803197825e-06, "epoch": 0.22241673192979222, "percentage": 22.24, "elapsed_time": "7:34:04", "remaining_time": "1 day, 2:27:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2415, "total_steps": 10853, "loss": 0.1579, "learning_rate": 4.6041815471551e-06, "epoch": 0.22250886810706225, "percentage": 22.25, "elapsed_time": "7:34:13", "remaining_time": "1 day, 2:27:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2416, "total_steps": 10853, "loss": 0.1781, "learning_rate": 4.603770095738892e-06, "epoch": 0.22260100428433224, "percentage": 22.26, "elapsed_time": "7:34:24", "remaining_time": "1 day, 2:26:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2417, "total_steps": 10853, "loss": 0.1673, "learning_rate": 4.603358448987405e-06, "epoch": 0.22269314046160224, "percentage": 22.27, "elapsed_time": "7:34:34", "remaining_time": "1 day, 2:26:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2418, "total_steps": 10853, "loss": 0.1729, "learning_rate": 4.602946606938858e-06, "epoch": 0.22278527663887226, "percentage": 22.28, "elapsed_time": "7:34:46", "remaining_time": "1 day, 2:26:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2419, "total_steps": 10853, "loss": 0.1637, "learning_rate": 4.6025345696314935e-06, "epoch": 0.22287741281614226, "percentage": 22.29, "elapsed_time": "7:34:56", "remaining_time": "1 day, 2:26:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2420, "total_steps": 10853, "loss": 0.1861, "learning_rate": 4.602122337103568e-06, "epoch": 0.22296954899341226, "percentage": 22.3, "elapsed_time": "7:35:06", "remaining_time": "1 day, 2:25:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2421, "total_steps": 10853, "loss": 0.1789, "learning_rate": 4.601709909393357e-06, "epoch": 0.22306168517068226, "percentage": 22.31, "elapsed_time": "7:35:18", "remaining_time": "1 day, 2:25:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2422, "total_steps": 10853, "loss": 0.1844, "learning_rate": 4.601297286539155e-06, "epoch": 0.22315382134795228, "percentage": 22.32, "elapsed_time": "7:35:29", "remaining_time": "1 day, 2:25:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2423, "total_steps": 10853, "loss": 0.1718, "learning_rate": 4.600884468579273e-06, "epoch": 0.22324595752522228, "percentage": 22.33, "elapsed_time": "7:35:41", "remaining_time": "1 day, 2:25:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2424, "total_steps": 10853, "loss": 0.1545, "learning_rate": 4.600471455552043e-06, "epoch": 0.22333809370249227, "percentage": 22.33, "elapsed_time": "7:35:52", "remaining_time": "1 day, 2:25:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2425, "total_steps": 10853, "loss": 0.168, "learning_rate": 4.600058247495812e-06, "epoch": 0.2234302298797623, "percentage": 22.34, "elapsed_time": "7:36:03", "remaining_time": "1 day, 2:24:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2426, "total_steps": 10853, "loss": 0.175, "learning_rate": 4.599644844448946e-06, "epoch": 0.2235223660570323, "percentage": 22.35, "elapsed_time": "7:36:14", "remaining_time": "1 day, 2:24:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2427, "total_steps": 10853, "loss": 0.1705, "learning_rate": 4.599231246449831e-06, "epoch": 0.2236145022343023, "percentage": 22.36, "elapsed_time": "7:36:24", "remaining_time": "1 day, 2:24:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2428, "total_steps": 10853, "loss": 0.1568, "learning_rate": 4.5988174535368686e-06, "epoch": 0.22370663841157232, "percentage": 22.37, "elapsed_time": "7:36:35", "remaining_time": "1 day, 2:24:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2429, "total_steps": 10853, "loss": 0.1809, "learning_rate": 4.59840346574848e-06, "epoch": 0.22379877458884231, "percentage": 22.38, "elapsed_time": "7:36:47", "remaining_time": "1 day, 2:24:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2430, "total_steps": 10853, "loss": 0.1843, "learning_rate": 4.597989283123104e-06, "epoch": 0.2238909107661123, "percentage": 22.39, "elapsed_time": "7:36:57", "remaining_time": "1 day, 2:23:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2431, "total_steps": 10853, "loss": 0.1685, "learning_rate": 4.597574905699196e-06, "epoch": 0.2239830469433823, "percentage": 22.4, "elapsed_time": "7:37:08", "remaining_time": "1 day, 2:23:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2432, "total_steps": 10853, "loss": 0.1767, "learning_rate": 4.597160333515233e-06, "epoch": 0.22407518312065233, "percentage": 22.41, "elapsed_time": "7:37:19", "remaining_time": "1 day, 2:23:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2433, "total_steps": 10853, "loss": 0.1598, "learning_rate": 4.596745566609707e-06, "epoch": 0.22416731929792233, "percentage": 22.42, "elapsed_time": "7:37:30", "remaining_time": "1 day, 2:23:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2434, "total_steps": 10853, "loss": 0.1649, "learning_rate": 4.5963306050211296e-06, "epoch": 0.22425945547519233, "percentage": 22.43, "elapsed_time": "7:37:40", "remaining_time": "1 day, 2:23:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2435, "total_steps": 10853, "loss": 0.1818, "learning_rate": 4.595915448788031e-06, "epoch": 0.22435159165246235, "percentage": 22.44, "elapsed_time": "7:37:51", "remaining_time": "1 day, 2:22:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2436, "total_steps": 10853, "loss": 0.1766, "learning_rate": 4.5955000979489565e-06, "epoch": 0.22444372782973235, "percentage": 22.45, "elapsed_time": "7:38:01", "remaining_time": "1 day, 2:22:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2437, "total_steps": 10853, "loss": 0.1728, "learning_rate": 4.595084552542472e-06, "epoch": 0.22453586400700234, "percentage": 22.45, "elapsed_time": "7:38:11", "remaining_time": "1 day, 2:22:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2438, "total_steps": 10853, "loss": 0.1667, "learning_rate": 4.594668812607162e-06, "epoch": 0.22462800018427234, "percentage": 22.46, "elapsed_time": "7:38:21", "remaining_time": "1 day, 2:22:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2439, "total_steps": 10853, "loss": 0.163, "learning_rate": 4.594252878181627e-06, "epoch": 0.22472013636154237, "percentage": 22.47, "elapsed_time": "7:38:33", "remaining_time": "1 day, 2:21:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2440, "total_steps": 10853, "loss": 0.1511, "learning_rate": 4.593836749304487e-06, "epoch": 0.22481227253881236, "percentage": 22.48, "elapsed_time": "7:38:43", "remaining_time": "1 day, 2:21:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2441, "total_steps": 10853, "loss": 0.1839, "learning_rate": 4.59342042601438e-06, "epoch": 0.22490440871608236, "percentage": 22.49, "elapsed_time": "7:38:53", "remaining_time": "1 day, 2:21:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2442, "total_steps": 10853, "loss": 0.178, "learning_rate": 4.59300390834996e-06, "epoch": 0.22499654489335238, "percentage": 22.5, "elapsed_time": "7:39:04", "remaining_time": "1 day, 2:21:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2443, "total_steps": 10853, "loss": 0.1798, "learning_rate": 4.592587196349902e-06, "epoch": 0.22508868107062238, "percentage": 22.51, "elapsed_time": "7:39:15", "remaining_time": "1 day, 2:20:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2444, "total_steps": 10853, "loss": 0.1654, "learning_rate": 4.592170290052898e-06, "epoch": 0.22518081724789238, "percentage": 22.52, "elapsed_time": "7:39:24", "remaining_time": "1 day, 2:20:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2445, "total_steps": 10853, "loss": 0.1544, "learning_rate": 4.591753189497658e-06, "epoch": 0.2252729534251624, "percentage": 22.53, "elapsed_time": "7:39:34", "remaining_time": "1 day, 2:20:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2446, "total_steps": 10853, "loss": 0.1937, "learning_rate": 4.591335894722909e-06, "epoch": 0.2253650896024324, "percentage": 22.54, "elapsed_time": "7:39:45", "remaining_time": "1 day, 2:20:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2447, "total_steps": 10853, "loss": 0.1604, "learning_rate": 4.5909184057673976e-06, "epoch": 0.2254572257797024, "percentage": 22.55, "elapsed_time": "7:39:55", "remaining_time": "1 day, 2:19:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2448, "total_steps": 10853, "loss": 0.1697, "learning_rate": 4.590500722669886e-06, "epoch": 0.2255493619569724, "percentage": 22.56, "elapsed_time": "7:40:06", "remaining_time": "1 day, 2:19:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2449, "total_steps": 10853, "loss": 0.1507, "learning_rate": 4.590082845469158e-06, "epoch": 0.22564149813424242, "percentage": 22.57, "elapsed_time": "7:40:16", "remaining_time": "1 day, 2:19:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2450, "total_steps": 10853, "loss": 0.1696, "learning_rate": 4.589664774204013e-06, "epoch": 0.22573363431151242, "percentage": 22.57, "elapsed_time": "7:40:27", "remaining_time": "1 day, 2:19:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2451, "total_steps": 10853, "loss": 0.1774, "learning_rate": 4.589246508913267e-06, "epoch": 0.2258257704887824, "percentage": 22.58, "elapsed_time": "7:40:38", "remaining_time": "1 day, 2:19:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2452, "total_steps": 10853, "loss": 0.1676, "learning_rate": 4.58882804963576e-06, "epoch": 0.22591790666605244, "percentage": 22.59, "elapsed_time": "7:40:48", "remaining_time": "1 day, 2:18:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2453, "total_steps": 10853, "loss": 0.1784, "learning_rate": 4.588409396410342e-06, "epoch": 0.22601004284332243, "percentage": 22.6, "elapsed_time": "7:40:59", "remaining_time": "1 day, 2:18:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2454, "total_steps": 10853, "loss": 0.1647, "learning_rate": 4.587990549275889e-06, "epoch": 0.22610217902059243, "percentage": 22.61, "elapsed_time": "7:41:11", "remaining_time": "1 day, 2:18:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2455, "total_steps": 10853, "loss": 0.1643, "learning_rate": 4.587571508271288e-06, "epoch": 0.22619431519786243, "percentage": 22.62, "elapsed_time": "7:41:22", "remaining_time": "1 day, 2:18:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2456, "total_steps": 10853, "loss": 0.166, "learning_rate": 4.587152273435447e-06, "epoch": 0.22628645137513245, "percentage": 22.63, "elapsed_time": "7:41:32", "remaining_time": "1 day, 2:18:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2457, "total_steps": 10853, "loss": 0.1695, "learning_rate": 4.586732844807293e-06, "epoch": 0.22637858755240245, "percentage": 22.64, "elapsed_time": "7:41:42", "remaining_time": "1 day, 2:17:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2458, "total_steps": 10853, "loss": 0.1672, "learning_rate": 4.58631322242577e-06, "epoch": 0.22647072372967245, "percentage": 22.65, "elapsed_time": "7:41:53", "remaining_time": "1 day, 2:17:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2459, "total_steps": 10853, "loss": 0.1704, "learning_rate": 4.58589340632984e-06, "epoch": 0.22656285990694247, "percentage": 22.66, "elapsed_time": "7:42:03", "remaining_time": "1 day, 2:17:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2460, "total_steps": 10853, "loss": 0.1896, "learning_rate": 4.585473396558482e-06, "epoch": 0.22665499608421247, "percentage": 22.67, "elapsed_time": "7:42:14", "remaining_time": "1 day, 2:17:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2461, "total_steps": 10853, "loss": 0.148, "learning_rate": 4.585053193150695e-06, "epoch": 0.22674713226148246, "percentage": 22.68, "elapsed_time": "7:42:24", "remaining_time": "1 day, 2:16:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2462, "total_steps": 10853, "loss": 0.1617, "learning_rate": 4.584632796145495e-06, "epoch": 0.2268392684387525, "percentage": 22.68, "elapsed_time": "7:42:34", "remaining_time": "1 day, 2:16:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2463, "total_steps": 10853, "loss": 0.1736, "learning_rate": 4.584212205581915e-06, "epoch": 0.2269314046160225, "percentage": 22.69, "elapsed_time": "7:42:45", "remaining_time": "1 day, 2:16:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2464, "total_steps": 10853, "loss": 0.1685, "learning_rate": 4.5837914214990085e-06, "epoch": 0.22702354079329248, "percentage": 22.7, "elapsed_time": "7:42:56", "remaining_time": "1 day, 2:16:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2465, "total_steps": 10853, "loss": 0.1574, "learning_rate": 4.583370443935843e-06, "epoch": 0.22711567697056248, "percentage": 22.71, "elapsed_time": "7:43:06", "remaining_time": "1 day, 2:15:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2466, "total_steps": 10853, "loss": 0.1708, "learning_rate": 4.582949272931508e-06, "epoch": 0.2272078131478325, "percentage": 22.72, "elapsed_time": "7:43:17", "remaining_time": "1 day, 2:15:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2467, "total_steps": 10853, "loss": 0.1701, "learning_rate": 4.582527908525109e-06, "epoch": 0.2272999493251025, "percentage": 22.73, "elapsed_time": "7:43:29", "remaining_time": "1 day, 2:15:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2468, "total_steps": 10853, "loss": 0.1771, "learning_rate": 4.5821063507557695e-06, "epoch": 0.2273920855023725, "percentage": 22.74, "elapsed_time": "7:43:38", "remaining_time": "1 day, 2:15:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2469, "total_steps": 10853, "loss": 0.1706, "learning_rate": 4.581684599662632e-06, "epoch": 0.22748422167964252, "percentage": 22.75, "elapsed_time": "7:43:49", "remaining_time": "1 day, 2:14:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2470, "total_steps": 10853, "loss": 0.1661, "learning_rate": 4.581262655284854e-06, "epoch": 0.22757635785691252, "percentage": 22.76, "elapsed_time": "7:43:59", "remaining_time": "1 day, 2:14:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2471, "total_steps": 10853, "loss": 0.1513, "learning_rate": 4.580840517661615e-06, "epoch": 0.22766849403418252, "percentage": 22.77, "elapsed_time": "7:44:10", "remaining_time": "1 day, 2:14:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2472, "total_steps": 10853, "loss": 0.1607, "learning_rate": 4.58041818683211e-06, "epoch": 0.2277606302114525, "percentage": 22.78, "elapsed_time": "7:44:21", "remaining_time": "1 day, 2:14:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2473, "total_steps": 10853, "loss": 0.1693, "learning_rate": 4.579995662835552e-06, "epoch": 0.22785276638872254, "percentage": 22.79, "elapsed_time": "7:44:31", "remaining_time": "1 day, 2:14:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2474, "total_steps": 10853, "loss": 0.1548, "learning_rate": 4.579572945711174e-06, "epoch": 0.22794490256599254, "percentage": 22.8, "elapsed_time": "7:44:42", "remaining_time": "1 day, 2:13:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2475, "total_steps": 10853, "loss": 0.1702, "learning_rate": 4.579150035498223e-06, "epoch": 0.22803703874326253, "percentage": 22.8, "elapsed_time": "7:44:52", "remaining_time": "1 day, 2:13:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2476, "total_steps": 10853, "loss": 0.1638, "learning_rate": 4.578726932235969e-06, "epoch": 0.22812917492053256, "percentage": 22.81, "elapsed_time": "7:45:02", "remaining_time": "1 day, 2:13:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2477, "total_steps": 10853, "loss": 0.1677, "learning_rate": 4.5783036359636935e-06, "epoch": 0.22822131109780255, "percentage": 22.82, "elapsed_time": "7:45:14", "remaining_time": "1 day, 2:13:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2478, "total_steps": 10853, "loss": 0.1699, "learning_rate": 4.5778801467207035e-06, "epoch": 0.22831344727507255, "percentage": 22.83, "elapsed_time": "7:45:26", "remaining_time": "1 day, 2:13:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2479, "total_steps": 10853, "loss": 0.1745, "learning_rate": 4.577456464546317e-06, "epoch": 0.22840558345234258, "percentage": 22.84, "elapsed_time": "7:45:35", "remaining_time": "1 day, 2:12:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2480, "total_steps": 10853, "loss": 0.1701, "learning_rate": 4.5770325894798754e-06, "epoch": 0.22849771962961257, "percentage": 22.85, "elapsed_time": "7:45:45", "remaining_time": "1 day, 2:12:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2481, "total_steps": 10853, "loss": 0.1704, "learning_rate": 4.5766085215607335e-06, "epoch": 0.22858985580688257, "percentage": 22.86, "elapsed_time": "7:45:54", "remaining_time": "1 day, 2:12:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2482, "total_steps": 10853, "loss": 0.1603, "learning_rate": 4.576184260828267e-06, "epoch": 0.22868199198415257, "percentage": 22.87, "elapsed_time": "7:46:04", "remaining_time": "1 day, 2:11:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2483, "total_steps": 10853, "loss": 0.179, "learning_rate": 4.575759807321869e-06, "epoch": 0.2287741281614226, "percentage": 22.88, "elapsed_time": "7:46:14", "remaining_time": "1 day, 2:11:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2484, "total_steps": 10853, "loss": 0.1595, "learning_rate": 4.575335161080948e-06, "epoch": 0.2288662643386926, "percentage": 22.89, "elapsed_time": "7:46:24", "remaining_time": "1 day, 2:11:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2485, "total_steps": 10853, "loss": 0.1785, "learning_rate": 4.574910322144935e-06, "epoch": 0.22895840051596258, "percentage": 22.9, "elapsed_time": "7:46:36", "remaining_time": "1 day, 2:11:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2486, "total_steps": 10853, "loss": 0.1671, "learning_rate": 4.574485290553276e-06, "epoch": 0.2290505366932326, "percentage": 22.91, "elapsed_time": "7:46:46", "remaining_time": "1 day, 2:11:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2487, "total_steps": 10853, "loss": 0.1794, "learning_rate": 4.574060066345434e-06, "epoch": 0.2291426728705026, "percentage": 22.92, "elapsed_time": "7:46:58", "remaining_time": "1 day, 2:10:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2488, "total_steps": 10853, "loss": 0.1651, "learning_rate": 4.573634649560891e-06, "epoch": 0.2292348090477726, "percentage": 22.92, "elapsed_time": "7:47:09", "remaining_time": "1 day, 2:10:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2489, "total_steps": 10853, "loss": 0.172, "learning_rate": 4.573209040239148e-06, "epoch": 0.2293269452250426, "percentage": 22.93, "elapsed_time": "7:47:21", "remaining_time": "1 day, 2:10:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2490, "total_steps": 10853, "loss": 0.165, "learning_rate": 4.572783238419723e-06, "epoch": 0.22941908140231262, "percentage": 22.94, "elapsed_time": "7:47:31", "remaining_time": "1 day, 2:10:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2491, "total_steps": 10853, "loss": 0.1687, "learning_rate": 4.572357244142151e-06, "epoch": 0.22951121757958262, "percentage": 22.95, "elapsed_time": "7:47:44", "remaining_time": "1 day, 2:10:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2492, "total_steps": 10853, "loss": 0.1661, "learning_rate": 4.5719310574459846e-06, "epoch": 0.22960335375685262, "percentage": 22.96, "elapsed_time": "7:47:55", "remaining_time": "1 day, 2:09:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2493, "total_steps": 10853, "loss": 0.161, "learning_rate": 4.5715046783707976e-06, "epoch": 0.22969548993412264, "percentage": 22.97, "elapsed_time": "7:48:05", "remaining_time": "1 day, 2:09:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2494, "total_steps": 10853, "loss": 0.1588, "learning_rate": 4.571078106956178e-06, "epoch": 0.22978762611139264, "percentage": 22.98, "elapsed_time": "7:48:17", "remaining_time": "1 day, 2:09:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2495, "total_steps": 10853, "loss": 0.1731, "learning_rate": 4.570651343241733e-06, "epoch": 0.22987976228866264, "percentage": 22.99, "elapsed_time": "7:48:28", "remaining_time": "1 day, 2:09:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2496, "total_steps": 10853, "loss": 0.179, "learning_rate": 4.570224387267089e-06, "epoch": 0.22997189846593266, "percentage": 23.0, "elapsed_time": "7:48:38", "remaining_time": "1 day, 2:09:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2497, "total_steps": 10853, "loss": 0.1831, "learning_rate": 4.569797239071887e-06, "epoch": 0.23006403464320266, "percentage": 23.01, "elapsed_time": "7:48:49", "remaining_time": "1 day, 2:08:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2498, "total_steps": 10853, "loss": 0.1741, "learning_rate": 4.569369898695789e-06, "epoch": 0.23015617082047266, "percentage": 23.02, "elapsed_time": "7:48:59", "remaining_time": "1 day, 2:08:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2499, "total_steps": 10853, "loss": 0.1623, "learning_rate": 4.568942366178473e-06, "epoch": 0.23024830699774265, "percentage": 23.03, "elapsed_time": "7:49:10", "remaining_time": "1 day, 2:08:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2500, "total_steps": 10853, "loss": 0.1647, "learning_rate": 4.568514641559636e-06, "epoch": 0.23034044317501268, "percentage": 23.04, "elapsed_time": "7:49:20", "remaining_time": "1 day, 2:08:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2500, "total_steps": 10853, "eval_loss": 0.16871164739131927, "epoch": 0.23034044317501268, "percentage": 23.04, "elapsed_time": "7:54:20", "remaining_time": "1 day, 2:24:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2501, "total_steps": 10853, "loss": 0.1741, "learning_rate": 4.5680867248789916e-06, "epoch": 0.23043257935228267, "percentage": 23.04, "elapsed_time": "7:54:32", "remaining_time": "1 day, 2:24:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2502, "total_steps": 10853, "loss": 0.1708, "learning_rate": 4.567658616176273e-06, "epoch": 0.23052471552955267, "percentage": 23.05, "elapsed_time": "7:54:44", "remaining_time": "1 day, 2:24:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2503, "total_steps": 10853, "loss": 0.1682, "learning_rate": 4.5672303154912275e-06, "epoch": 0.2306168517068227, "percentage": 23.06, "elapsed_time": "7:54:52", "remaining_time": "1 day, 2:24:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2504, "total_steps": 10853, "loss": 0.1666, "learning_rate": 4.566801822863626e-06, "epoch": 0.2307089878840927, "percentage": 23.07, "elapsed_time": "7:55:03", "remaining_time": "1 day, 2:23:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2505, "total_steps": 10853, "loss": 0.1619, "learning_rate": 4.566373138333253e-06, "epoch": 0.2308011240613627, "percentage": 23.08, "elapsed_time": "7:55:15", "remaining_time": "1 day, 2:23:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2506, "total_steps": 10853, "loss": 0.163, "learning_rate": 4.565944261939911e-06, "epoch": 0.23089326023863269, "percentage": 23.09, "elapsed_time": "7:55:26", "remaining_time": "1 day, 2:23:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2507, "total_steps": 10853, "loss": 0.1756, "learning_rate": 4.565515193723423e-06, "epoch": 0.2309853964159027, "percentage": 23.1, "elapsed_time": "7:55:36", "remaining_time": "1 day, 2:23:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2508, "total_steps": 10853, "loss": 0.1614, "learning_rate": 4.5650859337236256e-06, "epoch": 0.2310775325931727, "percentage": 23.11, "elapsed_time": "7:55:46", "remaining_time": "1 day, 2:23:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2509, "total_steps": 10853, "loss": 0.1733, "learning_rate": 4.564656481980378e-06, "epoch": 0.2311696687704427, "percentage": 23.12, "elapsed_time": "7:55:57", "remaining_time": "1 day, 2:22:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2510, "total_steps": 10853, "loss": 0.1586, "learning_rate": 4.564226838533553e-06, "epoch": 0.23126180494771273, "percentage": 23.13, "elapsed_time": "7:56:09", "remaining_time": "1 day, 2:22:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2511, "total_steps": 10853, "loss": 0.1673, "learning_rate": 4.563797003423045e-06, "epoch": 0.23135394112498273, "percentage": 23.14, "elapsed_time": "7:56:19", "remaining_time": "1 day, 2:22:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2512, "total_steps": 10853, "loss": 0.1761, "learning_rate": 4.563366976688762e-06, "epoch": 0.23144607730225272, "percentage": 23.15, "elapsed_time": "7:56:29", "remaining_time": "1 day, 2:22:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2513, "total_steps": 10853, "loss": 0.1637, "learning_rate": 4.562936758370634e-06, "epoch": 0.23153821347952275, "percentage": 23.15, "elapsed_time": "7:56:40", "remaining_time": "1 day, 2:21:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2514, "total_steps": 10853, "loss": 0.1925, "learning_rate": 4.5625063485086065e-06, "epoch": 0.23163034965679274, "percentage": 23.16, "elapsed_time": "7:56:51", "remaining_time": "1 day, 2:21:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2515, "total_steps": 10853, "loss": 0.1921, "learning_rate": 4.562075747142641e-06, "epoch": 0.23172248583406274, "percentage": 23.17, "elapsed_time": "7:57:03", "remaining_time": "1 day, 2:21:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2516, "total_steps": 10853, "loss": 0.1609, "learning_rate": 4.561644954312721e-06, "epoch": 0.23181462201133274, "percentage": 23.18, "elapsed_time": "7:57:14", "remaining_time": "1 day, 2:21:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2517, "total_steps": 10853, "loss": 0.1568, "learning_rate": 4.561213970058845e-06, "epoch": 0.23190675818860276, "percentage": 23.19, "elapsed_time": "7:57:24", "remaining_time": "1 day, 2:21:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2518, "total_steps": 10853, "loss": 0.1733, "learning_rate": 4.560782794421031e-06, "epoch": 0.23199889436587276, "percentage": 23.2, "elapsed_time": "7:57:35", "remaining_time": "1 day, 2:20:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2519, "total_steps": 10853, "loss": 0.1688, "learning_rate": 4.5603514274393125e-06, "epoch": 0.23209103054314276, "percentage": 23.21, "elapsed_time": "7:57:45", "remaining_time": "1 day, 2:20:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2520, "total_steps": 10853, "loss": 0.1526, "learning_rate": 4.559919869153742e-06, "epoch": 0.23218316672041278, "percentage": 23.22, "elapsed_time": "7:57:56", "remaining_time": "1 day, 2:20:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2521, "total_steps": 10853, "loss": 0.1625, "learning_rate": 4.559488119604389e-06, "epoch": 0.23227530289768278, "percentage": 23.23, "elapsed_time": "7:58:06", "remaining_time": "1 day, 2:20:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2522, "total_steps": 10853, "loss": 0.1769, "learning_rate": 4.5590561788313435e-06, "epoch": 0.23236743907495278, "percentage": 23.24, "elapsed_time": "7:58:18", "remaining_time": "1 day, 2:20:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2523, "total_steps": 10853, "loss": 0.1768, "learning_rate": 4.55862404687471e-06, "epoch": 0.23245957525222277, "percentage": 23.25, "elapsed_time": "7:58:30", "remaining_time": "1 day, 2:19:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2524, "total_steps": 10853, "loss": 0.1662, "learning_rate": 4.558191723774612e-06, "epoch": 0.2325517114294928, "percentage": 23.26, "elapsed_time": "7:58:42", "remaining_time": "1 day, 2:19:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2525, "total_steps": 10853, "loss": 0.1649, "learning_rate": 4.557759209571191e-06, "epoch": 0.2326438476067628, "percentage": 23.27, "elapsed_time": "7:58:53", "remaining_time": "1 day, 2:19:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2526, "total_steps": 10853, "loss": 0.1669, "learning_rate": 4.557326504304606e-06, "epoch": 0.2327359837840328, "percentage": 23.27, "elapsed_time": "7:59:04", "remaining_time": "1 day, 2:19:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2527, "total_steps": 10853, "loss": 0.1695, "learning_rate": 4.556893608015034e-06, "epoch": 0.23282811996130282, "percentage": 23.28, "elapsed_time": "7:59:16", "remaining_time": "1 day, 2:19:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2528, "total_steps": 10853, "loss": 0.1571, "learning_rate": 4.556460520742669e-06, "epoch": 0.2329202561385728, "percentage": 23.29, "elapsed_time": "7:59:25", "remaining_time": "1 day, 2:18:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2529, "total_steps": 10853, "loss": 0.1743, "learning_rate": 4.556027242527723e-06, "epoch": 0.2330123923158428, "percentage": 23.3, "elapsed_time": "7:59:36", "remaining_time": "1 day, 2:18:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2530, "total_steps": 10853, "loss": 0.1702, "learning_rate": 4.555593773410426e-06, "epoch": 0.23310452849311283, "percentage": 23.31, "elapsed_time": "7:59:46", "remaining_time": "1 day, 2:18:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2531, "total_steps": 10853, "loss": 0.1653, "learning_rate": 4.555160113431027e-06, "epoch": 0.23319666467038283, "percentage": 23.32, "elapsed_time": "7:59:55", "remaining_time": "1 day, 2:18:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2532, "total_steps": 10853, "loss": 0.1752, "learning_rate": 4.554726262629789e-06, "epoch": 0.23328880084765283, "percentage": 23.33, "elapsed_time": "8:00:06", "remaining_time": "1 day, 2:17:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2533, "total_steps": 10853, "loss": 0.1535, "learning_rate": 4.554292221046997e-06, "epoch": 0.23338093702492282, "percentage": 23.34, "elapsed_time": "8:00:15", "remaining_time": "1 day, 2:17:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2534, "total_steps": 10853, "loss": 0.1611, "learning_rate": 4.553857988722951e-06, "epoch": 0.23347307320219285, "percentage": 23.35, "elapsed_time": "8:00:27", "remaining_time": "1 day, 2:17:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2535, "total_steps": 10853, "loss": 0.1683, "learning_rate": 4.55342356569797e-06, "epoch": 0.23356520937946285, "percentage": 23.36, "elapsed_time": "8:00:37", "remaining_time": "1 day, 2:17:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2536, "total_steps": 10853, "loss": 0.17, "learning_rate": 4.5529889520123896e-06, "epoch": 0.23365734555673284, "percentage": 23.37, "elapsed_time": "8:00:48", "remaining_time": "1 day, 2:16:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2537, "total_steps": 10853, "loss": 0.1746, "learning_rate": 4.5525541477065644e-06, "epoch": 0.23374948173400287, "percentage": 23.38, "elapsed_time": "8:01:00", "remaining_time": "1 day, 2:16:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2538, "total_steps": 10853, "loss": 0.1606, "learning_rate": 4.552119152820866e-06, "epoch": 0.23384161791127286, "percentage": 23.39, "elapsed_time": "8:01:11", "remaining_time": "1 day, 2:16:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2539, "total_steps": 10853, "loss": 0.1692, "learning_rate": 4.551683967395683e-06, "epoch": 0.23393375408854286, "percentage": 23.39, "elapsed_time": "8:01:22", "remaining_time": "1 day, 2:16:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2540, "total_steps": 10853, "loss": 0.1649, "learning_rate": 4.5512485914714225e-06, "epoch": 0.23402589026581286, "percentage": 23.4, "elapsed_time": "8:01:33", "remaining_time": "1 day, 2:16:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2541, "total_steps": 10853, "loss": 0.165, "learning_rate": 4.55081302508851e-06, "epoch": 0.23411802644308288, "percentage": 23.41, "elapsed_time": "8:01:44", "remaining_time": "1 day, 2:15:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2542, "total_steps": 10853, "loss": 0.1698, "learning_rate": 4.550377268287387e-06, "epoch": 0.23421016262035288, "percentage": 23.42, "elapsed_time": "8:01:54", "remaining_time": "1 day, 2:15:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2543, "total_steps": 10853, "loss": 0.1714, "learning_rate": 4.549941321108514e-06, "epoch": 0.23430229879762288, "percentage": 23.43, "elapsed_time": "8:02:05", "remaining_time": "1 day, 2:15:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2544, "total_steps": 10853, "loss": 0.1849, "learning_rate": 4.549505183592368e-06, "epoch": 0.2343944349748929, "percentage": 23.44, "elapsed_time": "8:02:16", "remaining_time": "1 day, 2:15:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2545, "total_steps": 10853, "loss": 0.1526, "learning_rate": 4.549068855779447e-06, "epoch": 0.2344865711521629, "percentage": 23.45, "elapsed_time": "8:02:26", "remaining_time": "1 day, 2:14:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2546, "total_steps": 10853, "loss": 0.1765, "learning_rate": 4.5486323377102615e-06, "epoch": 0.2345787073294329, "percentage": 23.46, "elapsed_time": "8:02:37", "remaining_time": "1 day, 2:14:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2547, "total_steps": 10853, "loss": 0.1394, "learning_rate": 4.548195629425343e-06, "epoch": 0.23467084350670292, "percentage": 23.47, "elapsed_time": "8:02:48", "remaining_time": "1 day, 2:14:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2548, "total_steps": 10853, "loss": 0.1598, "learning_rate": 4.547758730965239e-06, "epoch": 0.23476297968397292, "percentage": 23.48, "elapsed_time": "8:02:59", "remaining_time": "1 day, 2:14:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2549, "total_steps": 10853, "loss": 0.1826, "learning_rate": 4.547321642370517e-06, "epoch": 0.2348551158612429, "percentage": 23.49, "elapsed_time": "8:03:09", "remaining_time": "1 day, 2:14:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2550, "total_steps": 10853, "loss": 0.1576, "learning_rate": 4.5468843636817605e-06, "epoch": 0.2349472520385129, "percentage": 23.5, "elapsed_time": "8:03:19", "remaining_time": "1 day, 2:13:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2551, "total_steps": 10853, "loss": 0.1722, "learning_rate": 4.54644689493957e-06, "epoch": 0.23503938821578294, "percentage": 23.51, "elapsed_time": "8:03:31", "remaining_time": "1 day, 2:13:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2552, "total_steps": 10853, "loss": 0.1463, "learning_rate": 4.546009236184565e-06, "epoch": 0.23513152439305293, "percentage": 23.51, "elapsed_time": "8:03:40", "remaining_time": "1 day, 2:13:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2553, "total_steps": 10853, "loss": 0.1688, "learning_rate": 4.545571387457382e-06, "epoch": 0.23522366057032293, "percentage": 23.52, "elapsed_time": "8:03:50", "remaining_time": "1 day, 2:13:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2554, "total_steps": 10853, "loss": 0.1758, "learning_rate": 4.545133348798677e-06, "epoch": 0.23531579674759295, "percentage": 23.53, "elapsed_time": "8:04:00", "remaining_time": "1 day, 2:12:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2555, "total_steps": 10853, "loss": 0.1713, "learning_rate": 4.54469512024912e-06, "epoch": 0.23540793292486295, "percentage": 23.54, "elapsed_time": "8:04:11", "remaining_time": "1 day, 2:12:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2556, "total_steps": 10853, "loss": 0.1625, "learning_rate": 4.5442567018494e-06, "epoch": 0.23550006910213295, "percentage": 23.55, "elapsed_time": "8:04:21", "remaining_time": "1 day, 2:12:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2557, "total_steps": 10853, "loss": 0.174, "learning_rate": 4.543818093640226e-06, "epoch": 0.23559220527940294, "percentage": 23.56, "elapsed_time": "8:04:32", "remaining_time": "1 day, 2:12:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2558, "total_steps": 10853, "loss": 0.1713, "learning_rate": 4.543379295662322e-06, "epoch": 0.23568434145667297, "percentage": 23.57, "elapsed_time": "8:04:44", "remaining_time": "1 day, 2:11:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2559, "total_steps": 10853, "loss": 0.1573, "learning_rate": 4.54294030795643e-06, "epoch": 0.23577647763394297, "percentage": 23.58, "elapsed_time": "8:04:55", "remaining_time": "1 day, 2:11:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2560, "total_steps": 10853, "loss": 0.1792, "learning_rate": 4.5425011305633106e-06, "epoch": 0.23586861381121296, "percentage": 23.59, "elapsed_time": "8:05:07", "remaining_time": "1 day, 2:11:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2561, "total_steps": 10853, "loss": 0.1756, "learning_rate": 4.542061763523742e-06, "epoch": 0.235960749988483, "percentage": 23.6, "elapsed_time": "8:05:18", "remaining_time": "1 day, 2:11:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2562, "total_steps": 10853, "loss": 0.1614, "learning_rate": 4.541622206878519e-06, "epoch": 0.23605288616575298, "percentage": 23.61, "elapsed_time": "8:05:28", "remaining_time": "1 day, 2:11:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2563, "total_steps": 10853, "loss": 0.1735, "learning_rate": 4.541182460668453e-06, "epoch": 0.23614502234302298, "percentage": 23.62, "elapsed_time": "8:05:40", "remaining_time": "1 day, 2:10:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2564, "total_steps": 10853, "loss": 0.1728, "learning_rate": 4.540742524934377e-06, "epoch": 0.236237158520293, "percentage": 23.62, "elapsed_time": "8:05:50", "remaining_time": "1 day, 2:10:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2565, "total_steps": 10853, "loss": 0.1706, "learning_rate": 4.540302399717138e-06, "epoch": 0.236329294697563, "percentage": 23.63, "elapsed_time": "8:06:00", "remaining_time": "1 day, 2:10:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2566, "total_steps": 10853, "loss": 0.162, "learning_rate": 4.5398620850576016e-06, "epoch": 0.236421430874833, "percentage": 23.64, "elapsed_time": "8:06:11", "remaining_time": "1 day, 2:10:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2567, "total_steps": 10853, "loss": 0.1562, "learning_rate": 4.53942158099665e-06, "epoch": 0.236513567052103, "percentage": 23.65, "elapsed_time": "8:06:22", "remaining_time": "1 day, 2:09:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2568, "total_steps": 10853, "loss": 0.1598, "learning_rate": 4.538980887575187e-06, "epoch": 0.23660570322937302, "percentage": 23.66, "elapsed_time": "8:06:32", "remaining_time": "1 day, 2:09:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2569, "total_steps": 10853, "loss": 0.155, "learning_rate": 4.538540004834128e-06, "epoch": 0.23669783940664302, "percentage": 23.67, "elapsed_time": "8:06:42", "remaining_time": "1 day, 2:09:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2570, "total_steps": 10853, "loss": 0.1525, "learning_rate": 4.53809893281441e-06, "epoch": 0.23678997558391301, "percentage": 23.68, "elapsed_time": "8:06:52", "remaining_time": "1 day, 2:09:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2571, "total_steps": 10853, "loss": 0.1646, "learning_rate": 4.537657671556987e-06, "epoch": 0.23688211176118304, "percentage": 23.69, "elapsed_time": "8:07:02", "remaining_time": "1 day, 2:08:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2572, "total_steps": 10853, "loss": 0.1807, "learning_rate": 4.5372162211028305e-06, "epoch": 0.23697424793845304, "percentage": 23.7, "elapsed_time": "8:07:11", "remaining_time": "1 day, 2:08:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2573, "total_steps": 10853, "loss": 0.1494, "learning_rate": 4.536774581492928e-06, "epoch": 0.23706638411572303, "percentage": 23.71, "elapsed_time": "8:07:23", "remaining_time": "1 day, 2:08:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2574, "total_steps": 10853, "loss": 0.1593, "learning_rate": 4.5363327527682855e-06, "epoch": 0.23715852029299303, "percentage": 23.72, "elapsed_time": "8:07:34", "remaining_time": "1 day, 2:08:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2575, "total_steps": 10853, "loss": 0.1704, "learning_rate": 4.535890734969929e-06, "epoch": 0.23725065647026305, "percentage": 23.73, "elapsed_time": "8:07:44", "remaining_time": "1 day, 2:07:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2576, "total_steps": 10853, "loss": 0.176, "learning_rate": 4.535448528138899e-06, "epoch": 0.23734279264753305, "percentage": 23.74, "elapsed_time": "8:07:56", "remaining_time": "1 day, 2:07:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2577, "total_steps": 10853, "loss": 0.1911, "learning_rate": 4.535006132316253e-06, "epoch": 0.23743492882480305, "percentage": 23.74, "elapsed_time": "8:08:08", "remaining_time": "1 day, 2:07:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2578, "total_steps": 10853, "loss": 0.1606, "learning_rate": 4.534563547543069e-06, "epoch": 0.23752706500207307, "percentage": 23.75, "elapsed_time": "8:08:19", "remaining_time": "1 day, 2:07:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2579, "total_steps": 10853, "loss": 0.1817, "learning_rate": 4.53412077386044e-06, "epoch": 0.23761920117934307, "percentage": 23.76, "elapsed_time": "8:08:29", "remaining_time": "1 day, 2:07:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2580, "total_steps": 10853, "loss": 0.1672, "learning_rate": 4.533677811309479e-06, "epoch": 0.23771133735661307, "percentage": 23.77, "elapsed_time": "8:08:40", "remaining_time": "1 day, 2:06:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2581, "total_steps": 10853, "loss": 0.1845, "learning_rate": 4.533234659931315e-06, "epoch": 0.2378034735338831, "percentage": 23.78, "elapsed_time": "8:08:49", "remaining_time": "1 day, 2:06:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2582, "total_steps": 10853, "loss": 0.1434, "learning_rate": 4.532791319767093e-06, "epoch": 0.2378956097111531, "percentage": 23.79, "elapsed_time": "8:09:00", "remaining_time": "1 day, 2:06:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2583, "total_steps": 10853, "loss": 0.1808, "learning_rate": 4.532347790857978e-06, "epoch": 0.23798774588842309, "percentage": 23.8, "elapsed_time": "8:09:11", "remaining_time": "1 day, 2:06:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2584, "total_steps": 10853, "loss": 0.1701, "learning_rate": 4.531904073245152e-06, "epoch": 0.23807988206569308, "percentage": 23.81, "elapsed_time": "8:09:21", "remaining_time": "1 day, 2:05:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2585, "total_steps": 10853, "loss": 0.1668, "learning_rate": 4.531460166969816e-06, "epoch": 0.2381720182429631, "percentage": 23.82, "elapsed_time": "8:09:31", "remaining_time": "1 day, 2:05:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2586, "total_steps": 10853, "loss": 0.1697, "learning_rate": 4.531016072073182e-06, "epoch": 0.2382641544202331, "percentage": 23.83, "elapsed_time": "8:09:42", "remaining_time": "1 day, 2:05:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2587, "total_steps": 10853, "loss": 0.166, "learning_rate": 4.530571788596489e-06, "epoch": 0.2383562905975031, "percentage": 23.84, "elapsed_time": "8:09:53", "remaining_time": "1 day, 2:05:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2588, "total_steps": 10853, "loss": 0.1775, "learning_rate": 4.530127316580986e-06, "epoch": 0.23844842677477313, "percentage": 23.85, "elapsed_time": "8:10:04", "remaining_time": "1 day, 2:05:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2589, "total_steps": 10853, "loss": 0.1493, "learning_rate": 4.5296826560679445e-06, "epoch": 0.23854056295204312, "percentage": 23.86, "elapsed_time": "8:10:14", "remaining_time": "1 day, 2:04:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2590, "total_steps": 10853, "loss": 0.1625, "learning_rate": 4.529237807098649e-06, "epoch": 0.23863269912931312, "percentage": 23.86, "elapsed_time": "8:10:26", "remaining_time": "1 day, 2:04:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2591, "total_steps": 10853, "loss": 0.1758, "learning_rate": 4.528792769714404e-06, "epoch": 0.23872483530658312, "percentage": 23.87, "elapsed_time": "8:10:37", "remaining_time": "1 day, 2:04:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2592, "total_steps": 10853, "loss": 0.1596, "learning_rate": 4.528347543956533e-06, "epoch": 0.23881697148385314, "percentage": 23.88, "elapsed_time": "8:10:48", "remaining_time": "1 day, 2:04:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2593, "total_steps": 10853, "loss": 0.1732, "learning_rate": 4.527902129866374e-06, "epoch": 0.23890910766112314, "percentage": 23.89, "elapsed_time": "8:10:59", "remaining_time": "1 day, 2:04:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2594, "total_steps": 10853, "loss": 0.1683, "learning_rate": 4.527456527485284e-06, "epoch": 0.23900124383839313, "percentage": 23.9, "elapsed_time": "8:11:11", "remaining_time": "1 day, 2:03:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2595, "total_steps": 10853, "loss": 0.1601, "learning_rate": 4.527010736854637e-06, "epoch": 0.23909338001566316, "percentage": 23.91, "elapsed_time": "8:11:22", "remaining_time": "1 day, 2:03:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2596, "total_steps": 10853, "loss": 0.1597, "learning_rate": 4.526564758015825e-06, "epoch": 0.23918551619293316, "percentage": 23.92, "elapsed_time": "8:11:33", "remaining_time": "1 day, 2:03:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2597, "total_steps": 10853, "loss": 0.1749, "learning_rate": 4.5261185910102575e-06, "epoch": 0.23927765237020315, "percentage": 23.93, "elapsed_time": "8:11:43", "remaining_time": "1 day, 2:03:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2598, "total_steps": 10853, "loss": 0.1757, "learning_rate": 4.525672235879361e-06, "epoch": 0.23936978854747318, "percentage": 23.94, "elapsed_time": "8:11:53", "remaining_time": "1 day, 2:02:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2599, "total_steps": 10853, "loss": 0.1733, "learning_rate": 4.5252256926645786e-06, "epoch": 0.23946192472474317, "percentage": 23.95, "elapsed_time": "8:12:05", "remaining_time": "1 day, 2:02:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2600, "total_steps": 10853, "loss": 0.1518, "learning_rate": 4.5247789614073725e-06, "epoch": 0.23955406090201317, "percentage": 23.96, "elapsed_time": "8:12:16", "remaining_time": "1 day, 2:02:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2601, "total_steps": 10853, "loss": 0.1598, "learning_rate": 4.524332042149223e-06, "epoch": 0.23964619707928317, "percentage": 23.97, "elapsed_time": "8:12:27", "remaining_time": "1 day, 2:02:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2602, "total_steps": 10853, "loss": 0.1536, "learning_rate": 4.523884934931624e-06, "epoch": 0.2397383332565532, "percentage": 23.97, "elapsed_time": "8:12:38", "remaining_time": "1 day, 2:02:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2603, "total_steps": 10853, "loss": 0.1558, "learning_rate": 4.523437639796092e-06, "epoch": 0.2398304694338232, "percentage": 23.98, "elapsed_time": "8:12:48", "remaining_time": "1 day, 2:01:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2604, "total_steps": 10853, "loss": 0.1696, "learning_rate": 4.522990156784157e-06, "epoch": 0.2399226056110932, "percentage": 23.99, "elapsed_time": "8:13:00", "remaining_time": "1 day, 2:01:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2605, "total_steps": 10853, "loss": 0.165, "learning_rate": 4.522542485937369e-06, "epoch": 0.2400147417883632, "percentage": 24.0, "elapsed_time": "8:13:11", "remaining_time": "1 day, 2:01:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2606, "total_steps": 10853, "loss": 0.1518, "learning_rate": 4.522094627297293e-06, "epoch": 0.2401068779656332, "percentage": 24.01, "elapsed_time": "8:13:22", "remaining_time": "1 day, 2:01:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2607, "total_steps": 10853, "loss": 0.1663, "learning_rate": 4.521646580905513e-06, "epoch": 0.2401990141429032, "percentage": 24.02, "elapsed_time": "8:13:32", "remaining_time": "1 day, 2:01:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2608, "total_steps": 10853, "loss": 0.156, "learning_rate": 4.521198346803631e-06, "epoch": 0.2402911503201732, "percentage": 24.03, "elapsed_time": "8:13:43", "remaining_time": "1 day, 2:00:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2609, "total_steps": 10853, "loss": 0.1607, "learning_rate": 4.520749925033264e-06, "epoch": 0.24038328649744323, "percentage": 24.04, "elapsed_time": "8:13:53", "remaining_time": "1 day, 2:00:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2610, "total_steps": 10853, "loss": 0.1725, "learning_rate": 4.52030131563605e-06, "epoch": 0.24047542267471322, "percentage": 24.05, "elapsed_time": "8:14:02", "remaining_time": "1 day, 2:00:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2611, "total_steps": 10853, "loss": 0.167, "learning_rate": 4.519852518653641e-06, "epoch": 0.24056755885198322, "percentage": 24.06, "elapsed_time": "8:14:13", "remaining_time": "1 day, 2:00:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2612, "total_steps": 10853, "loss": 0.1651, "learning_rate": 4.519403534127709e-06, "epoch": 0.24065969502925325, "percentage": 24.07, "elapsed_time": "8:14:24", "remaining_time": "1 day, 1:59:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2613, "total_steps": 10853, "loss": 0.1682, "learning_rate": 4.51895436209994e-06, "epoch": 0.24075183120652324, "percentage": 24.08, "elapsed_time": "8:14:36", "remaining_time": "1 day, 1:59:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2614, "total_steps": 10853, "loss": 0.1581, "learning_rate": 4.5185050026120425e-06, "epoch": 0.24084396738379324, "percentage": 24.09, "elapsed_time": "8:14:47", "remaining_time": "1 day, 1:59:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2615, "total_steps": 10853, "loss": 0.1607, "learning_rate": 4.5180554557057376e-06, "epoch": 0.24093610356106326, "percentage": 24.09, "elapsed_time": "8:14:59", "remaining_time": "1 day, 1:59:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2616, "total_steps": 10853, "loss": 0.1557, "learning_rate": 4.5176057214227665e-06, "epoch": 0.24102823973833326, "percentage": 24.1, "elapsed_time": "8:15:09", "remaining_time": "1 day, 1:59:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2617, "total_steps": 10853, "loss": 0.1594, "learning_rate": 4.517155799804888e-06, "epoch": 0.24112037591560326, "percentage": 24.11, "elapsed_time": "8:15:19", "remaining_time": "1 day, 1:58:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2618, "total_steps": 10853, "loss": 0.1746, "learning_rate": 4.516705690893874e-06, "epoch": 0.24121251209287325, "percentage": 24.12, "elapsed_time": "8:15:31", "remaining_time": "1 day, 1:58:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2619, "total_steps": 10853, "loss": 0.1655, "learning_rate": 4.516255394731522e-06, "epoch": 0.24130464827014328, "percentage": 24.13, "elapsed_time": "8:15:42", "remaining_time": "1 day, 1:58:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2620, "total_steps": 10853, "loss": 0.1604, "learning_rate": 4.515804911359639e-06, "epoch": 0.24139678444741328, "percentage": 24.14, "elapsed_time": "8:15:53", "remaining_time": "1 day, 1:58:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2621, "total_steps": 10853, "loss": 0.1666, "learning_rate": 4.5153542408200524e-06, "epoch": 0.24148892062468327, "percentage": 24.15, "elapsed_time": "8:16:03", "remaining_time": "1 day, 1:57:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2622, "total_steps": 10853, "loss": 0.1715, "learning_rate": 4.514903383154608e-06, "epoch": 0.2415810568019533, "percentage": 24.16, "elapsed_time": "8:16:14", "remaining_time": "1 day, 1:57:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2623, "total_steps": 10853, "loss": 0.1704, "learning_rate": 4.5144523384051675e-06, "epoch": 0.2416731929792233, "percentage": 24.17, "elapsed_time": "8:16:25", "remaining_time": "1 day, 1:57:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2624, "total_steps": 10853, "loss": 0.1673, "learning_rate": 4.514001106613611e-06, "epoch": 0.2417653291564933, "percentage": 24.18, "elapsed_time": "8:16:36", "remaining_time": "1 day, 1:57:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2625, "total_steps": 10853, "loss": 0.1598, "learning_rate": 4.513549687821834e-06, "epoch": 0.2418574653337633, "percentage": 24.19, "elapsed_time": "8:16:46", "remaining_time": "1 day, 1:57:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2626, "total_steps": 10853, "loss": 0.1796, "learning_rate": 4.513098082071753e-06, "epoch": 0.2419496015110333, "percentage": 24.2, "elapsed_time": "8:16:57", "remaining_time": "1 day, 1:56:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2627, "total_steps": 10853, "loss": 0.1737, "learning_rate": 4.512646289405298e-06, "epoch": 0.2420417376883033, "percentage": 24.21, "elapsed_time": "8:17:08", "remaining_time": "1 day, 1:56:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2628, "total_steps": 10853, "loss": 0.1727, "learning_rate": 4.5121943098644185e-06, "epoch": 0.2421338738655733, "percentage": 24.21, "elapsed_time": "8:17:18", "remaining_time": "1 day, 1:56:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2629, "total_steps": 10853, "loss": 0.1563, "learning_rate": 4.5117421434910805e-06, "epoch": 0.24222601004284333, "percentage": 24.22, "elapsed_time": "8:17:28", "remaining_time": "1 day, 1:56:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2630, "total_steps": 10853, "loss": 0.1795, "learning_rate": 4.511289790327268e-06, "epoch": 0.24231814622011333, "percentage": 24.23, "elapsed_time": "8:17:40", "remaining_time": "1 day, 1:56:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2631, "total_steps": 10853, "loss": 0.1802, "learning_rate": 4.510837250414982e-06, "epoch": 0.24241028239738333, "percentage": 24.24, "elapsed_time": "8:17:50", "remaining_time": "1 day, 1:55:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2632, "total_steps": 10853, "loss": 0.1824, "learning_rate": 4.5103845237962405e-06, "epoch": 0.24250241857465335, "percentage": 24.25, "elapsed_time": "8:18:00", "remaining_time": "1 day, 1:55:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2633, "total_steps": 10853, "loss": 0.1535, "learning_rate": 4.509931610513081e-06, "epoch": 0.24259455475192335, "percentage": 24.26, "elapsed_time": "8:18:10", "remaining_time": "1 day, 1:55:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2634, "total_steps": 10853, "loss": 0.162, "learning_rate": 4.509478510607553e-06, "epoch": 0.24268669092919334, "percentage": 24.27, "elapsed_time": "8:18:21", "remaining_time": "1 day, 1:55:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2635, "total_steps": 10853, "loss": 0.1488, "learning_rate": 4.509025224121732e-06, "epoch": 0.24277882710646334, "percentage": 24.28, "elapsed_time": "8:18:32", "remaining_time": "1 day, 1:54:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2636, "total_steps": 10853, "loss": 0.1832, "learning_rate": 4.5085717510977e-06, "epoch": 0.24287096328373337, "percentage": 24.29, "elapsed_time": "8:18:43", "remaining_time": "1 day, 1:54:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2637, "total_steps": 10853, "loss": 0.1578, "learning_rate": 4.508118091577566e-06, "epoch": 0.24296309946100336, "percentage": 24.3, "elapsed_time": "8:18:55", "remaining_time": "1 day, 1:54:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2638, "total_steps": 10853, "loss": 0.1661, "learning_rate": 4.507664245603451e-06, "epoch": 0.24305523563827336, "percentage": 24.31, "elapsed_time": "8:19:05", "remaining_time": "1 day, 1:54:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2639, "total_steps": 10853, "loss": 0.1695, "learning_rate": 4.507210213217495e-06, "epoch": 0.24314737181554338, "percentage": 24.32, "elapsed_time": "8:19:15", "remaining_time": "1 day, 1:53:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2640, "total_steps": 10853, "loss": 0.1803, "learning_rate": 4.506755994461853e-06, "epoch": 0.24323950799281338, "percentage": 24.33, "elapsed_time": "8:19:27", "remaining_time": "1 day, 1:53:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2641, "total_steps": 10853, "loss": 0.1754, "learning_rate": 4.506301589378703e-06, "epoch": 0.24333164417008338, "percentage": 24.33, "elapsed_time": "8:19:38", "remaining_time": "1 day, 1:53:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2642, "total_steps": 10853, "loss": 0.1608, "learning_rate": 4.5058469980102336e-06, "epoch": 0.24342378034735337, "percentage": 24.34, "elapsed_time": "8:19:49", "remaining_time": "1 day, 1:53:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2643, "total_steps": 10853, "loss": 0.1743, "learning_rate": 4.505392220398655e-06, "epoch": 0.2435159165246234, "percentage": 24.35, "elapsed_time": "8:20:01", "remaining_time": "1 day, 1:53:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2644, "total_steps": 10853, "loss": 0.1614, "learning_rate": 4.504937256586192e-06, "epoch": 0.2436080527018934, "percentage": 24.36, "elapsed_time": "8:20:12", "remaining_time": "1 day, 1:53:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2645, "total_steps": 10853, "loss": 0.18, "learning_rate": 4.50448210661509e-06, "epoch": 0.2437001888791634, "percentage": 24.37, "elapsed_time": "8:20:23", "remaining_time": "1 day, 1:52:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2646, "total_steps": 10853, "loss": 0.1625, "learning_rate": 4.504026770527607e-06, "epoch": 0.24379232505643342, "percentage": 24.38, "elapsed_time": "8:20:35", "remaining_time": "1 day, 1:52:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2647, "total_steps": 10853, "loss": 0.1644, "learning_rate": 4.503571248366024e-06, "epoch": 0.24388446123370341, "percentage": 24.39, "elapsed_time": "8:20:45", "remaining_time": "1 day, 1:52:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2648, "total_steps": 10853, "loss": 0.1766, "learning_rate": 4.503115540172636e-06, "epoch": 0.2439765974109734, "percentage": 24.4, "elapsed_time": "8:20:55", "remaining_time": "1 day, 1:52:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2649, "total_steps": 10853, "loss": 0.1517, "learning_rate": 4.502659645989753e-06, "epoch": 0.24406873358824344, "percentage": 24.41, "elapsed_time": "8:21:04", "remaining_time": "1 day, 1:51:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2650, "total_steps": 10853, "loss": 0.1548, "learning_rate": 4.502203565859706e-06, "epoch": 0.24416086976551343, "percentage": 24.42, "elapsed_time": "8:21:16", "remaining_time": "1 day, 1:51:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2651, "total_steps": 10853, "loss": 0.1769, "learning_rate": 4.501747299824843e-06, "epoch": 0.24425300594278343, "percentage": 24.43, "elapsed_time": "8:21:27", "remaining_time": "1 day, 1:51:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2652, "total_steps": 10853, "loss": 0.158, "learning_rate": 4.501290847927529e-06, "epoch": 0.24434514212005343, "percentage": 24.44, "elapsed_time": "8:21:38", "remaining_time": "1 day, 1:51:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2653, "total_steps": 10853, "loss": 0.1536, "learning_rate": 4.500834210210143e-06, "epoch": 0.24443727829732345, "percentage": 24.44, "elapsed_time": "8:21:47", "remaining_time": "1 day, 1:50:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2654, "total_steps": 10853, "loss": 0.1561, "learning_rate": 4.500377386715086e-06, "epoch": 0.24452941447459345, "percentage": 24.45, "elapsed_time": "8:21:59", "remaining_time": "1 day, 1:50:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2655, "total_steps": 10853, "loss": 0.1561, "learning_rate": 4.499920377484772e-06, "epoch": 0.24462155065186345, "percentage": 24.46, "elapsed_time": "8:22:11", "remaining_time": "1 day, 1:50:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2656, "total_steps": 10853, "loss": 0.1781, "learning_rate": 4.499463182561637e-06, "epoch": 0.24471368682913347, "percentage": 24.47, "elapsed_time": "8:22:22", "remaining_time": "1 day, 1:50:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2657, "total_steps": 10853, "loss": 0.163, "learning_rate": 4.49900580198813e-06, "epoch": 0.24480582300640347, "percentage": 24.48, "elapsed_time": "8:22:33", "remaining_time": "1 day, 1:50:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2658, "total_steps": 10853, "loss": 0.1552, "learning_rate": 4.498548235806719e-06, "epoch": 0.24489795918367346, "percentage": 24.49, "elapsed_time": "8:22:43", "remaining_time": "1 day, 1:49:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2659, "total_steps": 10853, "loss": 0.1552, "learning_rate": 4.4980904840598894e-06, "epoch": 0.24499009536094346, "percentage": 24.5, "elapsed_time": "8:22:53", "remaining_time": "1 day, 1:49:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2660, "total_steps": 10853, "loss": 0.1512, "learning_rate": 4.497632546790143e-06, "epoch": 0.24508223153821349, "percentage": 24.51, "elapsed_time": "8:23:03", "remaining_time": "1 day, 1:49:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2661, "total_steps": 10853, "loss": 0.1595, "learning_rate": 4.49717442404e-06, "epoch": 0.24517436771548348, "percentage": 24.52, "elapsed_time": "8:23:13", "remaining_time": "1 day, 1:49:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2662, "total_steps": 10853, "loss": 0.1717, "learning_rate": 4.496716115851996e-06, "epoch": 0.24526650389275348, "percentage": 24.53, "elapsed_time": "8:23:24", "remaining_time": "1 day, 1:48:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2663, "total_steps": 10853, "loss": 0.1615, "learning_rate": 4.496257622268687e-06, "epoch": 0.2453586400700235, "percentage": 24.54, "elapsed_time": "8:23:34", "remaining_time": "1 day, 1:48:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2664, "total_steps": 10853, "loss": 0.1579, "learning_rate": 4.495798943332642e-06, "epoch": 0.2454507762472935, "percentage": 24.55, "elapsed_time": "8:23:44", "remaining_time": "1 day, 1:48:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2665, "total_steps": 10853, "loss": 0.169, "learning_rate": 4.495340079086451e-06, "epoch": 0.2455429124245635, "percentage": 24.56, "elapsed_time": "8:23:55", "remaining_time": "1 day, 1:48:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2666, "total_steps": 10853, "loss": 0.1704, "learning_rate": 4.494881029572718e-06, "epoch": 0.24563504860183352, "percentage": 24.56, "elapsed_time": "8:24:06", "remaining_time": "1 day, 1:48:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2667, "total_steps": 10853, "loss": 0.1605, "learning_rate": 4.494421794834068e-06, "epoch": 0.24572718477910352, "percentage": 24.57, "elapsed_time": "8:24:17", "remaining_time": "1 day, 1:47:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2668, "total_steps": 10853, "loss": 0.1787, "learning_rate": 4.4939623749131385e-06, "epoch": 0.24581932095637352, "percentage": 24.58, "elapsed_time": "8:24:29", "remaining_time": "1 day, 1:47:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2669, "total_steps": 10853, "loss": 0.1645, "learning_rate": 4.493502769852589e-06, "epoch": 0.2459114571336435, "percentage": 24.59, "elapsed_time": "8:24:39", "remaining_time": "1 day, 1:47:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2670, "total_steps": 10853, "loss": 0.1706, "learning_rate": 4.493042979695092e-06, "epoch": 0.24600359331091354, "percentage": 24.6, "elapsed_time": "8:24:48", "remaining_time": "1 day, 1:47:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2671, "total_steps": 10853, "loss": 0.1632, "learning_rate": 4.4925830044833405e-06, "epoch": 0.24609572948818353, "percentage": 24.61, "elapsed_time": "8:24:59", "remaining_time": "1 day, 1:46:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2672, "total_steps": 10853, "loss": 0.1645, "learning_rate": 4.492122844260042e-06, "epoch": 0.24618786566545353, "percentage": 24.62, "elapsed_time": "8:25:09", "remaining_time": "1 day, 1:46:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2673, "total_steps": 10853, "loss": 0.1684, "learning_rate": 4.491662499067923e-06, "epoch": 0.24628000184272356, "percentage": 24.63, "elapsed_time": "8:25:19", "remaining_time": "1 day, 1:46:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2674, "total_steps": 10853, "loss": 0.1425, "learning_rate": 4.491201968949726e-06, "epoch": 0.24637213801999355, "percentage": 24.64, "elapsed_time": "8:25:29", "remaining_time": "1 day, 1:46:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2675, "total_steps": 10853, "loss": 0.1617, "learning_rate": 4.490741253948213e-06, "epoch": 0.24646427419726355, "percentage": 24.65, "elapsed_time": "8:25:40", "remaining_time": "1 day, 1:45:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2676, "total_steps": 10853, "loss": 0.161, "learning_rate": 4.49028035410616e-06, "epoch": 0.24655641037453357, "percentage": 24.66, "elapsed_time": "8:25:51", "remaining_time": "1 day, 1:45:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2677, "total_steps": 10853, "loss": 0.1646, "learning_rate": 4.489819269466362e-06, "epoch": 0.24664854655180357, "percentage": 24.67, "elapsed_time": "8:26:01", "remaining_time": "1 day, 1:45:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2678, "total_steps": 10853, "loss": 0.1591, "learning_rate": 4.489358000071631e-06, "epoch": 0.24674068272907357, "percentage": 24.68, "elapsed_time": "8:26:12", "remaining_time": "1 day, 1:45:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2679, "total_steps": 10853, "loss": 0.1642, "learning_rate": 4.488896545964795e-06, "epoch": 0.24683281890634357, "percentage": 24.68, "elapsed_time": "8:26:22", "remaining_time": "1 day, 1:45:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2680, "total_steps": 10853, "loss": 0.1506, "learning_rate": 4.4884349071887e-06, "epoch": 0.2469249550836136, "percentage": 24.69, "elapsed_time": "8:26:33", "remaining_time": "1 day, 1:44:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2681, "total_steps": 10853, "loss": 0.1668, "learning_rate": 4.487973083786211e-06, "epoch": 0.2470170912608836, "percentage": 24.7, "elapsed_time": "8:26:42", "remaining_time": "1 day, 1:44:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2682, "total_steps": 10853, "loss": 0.1731, "learning_rate": 4.4875110758002076e-06, "epoch": 0.24710922743815358, "percentage": 24.71, "elapsed_time": "8:26:52", "remaining_time": "1 day, 1:44:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2683, "total_steps": 10853, "loss": 0.162, "learning_rate": 4.487048883273586e-06, "epoch": 0.2472013636154236, "percentage": 24.72, "elapsed_time": "8:27:03", "remaining_time": "1 day, 1:44:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2684, "total_steps": 10853, "loss": 0.1656, "learning_rate": 4.486586506249262e-06, "epoch": 0.2472934997926936, "percentage": 24.73, "elapsed_time": "8:27:14", "remaining_time": "1 day, 1:43:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2685, "total_steps": 10853, "loss": 0.1649, "learning_rate": 4.486123944770166e-06, "epoch": 0.2473856359699636, "percentage": 24.74, "elapsed_time": "8:27:24", "remaining_time": "1 day, 1:43:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2686, "total_steps": 10853, "loss": 0.1773, "learning_rate": 4.48566119887925e-06, "epoch": 0.2474777721472336, "percentage": 24.75, "elapsed_time": "8:27:34", "remaining_time": "1 day, 1:43:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2687, "total_steps": 10853, "loss": 0.1567, "learning_rate": 4.4851982686194775e-06, "epoch": 0.24756990832450362, "percentage": 24.76, "elapsed_time": "8:27:45", "remaining_time": "1 day, 1:43:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2688, "total_steps": 10853, "loss": 0.1593, "learning_rate": 4.484735154033831e-06, "epoch": 0.24766204450177362, "percentage": 24.77, "elapsed_time": "8:27:55", "remaining_time": "1 day, 1:42:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2689, "total_steps": 10853, "loss": 0.1694, "learning_rate": 4.484271855165312e-06, "epoch": 0.24775418067904362, "percentage": 24.78, "elapsed_time": "8:28:07", "remaining_time": "1 day, 1:42:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2690, "total_steps": 10853, "loss": 0.1714, "learning_rate": 4.483808372056939e-06, "epoch": 0.24784631685631364, "percentage": 24.79, "elapsed_time": "8:28:19", "remaining_time": "1 day, 1:42:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2691, "total_steps": 10853, "loss": 0.1791, "learning_rate": 4.483344704751745e-06, "epoch": 0.24793845303358364, "percentage": 24.79, "elapsed_time": "8:28:30", "remaining_time": "1 day, 1:42:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2692, "total_steps": 10853, "loss": 0.1642, "learning_rate": 4.48288085329278e-06, "epoch": 0.24803058921085364, "percentage": 24.8, "elapsed_time": "8:28:41", "remaining_time": "1 day, 1:42:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2693, "total_steps": 10853, "loss": 0.1619, "learning_rate": 4.482416817723115e-06, "epoch": 0.24812272538812366, "percentage": 24.81, "elapsed_time": "8:28:52", "remaining_time": "1 day, 1:41:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2694, "total_steps": 10853, "loss": 0.1816, "learning_rate": 4.481952598085836e-06, "epoch": 0.24821486156539366, "percentage": 24.82, "elapsed_time": "8:29:03", "remaining_time": "1 day, 1:41:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2695, "total_steps": 10853, "loss": 0.1502, "learning_rate": 4.481488194424044e-06, "epoch": 0.24830699774266365, "percentage": 24.83, "elapsed_time": "8:29:14", "remaining_time": "1 day, 1:41:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2696, "total_steps": 10853, "loss": 0.1681, "learning_rate": 4.481023606780861e-06, "epoch": 0.24839913391993365, "percentage": 24.84, "elapsed_time": "8:29:25", "remaining_time": "1 day, 1:41:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2697, "total_steps": 10853, "loss": 0.1611, "learning_rate": 4.480558835199422e-06, "epoch": 0.24849127009720368, "percentage": 24.85, "elapsed_time": "8:29:37", "remaining_time": "1 day, 1:41:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2698, "total_steps": 10853, "loss": 0.1508, "learning_rate": 4.4800938797228825e-06, "epoch": 0.24858340627447367, "percentage": 24.86, "elapsed_time": "8:29:46", "remaining_time": "1 day, 1:40:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2699, "total_steps": 10853, "loss": 0.1424, "learning_rate": 4.479628740394412e-06, "epoch": 0.24867554245174367, "percentage": 24.87, "elapsed_time": "8:29:57", "remaining_time": "1 day, 1:40:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2700, "total_steps": 10853, "loss": 0.1557, "learning_rate": 4.4791634172572015e-06, "epoch": 0.2487676786290137, "percentage": 24.88, "elapsed_time": "8:30:07", "remaining_time": "1 day, 1:40:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2701, "total_steps": 10853, "loss": 0.1647, "learning_rate": 4.478697910354455e-06, "epoch": 0.2488598148062837, "percentage": 24.89, "elapsed_time": "8:30:18", "remaining_time": "1 day, 1:40:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2702, "total_steps": 10853, "loss": 0.1508, "learning_rate": 4.4782322197293935e-06, "epoch": 0.2489519509835537, "percentage": 24.9, "elapsed_time": "8:30:29", "remaining_time": "1 day, 1:39:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2703, "total_steps": 10853, "loss": 0.1669, "learning_rate": 4.477766345425257e-06, "epoch": 0.24904408716082369, "percentage": 24.91, "elapsed_time": "8:30:39", "remaining_time": "1 day, 1:39:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2704, "total_steps": 10853, "loss": 0.166, "learning_rate": 4.4773002874853035e-06, "epoch": 0.2491362233380937, "percentage": 24.91, "elapsed_time": "8:30:51", "remaining_time": "1 day, 1:39:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2705, "total_steps": 10853, "loss": 0.1692, "learning_rate": 4.476834045952805e-06, "epoch": 0.2492283595153637, "percentage": 24.92, "elapsed_time": "8:31:02", "remaining_time": "1 day, 1:39:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2706, "total_steps": 10853, "loss": 0.1678, "learning_rate": 4.476367620871053e-06, "epoch": 0.2493204956926337, "percentage": 24.93, "elapsed_time": "8:31:14", "remaining_time": "1 day, 1:39:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2707, "total_steps": 10853, "loss": 0.1719, "learning_rate": 4.475901012283354e-06, "epoch": 0.24941263186990373, "percentage": 24.94, "elapsed_time": "8:31:25", "remaining_time": "1 day, 1:38:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2708, "total_steps": 10853, "loss": 0.171, "learning_rate": 4.475434220233034e-06, "epoch": 0.24950476804717373, "percentage": 24.95, "elapsed_time": "8:31:35", "remaining_time": "1 day, 1:38:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2709, "total_steps": 10853, "loss": 0.1524, "learning_rate": 4.474967244763434e-06, "epoch": 0.24959690422444372, "percentage": 24.96, "elapsed_time": "8:31:46", "remaining_time": "1 day, 1:38:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2710, "total_steps": 10853, "loss": 0.1626, "learning_rate": 4.474500085917912e-06, "epoch": 0.24968904040171375, "percentage": 24.97, "elapsed_time": "8:31:57", "remaining_time": "1 day, 1:38:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2711, "total_steps": 10853, "loss": 0.1681, "learning_rate": 4.474032743739846e-06, "epoch": 0.24978117657898374, "percentage": 24.98, "elapsed_time": "8:32:08", "remaining_time": "1 day, 1:38:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2712, "total_steps": 10853, "loss": 0.1534, "learning_rate": 4.4735652182726265e-06, "epoch": 0.24987331275625374, "percentage": 24.99, "elapsed_time": "8:32:18", "remaining_time": "1 day, 1:37:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2713, "total_steps": 10853, "loss": 0.1629, "learning_rate": 4.473097509559664e-06, "epoch": 0.24996544893352374, "percentage": 25.0, "elapsed_time": "8:32:28", "remaining_time": "1 day, 1:37:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2714, "total_steps": 10853, "loss": 0.1634, "learning_rate": 4.472629617644385e-06, "epoch": 0.25005758511079373, "percentage": 25.01, "elapsed_time": "8:32:38", "remaining_time": "1 day, 1:37:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2715, "total_steps": 10853, "loss": 0.1465, "learning_rate": 4.472161542570234e-06, "epoch": 0.25014972128806373, "percentage": 25.02, "elapsed_time": "8:32:49", "remaining_time": "1 day, 1:37:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2716, "total_steps": 10853, "loss": 0.1885, "learning_rate": 4.4716932843806715e-06, "epoch": 0.2502418574653338, "percentage": 25.03, "elapsed_time": "8:33:01", "remaining_time": "1 day, 1:36:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2717, "total_steps": 10853, "loss": 0.1622, "learning_rate": 4.471224843119176e-06, "epoch": 0.2503339936426038, "percentage": 25.03, "elapsed_time": "8:33:11", "remaining_time": "1 day, 1:36:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2718, "total_steps": 10853, "loss": 0.1806, "learning_rate": 4.470756218829241e-06, "epoch": 0.2504261298198738, "percentage": 25.04, "elapsed_time": "8:33:21", "remaining_time": "1 day, 1:36:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2719, "total_steps": 10853, "loss": 0.1517, "learning_rate": 4.470287411554379e-06, "epoch": 0.2505182659971438, "percentage": 25.05, "elapsed_time": "8:33:31", "remaining_time": "1 day, 1:36:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2720, "total_steps": 10853, "loss": 0.1562, "learning_rate": 4.469818421338119e-06, "epoch": 0.25061040217441377, "percentage": 25.06, "elapsed_time": "8:33:44", "remaining_time": "1 day, 1:36:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2721, "total_steps": 10853, "loss": 0.1943, "learning_rate": 4.469349248224007e-06, "epoch": 0.25070253835168377, "percentage": 25.07, "elapsed_time": "8:33:56", "remaining_time": "1 day, 1:35:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2722, "total_steps": 10853, "loss": 0.155, "learning_rate": 4.468879892255604e-06, "epoch": 0.2507946745289538, "percentage": 25.08, "elapsed_time": "8:34:05", "remaining_time": "1 day, 1:35:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2723, "total_steps": 10853, "loss": 0.1684, "learning_rate": 4.4684103534764925e-06, "epoch": 0.2508868107062238, "percentage": 25.09, "elapsed_time": "8:34:16", "remaining_time": "1 day, 1:35:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2724, "total_steps": 10853, "loss": 0.1643, "learning_rate": 4.467940631930267e-06, "epoch": 0.2509789468834938, "percentage": 25.1, "elapsed_time": "8:34:26", "remaining_time": "1 day, 1:35:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2725, "total_steps": 10853, "loss": 0.161, "learning_rate": 4.467470727660543e-06, "epoch": 0.2510710830607638, "percentage": 25.11, "elapsed_time": "8:34:37", "remaining_time": "1 day, 1:35:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2726, "total_steps": 10853, "loss": 0.1657, "learning_rate": 4.467000640710949e-06, "epoch": 0.2511632192380338, "percentage": 25.12, "elapsed_time": "8:34:49", "remaining_time": "1 day, 1:34:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2727, "total_steps": 10853, "loss": 0.1627, "learning_rate": 4.466530371125135e-06, "epoch": 0.2512553554153038, "percentage": 25.13, "elapsed_time": "8:34:59", "remaining_time": "1 day, 1:34:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2728, "total_steps": 10853, "loss": 0.1748, "learning_rate": 4.4660599189467634e-06, "epoch": 0.2513474915925738, "percentage": 25.14, "elapsed_time": "8:35:10", "remaining_time": "1 day, 1:34:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2729, "total_steps": 10853, "loss": 0.1823, "learning_rate": 4.465589284219517e-06, "epoch": 0.25143962776984385, "percentage": 25.15, "elapsed_time": "8:35:21", "remaining_time": "1 day, 1:34:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2730, "total_steps": 10853, "loss": 0.1749, "learning_rate": 4.465118466987094e-06, "epoch": 0.25153176394711385, "percentage": 25.15, "elapsed_time": "8:35:33", "remaining_time": "1 day, 1:34:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2731, "total_steps": 10853, "loss": 0.1688, "learning_rate": 4.4646474672932105e-06, "epoch": 0.25162390012438385, "percentage": 25.16, "elapsed_time": "8:35:44", "remaining_time": "1 day, 1:33:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2732, "total_steps": 10853, "loss": 0.1707, "learning_rate": 4.464176285181597e-06, "epoch": 0.25171603630165384, "percentage": 25.17, "elapsed_time": "8:35:55", "remaining_time": "1 day, 1:33:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2733, "total_steps": 10853, "loss": 0.1664, "learning_rate": 4.4637049206960055e-06, "epoch": 0.25180817247892384, "percentage": 25.18, "elapsed_time": "8:36:06", "remaining_time": "1 day, 1:33:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2734, "total_steps": 10853, "loss": 0.1636, "learning_rate": 4.4632333738802e-06, "epoch": 0.25190030865619384, "percentage": 25.19, "elapsed_time": "8:36:17", "remaining_time": "1 day, 1:33:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2735, "total_steps": 10853, "loss": 0.1619, "learning_rate": 4.462761644777964e-06, "epoch": 0.25199244483346384, "percentage": 25.2, "elapsed_time": "8:36:27", "remaining_time": "1 day, 1:32:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2736, "total_steps": 10853, "loss": 0.1643, "learning_rate": 4.4622897334330985e-06, "epoch": 0.2520845810107339, "percentage": 25.21, "elapsed_time": "8:36:39", "remaining_time": "1 day, 1:32:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2737, "total_steps": 10853, "loss": 0.1621, "learning_rate": 4.4618176398894205e-06, "epoch": 0.2521767171880039, "percentage": 25.22, "elapsed_time": "8:36:51", "remaining_time": "1 day, 1:32:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2738, "total_steps": 10853, "loss": 0.169, "learning_rate": 4.4613453641907634e-06, "epoch": 0.2522688533652739, "percentage": 25.23, "elapsed_time": "8:37:02", "remaining_time": "1 day, 1:32:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2739, "total_steps": 10853, "loss": 0.1667, "learning_rate": 4.460872906380977e-06, "epoch": 0.2523609895425439, "percentage": 25.24, "elapsed_time": "8:37:11", "remaining_time": "1 day, 1:32:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2740, "total_steps": 10853, "loss": 0.1788, "learning_rate": 4.460400266503932e-06, "epoch": 0.2524531257198139, "percentage": 25.25, "elapsed_time": "8:37:21", "remaining_time": "1 day, 1:31:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2741, "total_steps": 10853, "loss": 0.1634, "learning_rate": 4.4599274446035104e-06, "epoch": 0.2525452618970839, "percentage": 25.26, "elapsed_time": "8:37:33", "remaining_time": "1 day, 1:31:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2742, "total_steps": 10853, "loss": 0.1674, "learning_rate": 4.459454440723614e-06, "epoch": 0.25263739807435387, "percentage": 25.26, "elapsed_time": "8:37:45", "remaining_time": "1 day, 1:31:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2743, "total_steps": 10853, "loss": 0.1754, "learning_rate": 4.4589812549081624e-06, "epoch": 0.2527295342516239, "percentage": 25.27, "elapsed_time": "8:37:55", "remaining_time": "1 day, 1:31:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2744, "total_steps": 10853, "loss": 0.1622, "learning_rate": 4.458507887201091e-06, "epoch": 0.2528216704288939, "percentage": 25.28, "elapsed_time": "8:38:06", "remaining_time": "1 day, 1:31:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2745, "total_steps": 10853, "loss": 0.1717, "learning_rate": 4.458034337646351e-06, "epoch": 0.2529138066061639, "percentage": 25.29, "elapsed_time": "8:38:17", "remaining_time": "1 day, 1:30:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2746, "total_steps": 10853, "loss": 0.1591, "learning_rate": 4.4575606062879115e-06, "epoch": 0.2530059427834339, "percentage": 25.3, "elapsed_time": "8:38:26", "remaining_time": "1 day, 1:30:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2747, "total_steps": 10853, "loss": 0.167, "learning_rate": 4.45708669316976e-06, "epoch": 0.2530980789607039, "percentage": 25.31, "elapsed_time": "8:38:36", "remaining_time": "1 day, 1:30:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2748, "total_steps": 10853, "loss": 0.1684, "learning_rate": 4.456612598335898e-06, "epoch": 0.2531902151379739, "percentage": 25.32, "elapsed_time": "8:38:48", "remaining_time": "1 day, 1:30:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2749, "total_steps": 10853, "loss": 0.1448, "learning_rate": 4.4561383218303455e-06, "epoch": 0.2532823513152439, "percentage": 25.33, "elapsed_time": "8:38:59", "remaining_time": "1 day, 1:29:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2750, "total_steps": 10853, "loss": 0.1796, "learning_rate": 4.45566386369714e-06, "epoch": 0.25337448749251396, "percentage": 25.34, "elapsed_time": "8:39:09", "remaining_time": "1 day, 1:29:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2751, "total_steps": 10853, "loss": 0.1666, "learning_rate": 4.455189223980333e-06, "epoch": 0.25346662366978395, "percentage": 25.35, "elapsed_time": "8:39:21", "remaining_time": "1 day, 1:29:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2752, "total_steps": 10853, "loss": 0.1672, "learning_rate": 4.454714402723997e-06, "epoch": 0.25355875984705395, "percentage": 25.36, "elapsed_time": "8:39:31", "remaining_time": "1 day, 1:29:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2753, "total_steps": 10853, "loss": 0.1749, "learning_rate": 4.4542393999722184e-06, "epoch": 0.25365089602432395, "percentage": 25.37, "elapsed_time": "8:39:44", "remaining_time": "1 day, 1:29:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2754, "total_steps": 10853, "loss": 0.1617, "learning_rate": 4.453764215769101e-06, "epoch": 0.25374303220159394, "percentage": 25.38, "elapsed_time": "8:39:56", "remaining_time": "1 day, 1:29:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2755, "total_steps": 10853, "loss": 0.1691, "learning_rate": 4.4532888501587655e-06, "epoch": 0.25383516837886394, "percentage": 25.38, "elapsed_time": "8:40:07", "remaining_time": "1 day, 1:28:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2756, "total_steps": 10853, "loss": 0.1628, "learning_rate": 4.452813303185351e-06, "epoch": 0.253927304556134, "percentage": 25.39, "elapsed_time": "8:40:15", "remaining_time": "1 day, 1:28:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2757, "total_steps": 10853, "loss": 0.1602, "learning_rate": 4.452337574893011e-06, "epoch": 0.254019440733404, "percentage": 25.4, "elapsed_time": "8:40:25", "remaining_time": "1 day, 1:28:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2758, "total_steps": 10853, "loss": 0.1473, "learning_rate": 4.451861665325916e-06, "epoch": 0.254111576910674, "percentage": 25.41, "elapsed_time": "8:40:34", "remaining_time": "1 day, 1:27:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2759, "total_steps": 10853, "loss": 0.1511, "learning_rate": 4.451385574528256e-06, "epoch": 0.254203713087944, "percentage": 25.42, "elapsed_time": "8:40:46", "remaining_time": "1 day, 1:27:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2760, "total_steps": 10853, "loss": 0.1645, "learning_rate": 4.450909302544235e-06, "epoch": 0.254295849265214, "percentage": 25.43, "elapsed_time": "8:40:57", "remaining_time": "1 day, 1:27:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2761, "total_steps": 10853, "loss": 0.1698, "learning_rate": 4.450432849418076e-06, "epoch": 0.254387985442484, "percentage": 25.44, "elapsed_time": "8:41:08", "remaining_time": "1 day, 1:27:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2762, "total_steps": 10853, "loss": 0.1733, "learning_rate": 4.449956215194017e-06, "epoch": 0.254480121619754, "percentage": 25.45, "elapsed_time": "8:41:18", "remaining_time": "1 day, 1:27:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2763, "total_steps": 10853, "loss": 0.1485, "learning_rate": 4.4494793999163125e-06, "epoch": 0.254572257797024, "percentage": 25.46, "elapsed_time": "8:41:29", "remaining_time": "1 day, 1:26:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2764, "total_steps": 10853, "loss": 0.1715, "learning_rate": 4.449002403629237e-06, "epoch": 0.254664393974294, "percentage": 25.47, "elapsed_time": "8:41:42", "remaining_time": "1 day, 1:26:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2765, "total_steps": 10853, "loss": 0.1599, "learning_rate": 4.448525226377078e-06, "epoch": 0.254756530151564, "percentage": 25.48, "elapsed_time": "8:41:52", "remaining_time": "1 day, 1:26:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2766, "total_steps": 10853, "loss": 0.1663, "learning_rate": 4.448047868204143e-06, "epoch": 0.254848666328834, "percentage": 25.49, "elapsed_time": "8:42:03", "remaining_time": "1 day, 1:26:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2767, "total_steps": 10853, "loss": 0.159, "learning_rate": 4.447570329154752e-06, "epoch": 0.254940802506104, "percentage": 25.5, "elapsed_time": "8:42:13", "remaining_time": "1 day, 1:26:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2768, "total_steps": 10853, "loss": 0.1672, "learning_rate": 4.447092609273248e-06, "epoch": 0.255032938683374, "percentage": 25.5, "elapsed_time": "8:42:25", "remaining_time": "1 day, 1:25:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2769, "total_steps": 10853, "loss": 0.175, "learning_rate": 4.446614708603985e-06, "epoch": 0.255125074860644, "percentage": 25.51, "elapsed_time": "8:42:36", "remaining_time": "1 day, 1:25:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2770, "total_steps": 10853, "loss": 0.1688, "learning_rate": 4.446136627191337e-06, "epoch": 0.25521721103791406, "percentage": 25.52, "elapsed_time": "8:42:45", "remaining_time": "1 day, 1:25:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2771, "total_steps": 10853, "loss": 0.1548, "learning_rate": 4.445658365079693e-06, "epoch": 0.25530934721518406, "percentage": 25.53, "elapsed_time": "8:42:56", "remaining_time": "1 day, 1:25:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2772, "total_steps": 10853, "loss": 0.1588, "learning_rate": 4.4451799223134615e-06, "epoch": 0.25540148339245405, "percentage": 25.54, "elapsed_time": "8:43:06", "remaining_time": "1 day, 1:24:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2773, "total_steps": 10853, "loss": 0.1647, "learning_rate": 4.444701298937064e-06, "epoch": 0.25549361956972405, "percentage": 25.55, "elapsed_time": "8:43:17", "remaining_time": "1 day, 1:24:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2774, "total_steps": 10853, "loss": 0.1607, "learning_rate": 4.444222494994942e-06, "epoch": 0.25558575574699405, "percentage": 25.56, "elapsed_time": "8:43:28", "remaining_time": "1 day, 1:24:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2775, "total_steps": 10853, "loss": 0.1581, "learning_rate": 4.443743510531552e-06, "epoch": 0.25567789192426404, "percentage": 25.57, "elapsed_time": "8:43:38", "remaining_time": "1 day, 1:24:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2776, "total_steps": 10853, "loss": 0.1602, "learning_rate": 4.443264345591368e-06, "epoch": 0.25577002810153404, "percentage": 25.58, "elapsed_time": "8:43:49", "remaining_time": "1 day, 1:24:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2777, "total_steps": 10853, "loss": 0.1669, "learning_rate": 4.442785000218881e-06, "epoch": 0.2558621642788041, "percentage": 25.59, "elapsed_time": "8:44:01", "remaining_time": "1 day, 1:23:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2778, "total_steps": 10853, "loss": 0.1598, "learning_rate": 4.442305474458596e-06, "epoch": 0.2559543004560741, "percentage": 25.6, "elapsed_time": "8:44:10", "remaining_time": "1 day, 1:23:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2779, "total_steps": 10853, "loss": 0.1537, "learning_rate": 4.4418257683550405e-06, "epoch": 0.2560464366333441, "percentage": 25.61, "elapsed_time": "8:44:23", "remaining_time": "1 day, 1:23:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2780, "total_steps": 10853, "loss": 0.169, "learning_rate": 4.441345881952752e-06, "epoch": 0.2561385728106141, "percentage": 25.62, "elapsed_time": "8:44:34", "remaining_time": "1 day, 1:23:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2781, "total_steps": 10853, "loss": 0.1769, "learning_rate": 4.44086581529629e-06, "epoch": 0.2562307089878841, "percentage": 25.62, "elapsed_time": "8:44:44", "remaining_time": "1 day, 1:23:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2782, "total_steps": 10853, "loss": 0.1544, "learning_rate": 4.440385568430228e-06, "epoch": 0.2563228451651541, "percentage": 25.63, "elapsed_time": "8:44:54", "remaining_time": "1 day, 1:22:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2783, "total_steps": 10853, "loss": 0.1797, "learning_rate": 4.439905141399157e-06, "epoch": 0.2564149813424241, "percentage": 25.64, "elapsed_time": "8:45:04", "remaining_time": "1 day, 1:22:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2784, "total_steps": 10853, "loss": 0.162, "learning_rate": 4.439424534247686e-06, "epoch": 0.25650711751969413, "percentage": 25.65, "elapsed_time": "8:45:14", "remaining_time": "1 day, 1:22:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2785, "total_steps": 10853, "loss": 0.1606, "learning_rate": 4.438943747020437e-06, "epoch": 0.2565992536969641, "percentage": 25.66, "elapsed_time": "8:45:25", "remaining_time": "1 day, 1:22:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2786, "total_steps": 10853, "loss": 0.1589, "learning_rate": 4.438462779762052e-06, "epoch": 0.2566913898742341, "percentage": 25.67, "elapsed_time": "8:45:34", "remaining_time": "1 day, 1:21:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2787, "total_steps": 10853, "loss": 0.1691, "learning_rate": 4.437981632517191e-06, "epoch": 0.2567835260515041, "percentage": 25.68, "elapsed_time": "8:45:45", "remaining_time": "1 day, 1:21:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2788, "total_steps": 10853, "loss": 0.1627, "learning_rate": 4.437500305330526e-06, "epoch": 0.2568756622287741, "percentage": 25.69, "elapsed_time": "8:45:55", "remaining_time": "1 day, 1:21:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2789, "total_steps": 10853, "loss": 0.1533, "learning_rate": 4.437018798246749e-06, "epoch": 0.2569677984060441, "percentage": 25.7, "elapsed_time": "8:46:05", "remaining_time": "1 day, 1:21:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2790, "total_steps": 10853, "loss": 0.1806, "learning_rate": 4.436537111310568e-06, "epoch": 0.25705993458331416, "percentage": 25.71, "elapsed_time": "8:46:17", "remaining_time": "1 day, 1:20:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2791, "total_steps": 10853, "loss": 0.1585, "learning_rate": 4.436055244566708e-06, "epoch": 0.25715207076058416, "percentage": 25.72, "elapsed_time": "8:46:27", "remaining_time": "1 day, 1:20:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2792, "total_steps": 10853, "loss": 0.1579, "learning_rate": 4.4355731980599105e-06, "epoch": 0.25724420693785416, "percentage": 25.73, "elapsed_time": "8:46:38", "remaining_time": "1 day, 1:20:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2793, "total_steps": 10853, "loss": 0.1709, "learning_rate": 4.435090971834933e-06, "epoch": 0.25733634311512416, "percentage": 25.73, "elapsed_time": "8:46:48", "remaining_time": "1 day, 1:20:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2794, "total_steps": 10853, "loss": 0.1718, "learning_rate": 4.43460856593655e-06, "epoch": 0.25742847929239415, "percentage": 25.74, "elapsed_time": "8:46:59", "remaining_time": "1 day, 1:20:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2795, "total_steps": 10853, "loss": 0.1562, "learning_rate": 4.434125980409553e-06, "epoch": 0.25752061546966415, "percentage": 25.75, "elapsed_time": "8:47:09", "remaining_time": "1 day, 1:19:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2796, "total_steps": 10853, "loss": 0.1577, "learning_rate": 4.433643215298753e-06, "epoch": 0.25761275164693415, "percentage": 25.76, "elapsed_time": "8:47:20", "remaining_time": "1 day, 1:19:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2797, "total_steps": 10853, "loss": 0.1613, "learning_rate": 4.433160270648971e-06, "epoch": 0.2577048878242042, "percentage": 25.77, "elapsed_time": "8:47:31", "remaining_time": "1 day, 1:19:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2798, "total_steps": 10853, "loss": 0.1643, "learning_rate": 4.432677146505049e-06, "epoch": 0.2577970240014742, "percentage": 25.78, "elapsed_time": "8:47:42", "remaining_time": "1 day, 1:19:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2799, "total_steps": 10853, "loss": 0.1807, "learning_rate": 4.432193842911846e-06, "epoch": 0.2578891601787442, "percentage": 25.79, "elapsed_time": "8:47:52", "remaining_time": "1 day, 1:18:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2800, "total_steps": 10853, "loss": 0.1653, "learning_rate": 4.431710359914238e-06, "epoch": 0.2579812963560142, "percentage": 25.8, "elapsed_time": "8:48:03", "remaining_time": "1 day, 1:18:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2801, "total_steps": 10853, "loss": 0.1608, "learning_rate": 4.4312266975571145e-06, "epoch": 0.2580734325332842, "percentage": 25.81, "elapsed_time": "8:48:14", "remaining_time": "1 day, 1:18:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2802, "total_steps": 10853, "loss": 0.1595, "learning_rate": 4.430742855885384e-06, "epoch": 0.2581655687105542, "percentage": 25.82, "elapsed_time": "8:48:24", "remaining_time": "1 day, 1:18:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2803, "total_steps": 10853, "loss": 0.1435, "learning_rate": 4.430258834943973e-06, "epoch": 0.2582577048878242, "percentage": 25.83, "elapsed_time": "8:48:35", "remaining_time": "1 day, 1:18:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2804, "total_steps": 10853, "loss": 0.1708, "learning_rate": 4.429774634777819e-06, "epoch": 0.25834984106509423, "percentage": 25.84, "elapsed_time": "8:48:47", "remaining_time": "1 day, 1:17:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2805, "total_steps": 10853, "loss": 0.1548, "learning_rate": 4.429290255431884e-06, "epoch": 0.25844197724236423, "percentage": 25.85, "elapsed_time": "8:48:59", "remaining_time": "1 day, 1:17:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2806, "total_steps": 10853, "loss": 0.1691, "learning_rate": 4.428805696951141e-06, "epoch": 0.2585341134196342, "percentage": 25.85, "elapsed_time": "8:49:13", "remaining_time": "1 day, 1:17:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2807, "total_steps": 10853, "loss": 0.1684, "learning_rate": 4.428320959380581e-06, "epoch": 0.2586262495969042, "percentage": 25.86, "elapsed_time": "8:49:23", "remaining_time": "1 day, 1:17:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2808, "total_steps": 10853, "loss": 0.1448, "learning_rate": 4.427836042765213e-06, "epoch": 0.2587183857741742, "percentage": 25.87, "elapsed_time": "8:49:33", "remaining_time": "1 day, 1:17:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2809, "total_steps": 10853, "loss": 0.148, "learning_rate": 4.4273509471500606e-06, "epoch": 0.2588105219514442, "percentage": 25.88, "elapsed_time": "8:49:45", "remaining_time": "1 day, 1:17:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2810, "total_steps": 10853, "loss": 0.1506, "learning_rate": 4.426865672580166e-06, "epoch": 0.2589026581287142, "percentage": 25.89, "elapsed_time": "8:49:55", "remaining_time": "1 day, 1:16:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2811, "total_steps": 10853, "loss": 0.1531, "learning_rate": 4.426380219100585e-06, "epoch": 0.25899479430598427, "percentage": 25.9, "elapsed_time": "8:50:06", "remaining_time": "1 day, 1:16:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2812, "total_steps": 10853, "loss": 0.196, "learning_rate": 4.425894586756394e-06, "epoch": 0.25908693048325426, "percentage": 25.91, "elapsed_time": "8:50:18", "remaining_time": "1 day, 1:16:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2813, "total_steps": 10853, "loss": 0.1574, "learning_rate": 4.425408775592684e-06, "epoch": 0.25917906666052426, "percentage": 25.92, "elapsed_time": "8:50:29", "remaining_time": "1 day, 1:16:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2814, "total_steps": 10853, "loss": 0.1557, "learning_rate": 4.424922785654561e-06, "epoch": 0.25927120283779426, "percentage": 25.93, "elapsed_time": "8:50:40", "remaining_time": "1 day, 1:16:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2815, "total_steps": 10853, "loss": 0.1534, "learning_rate": 4.424436616987151e-06, "epoch": 0.25936333901506425, "percentage": 25.94, "elapsed_time": "8:50:51", "remaining_time": "1 day, 1:15:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2816, "total_steps": 10853, "loss": 0.1722, "learning_rate": 4.423950269635594e-06, "epoch": 0.25945547519233425, "percentage": 25.95, "elapsed_time": "8:51:01", "remaining_time": "1 day, 1:15:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2817, "total_steps": 10853, "loss": 0.1667, "learning_rate": 4.4234637436450465e-06, "epoch": 0.25954761136960425, "percentage": 25.96, "elapsed_time": "8:51:12", "remaining_time": "1 day, 1:15:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2818, "total_steps": 10853, "loss": 0.1551, "learning_rate": 4.422977039060684e-06, "epoch": 0.2596397475468743, "percentage": 25.97, "elapsed_time": "8:51:23", "remaining_time": "1 day, 1:15:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2819, "total_steps": 10853, "loss": 0.1547, "learning_rate": 4.422490155927696e-06, "epoch": 0.2597318837241443, "percentage": 25.97, "elapsed_time": "8:51:34", "remaining_time": "1 day, 1:14:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2820, "total_steps": 10853, "loss": 0.1553, "learning_rate": 4.422003094291291e-06, "epoch": 0.2598240199014143, "percentage": 25.98, "elapsed_time": "8:51:45", "remaining_time": "1 day, 1:14:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2821, "total_steps": 10853, "loss": 0.1421, "learning_rate": 4.421515854196692e-06, "epoch": 0.2599161560786843, "percentage": 25.99, "elapsed_time": "8:51:55", "remaining_time": "1 day, 1:14:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2822, "total_steps": 10853, "loss": 0.1739, "learning_rate": 4.421028435689138e-06, "epoch": 0.2600082922559543, "percentage": 26.0, "elapsed_time": "8:52:05", "remaining_time": "1 day, 1:14:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2823, "total_steps": 10853, "loss": 0.1726, "learning_rate": 4.420540838813887e-06, "epoch": 0.2601004284332243, "percentage": 26.01, "elapsed_time": "8:52:16", "remaining_time": "1 day, 1:14:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2824, "total_steps": 10853, "loss": 0.1597, "learning_rate": 4.420053063616214e-06, "epoch": 0.26019256461049434, "percentage": 26.02, "elapsed_time": "8:52:26", "remaining_time": "1 day, 1:13:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2825, "total_steps": 10853, "loss": 0.1669, "learning_rate": 4.419565110141406e-06, "epoch": 0.26028470078776433, "percentage": 26.03, "elapsed_time": "8:52:38", "remaining_time": "1 day, 1:13:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2826, "total_steps": 10853, "loss": 0.1587, "learning_rate": 4.419076978434771e-06, "epoch": 0.26037683696503433, "percentage": 26.04, "elapsed_time": "8:52:49", "remaining_time": "1 day, 1:13:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2827, "total_steps": 10853, "loss": 0.1496, "learning_rate": 4.418588668541632e-06, "epoch": 0.2604689731423043, "percentage": 26.05, "elapsed_time": "8:53:00", "remaining_time": "1 day, 1:13:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2828, "total_steps": 10853, "loss": 0.1612, "learning_rate": 4.41810018050733e-06, "epoch": 0.2605611093195743, "percentage": 26.06, "elapsed_time": "8:53:10", "remaining_time": "1 day, 1:13:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2829, "total_steps": 10853, "loss": 0.1541, "learning_rate": 4.417611514377218e-06, "epoch": 0.2606532454968443, "percentage": 26.07, "elapsed_time": "8:53:21", "remaining_time": "1 day, 1:12:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2830, "total_steps": 10853, "loss": 0.1662, "learning_rate": 4.417122670196672e-06, "epoch": 0.2607453816741143, "percentage": 26.08, "elapsed_time": "8:53:32", "remaining_time": "1 day, 1:12:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2831, "total_steps": 10853, "loss": 0.1719, "learning_rate": 4.416633648011079e-06, "epoch": 0.26083751785138437, "percentage": 26.08, "elapsed_time": "8:53:43", "remaining_time": "1 day, 1:12:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2832, "total_steps": 10853, "loss": 0.1594, "learning_rate": 4.416144447865845e-06, "epoch": 0.26092965402865437, "percentage": 26.09, "elapsed_time": "8:53:55", "remaining_time": "1 day, 1:12:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2833, "total_steps": 10853, "loss": 0.1503, "learning_rate": 4.4156550698063935e-06, "epoch": 0.26102179020592436, "percentage": 26.1, "elapsed_time": "8:54:07", "remaining_time": "1 day, 1:12:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2834, "total_steps": 10853, "loss": 0.1477, "learning_rate": 4.4151655138781625e-06, "epoch": 0.26111392638319436, "percentage": 26.11, "elapsed_time": "8:54:18", "remaining_time": "1 day, 1:11:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2835, "total_steps": 10853, "loss": 0.1655, "learning_rate": 4.414675780126607e-06, "epoch": 0.26120606256046436, "percentage": 26.12, "elapsed_time": "8:54:29", "remaining_time": "1 day, 1:11:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2836, "total_steps": 10853, "loss": 0.1709, "learning_rate": 4.4141858685972e-06, "epoch": 0.26129819873773436, "percentage": 26.13, "elapsed_time": "8:54:42", "remaining_time": "1 day, 1:11:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2837, "total_steps": 10853, "loss": 0.1604, "learning_rate": 4.413695779335428e-06, "epoch": 0.26139033491500435, "percentage": 26.14, "elapsed_time": "8:54:53", "remaining_time": "1 day, 1:11:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2838, "total_steps": 10853, "loss": 0.1683, "learning_rate": 4.413205512386798e-06, "epoch": 0.2614824710922744, "percentage": 26.15, "elapsed_time": "8:55:04", "remaining_time": "1 day, 1:11:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2839, "total_steps": 10853, "loss": 0.1781, "learning_rate": 4.41271506779683e-06, "epoch": 0.2615746072695444, "percentage": 26.16, "elapsed_time": "8:55:16", "remaining_time": "1 day, 1:10:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2840, "total_steps": 10853, "loss": 0.1636, "learning_rate": 4.412224445611062e-06, "epoch": 0.2616667434468144, "percentage": 26.17, "elapsed_time": "8:55:27", "remaining_time": "1 day, 1:10:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2841, "total_steps": 10853, "loss": 0.1586, "learning_rate": 4.411733645875048e-06, "epoch": 0.2617588796240844, "percentage": 26.18, "elapsed_time": "8:55:38", "remaining_time": "1 day, 1:10:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2842, "total_steps": 10853, "loss": 0.1666, "learning_rate": 4.41124266863436e-06, "epoch": 0.2618510158013544, "percentage": 26.19, "elapsed_time": "8:55:49", "remaining_time": "1 day, 1:10:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2843, "total_steps": 10853, "loss": 0.1725, "learning_rate": 4.410751513934585e-06, "epoch": 0.2619431519786244, "percentage": 26.2, "elapsed_time": "8:55:59", "remaining_time": "1 day, 1:10:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2844, "total_steps": 10853, "loss": 0.1763, "learning_rate": 4.410260181821325e-06, "epoch": 0.2620352881558944, "percentage": 26.2, "elapsed_time": "8:56:09", "remaining_time": "1 day, 1:09:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2845, "total_steps": 10853, "loss": 0.1463, "learning_rate": 4.409768672340202e-06, "epoch": 0.26212742433316444, "percentage": 26.21, "elapsed_time": "8:56:19", "remaining_time": "1 day, 1:09:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2846, "total_steps": 10853, "loss": 0.173, "learning_rate": 4.409276985536852e-06, "epoch": 0.26221956051043444, "percentage": 26.22, "elapsed_time": "8:56:31", "remaining_time": "1 day, 1:09:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2847, "total_steps": 10853, "loss": 0.1613, "learning_rate": 4.408785121456929e-06, "epoch": 0.26231169668770443, "percentage": 26.23, "elapsed_time": "8:56:42", "remaining_time": "1 day, 1:09:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2848, "total_steps": 10853, "loss": 0.1474, "learning_rate": 4.408293080146101e-06, "epoch": 0.26240383286497443, "percentage": 26.24, "elapsed_time": "8:56:53", "remaining_time": "1 day, 1:09:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2849, "total_steps": 10853, "loss": 0.1586, "learning_rate": 4.407800861650056e-06, "epoch": 0.2624959690422444, "percentage": 26.25, "elapsed_time": "8:57:04", "remaining_time": "1 day, 1:08:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2850, "total_steps": 10853, "loss": 0.1486, "learning_rate": 4.407308466014496e-06, "epoch": 0.2625881052195144, "percentage": 26.26, "elapsed_time": "8:57:15", "remaining_time": "1 day, 1:08:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2851, "total_steps": 10853, "loss": 0.1653, "learning_rate": 4.406815893285139e-06, "epoch": 0.2626802413967845, "percentage": 26.27, "elapsed_time": "8:57:26", "remaining_time": "1 day, 1:08:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2852, "total_steps": 10853, "loss": 0.1612, "learning_rate": 4.406323143507721e-06, "epoch": 0.26277237757405447, "percentage": 26.28, "elapsed_time": "8:57:35", "remaining_time": "1 day, 1:08:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2853, "total_steps": 10853, "loss": 0.1501, "learning_rate": 4.405830216727995e-06, "epoch": 0.26286451375132447, "percentage": 26.29, "elapsed_time": "8:57:45", "remaining_time": "1 day, 1:07:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2854, "total_steps": 10853, "loss": 0.1483, "learning_rate": 4.405337112991728e-06, "epoch": 0.26295664992859447, "percentage": 26.3, "elapsed_time": "8:57:55", "remaining_time": "1 day, 1:07:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2855, "total_steps": 10853, "loss": 0.1653, "learning_rate": 4.404843832344704e-06, "epoch": 0.26304878610586446, "percentage": 26.31, "elapsed_time": "8:58:05", "remaining_time": "1 day, 1:07:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2856, "total_steps": 10853, "loss": 0.1611, "learning_rate": 4.404350374832725e-06, "epoch": 0.26314092228313446, "percentage": 26.32, "elapsed_time": "8:58:16", "remaining_time": "1 day, 1:07:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2857, "total_steps": 10853, "loss": 0.1537, "learning_rate": 4.40385674050161e-06, "epoch": 0.26323305846040446, "percentage": 26.32, "elapsed_time": "8:58:27", "remaining_time": "1 day, 1:06:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2858, "total_steps": 10853, "loss": 0.1559, "learning_rate": 4.403362929397191e-06, "epoch": 0.2633251946376745, "percentage": 26.33, "elapsed_time": "8:58:38", "remaining_time": "1 day, 1:06:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2859, "total_steps": 10853, "loss": 0.1531, "learning_rate": 4.40286894156532e-06, "epoch": 0.2634173308149445, "percentage": 26.34, "elapsed_time": "8:58:50", "remaining_time": "1 day, 1:06:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2860, "total_steps": 10853, "loss": 0.1676, "learning_rate": 4.402374777051862e-06, "epoch": 0.2635094669922145, "percentage": 26.35, "elapsed_time": "8:59:00", "remaining_time": "1 day, 1:06:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2861, "total_steps": 10853, "loss": 0.1676, "learning_rate": 4.401880435902701e-06, "epoch": 0.2636016031694845, "percentage": 26.36, "elapsed_time": "8:59:10", "remaining_time": "1 day, 1:06:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2862, "total_steps": 10853, "loss": 0.1859, "learning_rate": 4.401385918163737e-06, "epoch": 0.2636937393467545, "percentage": 26.37, "elapsed_time": "8:59:22", "remaining_time": "1 day, 1:05:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2863, "total_steps": 10853, "loss": 0.1488, "learning_rate": 4.400891223880888e-06, "epoch": 0.2637858755240245, "percentage": 26.38, "elapsed_time": "8:59:31", "remaining_time": "1 day, 1:05:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2864, "total_steps": 10853, "loss": 0.1599, "learning_rate": 4.400396353100081e-06, "epoch": 0.2638780117012945, "percentage": 26.39, "elapsed_time": "8:59:42", "remaining_time": "1 day, 1:05:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2865, "total_steps": 10853, "loss": 0.1597, "learning_rate": 4.39990130586727e-06, "epoch": 0.26397014787856454, "percentage": 26.4, "elapsed_time": "8:59:54", "remaining_time": "1 day, 1:05:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2866, "total_steps": 10853, "loss": 0.1533, "learning_rate": 4.399406082228418e-06, "epoch": 0.26406228405583454, "percentage": 26.41, "elapsed_time": "9:00:04", "remaining_time": "1 day, 1:05:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2867, "total_steps": 10853, "loss": 0.1718, "learning_rate": 4.398910682229507e-06, "epoch": 0.26415442023310454, "percentage": 26.42, "elapsed_time": "9:00:14", "remaining_time": "1 day, 1:04:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2868, "total_steps": 10853, "loss": 0.1646, "learning_rate": 4.398415105916535e-06, "epoch": 0.26424655641037453, "percentage": 26.43, "elapsed_time": "9:00:27", "remaining_time": "1 day, 1:04:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2869, "total_steps": 10853, "loss": 0.1513, "learning_rate": 4.397919353335516e-06, "epoch": 0.26433869258764453, "percentage": 26.44, "elapsed_time": "9:00:36", "remaining_time": "1 day, 1:04:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2870, "total_steps": 10853, "loss": 0.1705, "learning_rate": 4.3974234245324795e-06, "epoch": 0.2644308287649145, "percentage": 26.44, "elapsed_time": "9:00:49", "remaining_time": "1 day, 1:04:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2871, "total_steps": 10853, "loss": 0.1718, "learning_rate": 4.396927319553476e-06, "epoch": 0.2645229649421845, "percentage": 26.45, "elapsed_time": "9:00:59", "remaining_time": "1 day, 1:04:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2872, "total_steps": 10853, "loss": 0.1576, "learning_rate": 4.396431038444565e-06, "epoch": 0.2646151011194546, "percentage": 26.46, "elapsed_time": "9:01:11", "remaining_time": "1 day, 1:03:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2873, "total_steps": 10853, "loss": 0.1666, "learning_rate": 4.3959345812518285e-06, "epoch": 0.2647072372967246, "percentage": 26.47, "elapsed_time": "9:01:21", "remaining_time": "1 day, 1:03:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2874, "total_steps": 10853, "loss": 0.1623, "learning_rate": 4.395437948021362e-06, "epoch": 0.26479937347399457, "percentage": 26.48, "elapsed_time": "9:01:33", "remaining_time": "1 day, 1:03:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2875, "total_steps": 10853, "loss": 0.1654, "learning_rate": 4.394941138799278e-06, "epoch": 0.26489150965126457, "percentage": 26.49, "elapsed_time": "9:01:45", "remaining_time": "1 day, 1:03:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2876, "total_steps": 10853, "loss": 0.1425, "learning_rate": 4.3944441536317055e-06, "epoch": 0.26498364582853456, "percentage": 26.5, "elapsed_time": "9:01:55", "remaining_time": "1 day, 1:03:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2877, "total_steps": 10853, "loss": 0.1705, "learning_rate": 4.3939469925647895e-06, "epoch": 0.26507578200580456, "percentage": 26.51, "elapsed_time": "9:02:05", "remaining_time": "1 day, 1:02:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2878, "total_steps": 10853, "loss": 0.1475, "learning_rate": 4.3934496556446916e-06, "epoch": 0.26516791818307456, "percentage": 26.52, "elapsed_time": "9:02:15", "remaining_time": "1 day, 1:02:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2879, "total_steps": 10853, "loss": 0.1523, "learning_rate": 4.3929521429175895e-06, "epoch": 0.2652600543603446, "percentage": 26.53, "elapsed_time": "9:02:26", "remaining_time": "1 day, 1:02:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2880, "total_steps": 10853, "loss": 0.1703, "learning_rate": 4.392454454429676e-06, "epoch": 0.2653521905376146, "percentage": 26.54, "elapsed_time": "9:02:36", "remaining_time": "1 day, 1:02:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2881, "total_steps": 10853, "loss": 0.1603, "learning_rate": 4.391956590227164e-06, "epoch": 0.2654443267148846, "percentage": 26.55, "elapsed_time": "9:02:47", "remaining_time": "1 day, 1:01:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2882, "total_steps": 10853, "loss": 0.1619, "learning_rate": 4.391458550356278e-06, "epoch": 0.2655364628921546, "percentage": 26.55, "elapsed_time": "9:02:58", "remaining_time": "1 day, 1:01:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2883, "total_steps": 10853, "loss": 0.1533, "learning_rate": 4.390960334863263e-06, "epoch": 0.2656285990694246, "percentage": 26.56, "elapsed_time": "9:03:09", "remaining_time": "1 day, 1:01:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2884, "total_steps": 10853, "loss": 0.1775, "learning_rate": 4.390461943794377e-06, "epoch": 0.2657207352466946, "percentage": 26.57, "elapsed_time": "9:03:20", "remaining_time": "1 day, 1:01:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2885, "total_steps": 10853, "loss": 0.162, "learning_rate": 4.389963377195896e-06, "epoch": 0.26581287142396465, "percentage": 26.58, "elapsed_time": "9:03:31", "remaining_time": "1 day, 1:01:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2886, "total_steps": 10853, "loss": 0.1563, "learning_rate": 4.389464635114112e-06, "epoch": 0.26590500760123464, "percentage": 26.59, "elapsed_time": "9:03:41", "remaining_time": "1 day, 1:00:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2887, "total_steps": 10853, "loss": 0.1867, "learning_rate": 4.388965717595334e-06, "epoch": 0.26599714377850464, "percentage": 26.6, "elapsed_time": "9:03:53", "remaining_time": "1 day, 1:00:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2888, "total_steps": 10853, "loss": 0.1565, "learning_rate": 4.3884666246858846e-06, "epoch": 0.26608927995577464, "percentage": 26.61, "elapsed_time": "9:04:03", "remaining_time": "1 day, 1:00:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2889, "total_steps": 10853, "loss": 0.17, "learning_rate": 4.387967356432107e-06, "epoch": 0.26618141613304463, "percentage": 26.62, "elapsed_time": "9:04:14", "remaining_time": "1 day, 1:00:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2890, "total_steps": 10853, "loss": 0.1535, "learning_rate": 4.3874679128803565e-06, "epoch": 0.26627355231031463, "percentage": 26.63, "elapsed_time": "9:04:23", "remaining_time": "1 day, 1:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2891, "total_steps": 10853, "loss": 0.1599, "learning_rate": 4.386968294077007e-06, "epoch": 0.26636568848758463, "percentage": 26.64, "elapsed_time": "9:04:34", "remaining_time": "1 day, 0:59:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2892, "total_steps": 10853, "loss": 0.1663, "learning_rate": 4.386468500068449e-06, "epoch": 0.2664578246648547, "percentage": 26.65, "elapsed_time": "9:04:44", "remaining_time": "1 day, 0:59:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2893, "total_steps": 10853, "loss": 0.1737, "learning_rate": 4.385968530901087e-06, "epoch": 0.2665499608421247, "percentage": 26.66, "elapsed_time": "9:04:56", "remaining_time": "1 day, 0:59:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2894, "total_steps": 10853, "loss": 0.1613, "learning_rate": 4.3854683866213445e-06, "epoch": 0.2666420970193947, "percentage": 26.67, "elapsed_time": "9:05:07", "remaining_time": "1 day, 0:59:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2895, "total_steps": 10853, "loss": 0.1749, "learning_rate": 4.384968067275659e-06, "epoch": 0.26673423319666467, "percentage": 26.67, "elapsed_time": "9:05:17", "remaining_time": "1 day, 0:58:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2896, "total_steps": 10853, "loss": 0.1744, "learning_rate": 4.384467572910486e-06, "epoch": 0.26682636937393467, "percentage": 26.68, "elapsed_time": "9:05:28", "remaining_time": "1 day, 0:58:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2897, "total_steps": 10853, "loss": 0.1669, "learning_rate": 4.383966903572295e-06, "epoch": 0.26691850555120467, "percentage": 26.69, "elapsed_time": "9:05:39", "remaining_time": "1 day, 0:58:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2898, "total_steps": 10853, "loss": 0.1529, "learning_rate": 4.383466059307576e-06, "epoch": 0.26701064172847466, "percentage": 26.7, "elapsed_time": "9:05:50", "remaining_time": "1 day, 0:58:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2899, "total_steps": 10853, "loss": 0.1678, "learning_rate": 4.382965040162829e-06, "epoch": 0.2671027779057447, "percentage": 26.71, "elapsed_time": "9:06:01", "remaining_time": "1 day, 0:58:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2900, "total_steps": 10853, "loss": 0.1624, "learning_rate": 4.3824638461845764e-06, "epoch": 0.2671949140830147, "percentage": 26.72, "elapsed_time": "9:06:12", "remaining_time": "1 day, 0:57:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2901, "total_steps": 10853, "loss": 0.1621, "learning_rate": 4.381962477419352e-06, "epoch": 0.2672870502602847, "percentage": 26.73, "elapsed_time": "9:06:23", "remaining_time": "1 day, 0:57:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2902, "total_steps": 10853, "loss": 0.1697, "learning_rate": 4.3814609339137105e-06, "epoch": 0.2673791864375547, "percentage": 26.74, "elapsed_time": "9:06:35", "remaining_time": "1 day, 0:57:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2903, "total_steps": 10853, "loss": 0.1625, "learning_rate": 4.380959215714218e-06, "epoch": 0.2674713226148247, "percentage": 26.75, "elapsed_time": "9:06:46", "remaining_time": "1 day, 0:57:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2904, "total_steps": 10853, "loss": 0.1615, "learning_rate": 4.380457322867461e-06, "epoch": 0.2675634587920947, "percentage": 26.76, "elapsed_time": "9:06:55", "remaining_time": "1 day, 0:57:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2905, "total_steps": 10853, "loss": 0.1636, "learning_rate": 4.379955255420037e-06, "epoch": 0.2676555949693647, "percentage": 26.77, "elapsed_time": "9:07:06", "remaining_time": "1 day, 0:56:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2906, "total_steps": 10853, "loss": 0.1722, "learning_rate": 4.379453013418567e-06, "epoch": 0.26774773114663475, "percentage": 26.78, "elapsed_time": "9:07:17", "remaining_time": "1 day, 0:56:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2907, "total_steps": 10853, "loss": 0.1661, "learning_rate": 4.378950596909683e-06, "epoch": 0.26783986732390475, "percentage": 26.79, "elapsed_time": "9:07:28", "remaining_time": "1 day, 0:56:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2908, "total_steps": 10853, "loss": 0.1661, "learning_rate": 4.378448005940031e-06, "epoch": 0.26793200350117474, "percentage": 26.79, "elapsed_time": "9:07:39", "remaining_time": "1 day, 0:56:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2909, "total_steps": 10853, "loss": 0.1779, "learning_rate": 4.377945240556282e-06, "epoch": 0.26802413967844474, "percentage": 26.8, "elapsed_time": "9:07:51", "remaining_time": "1 day, 0:56:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2910, "total_steps": 10853, "loss": 0.1634, "learning_rate": 4.3774423008051145e-06, "epoch": 0.26811627585571474, "percentage": 26.81, "elapsed_time": "9:08:02", "remaining_time": "1 day, 0:55:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2911, "total_steps": 10853, "loss": 0.1516, "learning_rate": 4.376939186733227e-06, "epoch": 0.26820841203298473, "percentage": 26.82, "elapsed_time": "9:08:13", "remaining_time": "1 day, 0:55:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2912, "total_steps": 10853, "loss": 0.1632, "learning_rate": 4.376435898387334e-06, "epoch": 0.26830054821025473, "percentage": 26.83, "elapsed_time": "9:08:24", "remaining_time": "1 day, 0:55:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2913, "total_steps": 10853, "loss": 0.1846, "learning_rate": 4.375932435814167e-06, "epoch": 0.2683926843875248, "percentage": 26.84, "elapsed_time": "9:08:35", "remaining_time": "1 day, 0:55:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2914, "total_steps": 10853, "loss": 0.1675, "learning_rate": 4.37542879906047e-06, "epoch": 0.2684848205647948, "percentage": 26.85, "elapsed_time": "9:08:48", "remaining_time": "1 day, 0:55:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2915, "total_steps": 10853, "loss": 0.1608, "learning_rate": 4.374924988173008e-06, "epoch": 0.2685769567420648, "percentage": 26.86, "elapsed_time": "9:08:59", "remaining_time": "1 day, 0:54:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2916, "total_steps": 10853, "loss": 0.1575, "learning_rate": 4.374421003198559e-06, "epoch": 0.2686690929193348, "percentage": 26.87, "elapsed_time": "9:09:09", "remaining_time": "1 day, 0:54:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2917, "total_steps": 10853, "loss": 0.1587, "learning_rate": 4.373916844183918e-06, "epoch": 0.26876122909660477, "percentage": 26.88, "elapsed_time": "9:09:19", "remaining_time": "1 day, 0:54:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2918, "total_steps": 10853, "loss": 0.1575, "learning_rate": 4.373412511175897e-06, "epoch": 0.26885336527387477, "percentage": 26.89, "elapsed_time": "9:09:30", "remaining_time": "1 day, 0:54:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2919, "total_steps": 10853, "loss": 0.1687, "learning_rate": 4.372908004221322e-06, "epoch": 0.2689455014511448, "percentage": 26.9, "elapsed_time": "9:09:40", "remaining_time": "1 day, 0:54:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2920, "total_steps": 10853, "loss": 0.1538, "learning_rate": 4.372403323367037e-06, "epoch": 0.2690376376284148, "percentage": 26.91, "elapsed_time": "9:09:51", "remaining_time": "1 day, 0:53:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2921, "total_steps": 10853, "loss": 0.1701, "learning_rate": 4.371898468659903e-06, "epoch": 0.2691297738056848, "percentage": 26.91, "elapsed_time": "9:10:02", "remaining_time": "1 day, 0:53:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2922, "total_steps": 10853, "loss": 0.1654, "learning_rate": 4.371393440146794e-06, "epoch": 0.2692219099829548, "percentage": 26.92, "elapsed_time": "9:10:13", "remaining_time": "1 day, 0:53:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2923, "total_steps": 10853, "loss": 0.1494, "learning_rate": 4.370888237874602e-06, "epoch": 0.2693140461602248, "percentage": 26.93, "elapsed_time": "9:10:23", "remaining_time": "1 day, 0:53:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2924, "total_steps": 10853, "loss": 0.1459, "learning_rate": 4.370382861890237e-06, "epoch": 0.2694061823374948, "percentage": 26.94, "elapsed_time": "9:10:33", "remaining_time": "1 day, 0:52:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2925, "total_steps": 10853, "loss": 0.17, "learning_rate": 4.369877312240621e-06, "epoch": 0.2694983185147648, "percentage": 26.95, "elapsed_time": "9:10:44", "remaining_time": "1 day, 0:52:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2926, "total_steps": 10853, "loss": 0.1581, "learning_rate": 4.369371588972696e-06, "epoch": 0.26959045469203485, "percentage": 26.96, "elapsed_time": "9:10:55", "remaining_time": "1 day, 0:52:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2927, "total_steps": 10853, "loss": 0.1628, "learning_rate": 4.368865692133417e-06, "epoch": 0.26968259086930485, "percentage": 26.97, "elapsed_time": "9:11:06", "remaining_time": "1 day, 0:52:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2928, "total_steps": 10853, "loss": 0.1578, "learning_rate": 4.3683596217697585e-06, "epoch": 0.26977472704657485, "percentage": 26.98, "elapsed_time": "9:11:17", "remaining_time": "1 day, 0:52:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2929, "total_steps": 10853, "loss": 0.1777, "learning_rate": 4.367853377928707e-06, "epoch": 0.26986686322384484, "percentage": 26.99, "elapsed_time": "9:11:27", "remaining_time": "1 day, 0:51:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2930, "total_steps": 10853, "loss": 0.1523, "learning_rate": 4.367346960657269e-06, "epoch": 0.26995899940111484, "percentage": 27.0, "elapsed_time": "9:11:38", "remaining_time": "1 day, 0:51:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2931, "total_steps": 10853, "loss": 0.1602, "learning_rate": 4.366840370002465e-06, "epoch": 0.27005113557838484, "percentage": 27.01, "elapsed_time": "9:11:49", "remaining_time": "1 day, 0:51:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2932, "total_steps": 10853, "loss": 0.1674, "learning_rate": 4.366333606011331e-06, "epoch": 0.27014327175565483, "percentage": 27.02, "elapsed_time": "9:12:00", "remaining_time": "1 day, 0:51:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2933, "total_steps": 10853, "loss": 0.1662, "learning_rate": 4.365826668730921e-06, "epoch": 0.2702354079329249, "percentage": 27.02, "elapsed_time": "9:12:11", "remaining_time": "1 day, 0:51:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2934, "total_steps": 10853, "loss": 0.1656, "learning_rate": 4.365319558208304e-06, "epoch": 0.2703275441101949, "percentage": 27.03, "elapsed_time": "9:12:22", "remaining_time": "1 day, 0:50:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2935, "total_steps": 10853, "loss": 0.1918, "learning_rate": 4.3648122744905654e-06, "epoch": 0.2704196802874649, "percentage": 27.04, "elapsed_time": "9:12:34", "remaining_time": "1 day, 0:50:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2936, "total_steps": 10853, "loss": 0.1629, "learning_rate": 4.364304817624806e-06, "epoch": 0.2705118164647349, "percentage": 27.05, "elapsed_time": "9:12:44", "remaining_time": "1 day, 0:50:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2937, "total_steps": 10853, "loss": 0.1524, "learning_rate": 4.363797187658144e-06, "epoch": 0.2706039526420049, "percentage": 27.06, "elapsed_time": "9:12:54", "remaining_time": "1 day, 0:50:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2938, "total_steps": 10853, "loss": 0.1677, "learning_rate": 4.363289384637713e-06, "epoch": 0.27069608881927487, "percentage": 27.07, "elapsed_time": "9:13:05", "remaining_time": "1 day, 0:50:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2939, "total_steps": 10853, "loss": 0.1596, "learning_rate": 4.362781408610662e-06, "epoch": 0.27078822499654487, "percentage": 27.08, "elapsed_time": "9:13:16", "remaining_time": "1 day, 0:49:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2940, "total_steps": 10853, "loss": 0.1587, "learning_rate": 4.362273259624156e-06, "epoch": 0.2708803611738149, "percentage": 27.09, "elapsed_time": "9:13:24", "remaining_time": "1 day, 0:49:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2941, "total_steps": 10853, "loss": 0.1713, "learning_rate": 4.3617649377253775e-06, "epoch": 0.2709724973510849, "percentage": 27.1, "elapsed_time": "9:13:36", "remaining_time": "1 day, 0:49:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2942, "total_steps": 10853, "loss": 0.1703, "learning_rate": 4.361256442961524e-06, "epoch": 0.2710646335283549, "percentage": 27.11, "elapsed_time": "9:13:47", "remaining_time": "1 day, 0:49:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2943, "total_steps": 10853, "loss": 0.1704, "learning_rate": 4.360747775379811e-06, "epoch": 0.2711567697056249, "percentage": 27.12, "elapsed_time": "9:14:00", "remaining_time": "1 day, 0:49:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2944, "total_steps": 10853, "loss": 0.1591, "learning_rate": 4.3602389350274656e-06, "epoch": 0.2712489058828949, "percentage": 27.13, "elapsed_time": "9:14:11", "remaining_time": "1 day, 0:48:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2945, "total_steps": 10853, "loss": 0.1668, "learning_rate": 4.359729921951735e-06, "epoch": 0.2713410420601649, "percentage": 27.14, "elapsed_time": "9:14:22", "remaining_time": "1 day, 0:48:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2946, "total_steps": 10853, "loss": 0.1692, "learning_rate": 4.3592207361998815e-06, "epoch": 0.2714331782374349, "percentage": 27.14, "elapsed_time": "9:14:32", "remaining_time": "1 day, 0:48:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2947, "total_steps": 10853, "loss": 0.1562, "learning_rate": 4.358711377819181e-06, "epoch": 0.27152531441470495, "percentage": 27.15, "elapsed_time": "9:14:43", "remaining_time": "1 day, 0:48:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2948, "total_steps": 10853, "loss": 0.1578, "learning_rate": 4.358201846856931e-06, "epoch": 0.27161745059197495, "percentage": 27.16, "elapsed_time": "9:14:55", "remaining_time": "1 day, 0:48:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2949, "total_steps": 10853, "loss": 0.1602, "learning_rate": 4.357692143360438e-06, "epoch": 0.27170958676924495, "percentage": 27.17, "elapsed_time": "9:15:07", "remaining_time": "1 day, 0:47:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2950, "total_steps": 10853, "loss": 0.1607, "learning_rate": 4.35718226737703e-06, "epoch": 0.27180172294651495, "percentage": 27.18, "elapsed_time": "9:15:18", "remaining_time": "1 day, 0:47:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2951, "total_steps": 10853, "loss": 0.1724, "learning_rate": 4.35667221895405e-06, "epoch": 0.27189385912378494, "percentage": 27.19, "elapsed_time": "9:15:30", "remaining_time": "1 day, 0:47:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2952, "total_steps": 10853, "loss": 0.1724, "learning_rate": 4.356161998138853e-06, "epoch": 0.27198599530105494, "percentage": 27.2, "elapsed_time": "9:15:41", "remaining_time": "1 day, 0:47:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2953, "total_steps": 10853, "loss": 0.1597, "learning_rate": 4.355651604978815e-06, "epoch": 0.272078131478325, "percentage": 27.21, "elapsed_time": "9:15:52", "remaining_time": "1 day, 0:47:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2954, "total_steps": 10853, "loss": 0.16, "learning_rate": 4.355141039521325e-06, "epoch": 0.272170267655595, "percentage": 27.22, "elapsed_time": "9:16:04", "remaining_time": "1 day, 0:46:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2955, "total_steps": 10853, "loss": 0.1512, "learning_rate": 4.3546303018137915e-06, "epoch": 0.272262403832865, "percentage": 27.23, "elapsed_time": "9:16:14", "remaining_time": "1 day, 0:46:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2956, "total_steps": 10853, "loss": 0.1654, "learning_rate": 4.354119391903634e-06, "epoch": 0.272354540010135, "percentage": 27.24, "elapsed_time": "9:16:23", "remaining_time": "1 day, 0:46:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2957, "total_steps": 10853, "loss": 0.1403, "learning_rate": 4.353608309838292e-06, "epoch": 0.272446676187405, "percentage": 27.25, "elapsed_time": "9:16:34", "remaining_time": "1 day, 0:46:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2958, "total_steps": 10853, "loss": 0.1566, "learning_rate": 4.353097055665219e-06, "epoch": 0.272538812364675, "percentage": 27.26, "elapsed_time": "9:16:44", "remaining_time": "1 day, 0:45:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2959, "total_steps": 10853, "loss": 0.165, "learning_rate": 4.352585629431883e-06, "epoch": 0.272630948541945, "percentage": 27.26, "elapsed_time": "9:16:56", "remaining_time": "1 day, 0:45:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2960, "total_steps": 10853, "loss": 0.1573, "learning_rate": 4.352074031185774e-06, "epoch": 0.272723084719215, "percentage": 27.27, "elapsed_time": "9:17:07", "remaining_time": "1 day, 0:45:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2961, "total_steps": 10853, "loss": 0.1749, "learning_rate": 4.351562260974391e-06, "epoch": 0.272815220896485, "percentage": 27.28, "elapsed_time": "9:17:18", "remaining_time": "1 day, 0:45:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2962, "total_steps": 10853, "loss": 0.1693, "learning_rate": 4.3510503188452535e-06, "epoch": 0.272907357073755, "percentage": 27.29, "elapsed_time": "9:17:28", "remaining_time": "1 day, 0:45:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2963, "total_steps": 10853, "loss": 0.1641, "learning_rate": 4.350538204845895e-06, "epoch": 0.272999493251025, "percentage": 27.3, "elapsed_time": "9:17:39", "remaining_time": "1 day, 0:44:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2964, "total_steps": 10853, "loss": 0.1714, "learning_rate": 4.350025919023864e-06, "epoch": 0.273091629428295, "percentage": 27.31, "elapsed_time": "9:17:50", "remaining_time": "1 day, 0:44:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2965, "total_steps": 10853, "loss": 0.1777, "learning_rate": 4.349513461426728e-06, "epoch": 0.273183765605565, "percentage": 27.32, "elapsed_time": "9:18:00", "remaining_time": "1 day, 0:44:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2966, "total_steps": 10853, "loss": 0.1606, "learning_rate": 4.349000832102067e-06, "epoch": 0.273275901782835, "percentage": 27.33, "elapsed_time": "9:18:11", "remaining_time": "1 day, 0:44:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2967, "total_steps": 10853, "loss": 0.1603, "learning_rate": 4.348488031097481e-06, "epoch": 0.27336803796010506, "percentage": 27.34, "elapsed_time": "9:18:20", "remaining_time": "1 day, 0:44:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2968, "total_steps": 10853, "loss": 0.16, "learning_rate": 4.3479750584605814e-06, "epoch": 0.27346017413737506, "percentage": 27.35, "elapsed_time": "9:18:30", "remaining_time": "1 day, 0:43:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2969, "total_steps": 10853, "loss": 0.1662, "learning_rate": 4.347461914238999e-06, "epoch": 0.27355231031464505, "percentage": 27.36, "elapsed_time": "9:18:41", "remaining_time": "1 day, 0:43:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2970, "total_steps": 10853, "loss": 0.162, "learning_rate": 4.34694859848038e-06, "epoch": 0.27364444649191505, "percentage": 27.37, "elapsed_time": "9:18:51", "remaining_time": "1 day, 0:43:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2971, "total_steps": 10853, "loss": 0.1673, "learning_rate": 4.346435111232383e-06, "epoch": 0.27373658266918505, "percentage": 27.37, "elapsed_time": "9:19:01", "remaining_time": "1 day, 0:43:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2972, "total_steps": 10853, "loss": 0.1578, "learning_rate": 4.345921452542689e-06, "epoch": 0.27382871884645504, "percentage": 27.38, "elapsed_time": "9:19:13", "remaining_time": "1 day, 0:42:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2973, "total_steps": 10853, "loss": 0.1673, "learning_rate": 4.345407622458988e-06, "epoch": 0.27392085502372504, "percentage": 27.39, "elapsed_time": "9:19:22", "remaining_time": "1 day, 0:42:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2974, "total_steps": 10853, "loss": 0.1457, "learning_rate": 4.3448936210289916e-06, "epoch": 0.2740129912009951, "percentage": 27.4, "elapsed_time": "9:19:33", "remaining_time": "1 day, 0:42:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2975, "total_steps": 10853, "loss": 0.1704, "learning_rate": 4.344379448300423e-06, "epoch": 0.2741051273782651, "percentage": 27.41, "elapsed_time": "9:19:44", "remaining_time": "1 day, 0:42:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2976, "total_steps": 10853, "loss": 0.1546, "learning_rate": 4.343865104321026e-06, "epoch": 0.2741972635555351, "percentage": 27.42, "elapsed_time": "9:19:53", "remaining_time": "1 day, 0:41:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2977, "total_steps": 10853, "loss": 0.1668, "learning_rate": 4.3433505891385534e-06, "epoch": 0.2742893997328051, "percentage": 27.43, "elapsed_time": "9:20:04", "remaining_time": "1 day, 0:41:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2978, "total_steps": 10853, "loss": 0.1692, "learning_rate": 4.342835902800782e-06, "epoch": 0.2743815359100751, "percentage": 27.44, "elapsed_time": "9:20:15", "remaining_time": "1 day, 0:41:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2979, "total_steps": 10853, "loss": 0.1679, "learning_rate": 4.342321045355498e-06, "epoch": 0.2744736720873451, "percentage": 27.45, "elapsed_time": "9:20:26", "remaining_time": "1 day, 0:41:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2980, "total_steps": 10853, "loss": 0.1564, "learning_rate": 4.341806016850506e-06, "epoch": 0.2745658082646151, "percentage": 27.46, "elapsed_time": "9:20:38", "remaining_time": "1 day, 0:41:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2981, "total_steps": 10853, "loss": 0.173, "learning_rate": 4.341290817333628e-06, "epoch": 0.2746579444418851, "percentage": 27.47, "elapsed_time": "9:20:48", "remaining_time": "1 day, 0:40:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2982, "total_steps": 10853, "loss": 0.1559, "learning_rate": 4.340775446852699e-06, "epoch": 0.2747500806191551, "percentage": 27.48, "elapsed_time": "9:21:01", "remaining_time": "1 day, 0:40:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2983, "total_steps": 10853, "loss": 0.1516, "learning_rate": 4.340259905455572e-06, "epoch": 0.2748422167964251, "percentage": 27.49, "elapsed_time": "9:21:13", "remaining_time": "1 day, 0:40:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2984, "total_steps": 10853, "loss": 0.1713, "learning_rate": 4.339744193190114e-06, "epoch": 0.2749343529736951, "percentage": 27.49, "elapsed_time": "9:21:24", "remaining_time": "1 day, 0:40:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2985, "total_steps": 10853, "loss": 0.1827, "learning_rate": 4.339228310104211e-06, "epoch": 0.2750264891509651, "percentage": 27.5, "elapsed_time": "9:21:34", "remaining_time": "1 day, 0:40:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2986, "total_steps": 10853, "loss": 0.1586, "learning_rate": 4.338712256245761e-06, "epoch": 0.2751186253282351, "percentage": 27.51, "elapsed_time": "9:21:44", "remaining_time": "1 day, 0:39:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2987, "total_steps": 10853, "loss": 0.1591, "learning_rate": 4.3381960316626795e-06, "epoch": 0.27521076150550516, "percentage": 27.52, "elapsed_time": "9:21:55", "remaining_time": "1 day, 0:39:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2988, "total_steps": 10853, "loss": 0.1595, "learning_rate": 4.337679636402898e-06, "epoch": 0.27530289768277516, "percentage": 27.53, "elapsed_time": "9:22:06", "remaining_time": "1 day, 0:39:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2989, "total_steps": 10853, "loss": 0.155, "learning_rate": 4.3371630705143665e-06, "epoch": 0.27539503386004516, "percentage": 27.54, "elapsed_time": "9:22:16", "remaining_time": "1 day, 0:39:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2990, "total_steps": 10853, "loss": 0.1565, "learning_rate": 4.336646334045045e-06, "epoch": 0.27548717003731515, "percentage": 27.55, "elapsed_time": "9:22:27", "remaining_time": "1 day, 0:39:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2991, "total_steps": 10853, "loss": 0.1486, "learning_rate": 4.336129427042913e-06, "epoch": 0.27557930621458515, "percentage": 27.56, "elapsed_time": "9:22:37", "remaining_time": "1 day, 0:38:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2992, "total_steps": 10853, "loss": 0.1706, "learning_rate": 4.335612349555967e-06, "epoch": 0.27567144239185515, "percentage": 27.57, "elapsed_time": "9:22:49", "remaining_time": "1 day, 0:38:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2993, "total_steps": 10853, "loss": 0.1703, "learning_rate": 4.335095101632217e-06, "epoch": 0.27576357856912515, "percentage": 27.58, "elapsed_time": "9:22:59", "remaining_time": "1 day, 0:38:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2994, "total_steps": 10853, "loss": 0.1515, "learning_rate": 4.334577683319689e-06, "epoch": 0.2758557147463952, "percentage": 27.59, "elapsed_time": "9:23:09", "remaining_time": "1 day, 0:38:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2995, "total_steps": 10853, "loss": 0.1623, "learning_rate": 4.334060094666426e-06, "epoch": 0.2759478509236652, "percentage": 27.6, "elapsed_time": "9:23:21", "remaining_time": "1 day, 0:38:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2996, "total_steps": 10853, "loss": 0.1736, "learning_rate": 4.333542335720485e-06, "epoch": 0.2760399871009352, "percentage": 27.61, "elapsed_time": "9:23:32", "remaining_time": "1 day, 0:37:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2997, "total_steps": 10853, "loss": 0.1663, "learning_rate": 4.3330244065299424e-06, "epoch": 0.2761321232782052, "percentage": 27.61, "elapsed_time": "9:23:43", "remaining_time": "1 day, 0:37:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2998, "total_steps": 10853, "loss": 0.1557, "learning_rate": 4.332506307142885e-06, "epoch": 0.2762242594554752, "percentage": 27.62, "elapsed_time": "9:23:55", "remaining_time": "1 day, 0:37:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2999, "total_steps": 10853, "loss": 0.1623, "learning_rate": 4.33198803760742e-06, "epoch": 0.2763163956327452, "percentage": 27.63, "elapsed_time": "9:24:05", "remaining_time": "1 day, 0:37:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3000, "total_steps": 10853, "loss": 0.1507, "learning_rate": 4.3314695979716684e-06, "epoch": 0.2764085318100152, "percentage": 27.64, "elapsed_time": "9:24:16", "remaining_time": "1 day, 0:37:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3000, "total_steps": 10853, "eval_loss": 0.1629796177148819, "epoch": 0.2764085318100152, "percentage": 27.64, "elapsed_time": "9:29:16", "remaining_time": "1 day, 0:50:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3001, "total_steps": 10853, "loss": 0.1647, "learning_rate": 4.330950988283767e-06, "epoch": 0.27650066798728523, "percentage": 27.65, "elapsed_time": "9:29:26", "remaining_time": "1 day, 0:49:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3002, "total_steps": 10853, "loss": 0.1517, "learning_rate": 4.330432208591871e-06, "epoch": 0.27659280416455523, "percentage": 27.66, "elapsed_time": "9:29:38", "remaining_time": "1 day, 0:49:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3003, "total_steps": 10853, "loss": 0.1629, "learning_rate": 4.329913258944146e-06, "epoch": 0.2766849403418252, "percentage": 27.67, "elapsed_time": "9:29:49", "remaining_time": "1 day, 0:49:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3004, "total_steps": 10853, "loss": 0.1547, "learning_rate": 4.329394139388779e-06, "epoch": 0.2767770765190952, "percentage": 27.68, "elapsed_time": "9:30:00", "remaining_time": "1 day, 0:49:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3005, "total_steps": 10853, "loss": 0.166, "learning_rate": 4.328874849973968e-06, "epoch": 0.2768692126963652, "percentage": 27.69, "elapsed_time": "9:30:12", "remaining_time": "1 day, 0:49:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3006, "total_steps": 10853, "loss": 0.1685, "learning_rate": 4.328355390747931e-06, "epoch": 0.2769613488736352, "percentage": 27.7, "elapsed_time": "9:30:23", "remaining_time": "1 day, 0:48:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3007, "total_steps": 10853, "loss": 0.1578, "learning_rate": 4.3278357617589e-06, "epoch": 0.2770534850509052, "percentage": 27.71, "elapsed_time": "9:30:32", "remaining_time": "1 day, 0:48:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3008, "total_steps": 10853, "loss": 0.1584, "learning_rate": 4.327315963055121e-06, "epoch": 0.27714562122817527, "percentage": 27.72, "elapsed_time": "9:30:44", "remaining_time": "1 day, 0:48:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3009, "total_steps": 10853, "loss": 0.1629, "learning_rate": 4.326795994684858e-06, "epoch": 0.27723775740544526, "percentage": 27.73, "elapsed_time": "9:30:54", "remaining_time": "1 day, 0:48:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3010, "total_steps": 10853, "loss": 0.1462, "learning_rate": 4.326275856696391e-06, "epoch": 0.27732989358271526, "percentage": 27.73, "elapsed_time": "9:31:04", "remaining_time": "1 day, 0:48:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3011, "total_steps": 10853, "loss": 0.1626, "learning_rate": 4.325755549138014e-06, "epoch": 0.27742202975998526, "percentage": 27.74, "elapsed_time": "9:31:14", "remaining_time": "1 day, 0:47:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3012, "total_steps": 10853, "loss": 0.1682, "learning_rate": 4.325235072058037e-06, "epoch": 0.27751416593725525, "percentage": 27.75, "elapsed_time": "9:31:25", "remaining_time": "1 day, 0:47:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3013, "total_steps": 10853, "loss": 0.1681, "learning_rate": 4.324714425504788e-06, "epoch": 0.27760630211452525, "percentage": 27.76, "elapsed_time": "9:31:35", "remaining_time": "1 day, 0:47:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3014, "total_steps": 10853, "loss": 0.1493, "learning_rate": 4.324193609526607e-06, "epoch": 0.27769843829179525, "percentage": 27.77, "elapsed_time": "9:31:45", "remaining_time": "1 day, 0:47:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3015, "total_steps": 10853, "loss": 0.1716, "learning_rate": 4.323672624171854e-06, "epoch": 0.2777905744690653, "percentage": 27.78, "elapsed_time": "9:31:56", "remaining_time": "1 day, 0:46:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3016, "total_steps": 10853, "loss": 0.1596, "learning_rate": 4.323151469488902e-06, "epoch": 0.2778827106463353, "percentage": 27.79, "elapsed_time": "9:32:07", "remaining_time": "1 day, 0:46:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3017, "total_steps": 10853, "loss": 0.1603, "learning_rate": 4.322630145526139e-06, "epoch": 0.2779748468236053, "percentage": 27.8, "elapsed_time": "9:32:17", "remaining_time": "1 day, 0:46:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3018, "total_steps": 10853, "loss": 0.147, "learning_rate": 4.322108652331971e-06, "epoch": 0.2780669830008753, "percentage": 27.81, "elapsed_time": "9:32:29", "remaining_time": "1 day, 0:46:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3019, "total_steps": 10853, "loss": 0.152, "learning_rate": 4.321586989954819e-06, "epoch": 0.2781591191781453, "percentage": 27.82, "elapsed_time": "9:32:38", "remaining_time": "1 day, 0:45:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3020, "total_steps": 10853, "loss": 0.1708, "learning_rate": 4.3210651584431186e-06, "epoch": 0.2782512553554153, "percentage": 27.83, "elapsed_time": "9:32:50", "remaining_time": "1 day, 0:45:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3021, "total_steps": 10853, "loss": 0.1664, "learning_rate": 4.320543157845321e-06, "epoch": 0.27834339153268534, "percentage": 27.84, "elapsed_time": "9:33:02", "remaining_time": "1 day, 0:45:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3022, "total_steps": 10853, "loss": 0.1524, "learning_rate": 4.320020988209898e-06, "epoch": 0.27843552770995533, "percentage": 27.84, "elapsed_time": "9:33:12", "remaining_time": "1 day, 0:45:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3023, "total_steps": 10853, "loss": 0.1837, "learning_rate": 4.319498649585329e-06, "epoch": 0.27852766388722533, "percentage": 27.85, "elapsed_time": "9:33:24", "remaining_time": "1 day, 0:45:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3024, "total_steps": 10853, "loss": 0.1815, "learning_rate": 4.318976142020113e-06, "epoch": 0.2786198000644953, "percentage": 27.86, "elapsed_time": "9:33:35", "remaining_time": "1 day, 0:44:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3025, "total_steps": 10853, "loss": 0.1648, "learning_rate": 4.318453465562768e-06, "epoch": 0.2787119362417653, "percentage": 27.87, "elapsed_time": "9:33:47", "remaining_time": "1 day, 0:44:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3026, "total_steps": 10853, "loss": 0.1541, "learning_rate": 4.317930620261823e-06, "epoch": 0.2788040724190353, "percentage": 27.88, "elapsed_time": "9:33:58", "remaining_time": "1 day, 0:44:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3027, "total_steps": 10853, "loss": 0.1693, "learning_rate": 4.317407606165825e-06, "epoch": 0.2788962085963053, "percentage": 27.89, "elapsed_time": "9:34:09", "remaining_time": "1 day, 0:44:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3028, "total_steps": 10853, "loss": 0.1672, "learning_rate": 4.3168844233233345e-06, "epoch": 0.27898834477357537, "percentage": 27.9, "elapsed_time": "9:34:20", "remaining_time": "1 day, 0:44:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3029, "total_steps": 10853, "loss": 0.1674, "learning_rate": 4.316361071782929e-06, "epoch": 0.27908048095084537, "percentage": 27.91, "elapsed_time": "9:34:31", "remaining_time": "1 day, 0:43:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3030, "total_steps": 10853, "loss": 0.1566, "learning_rate": 4.315837551593203e-06, "epoch": 0.27917261712811536, "percentage": 27.92, "elapsed_time": "9:34:41", "remaining_time": "1 day, 0:43:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3031, "total_steps": 10853, "loss": 0.156, "learning_rate": 4.315313862802766e-06, "epoch": 0.27926475330538536, "percentage": 27.93, "elapsed_time": "9:34:51", "remaining_time": "1 day, 0:43:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3032, "total_steps": 10853, "loss": 0.1767, "learning_rate": 4.31479000546024e-06, "epoch": 0.27935688948265536, "percentage": 27.94, "elapsed_time": "9:35:02", "remaining_time": "1 day, 0:43:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3033, "total_steps": 10853, "loss": 0.1708, "learning_rate": 4.314265979614267e-06, "epoch": 0.27944902565992535, "percentage": 27.95, "elapsed_time": "9:35:14", "remaining_time": "1 day, 0:43:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3034, "total_steps": 10853, "loss": 0.1554, "learning_rate": 4.313741785313503e-06, "epoch": 0.27954116183719535, "percentage": 27.96, "elapsed_time": "9:35:25", "remaining_time": "1 day, 0:42:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3035, "total_steps": 10853, "loss": 0.1569, "learning_rate": 4.313217422606618e-06, "epoch": 0.2796332980144654, "percentage": 27.96, "elapsed_time": "9:35:36", "remaining_time": "1 day, 0:42:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3036, "total_steps": 10853, "loss": 0.1661, "learning_rate": 4.312692891542302e-06, "epoch": 0.2797254341917354, "percentage": 27.97, "elapsed_time": "9:35:46", "remaining_time": "1 day, 0:42:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3037, "total_steps": 10853, "loss": 0.1603, "learning_rate": 4.312168192169254e-06, "epoch": 0.2798175703690054, "percentage": 27.98, "elapsed_time": "9:35:57", "remaining_time": "1 day, 0:42:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3038, "total_steps": 10853, "loss": 0.1624, "learning_rate": 4.311643324536195e-06, "epoch": 0.2799097065462754, "percentage": 27.99, "elapsed_time": "9:36:08", "remaining_time": "1 day, 0:42:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3039, "total_steps": 10853, "loss": 0.1684, "learning_rate": 4.311118288691859e-06, "epoch": 0.2800018427235454, "percentage": 28.0, "elapsed_time": "9:36:19", "remaining_time": "1 day, 0:41:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3040, "total_steps": 10853, "loss": 0.1714, "learning_rate": 4.3105930846849945e-06, "epoch": 0.2800939789008154, "percentage": 28.01, "elapsed_time": "9:36:30", "remaining_time": "1 day, 0:41:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3041, "total_steps": 10853, "loss": 0.1448, "learning_rate": 4.310067712564367e-06, "epoch": 0.2801861150780854, "percentage": 28.02, "elapsed_time": "9:36:40", "remaining_time": "1 day, 0:41:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3042, "total_steps": 10853, "loss": 0.1672, "learning_rate": 4.3095421723787585e-06, "epoch": 0.28027825125535544, "percentage": 28.03, "elapsed_time": "9:36:52", "remaining_time": "1 day, 0:41:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3043, "total_steps": 10853, "loss": 0.1653, "learning_rate": 4.309016464176964e-06, "epoch": 0.28037038743262543, "percentage": 28.04, "elapsed_time": "9:37:03", "remaining_time": "1 day, 0:41:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3044, "total_steps": 10853, "loss": 0.1634, "learning_rate": 4.308490588007796e-06, "epoch": 0.28046252360989543, "percentage": 28.05, "elapsed_time": "9:37:15", "remaining_time": "1 day, 0:40:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3045, "total_steps": 10853, "loss": 0.1662, "learning_rate": 4.307964543920083e-06, "epoch": 0.28055465978716543, "percentage": 28.06, "elapsed_time": "9:37:26", "remaining_time": "1 day, 0:40:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3046, "total_steps": 10853, "loss": 0.1594, "learning_rate": 4.3074383319626655e-06, "epoch": 0.2806467959644354, "percentage": 28.07, "elapsed_time": "9:37:35", "remaining_time": "1 day, 0:40:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3047, "total_steps": 10853, "loss": 0.1487, "learning_rate": 4.306911952184406e-06, "epoch": 0.2807389321417054, "percentage": 28.08, "elapsed_time": "9:37:46", "remaining_time": "1 day, 0:40:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3048, "total_steps": 10853, "loss": 0.1786, "learning_rate": 4.306385404634177e-06, "epoch": 0.2808310683189754, "percentage": 28.08, "elapsed_time": "9:37:56", "remaining_time": "1 day, 0:39:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3049, "total_steps": 10853, "loss": 0.1492, "learning_rate": 4.305858689360869e-06, "epoch": 0.28092320449624547, "percentage": 28.09, "elapsed_time": "9:38:06", "remaining_time": "1 day, 0:39:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3050, "total_steps": 10853, "loss": 0.1637, "learning_rate": 4.3053318064133864e-06, "epoch": 0.28101534067351547, "percentage": 28.1, "elapsed_time": "9:38:16", "remaining_time": "1 day, 0:39:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3051, "total_steps": 10853, "loss": 0.159, "learning_rate": 4.3048047558406525e-06, "epoch": 0.28110747685078546, "percentage": 28.11, "elapsed_time": "9:38:26", "remaining_time": "1 day, 0:39:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3052, "total_steps": 10853, "loss": 0.1589, "learning_rate": 4.304277537691602e-06, "epoch": 0.28119961302805546, "percentage": 28.12, "elapsed_time": "9:38:37", "remaining_time": "1 day, 0:38:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3053, "total_steps": 10853, "loss": 0.1675, "learning_rate": 4.303750152015188e-06, "epoch": 0.28129174920532546, "percentage": 28.13, "elapsed_time": "9:38:49", "remaining_time": "1 day, 0:38:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3054, "total_steps": 10853, "loss": 0.1537, "learning_rate": 4.3032225988603786e-06, "epoch": 0.28138388538259546, "percentage": 28.14, "elapsed_time": "9:39:00", "remaining_time": "1 day, 0:38:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3055, "total_steps": 10853, "loss": 0.1679, "learning_rate": 4.302694878276157e-06, "epoch": 0.2814760215598655, "percentage": 28.15, "elapsed_time": "9:39:11", "remaining_time": "1 day, 0:38:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3056, "total_steps": 10853, "loss": 0.1825, "learning_rate": 4.302166990311522e-06, "epoch": 0.2815681577371355, "percentage": 28.16, "elapsed_time": "9:39:23", "remaining_time": "1 day, 0:38:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3057, "total_steps": 10853, "loss": 0.1456, "learning_rate": 4.301638935015487e-06, "epoch": 0.2816602939144055, "percentage": 28.17, "elapsed_time": "9:39:34", "remaining_time": "1 day, 0:38:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3058, "total_steps": 10853, "loss": 0.1498, "learning_rate": 4.3011107124370835e-06, "epoch": 0.2817524300916755, "percentage": 28.18, "elapsed_time": "9:39:44", "remaining_time": "1 day, 0:37:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3059, "total_steps": 10853, "loss": 0.1524, "learning_rate": 4.300582322625356e-06, "epoch": 0.2818445662689455, "percentage": 28.19, "elapsed_time": "9:39:55", "remaining_time": "1 day, 0:37:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3060, "total_steps": 10853, "loss": 0.1708, "learning_rate": 4.300053765629367e-06, "epoch": 0.2819367024462155, "percentage": 28.19, "elapsed_time": "9:40:07", "remaining_time": "1 day, 0:37:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3061, "total_steps": 10853, "loss": 0.149, "learning_rate": 4.299525041498192e-06, "epoch": 0.2820288386234855, "percentage": 28.2, "elapsed_time": "9:40:17", "remaining_time": "1 day, 0:37:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3062, "total_steps": 10853, "loss": 0.1581, "learning_rate": 4.298996150280923e-06, "epoch": 0.28212097480075554, "percentage": 28.21, "elapsed_time": "9:40:30", "remaining_time": "1 day, 0:37:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3063, "total_steps": 10853, "loss": 0.1677, "learning_rate": 4.298467092026668e-06, "epoch": 0.28221311097802554, "percentage": 28.22, "elapsed_time": "9:40:41", "remaining_time": "1 day, 0:36:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3064, "total_steps": 10853, "loss": 0.1517, "learning_rate": 4.29793786678455e-06, "epoch": 0.28230524715529554, "percentage": 28.23, "elapsed_time": "9:40:52", "remaining_time": "1 day, 0:36:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3065, "total_steps": 10853, "loss": 0.1738, "learning_rate": 4.297408474603707e-06, "epoch": 0.28239738333256553, "percentage": 28.24, "elapsed_time": "9:41:02", "remaining_time": "1 day, 0:36:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3066, "total_steps": 10853, "loss": 0.1703, "learning_rate": 4.296878915533294e-06, "epoch": 0.28248951950983553, "percentage": 28.25, "elapsed_time": "9:41:13", "remaining_time": "1 day, 0:36:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3067, "total_steps": 10853, "loss": 0.1541, "learning_rate": 4.2963491896224806e-06, "epoch": 0.2825816556871055, "percentage": 28.26, "elapsed_time": "9:41:24", "remaining_time": "1 day, 0:35:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3068, "total_steps": 10853, "loss": 0.1602, "learning_rate": 4.295819296920451e-06, "epoch": 0.2826737918643755, "percentage": 28.27, "elapsed_time": "9:41:34", "remaining_time": "1 day, 0:35:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3069, "total_steps": 10853, "loss": 0.1623, "learning_rate": 4.295289237476407e-06, "epoch": 0.2827659280416456, "percentage": 28.28, "elapsed_time": "9:41:43", "remaining_time": "1 day, 0:35:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3070, "total_steps": 10853, "loss": 0.1574, "learning_rate": 4.294759011339564e-06, "epoch": 0.2828580642189156, "percentage": 28.29, "elapsed_time": "9:41:53", "remaining_time": "1 day, 0:35:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3071, "total_steps": 10853, "loss": 0.178, "learning_rate": 4.294228618559153e-06, "epoch": 0.28295020039618557, "percentage": 28.3, "elapsed_time": "9:42:03", "remaining_time": "1 day, 0:34:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3072, "total_steps": 10853, "loss": 0.1549, "learning_rate": 4.293698059184423e-06, "epoch": 0.28304233657345557, "percentage": 28.31, "elapsed_time": "9:42:14", "remaining_time": "1 day, 0:34:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3073, "total_steps": 10853, "loss": 0.1516, "learning_rate": 4.293167333264634e-06, "epoch": 0.28313447275072556, "percentage": 28.31, "elapsed_time": "9:42:25", "remaining_time": "1 day, 0:34:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3074, "total_steps": 10853, "loss": 0.1559, "learning_rate": 4.292636440849065e-06, "epoch": 0.28322660892799556, "percentage": 28.32, "elapsed_time": "9:42:34", "remaining_time": "1 day, 0:34:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3075, "total_steps": 10853, "loss": 0.1531, "learning_rate": 4.292105381987011e-06, "epoch": 0.28331874510526556, "percentage": 28.33, "elapsed_time": "9:42:46", "remaining_time": "1 day, 0:34:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3076, "total_steps": 10853, "loss": 0.1823, "learning_rate": 4.291574156727778e-06, "epoch": 0.2834108812825356, "percentage": 28.34, "elapsed_time": "9:42:57", "remaining_time": "1 day, 0:33:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3077, "total_steps": 10853, "loss": 0.1551, "learning_rate": 4.291042765120693e-06, "epoch": 0.2835030174598056, "percentage": 28.35, "elapsed_time": "9:43:10", "remaining_time": "1 day, 0:33:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3078, "total_steps": 10853, "loss": 0.1562, "learning_rate": 4.290511207215093e-06, "epoch": 0.2835951536370756, "percentage": 28.36, "elapsed_time": "9:43:20", "remaining_time": "1 day, 0:33:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3079, "total_steps": 10853, "loss": 0.1643, "learning_rate": 4.289979483060336e-06, "epoch": 0.2836872898143456, "percentage": 28.37, "elapsed_time": "9:43:29", "remaining_time": "1 day, 0:33:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3080, "total_steps": 10853, "loss": 0.151, "learning_rate": 4.289447592705791e-06, "epoch": 0.2837794259916156, "percentage": 28.38, "elapsed_time": "9:43:40", "remaining_time": "1 day, 0:33:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3081, "total_steps": 10853, "loss": 0.1724, "learning_rate": 4.2889155362008435e-06, "epoch": 0.2838715621688856, "percentage": 28.39, "elapsed_time": "9:43:51", "remaining_time": "1 day, 0:32:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3082, "total_steps": 10853, "loss": 0.1571, "learning_rate": 4.288383313594897e-06, "epoch": 0.2839636983461556, "percentage": 28.4, "elapsed_time": "9:44:01", "remaining_time": "1 day, 0:32:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3083, "total_steps": 10853, "loss": 0.1625, "learning_rate": 4.287850924937367e-06, "epoch": 0.28405583452342564, "percentage": 28.41, "elapsed_time": "9:44:12", "remaining_time": "1 day, 0:32:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3084, "total_steps": 10853, "loss": 0.1598, "learning_rate": 4.287318370277686e-06, "epoch": 0.28414797070069564, "percentage": 28.42, "elapsed_time": "9:44:23", "remaining_time": "1 day, 0:32:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3085, "total_steps": 10853, "loss": 0.1428, "learning_rate": 4.286785649665302e-06, "epoch": 0.28424010687796564, "percentage": 28.43, "elapsed_time": "9:44:33", "remaining_time": "1 day, 0:31:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3086, "total_steps": 10853, "loss": 0.1726, "learning_rate": 4.286252763149679e-06, "epoch": 0.28433224305523563, "percentage": 28.43, "elapsed_time": "9:44:43", "remaining_time": "1 day, 0:31:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3087, "total_steps": 10853, "loss": 0.1628, "learning_rate": 4.2857197107802936e-06, "epoch": 0.28442437923250563, "percentage": 28.44, "elapsed_time": "9:44:53", "remaining_time": "1 day, 0:31:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3088, "total_steps": 10853, "loss": 0.1553, "learning_rate": 4.285186492606641e-06, "epoch": 0.2845165154097756, "percentage": 28.45, "elapsed_time": "9:45:04", "remaining_time": "1 day, 0:31:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3089, "total_steps": 10853, "loss": 0.1475, "learning_rate": 4.2846531086782315e-06, "epoch": 0.2846086515870457, "percentage": 28.46, "elapsed_time": "9:45:16", "remaining_time": "1 day, 0:31:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3090, "total_steps": 10853, "loss": 0.1622, "learning_rate": 4.2841195590445875e-06, "epoch": 0.2847007877643157, "percentage": 28.47, "elapsed_time": "9:45:26", "remaining_time": "1 day, 0:30:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3091, "total_steps": 10853, "loss": 0.1593, "learning_rate": 4.283585843755251e-06, "epoch": 0.2847929239415857, "percentage": 28.48, "elapsed_time": "9:45:37", "remaining_time": "1 day, 0:30:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3092, "total_steps": 10853, "loss": 0.1587, "learning_rate": 4.283051962859776e-06, "epoch": 0.28488506011885567, "percentage": 28.49, "elapsed_time": "9:45:47", "remaining_time": "1 day, 0:30:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3093, "total_steps": 10853, "loss": 0.1807, "learning_rate": 4.2825179164077365e-06, "epoch": 0.28497719629612567, "percentage": 28.5, "elapsed_time": "9:45:59", "remaining_time": "1 day, 0:30:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3094, "total_steps": 10853, "loss": 0.1543, "learning_rate": 4.281983704448715e-06, "epoch": 0.28506933247339566, "percentage": 28.51, "elapsed_time": "9:46:08", "remaining_time": "1 day, 0:29:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3095, "total_steps": 10853, "loss": 0.1634, "learning_rate": 4.281449327032315e-06, "epoch": 0.28516146865066566, "percentage": 28.52, "elapsed_time": "9:46:19", "remaining_time": "1 day, 0:29:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3096, "total_steps": 10853, "loss": 0.1497, "learning_rate": 4.2809147842081535e-06, "epoch": 0.2852536048279357, "percentage": 28.53, "elapsed_time": "9:46:29", "remaining_time": "1 day, 0:29:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3097, "total_steps": 10853, "loss": 0.1553, "learning_rate": 4.280380076025863e-06, "epoch": 0.2853457410052057, "percentage": 28.54, "elapsed_time": "9:46:40", "remaining_time": "1 day, 0:29:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3098, "total_steps": 10853, "loss": 0.1746, "learning_rate": 4.27984520253509e-06, "epoch": 0.2854378771824757, "percentage": 28.55, "elapsed_time": "9:46:52", "remaining_time": "1 day, 0:29:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3099, "total_steps": 10853, "loss": 0.1672, "learning_rate": 4.279310163785499e-06, "epoch": 0.2855300133597457, "percentage": 28.55, "elapsed_time": "9:47:03", "remaining_time": "1 day, 0:28:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3100, "total_steps": 10853, "loss": 0.154, "learning_rate": 4.278774959826768e-06, "epoch": 0.2856221495370157, "percentage": 28.56, "elapsed_time": "9:47:14", "remaining_time": "1 day, 0:28:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3101, "total_steps": 10853, "loss": 0.1978, "learning_rate": 4.2782395907085894e-06, "epoch": 0.2857142857142857, "percentage": 28.57, "elapsed_time": "9:47:26", "remaining_time": "1 day, 0:28:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3102, "total_steps": 10853, "loss": 0.1711, "learning_rate": 4.277704056480674e-06, "epoch": 0.2858064218915557, "percentage": 28.58, "elapsed_time": "9:47:38", "remaining_time": "1 day, 0:28:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3103, "total_steps": 10853, "loss": 0.1785, "learning_rate": 4.2771683571927455e-06, "epoch": 0.28589855806882575, "percentage": 28.59, "elapsed_time": "9:47:49", "remaining_time": "1 day, 0:28:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3104, "total_steps": 10853, "loss": 0.1484, "learning_rate": 4.276632492894544e-06, "epoch": 0.28599069424609574, "percentage": 28.6, "elapsed_time": "9:48:00", "remaining_time": "1 day, 0:27:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3105, "total_steps": 10853, "loss": 0.1653, "learning_rate": 4.276096463635825e-06, "epoch": 0.28608283042336574, "percentage": 28.61, "elapsed_time": "9:48:12", "remaining_time": "1 day, 0:27:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3106, "total_steps": 10853, "loss": 0.1673, "learning_rate": 4.275560269466358e-06, "epoch": 0.28617496660063574, "percentage": 28.62, "elapsed_time": "9:48:22", "remaining_time": "1 day, 0:27:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3107, "total_steps": 10853, "loss": 0.1537, "learning_rate": 4.275023910435928e-06, "epoch": 0.28626710277790574, "percentage": 28.63, "elapsed_time": "9:48:32", "remaining_time": "1 day, 0:27:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3108, "total_steps": 10853, "loss": 0.1538, "learning_rate": 4.274487386594338e-06, "epoch": 0.28635923895517573, "percentage": 28.64, "elapsed_time": "9:48:42", "remaining_time": "1 day, 0:27:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3109, "total_steps": 10853, "loss": 0.162, "learning_rate": 4.273950697991402e-06, "epoch": 0.28645137513244573, "percentage": 28.65, "elapsed_time": "9:48:53", "remaining_time": "1 day, 0:26:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3110, "total_steps": 10853, "loss": 0.1519, "learning_rate": 4.273413844676953e-06, "epoch": 0.2865435113097158, "percentage": 28.66, "elapsed_time": "9:49:02", "remaining_time": "1 day, 0:26:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3111, "total_steps": 10853, "loss": 0.1581, "learning_rate": 4.272876826700838e-06, "epoch": 0.2866356474869858, "percentage": 28.66, "elapsed_time": "9:49:14", "remaining_time": "1 day, 0:26:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3112, "total_steps": 10853, "loss": 0.1677, "learning_rate": 4.27233964411292e-06, "epoch": 0.2867277836642558, "percentage": 28.67, "elapsed_time": "9:49:24", "remaining_time": "1 day, 0:26:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3113, "total_steps": 10853, "loss": 0.1476, "learning_rate": 4.271802296963073e-06, "epoch": 0.28681991984152577, "percentage": 28.68, "elapsed_time": "9:49:35", "remaining_time": "1 day, 0:25:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3114, "total_steps": 10853, "loss": 0.1564, "learning_rate": 4.271264785301194e-06, "epoch": 0.28691205601879577, "percentage": 28.69, "elapsed_time": "9:49:47", "remaining_time": "1 day, 0:25:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3115, "total_steps": 10853, "loss": 0.17, "learning_rate": 4.270727109177188e-06, "epoch": 0.28700419219606577, "percentage": 28.7, "elapsed_time": "9:49:59", "remaining_time": "1 day, 0:25:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3116, "total_steps": 10853, "loss": 0.1626, "learning_rate": 4.270189268640979e-06, "epoch": 0.28709632837333576, "percentage": 28.71, "elapsed_time": "9:50:10", "remaining_time": "1 day, 0:25:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3117, "total_steps": 10853, "loss": 0.1634, "learning_rate": 4.269651263742507e-06, "epoch": 0.2871884645506058, "percentage": 28.72, "elapsed_time": "9:50:23", "remaining_time": "1 day, 0:25:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3118, "total_steps": 10853, "loss": 0.1679, "learning_rate": 4.269113094531724e-06, "epoch": 0.2872806007278758, "percentage": 28.73, "elapsed_time": "9:50:33", "remaining_time": "1 day, 0:25:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3119, "total_steps": 10853, "loss": 0.1763, "learning_rate": 4.268574761058601e-06, "epoch": 0.2873727369051458, "percentage": 28.74, "elapsed_time": "9:50:44", "remaining_time": "1 day, 0:24:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3120, "total_steps": 10853, "loss": 0.1546, "learning_rate": 4.26803626337312e-06, "epoch": 0.2874648730824158, "percentage": 28.75, "elapsed_time": "9:50:54", "remaining_time": "1 day, 0:24:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3121, "total_steps": 10853, "loss": 0.1687, "learning_rate": 4.267497601525281e-06, "epoch": 0.2875570092596858, "percentage": 28.76, "elapsed_time": "9:51:05", "remaining_time": "1 day, 0:24:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3122, "total_steps": 10853, "loss": 0.1401, "learning_rate": 4.266958775565101e-06, "epoch": 0.2876491454369558, "percentage": 28.77, "elapsed_time": "9:51:16", "remaining_time": "1 day, 0:24:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3123, "total_steps": 10853, "loss": 0.1626, "learning_rate": 4.266419785542607e-06, "epoch": 0.28774128161422585, "percentage": 28.78, "elapsed_time": "9:51:27", "remaining_time": "1 day, 0:23:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3124, "total_steps": 10853, "loss": 0.162, "learning_rate": 4.265880631507847e-06, "epoch": 0.28783341779149585, "percentage": 28.78, "elapsed_time": "9:51:38", "remaining_time": "1 day, 0:23:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3125, "total_steps": 10853, "loss": 0.163, "learning_rate": 4.265341313510879e-06, "epoch": 0.28792555396876585, "percentage": 28.79, "elapsed_time": "9:51:48", "remaining_time": "1 day, 0:23:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3126, "total_steps": 10853, "loss": 0.17, "learning_rate": 4.264801831601781e-06, "epoch": 0.28801769014603584, "percentage": 28.8, "elapsed_time": "9:51:59", "remaining_time": "1 day, 0:23:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3127, "total_steps": 10853, "loss": 0.1498, "learning_rate": 4.264262185830643e-06, "epoch": 0.28810982632330584, "percentage": 28.81, "elapsed_time": "9:52:10", "remaining_time": "1 day, 0:23:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3128, "total_steps": 10853, "loss": 0.1683, "learning_rate": 4.263722376247571e-06, "epoch": 0.28820196250057584, "percentage": 28.82, "elapsed_time": "9:52:21", "remaining_time": "1 day, 0:22:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3129, "total_steps": 10853, "loss": 0.154, "learning_rate": 4.263182402902687e-06, "epoch": 0.28829409867784583, "percentage": 28.83, "elapsed_time": "9:52:32", "remaining_time": "1 day, 0:22:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3130, "total_steps": 10853, "loss": 0.1479, "learning_rate": 4.262642265846127e-06, "epoch": 0.2883862348551159, "percentage": 28.84, "elapsed_time": "9:52:42", "remaining_time": "1 day, 0:22:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3131, "total_steps": 10853, "loss": 0.159, "learning_rate": 4.262101965128042e-06, "epoch": 0.2884783710323859, "percentage": 28.85, "elapsed_time": "9:52:53", "remaining_time": "1 day, 0:22:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3132, "total_steps": 10853, "loss": 0.1612, "learning_rate": 4.261561500798601e-06, "epoch": 0.2885705072096559, "percentage": 28.86, "elapsed_time": "9:53:04", "remaining_time": "1 day, 0:22:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3133, "total_steps": 10853, "loss": 0.1582, "learning_rate": 4.261020872907985e-06, "epoch": 0.2886626433869259, "percentage": 28.87, "elapsed_time": "9:53:15", "remaining_time": "1 day, 0:21:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3134, "total_steps": 10853, "loss": 0.164, "learning_rate": 4.26048008150639e-06, "epoch": 0.2887547795641959, "percentage": 28.88, "elapsed_time": "9:53:25", "remaining_time": "1 day, 0:21:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3135, "total_steps": 10853, "loss": 0.1679, "learning_rate": 4.259939126644032e-06, "epoch": 0.28884691574146587, "percentage": 28.89, "elapsed_time": "9:53:36", "remaining_time": "1 day, 0:21:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3136, "total_steps": 10853, "loss": 0.1676, "learning_rate": 4.259398008371136e-06, "epoch": 0.28893905191873587, "percentage": 28.9, "elapsed_time": "9:53:48", "remaining_time": "1 day, 0:21:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3137, "total_steps": 10853, "loss": 0.1492, "learning_rate": 4.258856726737945e-06, "epoch": 0.2890311880960059, "percentage": 28.9, "elapsed_time": "9:53:59", "remaining_time": "1 day, 0:21:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3138, "total_steps": 10853, "loss": 0.1631, "learning_rate": 4.258315281794718e-06, "epoch": 0.2891233242732759, "percentage": 28.91, "elapsed_time": "9:54:09", "remaining_time": "1 day, 0:20:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3139, "total_steps": 10853, "loss": 0.1498, "learning_rate": 4.257773673591728e-06, "epoch": 0.2892154604505459, "percentage": 28.92, "elapsed_time": "9:54:22", "remaining_time": "1 day, 0:20:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3140, "total_steps": 10853, "loss": 0.1504, "learning_rate": 4.257231902179263e-06, "epoch": 0.2893075966278159, "percentage": 28.93, "elapsed_time": "9:54:30", "remaining_time": "1 day, 0:20:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3141, "total_steps": 10853, "loss": 0.1725, "learning_rate": 4.256689967607627e-06, "epoch": 0.2893997328050859, "percentage": 28.94, "elapsed_time": "9:54:41", "remaining_time": "1 day, 0:20:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3142, "total_steps": 10853, "loss": 0.1581, "learning_rate": 4.256147869927137e-06, "epoch": 0.2894918689823559, "percentage": 28.95, "elapsed_time": "9:54:52", "remaining_time": "1 day, 0:19:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3143, "total_steps": 10853, "loss": 0.1602, "learning_rate": 4.25560560918813e-06, "epoch": 0.2895840051596259, "percentage": 28.96, "elapsed_time": "9:55:05", "remaining_time": "1 day, 0:19:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3144, "total_steps": 10853, "loss": 0.1654, "learning_rate": 4.255063185440953e-06, "epoch": 0.28967614133689595, "percentage": 28.97, "elapsed_time": "9:55:15", "remaining_time": "1 day, 0:19:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3145, "total_steps": 10853, "loss": 0.1824, "learning_rate": 4.254520598735971e-06, "epoch": 0.28976827751416595, "percentage": 28.98, "elapsed_time": "9:55:25", "remaining_time": "1 day, 0:19:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3146, "total_steps": 10853, "loss": 0.1612, "learning_rate": 4.253977849123561e-06, "epoch": 0.28986041369143595, "percentage": 28.99, "elapsed_time": "9:55:35", "remaining_time": "1 day, 0:19:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3147, "total_steps": 10853, "loss": 0.15, "learning_rate": 4.25343493665412e-06, "epoch": 0.28995254986870594, "percentage": 29.0, "elapsed_time": "9:55:46", "remaining_time": "1 day, 0:18:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3148, "total_steps": 10853, "loss": 0.1682, "learning_rate": 4.252891861378056e-06, "epoch": 0.29004468604597594, "percentage": 29.01, "elapsed_time": "9:55:57", "remaining_time": "1 day, 0:18:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3149, "total_steps": 10853, "loss": 0.1724, "learning_rate": 4.252348623345794e-06, "epoch": 0.29013682222324594, "percentage": 29.02, "elapsed_time": "9:56:08", "remaining_time": "1 day, 0:18:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3150, "total_steps": 10853, "loss": 0.1471, "learning_rate": 4.2518052226077734e-06, "epoch": 0.29022895840051594, "percentage": 29.02, "elapsed_time": "9:56:18", "remaining_time": "1 day, 0:18:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3151, "total_steps": 10853, "loss": 0.1586, "learning_rate": 4.25126165921445e-06, "epoch": 0.290321094577786, "percentage": 29.03, "elapsed_time": "9:56:30", "remaining_time": "1 day, 0:18:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3152, "total_steps": 10853, "loss": 0.1485, "learning_rate": 4.250717933216293e-06, "epoch": 0.290413230755056, "percentage": 29.04, "elapsed_time": "9:56:42", "remaining_time": "1 day, 0:17:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3153, "total_steps": 10853, "loss": 0.1641, "learning_rate": 4.250174044663787e-06, "epoch": 0.290505366932326, "percentage": 29.05, "elapsed_time": "9:56:52", "remaining_time": "1 day, 0:17:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3154, "total_steps": 10853, "loss": 0.1602, "learning_rate": 4.249629993607433e-06, "epoch": 0.290597503109596, "percentage": 29.06, "elapsed_time": "9:57:02", "remaining_time": "1 day, 0:17:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3155, "total_steps": 10853, "loss": 0.1506, "learning_rate": 4.249085780097746e-06, "epoch": 0.290689639286866, "percentage": 29.07, "elapsed_time": "9:57:13", "remaining_time": "1 day, 0:17:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3156, "total_steps": 10853, "loss": 0.1575, "learning_rate": 4.248541404185255e-06, "epoch": 0.29078177546413597, "percentage": 29.08, "elapsed_time": "9:57:23", "remaining_time": "1 day, 0:16:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3157, "total_steps": 10853, "loss": 0.1676, "learning_rate": 4.247996865920509e-06, "epoch": 0.290873911641406, "percentage": 29.09, "elapsed_time": "9:57:34", "remaining_time": "1 day, 0:16:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3158, "total_steps": 10853, "loss": 0.1757, "learning_rate": 4.247452165354064e-06, "epoch": 0.290966047818676, "percentage": 29.1, "elapsed_time": "9:57:44", "remaining_time": "1 day, 0:16:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3159, "total_steps": 10853, "loss": 0.1503, "learning_rate": 4.246907302536497e-06, "epoch": 0.291058183995946, "percentage": 29.11, "elapsed_time": "9:57:55", "remaining_time": "1 day, 0:16:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3160, "total_steps": 10853, "loss": 0.1633, "learning_rate": 4.246362277518399e-06, "epoch": 0.291150320173216, "percentage": 29.12, "elapsed_time": "9:58:06", "remaining_time": "1 day, 0:16:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3161, "total_steps": 10853, "loss": 0.1507, "learning_rate": 4.245817090350377e-06, "epoch": 0.291242456350486, "percentage": 29.13, "elapsed_time": "9:58:17", "remaining_time": "1 day, 0:15:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3162, "total_steps": 10853, "loss": 0.1669, "learning_rate": 4.245271741083049e-06, "epoch": 0.291334592527756, "percentage": 29.13, "elapsed_time": "9:58:29", "remaining_time": "1 day, 0:15:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3163, "total_steps": 10853, "loss": 0.1826, "learning_rate": 4.244726229767052e-06, "epoch": 0.291426728705026, "percentage": 29.14, "elapsed_time": "9:58:40", "remaining_time": "1 day, 0:15:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3164, "total_steps": 10853, "loss": 0.1501, "learning_rate": 4.2441805564530366e-06, "epoch": 0.29151886488229606, "percentage": 29.15, "elapsed_time": "9:58:49", "remaining_time": "1 day, 0:15:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3165, "total_steps": 10853, "loss": 0.1639, "learning_rate": 4.2436347211916695e-06, "epoch": 0.29161100105956606, "percentage": 29.16, "elapsed_time": "9:59:01", "remaining_time": "1 day, 0:15:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3166, "total_steps": 10853, "loss": 0.1586, "learning_rate": 4.243088724033632e-06, "epoch": 0.29170313723683605, "percentage": 29.17, "elapsed_time": "9:59:11", "remaining_time": "1 day, 0:14:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3167, "total_steps": 10853, "loss": 0.1676, "learning_rate": 4.242542565029617e-06, "epoch": 0.29179527341410605, "percentage": 29.18, "elapsed_time": "9:59:21", "remaining_time": "1 day, 0:14:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3168, "total_steps": 10853, "loss": 0.1572, "learning_rate": 4.241996244230338e-06, "epoch": 0.29188740959137605, "percentage": 29.19, "elapsed_time": "9:59:32", "remaining_time": "1 day, 0:14:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3169, "total_steps": 10853, "loss": 0.1552, "learning_rate": 4.24144976168652e-06, "epoch": 0.29197954576864604, "percentage": 29.2, "elapsed_time": "9:59:42", "remaining_time": "1 day, 0:14:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3170, "total_steps": 10853, "loss": 0.1608, "learning_rate": 4.240903117448904e-06, "epoch": 0.29207168194591604, "percentage": 29.21, "elapsed_time": "9:59:54", "remaining_time": "1 day, 0:13:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3171, "total_steps": 10853, "loss": 0.1454, "learning_rate": 4.240356311568247e-06, "epoch": 0.2921638181231861, "percentage": 29.22, "elapsed_time": "10:00:06", "remaining_time": "1 day, 0:13:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3172, "total_steps": 10853, "loss": 0.1645, "learning_rate": 4.239809344095319e-06, "epoch": 0.2922559543004561, "percentage": 29.23, "elapsed_time": "10:00:18", "remaining_time": "1 day, 0:13:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3173, "total_steps": 10853, "loss": 0.1584, "learning_rate": 4.239262215080906e-06, "epoch": 0.2923480904777261, "percentage": 29.24, "elapsed_time": "10:00:29", "remaining_time": "1 day, 0:13:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3174, "total_steps": 10853, "loss": 0.185, "learning_rate": 4.238714924575809e-06, "epoch": 0.2924402266549961, "percentage": 29.25, "elapsed_time": "10:00:41", "remaining_time": "1 day, 0:13:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3175, "total_steps": 10853, "loss": 0.1475, "learning_rate": 4.238167472630844e-06, "epoch": 0.2925323628322661, "percentage": 29.25, "elapsed_time": "10:00:51", "remaining_time": "1 day, 0:13:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3176, "total_steps": 10853, "loss": 0.1615, "learning_rate": 4.237619859296842e-06, "epoch": 0.2926244990095361, "percentage": 29.26, "elapsed_time": "10:01:01", "remaining_time": "1 day, 0:12:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3177, "total_steps": 10853, "loss": 0.141, "learning_rate": 4.237072084624649e-06, "epoch": 0.2927166351868061, "percentage": 29.27, "elapsed_time": "10:01:11", "remaining_time": "1 day, 0:12:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3178, "total_steps": 10853, "loss": 0.1543, "learning_rate": 4.2365241486651275e-06, "epoch": 0.2928087713640761, "percentage": 29.28, "elapsed_time": "10:01:21", "remaining_time": "1 day, 0:12:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3179, "total_steps": 10853, "loss": 0.1626, "learning_rate": 4.235976051469151e-06, "epoch": 0.2929009075413461, "percentage": 29.29, "elapsed_time": "10:01:33", "remaining_time": "1 day, 0:12:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3180, "total_steps": 10853, "loss": 0.1429, "learning_rate": 4.23542779308761e-06, "epoch": 0.2929930437186161, "percentage": 29.3, "elapsed_time": "10:01:42", "remaining_time": "1 day, 0:11:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3181, "total_steps": 10853, "loss": 0.162, "learning_rate": 4.234879373571413e-06, "epoch": 0.2930851798958861, "percentage": 29.31, "elapsed_time": "10:01:53", "remaining_time": "1 day, 0:11:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3182, "total_steps": 10853, "loss": 0.1632, "learning_rate": 4.234330792971479e-06, "epoch": 0.2931773160731561, "percentage": 29.32, "elapsed_time": "10:02:04", "remaining_time": "1 day, 0:11:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3183, "total_steps": 10853, "loss": 0.1617, "learning_rate": 4.233782051338745e-06, "epoch": 0.2932694522504261, "percentage": 29.33, "elapsed_time": "10:02:16", "remaining_time": "1 day, 0:11:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3184, "total_steps": 10853, "loss": 0.1533, "learning_rate": 4.23323314872416e-06, "epoch": 0.2933615884276961, "percentage": 29.34, "elapsed_time": "10:02:26", "remaining_time": "1 day, 0:11:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3185, "total_steps": 10853, "loss": 0.1649, "learning_rate": 4.232684085178691e-06, "epoch": 0.29345372460496616, "percentage": 29.35, "elapsed_time": "10:02:37", "remaining_time": "1 day, 0:10:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3186, "total_steps": 10853, "loss": 0.1673, "learning_rate": 4.232134860753318e-06, "epoch": 0.29354586078223616, "percentage": 29.36, "elapsed_time": "10:02:49", "remaining_time": "1 day, 0:10:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3187, "total_steps": 10853, "loss": 0.1448, "learning_rate": 4.231585475499037e-06, "epoch": 0.29363799695950615, "percentage": 29.37, "elapsed_time": "10:02:59", "remaining_time": "1 day, 0:10:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3188, "total_steps": 10853, "loss": 0.1595, "learning_rate": 4.231035929466858e-06, "epoch": 0.29373013313677615, "percentage": 29.37, "elapsed_time": "10:03:10", "remaining_time": "1 day, 0:10:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3189, "total_steps": 10853, "loss": 0.1527, "learning_rate": 4.230486222707807e-06, "epoch": 0.29382226931404615, "percentage": 29.38, "elapsed_time": "10:03:22", "remaining_time": "1 day, 0:10:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3190, "total_steps": 10853, "loss": 0.1617, "learning_rate": 4.229936355272924e-06, "epoch": 0.29391440549131614, "percentage": 29.39, "elapsed_time": "10:03:34", "remaining_time": "1 day, 0:09:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3191, "total_steps": 10853, "loss": 0.1611, "learning_rate": 4.229386327213264e-06, "epoch": 0.2940065416685862, "percentage": 29.4, "elapsed_time": "10:03:45", "remaining_time": "1 day, 0:09:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3192, "total_steps": 10853, "loss": 0.1729, "learning_rate": 4.228836138579897e-06, "epoch": 0.2940986778458562, "percentage": 29.41, "elapsed_time": "10:03:57", "remaining_time": "1 day, 0:09:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3193, "total_steps": 10853, "loss": 0.1687, "learning_rate": 4.2282857894239085e-06, "epoch": 0.2941908140231262, "percentage": 29.42, "elapsed_time": "10:04:08", "remaining_time": "1 day, 0:09:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3194, "total_steps": 10853, "loss": 0.1628, "learning_rate": 4.227735279796399e-06, "epoch": 0.2942829502003962, "percentage": 29.43, "elapsed_time": "10:04:21", "remaining_time": "1 day, 0:09:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3195, "total_steps": 10853, "loss": 0.1693, "learning_rate": 4.227184609748483e-06, "epoch": 0.2943750863776662, "percentage": 29.44, "elapsed_time": "10:04:32", "remaining_time": "1 day, 0:08:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3196, "total_steps": 10853, "loss": 0.1508, "learning_rate": 4.226633779331289e-06, "epoch": 0.2944672225549362, "percentage": 29.45, "elapsed_time": "10:04:42", "remaining_time": "1 day, 0:08:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3197, "total_steps": 10853, "loss": 0.1453, "learning_rate": 4.226082788595965e-06, "epoch": 0.2945593587322062, "percentage": 29.46, "elapsed_time": "10:04:52", "remaining_time": "1 day, 0:08:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3198, "total_steps": 10853, "loss": 0.1563, "learning_rate": 4.225531637593666e-06, "epoch": 0.29465149490947623, "percentage": 29.47, "elapsed_time": "10:05:04", "remaining_time": "1 day, 0:08:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3199, "total_steps": 10853, "loss": 0.1743, "learning_rate": 4.2249803263755695e-06, "epoch": 0.2947436310867462, "percentage": 29.48, "elapsed_time": "10:05:16", "remaining_time": "1 day, 0:08:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3200, "total_steps": 10853, "loss": 0.1516, "learning_rate": 4.2244288549928645e-06, "epoch": 0.2948357672640162, "percentage": 29.48, "elapsed_time": "10:05:27", "remaining_time": "1 day, 0:07:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3201, "total_steps": 10853, "loss": 0.1663, "learning_rate": 4.223877223496754e-06, "epoch": 0.2949279034412862, "percentage": 29.49, "elapsed_time": "10:05:38", "remaining_time": "1 day, 0:07:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3202, "total_steps": 10853, "loss": 0.1564, "learning_rate": 4.223325431938459e-06, "epoch": 0.2950200396185562, "percentage": 29.5, "elapsed_time": "10:05:49", "remaining_time": "1 day, 0:07:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3203, "total_steps": 10853, "loss": 0.1555, "learning_rate": 4.2227734803692115e-06, "epoch": 0.2951121757958262, "percentage": 29.51, "elapsed_time": "10:05:59", "remaining_time": "1 day, 0:07:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3204, "total_steps": 10853, "loss": 0.1386, "learning_rate": 4.2222213688402605e-06, "epoch": 0.2952043119730962, "percentage": 29.52, "elapsed_time": "10:06:09", "remaining_time": "1 day, 0:07:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3205, "total_steps": 10853, "loss": 0.144, "learning_rate": 4.22166909740287e-06, "epoch": 0.29529644815036626, "percentage": 29.53, "elapsed_time": "10:06:20", "remaining_time": "1 day, 0:06:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3206, "total_steps": 10853, "loss": 0.171, "learning_rate": 4.221116666108319e-06, "epoch": 0.29538858432763626, "percentage": 29.54, "elapsed_time": "10:06:31", "remaining_time": "1 day, 0:06:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3207, "total_steps": 10853, "loss": 0.1585, "learning_rate": 4.2205640750079e-06, "epoch": 0.29548072050490626, "percentage": 29.55, "elapsed_time": "10:06:42", "remaining_time": "1 day, 0:06:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3208, "total_steps": 10853, "loss": 0.1694, "learning_rate": 4.220011324152922e-06, "epoch": 0.29557285668217625, "percentage": 29.56, "elapsed_time": "10:06:53", "remaining_time": "1 day, 0:06:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3209, "total_steps": 10853, "loss": 0.1661, "learning_rate": 4.219458413594707e-06, "epoch": 0.29566499285944625, "percentage": 29.57, "elapsed_time": "10:07:03", "remaining_time": "1 day, 0:06:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3210, "total_steps": 10853, "loss": 0.1648, "learning_rate": 4.218905343384593e-06, "epoch": 0.29575712903671625, "percentage": 29.58, "elapsed_time": "10:07:15", "remaining_time": "1 day, 0:05:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3211, "total_steps": 10853, "loss": 0.161, "learning_rate": 4.218352113573933e-06, "epoch": 0.29584926521398625, "percentage": 29.59, "elapsed_time": "10:07:25", "remaining_time": "1 day, 0:05:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3212, "total_steps": 10853, "loss": 0.176, "learning_rate": 4.217798724214094e-06, "epoch": 0.2959414013912563, "percentage": 29.6, "elapsed_time": "10:07:36", "remaining_time": "1 day, 0:05:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3213, "total_steps": 10853, "loss": 0.161, "learning_rate": 4.21724517535646e-06, "epoch": 0.2960335375685263, "percentage": 29.6, "elapsed_time": "10:07:47", "remaining_time": "1 day, 0:05:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3214, "total_steps": 10853, "loss": 0.1501, "learning_rate": 4.216691467052426e-06, "epoch": 0.2961256737457963, "percentage": 29.61, "elapsed_time": "10:07:58", "remaining_time": "1 day, 0:05:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3215, "total_steps": 10853, "loss": 0.149, "learning_rate": 4.216137599353404e-06, "epoch": 0.2962178099230663, "percentage": 29.62, "elapsed_time": "10:08:09", "remaining_time": "1 day, 0:04:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3216, "total_steps": 10853, "loss": 0.1522, "learning_rate": 4.215583572310821e-06, "epoch": 0.2963099461003363, "percentage": 29.63, "elapsed_time": "10:08:20", "remaining_time": "1 day, 0:04:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3217, "total_steps": 10853, "loss": 0.1575, "learning_rate": 4.2150293859761196e-06, "epoch": 0.2964020822776063, "percentage": 29.64, "elapsed_time": "10:08:31", "remaining_time": "1 day, 0:04:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3218, "total_steps": 10853, "loss": 0.1693, "learning_rate": 4.214475040400755e-06, "epoch": 0.29649421845487633, "percentage": 29.65, "elapsed_time": "10:08:42", "remaining_time": "1 day, 0:04:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3219, "total_steps": 10853, "loss": 0.1555, "learning_rate": 4.213920535636198e-06, "epoch": 0.29658635463214633, "percentage": 29.66, "elapsed_time": "10:08:53", "remaining_time": "1 day, 0:04:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3220, "total_steps": 10853, "loss": 0.1589, "learning_rate": 4.213365871733934e-06, "epoch": 0.29667849080941633, "percentage": 29.67, "elapsed_time": "10:09:04", "remaining_time": "1 day, 0:03:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3221, "total_steps": 10853, "loss": 0.1625, "learning_rate": 4.212811048745467e-06, "epoch": 0.2967706269866863, "percentage": 29.68, "elapsed_time": "10:09:15", "remaining_time": "1 day, 0:03:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3222, "total_steps": 10853, "loss": 0.1648, "learning_rate": 4.212256066722307e-06, "epoch": 0.2968627631639563, "percentage": 29.69, "elapsed_time": "10:09:27", "remaining_time": "1 day, 0:03:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3223, "total_steps": 10853, "loss": 0.1434, "learning_rate": 4.211700925715988e-06, "epoch": 0.2969548993412263, "percentage": 29.7, "elapsed_time": "10:09:38", "remaining_time": "1 day, 0:03:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3224, "total_steps": 10853, "loss": 0.1718, "learning_rate": 4.211145625778054e-06, "epoch": 0.2970470355184963, "percentage": 29.71, "elapsed_time": "10:09:50", "remaining_time": "1 day, 0:03:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3225, "total_steps": 10853, "loss": 0.1493, "learning_rate": 4.2105901669600645e-06, "epoch": 0.29713917169576637, "percentage": 29.72, "elapsed_time": "10:10:00", "remaining_time": "1 day, 0:02:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3226, "total_steps": 10853, "loss": 0.1537, "learning_rate": 4.210034549313594e-06, "epoch": 0.29723130787303637, "percentage": 29.72, "elapsed_time": "10:10:10", "remaining_time": "1 day, 0:02:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3227, "total_steps": 10853, "loss": 0.154, "learning_rate": 4.2094787728902305e-06, "epoch": 0.29732344405030636, "percentage": 29.73, "elapsed_time": "10:10:21", "remaining_time": "1 day, 0:02:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3228, "total_steps": 10853, "loss": 0.1653, "learning_rate": 4.20892283774158e-06, "epoch": 0.29741558022757636, "percentage": 29.74, "elapsed_time": "10:10:32", "remaining_time": "1 day, 0:02:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3229, "total_steps": 10853, "loss": 0.1628, "learning_rate": 4.20836674391926e-06, "epoch": 0.29750771640484636, "percentage": 29.75, "elapsed_time": "10:10:44", "remaining_time": "1 day, 0:02:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3230, "total_steps": 10853, "loss": 0.1741, "learning_rate": 4.207810491474904e-06, "epoch": 0.29759985258211635, "percentage": 29.76, "elapsed_time": "10:10:55", "remaining_time": "1 day, 0:01:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3231, "total_steps": 10853, "loss": 0.1759, "learning_rate": 4.207254080460161e-06, "epoch": 0.29769198875938635, "percentage": 29.77, "elapsed_time": "10:11:08", "remaining_time": "1 day, 0:01:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3232, "total_steps": 10853, "loss": 0.1538, "learning_rate": 4.206697510926691e-06, "epoch": 0.2977841249366564, "percentage": 29.78, "elapsed_time": "10:11:19", "remaining_time": "1 day, 0:01:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3233, "total_steps": 10853, "loss": 0.1721, "learning_rate": 4.206140782926174e-06, "epoch": 0.2978762611139264, "percentage": 29.79, "elapsed_time": "10:11:29", "remaining_time": "1 day, 0:01:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3234, "total_steps": 10853, "loss": 0.1595, "learning_rate": 4.205583896510303e-06, "epoch": 0.2979683972911964, "percentage": 29.8, "elapsed_time": "10:11:40", "remaining_time": "1 day, 0:01:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3235, "total_steps": 10853, "loss": 0.1639, "learning_rate": 4.2050268517307816e-06, "epoch": 0.2980605334684664, "percentage": 29.81, "elapsed_time": "10:11:51", "remaining_time": "1 day, 0:00:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3236, "total_steps": 10853, "loss": 0.1715, "learning_rate": 4.204469648639335e-06, "epoch": 0.2981526696457364, "percentage": 29.82, "elapsed_time": "10:12:03", "remaining_time": "1 day, 0:00:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3237, "total_steps": 10853, "loss": 0.1604, "learning_rate": 4.203912287287697e-06, "epoch": 0.2982448058230064, "percentage": 29.83, "elapsed_time": "10:12:15", "remaining_time": "1 day, 0:00:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3238, "total_steps": 10853, "loss": 0.1658, "learning_rate": 4.203354767727621e-06, "epoch": 0.2983369420002764, "percentage": 29.84, "elapsed_time": "10:12:27", "remaining_time": "1 day, 0:00:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3239, "total_steps": 10853, "loss": 0.1692, "learning_rate": 4.202797090010871e-06, "epoch": 0.29842907817754644, "percentage": 29.84, "elapsed_time": "10:12:38", "remaining_time": "1 day, 0:00:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3240, "total_steps": 10853, "loss": 0.1527, "learning_rate": 4.202239254189228e-06, "epoch": 0.29852121435481643, "percentage": 29.85, "elapsed_time": "10:12:49", "remaining_time": "23:59:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3241, "total_steps": 10853, "loss": 0.1768, "learning_rate": 4.2016812603144865e-06, "epoch": 0.29861335053208643, "percentage": 29.86, "elapsed_time": "10:13:00", "remaining_time": "23:59:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3242, "total_steps": 10853, "loss": 0.1609, "learning_rate": 4.201123108438457e-06, "epoch": 0.2987054867093564, "percentage": 29.87, "elapsed_time": "10:13:12", "remaining_time": "23:59:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3243, "total_steps": 10853, "loss": 0.163, "learning_rate": 4.2005647986129635e-06, "epoch": 0.2987976228866264, "percentage": 29.88, "elapsed_time": "10:13:23", "remaining_time": "23:59:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3244, "total_steps": 10853, "loss": 0.154, "learning_rate": 4.2000063308898466e-06, "epoch": 0.2988897590638964, "percentage": 29.89, "elapsed_time": "10:13:34", "remaining_time": "23:59:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3245, "total_steps": 10853, "loss": 0.159, "learning_rate": 4.199447705320958e-06, "epoch": 0.2989818952411664, "percentage": 29.9, "elapsed_time": "10:13:45", "remaining_time": "23:58:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3246, "total_steps": 10853, "loss": 0.1809, "learning_rate": 4.1988889219581676e-06, "epoch": 0.29907403141843647, "percentage": 29.91, "elapsed_time": "10:13:56", "remaining_time": "23:58:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3247, "total_steps": 10853, "loss": 0.1386, "learning_rate": 4.198329980853357e-06, "epoch": 0.29916616759570647, "percentage": 29.92, "elapsed_time": "10:14:08", "remaining_time": "23:58:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3248, "total_steps": 10853, "loss": 0.1609, "learning_rate": 4.1977708820584265e-06, "epoch": 0.29925830377297646, "percentage": 29.93, "elapsed_time": "10:14:19", "remaining_time": "23:58:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3249, "total_steps": 10853, "loss": 0.1614, "learning_rate": 4.197211625625285e-06, "epoch": 0.29935043995024646, "percentage": 29.94, "elapsed_time": "10:14:30", "remaining_time": "23:58:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3250, "total_steps": 10853, "loss": 0.1753, "learning_rate": 4.196652211605863e-06, "epoch": 0.29944257612751646, "percentage": 29.95, "elapsed_time": "10:14:41", "remaining_time": "23:57:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3251, "total_steps": 10853, "loss": 0.1743, "learning_rate": 4.196092640052099e-06, "epoch": 0.29953471230478645, "percentage": 29.95, "elapsed_time": "10:14:50", "remaining_time": "23:57:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3252, "total_steps": 10853, "loss": 0.149, "learning_rate": 4.195532911015952e-06, "epoch": 0.2996268484820565, "percentage": 29.96, "elapsed_time": "10:15:01", "remaining_time": "23:57:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3253, "total_steps": 10853, "loss": 0.166, "learning_rate": 4.1949730245493915e-06, "epoch": 0.2997189846593265, "percentage": 29.97, "elapsed_time": "10:15:12", "remaining_time": "23:57:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3254, "total_steps": 10853, "loss": 0.1683, "learning_rate": 4.194412980704403e-06, "epoch": 0.2998111208365965, "percentage": 29.98, "elapsed_time": "10:15:24", "remaining_time": "23:57:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3255, "total_steps": 10853, "loss": 0.1695, "learning_rate": 4.1938527795329875e-06, "epoch": 0.2999032570138665, "percentage": 29.99, "elapsed_time": "10:15:35", "remaining_time": "23:56:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3256, "total_steps": 10853, "loss": 0.1584, "learning_rate": 4.1932924210871585e-06, "epoch": 0.2999953931911365, "percentage": 30.0, "elapsed_time": "10:15:46", "remaining_time": "23:56:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3257, "total_steps": 10853, "loss": 0.1612, "learning_rate": 4.192731905418947e-06, "epoch": 0.3000875293684065, "percentage": 30.01, "elapsed_time": "10:15:56", "remaining_time": "23:56:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3258, "total_steps": 10853, "loss": 0.1613, "learning_rate": 4.192171232580395e-06, "epoch": 0.3001796655456765, "percentage": 30.02, "elapsed_time": "10:16:07", "remaining_time": "23:56:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3259, "total_steps": 10853, "loss": 0.1501, "learning_rate": 4.191610402623561e-06, "epoch": 0.30027180172294654, "percentage": 30.03, "elapsed_time": "10:16:18", "remaining_time": "23:56:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3260, "total_steps": 10853, "loss": 0.1732, "learning_rate": 4.191049415600521e-06, "epoch": 0.30036393790021654, "percentage": 30.04, "elapsed_time": "10:16:29", "remaining_time": "23:55:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3261, "total_steps": 10853, "loss": 0.1695, "learning_rate": 4.19048827156336e-06, "epoch": 0.30045607407748653, "percentage": 30.05, "elapsed_time": "10:16:40", "remaining_time": "23:55:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3262, "total_steps": 10853, "loss": 0.1404, "learning_rate": 4.189926970564181e-06, "epoch": 0.30054821025475653, "percentage": 30.06, "elapsed_time": "10:16:49", "remaining_time": "23:55:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3263, "total_steps": 10853, "loss": 0.1605, "learning_rate": 4.189365512655101e-06, "epoch": 0.30064034643202653, "percentage": 30.07, "elapsed_time": "10:17:00", "remaining_time": "23:55:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3264, "total_steps": 10853, "loss": 0.1489, "learning_rate": 4.188803897888251e-06, "epoch": 0.3007324826092965, "percentage": 30.07, "elapsed_time": "10:17:11", "remaining_time": "23:55:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3265, "total_steps": 10853, "loss": 0.1636, "learning_rate": 4.188242126315778e-06, "epoch": 0.3008246187865665, "percentage": 30.08, "elapsed_time": "10:17:22", "remaining_time": "23:54:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3266, "total_steps": 10853, "loss": 0.1693, "learning_rate": 4.187680197989841e-06, "epoch": 0.3009167549638366, "percentage": 30.09, "elapsed_time": "10:17:32", "remaining_time": "23:54:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3267, "total_steps": 10853, "loss": 0.1471, "learning_rate": 4.187118112962616e-06, "epoch": 0.30100889114110657, "percentage": 30.1, "elapsed_time": "10:17:42", "remaining_time": "23:54:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3268, "total_steps": 10853, "loss": 0.1405, "learning_rate": 4.186555871286293e-06, "epoch": 0.30110102731837657, "percentage": 30.11, "elapsed_time": "10:17:51", "remaining_time": "23:54:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3269, "total_steps": 10853, "loss": 0.1494, "learning_rate": 4.185993473013076e-06, "epoch": 0.30119316349564657, "percentage": 30.12, "elapsed_time": "10:18:03", "remaining_time": "23:53:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3270, "total_steps": 10853, "loss": 0.1538, "learning_rate": 4.185430918195184e-06, "epoch": 0.30128529967291656, "percentage": 30.13, "elapsed_time": "10:18:15", "remaining_time": "23:53:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3271, "total_steps": 10853, "loss": 0.1485, "learning_rate": 4.184868206884849e-06, "epoch": 0.30137743585018656, "percentage": 30.14, "elapsed_time": "10:18:25", "remaining_time": "23:53:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3272, "total_steps": 10853, "loss": 0.1771, "learning_rate": 4.18430533913432e-06, "epoch": 0.30146957202745656, "percentage": 30.15, "elapsed_time": "10:18:37", "remaining_time": "23:53:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3273, "total_steps": 10853, "loss": 0.1618, "learning_rate": 4.183742314995859e-06, "epoch": 0.3015617082047266, "percentage": 30.16, "elapsed_time": "10:18:48", "remaining_time": "23:53:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3274, "total_steps": 10853, "loss": 0.1513, "learning_rate": 4.183179134521743e-06, "epoch": 0.3016538443819966, "percentage": 30.17, "elapsed_time": "10:18:59", "remaining_time": "23:52:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3275, "total_steps": 10853, "loss": 0.1484, "learning_rate": 4.1826157977642634e-06, "epoch": 0.3017459805592666, "percentage": 30.18, "elapsed_time": "10:19:10", "remaining_time": "23:52:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3276, "total_steps": 10853, "loss": 0.1656, "learning_rate": 4.1820523047757246e-06, "epoch": 0.3018381167365366, "percentage": 30.19, "elapsed_time": "10:19:20", "remaining_time": "23:52:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3277, "total_steps": 10853, "loss": 0.1626, "learning_rate": 4.18148865560845e-06, "epoch": 0.3019302529138066, "percentage": 30.19, "elapsed_time": "10:19:32", "remaining_time": "23:52:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3278, "total_steps": 10853, "loss": 0.1575, "learning_rate": 4.180924850314771e-06, "epoch": 0.3020223890910766, "percentage": 30.2, "elapsed_time": "10:19:43", "remaining_time": "23:52:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3279, "total_steps": 10853, "loss": 0.1703, "learning_rate": 4.180360888947041e-06, "epoch": 0.3021145252683466, "percentage": 30.21, "elapsed_time": "10:19:54", "remaining_time": "23:51:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3280, "total_steps": 10853, "loss": 0.1669, "learning_rate": 4.179796771557619e-06, "epoch": 0.30220666144561664, "percentage": 30.22, "elapsed_time": "10:20:06", "remaining_time": "23:51:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3281, "total_steps": 10853, "loss": 0.1503, "learning_rate": 4.179232498198888e-06, "epoch": 0.30229879762288664, "percentage": 30.23, "elapsed_time": "10:20:16", "remaining_time": "23:51:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3282, "total_steps": 10853, "loss": 0.1578, "learning_rate": 4.178668068923238e-06, "epoch": 0.30239093380015664, "percentage": 30.24, "elapsed_time": "10:20:27", "remaining_time": "23:51:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3283, "total_steps": 10853, "loss": 0.1525, "learning_rate": 4.178103483783077e-06, "epoch": 0.30248306997742663, "percentage": 30.25, "elapsed_time": "10:20:38", "remaining_time": "23:51:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3284, "total_steps": 10853, "loss": 0.1547, "learning_rate": 4.177538742830828e-06, "epoch": 0.30257520615469663, "percentage": 30.26, "elapsed_time": "10:20:49", "remaining_time": "23:50:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3285, "total_steps": 10853, "loss": 0.1653, "learning_rate": 4.1769738461189245e-06, "epoch": 0.3026673423319666, "percentage": 30.27, "elapsed_time": "10:21:00", "remaining_time": "23:50:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3286, "total_steps": 10853, "loss": 0.1528, "learning_rate": 4.176408793699821e-06, "epoch": 0.3027594785092367, "percentage": 30.28, "elapsed_time": "10:21:11", "remaining_time": "23:50:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3287, "total_steps": 10853, "loss": 0.1642, "learning_rate": 4.1758435856259784e-06, "epoch": 0.3028516146865067, "percentage": 30.29, "elapsed_time": "10:21:23", "remaining_time": "23:50:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3288, "total_steps": 10853, "loss": 0.1532, "learning_rate": 4.17527822194988e-06, "epoch": 0.3029437508637767, "percentage": 30.3, "elapsed_time": "10:21:32", "remaining_time": "23:50:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3289, "total_steps": 10853, "loss": 0.1638, "learning_rate": 4.174712702724017e-06, "epoch": 0.30303588704104667, "percentage": 30.3, "elapsed_time": "10:21:43", "remaining_time": "23:49:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3290, "total_steps": 10853, "loss": 0.1538, "learning_rate": 4.174147028000901e-06, "epoch": 0.30312802321831667, "percentage": 30.31, "elapsed_time": "10:21:53", "remaining_time": "23:49:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3291, "total_steps": 10853, "loss": 0.1482, "learning_rate": 4.173581197833052e-06, "epoch": 0.30322015939558666, "percentage": 30.32, "elapsed_time": "10:22:05", "remaining_time": "23:49:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3292, "total_steps": 10853, "loss": 0.1509, "learning_rate": 4.173015212273009e-06, "epoch": 0.30331229557285666, "percentage": 30.33, "elapsed_time": "10:22:16", "remaining_time": "23:49:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3293, "total_steps": 10853, "loss": 0.1514, "learning_rate": 4.1724490713733246e-06, "epoch": 0.3034044317501267, "percentage": 30.34, "elapsed_time": "10:22:27", "remaining_time": "23:49:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3294, "total_steps": 10853, "loss": 0.1619, "learning_rate": 4.171882775186563e-06, "epoch": 0.3034965679273967, "percentage": 30.35, "elapsed_time": "10:22:38", "remaining_time": "23:48:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3295, "total_steps": 10853, "loss": 0.1582, "learning_rate": 4.1713163237653055e-06, "epoch": 0.3035887041046667, "percentage": 30.36, "elapsed_time": "10:22:50", "remaining_time": "23:48:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3296, "total_steps": 10853, "loss": 0.1632, "learning_rate": 4.170749717162148e-06, "epoch": 0.3036808402819367, "percentage": 30.37, "elapsed_time": "10:23:01", "remaining_time": "23:48:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3297, "total_steps": 10853, "loss": 0.1616, "learning_rate": 4.170182955429699e-06, "epoch": 0.3037729764592067, "percentage": 30.38, "elapsed_time": "10:23:13", "remaining_time": "23:48:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3298, "total_steps": 10853, "loss": 0.1456, "learning_rate": 4.169616038620583e-06, "epoch": 0.3038651126364767, "percentage": 30.39, "elapsed_time": "10:23:24", "remaining_time": "23:48:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3299, "total_steps": 10853, "loss": 0.1478, "learning_rate": 4.169048966787438e-06, "epoch": 0.3039572488137467, "percentage": 30.4, "elapsed_time": "10:23:35", "remaining_time": "23:47:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3300, "total_steps": 10853, "loss": 0.1636, "learning_rate": 4.168481739982917e-06, "epoch": 0.30404938499101675, "percentage": 30.41, "elapsed_time": "10:23:46", "remaining_time": "23:47:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3301, "total_steps": 10853, "loss": 0.1548, "learning_rate": 4.167914358259687e-06, "epoch": 0.30414152116828674, "percentage": 30.42, "elapsed_time": "10:23:58", "remaining_time": "23:47:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3302, "total_steps": 10853, "loss": 0.1751, "learning_rate": 4.167346821670429e-06, "epoch": 0.30423365734555674, "percentage": 30.42, "elapsed_time": "10:24:10", "remaining_time": "23:47:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3303, "total_steps": 10853, "loss": 0.1665, "learning_rate": 4.166779130267839e-06, "epoch": 0.30432579352282674, "percentage": 30.43, "elapsed_time": "10:24:21", "remaining_time": "23:47:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3304, "total_steps": 10853, "loss": 0.1572, "learning_rate": 4.166211284104629e-06, "epoch": 0.30441792970009673, "percentage": 30.44, "elapsed_time": "10:24:31", "remaining_time": "23:46:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3305, "total_steps": 10853, "loss": 0.1698, "learning_rate": 4.16564328323352e-06, "epoch": 0.30451006587736673, "percentage": 30.45, "elapsed_time": "10:24:42", "remaining_time": "23:46:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3306, "total_steps": 10853, "loss": 0.1603, "learning_rate": 4.165075127707254e-06, "epoch": 0.30460220205463673, "percentage": 30.46, "elapsed_time": "10:24:53", "remaining_time": "23:46:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3307, "total_steps": 10853, "loss": 0.1536, "learning_rate": 4.164506817578582e-06, "epoch": 0.3046943382319068, "percentage": 30.47, "elapsed_time": "10:25:04", "remaining_time": "23:46:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3308, "total_steps": 10853, "loss": 0.1631, "learning_rate": 4.163938352900274e-06, "epoch": 0.3047864744091768, "percentage": 30.48, "elapsed_time": "10:25:14", "remaining_time": "23:46:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3309, "total_steps": 10853, "loss": 0.1707, "learning_rate": 4.16336973372511e-06, "epoch": 0.3048786105864468, "percentage": 30.49, "elapsed_time": "10:25:24", "remaining_time": "23:45:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3310, "total_steps": 10853, "loss": 0.1453, "learning_rate": 4.162800960105889e-06, "epoch": 0.30497074676371677, "percentage": 30.5, "elapsed_time": "10:25:35", "remaining_time": "23:45:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3311, "total_steps": 10853, "loss": 0.1639, "learning_rate": 4.162232032095418e-06, "epoch": 0.30506288294098677, "percentage": 30.51, "elapsed_time": "10:25:46", "remaining_time": "23:45:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3312, "total_steps": 10853, "loss": 0.1542, "learning_rate": 4.1616629497465245e-06, "epoch": 0.30515501911825677, "percentage": 30.52, "elapsed_time": "10:25:57", "remaining_time": "23:45:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3313, "total_steps": 10853, "loss": 0.1788, "learning_rate": 4.1610937131120474e-06, "epoch": 0.30524715529552676, "percentage": 30.53, "elapsed_time": "10:26:09", "remaining_time": "23:45:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3314, "total_steps": 10853, "loss": 0.1577, "learning_rate": 4.16052432224484e-06, "epoch": 0.3053392914727968, "percentage": 30.54, "elapsed_time": "10:26:20", "remaining_time": "23:44:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3315, "total_steps": 10853, "loss": 0.1574, "learning_rate": 4.159954777197771e-06, "epoch": 0.3054314276500668, "percentage": 30.54, "elapsed_time": "10:26:31", "remaining_time": "23:44:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3316, "total_steps": 10853, "loss": 0.1664, "learning_rate": 4.159385078023722e-06, "epoch": 0.3055235638273368, "percentage": 30.55, "elapsed_time": "10:26:42", "remaining_time": "23:44:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3317, "total_steps": 10853, "loss": 0.1581, "learning_rate": 4.15881522477559e-06, "epoch": 0.3056157000046068, "percentage": 30.56, "elapsed_time": "10:26:53", "remaining_time": "23:44:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3318, "total_steps": 10853, "loss": 0.1766, "learning_rate": 4.1582452175062854e-06, "epoch": 0.3057078361818768, "percentage": 30.57, "elapsed_time": "10:27:04", "remaining_time": "23:44:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3319, "total_steps": 10853, "loss": 0.1581, "learning_rate": 4.157675056268735e-06, "epoch": 0.3057999723591468, "percentage": 30.58, "elapsed_time": "10:27:15", "remaining_time": "23:43:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3320, "total_steps": 10853, "loss": 0.1542, "learning_rate": 4.157104741115876e-06, "epoch": 0.30589210853641685, "percentage": 30.59, "elapsed_time": "10:27:26", "remaining_time": "23:43:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3321, "total_steps": 10853, "loss": 0.1827, "learning_rate": 4.156534272100664e-06, "epoch": 0.30598424471368685, "percentage": 30.6, "elapsed_time": "10:27:37", "remaining_time": "23:43:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3322, "total_steps": 10853, "loss": 0.1593, "learning_rate": 4.155963649276066e-06, "epoch": 0.30607638089095685, "percentage": 30.61, "elapsed_time": "10:27:48", "remaining_time": "23:43:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3323, "total_steps": 10853, "loss": 0.1578, "learning_rate": 4.155392872695066e-06, "epoch": 0.30616851706822684, "percentage": 30.62, "elapsed_time": "10:27:58", "remaining_time": "23:43:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3324, "total_steps": 10853, "loss": 0.1528, "learning_rate": 4.154821942410659e-06, "epoch": 0.30626065324549684, "percentage": 30.63, "elapsed_time": "10:28:09", "remaining_time": "23:42:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3325, "total_steps": 10853, "loss": 0.1653, "learning_rate": 4.154250858475857e-06, "epoch": 0.30635278942276684, "percentage": 30.64, "elapsed_time": "10:28:19", "remaining_time": "23:42:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3326, "total_steps": 10853, "loss": 0.1659, "learning_rate": 4.1536796209436835e-06, "epoch": 0.30644492560003683, "percentage": 30.65, "elapsed_time": "10:28:29", "remaining_time": "23:42:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3327, "total_steps": 10853, "loss": 0.1665, "learning_rate": 4.153108229867181e-06, "epoch": 0.3065370617773069, "percentage": 30.66, "elapsed_time": "10:28:42", "remaining_time": "23:42:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3328, "total_steps": 10853, "loss": 0.1554, "learning_rate": 4.1525366852994e-06, "epoch": 0.3066291979545769, "percentage": 30.66, "elapsed_time": "10:28:53", "remaining_time": "23:42:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3329, "total_steps": 10853, "loss": 0.143, "learning_rate": 4.151964987293411e-06, "epoch": 0.3067213341318469, "percentage": 30.67, "elapsed_time": "10:29:04", "remaining_time": "23:41:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3330, "total_steps": 10853, "loss": 0.1583, "learning_rate": 4.151393135902294e-06, "epoch": 0.3068134703091169, "percentage": 30.68, "elapsed_time": "10:29:16", "remaining_time": "23:41:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3331, "total_steps": 10853, "loss": 0.1645, "learning_rate": 4.150821131179148e-06, "epoch": 0.3069056064863869, "percentage": 30.69, "elapsed_time": "10:29:27", "remaining_time": "23:41:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3332, "total_steps": 10853, "loss": 0.1507, "learning_rate": 4.150248973177081e-06, "epoch": 0.30699774266365687, "percentage": 30.7, "elapsed_time": "10:29:38", "remaining_time": "23:41:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3333, "total_steps": 10853, "loss": 0.1578, "learning_rate": 4.14967666194922e-06, "epoch": 0.30708987884092687, "percentage": 30.71, "elapsed_time": "10:29:51", "remaining_time": "23:41:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3334, "total_steps": 10853, "loss": 0.1517, "learning_rate": 4.149104197548703e-06, "epoch": 0.3071820150181969, "percentage": 30.72, "elapsed_time": "10:30:01", "remaining_time": "23:40:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3335, "total_steps": 10853, "loss": 0.1527, "learning_rate": 4.148531580028685e-06, "epoch": 0.3072741511954669, "percentage": 30.73, "elapsed_time": "10:30:13", "remaining_time": "23:40:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3336, "total_steps": 10853, "loss": 0.1379, "learning_rate": 4.147958809442331e-06, "epoch": 0.3073662873727369, "percentage": 30.74, "elapsed_time": "10:30:23", "remaining_time": "23:40:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3337, "total_steps": 10853, "loss": 0.1536, "learning_rate": 4.147385885842824e-06, "epoch": 0.3074584235500069, "percentage": 30.75, "elapsed_time": "10:30:33", "remaining_time": "23:40:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3338, "total_steps": 10853, "loss": 0.1663, "learning_rate": 4.146812809283361e-06, "epoch": 0.3075505597272769, "percentage": 30.76, "elapsed_time": "10:30:44", "remaining_time": "23:40:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3339, "total_steps": 10853, "loss": 0.1547, "learning_rate": 4.14623957981715e-06, "epoch": 0.3076426959045469, "percentage": 30.77, "elapsed_time": "10:30:54", "remaining_time": "23:39:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3340, "total_steps": 10853, "loss": 0.1385, "learning_rate": 4.1456661974974185e-06, "epoch": 0.3077348320818169, "percentage": 30.77, "elapsed_time": "10:31:04", "remaining_time": "23:39:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3341, "total_steps": 10853, "loss": 0.1641, "learning_rate": 4.145092662377403e-06, "epoch": 0.30782696825908695, "percentage": 30.78, "elapsed_time": "10:31:15", "remaining_time": "23:39:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3342, "total_steps": 10853, "loss": 0.17, "learning_rate": 4.144518974510358e-06, "epoch": 0.30791910443635695, "percentage": 30.79, "elapsed_time": "10:31:27", "remaining_time": "23:39:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3343, "total_steps": 10853, "loss": 0.1479, "learning_rate": 4.143945133949547e-06, "epoch": 0.30801124061362695, "percentage": 30.8, "elapsed_time": "10:31:37", "remaining_time": "23:38:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3344, "total_steps": 10853, "loss": 0.1731, "learning_rate": 4.1433711407482544e-06, "epoch": 0.30810337679089694, "percentage": 30.81, "elapsed_time": "10:31:49", "remaining_time": "23:38:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3345, "total_steps": 10853, "loss": 0.1857, "learning_rate": 4.142796994959775e-06, "epoch": 0.30819551296816694, "percentage": 30.82, "elapsed_time": "10:32:00", "remaining_time": "23:38:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3346, "total_steps": 10853, "loss": 0.1653, "learning_rate": 4.142222696637417e-06, "epoch": 0.30828764914543694, "percentage": 30.83, "elapsed_time": "10:32:11", "remaining_time": "23:38:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3347, "total_steps": 10853, "loss": 0.1557, "learning_rate": 4.141648245834505e-06, "epoch": 0.30837978532270693, "percentage": 30.84, "elapsed_time": "10:32:22", "remaining_time": "23:38:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3348, "total_steps": 10853, "loss": 0.1507, "learning_rate": 4.141073642604377e-06, "epoch": 0.308471921499977, "percentage": 30.85, "elapsed_time": "10:32:32", "remaining_time": "23:37:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3349, "total_steps": 10853, "loss": 0.1612, "learning_rate": 4.140498887000385e-06, "epoch": 0.308564057677247, "percentage": 30.86, "elapsed_time": "10:32:43", "remaining_time": "23:37:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3350, "total_steps": 10853, "loss": 0.1537, "learning_rate": 4.139923979075894e-06, "epoch": 0.308656193854517, "percentage": 30.87, "elapsed_time": "10:32:54", "remaining_time": "23:37:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3351, "total_steps": 10853, "loss": 0.1655, "learning_rate": 4.139348918884285e-06, "epoch": 0.308748330031787, "percentage": 30.88, "elapsed_time": "10:33:04", "remaining_time": "23:37:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3352, "total_steps": 10853, "loss": 0.151, "learning_rate": 4.138773706478953e-06, "epoch": 0.308840466209057, "percentage": 30.89, "elapsed_time": "10:33:14", "remaining_time": "23:37:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3353, "total_steps": 10853, "loss": 0.1493, "learning_rate": 4.138198341913305e-06, "epoch": 0.30893260238632697, "percentage": 30.89, "elapsed_time": "10:33:24", "remaining_time": "23:36:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3354, "total_steps": 10853, "loss": 0.1574, "learning_rate": 4.137622825240767e-06, "epoch": 0.309024738563597, "percentage": 30.9, "elapsed_time": "10:33:37", "remaining_time": "23:36:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3355, "total_steps": 10853, "loss": 0.1575, "learning_rate": 4.1370471565147715e-06, "epoch": 0.309116874740867, "percentage": 30.91, "elapsed_time": "10:33:49", "remaining_time": "23:36:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3356, "total_steps": 10853, "loss": 0.1543, "learning_rate": 4.1364713357887715e-06, "epoch": 0.309209010918137, "percentage": 30.92, "elapsed_time": "10:33:59", "remaining_time": "23:36:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3357, "total_steps": 10853, "loss": 0.1598, "learning_rate": 4.1358953631162314e-06, "epoch": 0.309301147095407, "percentage": 30.93, "elapsed_time": "10:34:10", "remaining_time": "23:36:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3358, "total_steps": 10853, "loss": 0.1559, "learning_rate": 4.135319238550632e-06, "epoch": 0.309393283272677, "percentage": 30.94, "elapsed_time": "10:34:20", "remaining_time": "23:35:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3359, "total_steps": 10853, "loss": 0.1491, "learning_rate": 4.1347429621454645e-06, "epoch": 0.309485419449947, "percentage": 30.95, "elapsed_time": "10:34:30", "remaining_time": "23:35:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3360, "total_steps": 10853, "loss": 0.1677, "learning_rate": 4.134166533954238e-06, "epoch": 0.309577555627217, "percentage": 30.96, "elapsed_time": "10:34:42", "remaining_time": "23:35:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3361, "total_steps": 10853, "loss": 0.1648, "learning_rate": 4.1335899540304715e-06, "epoch": 0.30966969180448706, "percentage": 30.97, "elapsed_time": "10:34:53", "remaining_time": "23:35:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3362, "total_steps": 10853, "loss": 0.1663, "learning_rate": 4.133013222427703e-06, "epoch": 0.30976182798175705, "percentage": 30.98, "elapsed_time": "10:35:02", "remaining_time": "23:34:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3363, "total_steps": 10853, "loss": 0.1527, "learning_rate": 4.132436339199481e-06, "epoch": 0.30985396415902705, "percentage": 30.99, "elapsed_time": "10:35:13", "remaining_time": "23:34:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3364, "total_steps": 10853, "loss": 0.1645, "learning_rate": 4.131859304399368e-06, "epoch": 0.30994610033629705, "percentage": 31.0, "elapsed_time": "10:35:25", "remaining_time": "23:34:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3365, "total_steps": 10853, "loss": 0.1672, "learning_rate": 4.1312821180809445e-06, "epoch": 0.31003823651356704, "percentage": 31.01, "elapsed_time": "10:35:36", "remaining_time": "23:34:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3366, "total_steps": 10853, "loss": 0.1498, "learning_rate": 4.130704780297801e-06, "epoch": 0.31013037269083704, "percentage": 31.01, "elapsed_time": "10:35:48", "remaining_time": "23:34:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3367, "total_steps": 10853, "loss": 0.1644, "learning_rate": 4.130127291103542e-06, "epoch": 0.31022250886810704, "percentage": 31.02, "elapsed_time": "10:35:59", "remaining_time": "23:34:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3368, "total_steps": 10853, "loss": 0.1453, "learning_rate": 4.129549650551788e-06, "epoch": 0.3103146450453771, "percentage": 31.03, "elapsed_time": "10:36:09", "remaining_time": "23:33:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3369, "total_steps": 10853, "loss": 0.1627, "learning_rate": 4.1289718586961755e-06, "epoch": 0.3104067812226471, "percentage": 31.04, "elapsed_time": "10:36:19", "remaining_time": "23:33:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3370, "total_steps": 10853, "loss": 0.1573, "learning_rate": 4.12839391559035e-06, "epoch": 0.3104989173999171, "percentage": 31.05, "elapsed_time": "10:36:30", "remaining_time": "23:33:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3371, "total_steps": 10853, "loss": 0.1691, "learning_rate": 4.127815821287973e-06, "epoch": 0.3105910535771871, "percentage": 31.06, "elapsed_time": "10:36:42", "remaining_time": "23:33:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3372, "total_steps": 10853, "loss": 0.1727, "learning_rate": 4.127237575842723e-06, "epoch": 0.3106831897544571, "percentage": 31.07, "elapsed_time": "10:36:54", "remaining_time": "23:33:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3373, "total_steps": 10853, "loss": 0.167, "learning_rate": 4.126659179308289e-06, "epoch": 0.3107753259317271, "percentage": 31.08, "elapsed_time": "10:37:04", "remaining_time": "23:32:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3374, "total_steps": 10853, "loss": 0.1577, "learning_rate": 4.126080631738374e-06, "epoch": 0.3108674621089971, "percentage": 31.09, "elapsed_time": "10:37:16", "remaining_time": "23:32:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3375, "total_steps": 10853, "loss": 0.152, "learning_rate": 4.125501933186699e-06, "epoch": 0.3109595982862671, "percentage": 31.1, "elapsed_time": "10:37:27", "remaining_time": "23:32:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3376, "total_steps": 10853, "loss": 0.169, "learning_rate": 4.124923083706993e-06, "epoch": 0.3110517344635371, "percentage": 31.11, "elapsed_time": "10:37:39", "remaining_time": "23:32:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3377, "total_steps": 10853, "loss": 0.1604, "learning_rate": 4.124344083353005e-06, "epoch": 0.3111438706408071, "percentage": 31.12, "elapsed_time": "10:37:51", "remaining_time": "23:32:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3378, "total_steps": 10853, "loss": 0.1537, "learning_rate": 4.123764932178492e-06, "epoch": 0.3112360068180771, "percentage": 31.13, "elapsed_time": "10:38:02", "remaining_time": "23:31:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3379, "total_steps": 10853, "loss": 0.1631, "learning_rate": 4.123185630237233e-06, "epoch": 0.3113281429953471, "percentage": 31.13, "elapsed_time": "10:38:13", "remaining_time": "23:31:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3380, "total_steps": 10853, "loss": 0.1571, "learning_rate": 4.122606177583012e-06, "epoch": 0.3114202791726171, "percentage": 31.14, "elapsed_time": "10:38:23", "remaining_time": "23:31:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3381, "total_steps": 10853, "loss": 0.1623, "learning_rate": 4.122026574269633e-06, "epoch": 0.3115124153498871, "percentage": 31.15, "elapsed_time": "10:38:35", "remaining_time": "23:31:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3382, "total_steps": 10853, "loss": 0.153, "learning_rate": 4.121446820350911e-06, "epoch": 0.31160455152715716, "percentage": 31.16, "elapsed_time": "10:38:45", "remaining_time": "23:31:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3383, "total_steps": 10853, "loss": 0.1565, "learning_rate": 4.12086691588068e-06, "epoch": 0.31169668770442716, "percentage": 31.17, "elapsed_time": "10:38:55", "remaining_time": "23:30:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3384, "total_steps": 10853, "loss": 0.1477, "learning_rate": 4.120286860912779e-06, "epoch": 0.31178882388169715, "percentage": 31.18, "elapsed_time": "10:39:06", "remaining_time": "23:30:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3385, "total_steps": 10853, "loss": 0.1599, "learning_rate": 4.11970665550107e-06, "epoch": 0.31188096005896715, "percentage": 31.19, "elapsed_time": "10:39:17", "remaining_time": "23:30:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3386, "total_steps": 10853, "loss": 0.1695, "learning_rate": 4.119126299699422e-06, "epoch": 0.31197309623623715, "percentage": 31.2, "elapsed_time": "10:39:27", "remaining_time": "23:30:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3387, "total_steps": 10853, "loss": 0.1473, "learning_rate": 4.118545793561724e-06, "epoch": 0.31206523241350714, "percentage": 31.21, "elapsed_time": "10:39:38", "remaining_time": "23:29:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3388, "total_steps": 10853, "loss": 0.1586, "learning_rate": 4.117965137141875e-06, "epoch": 0.3121573685907772, "percentage": 31.22, "elapsed_time": "10:39:50", "remaining_time": "23:29:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3389, "total_steps": 10853, "loss": 0.143, "learning_rate": 4.117384330493789e-06, "epoch": 0.3122495047680472, "percentage": 31.23, "elapsed_time": "10:40:02", "remaining_time": "23:29:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3390, "total_steps": 10853, "loss": 0.1657, "learning_rate": 4.1168033736713934e-06, "epoch": 0.3123416409453172, "percentage": 31.24, "elapsed_time": "10:40:13", "remaining_time": "23:29:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3391, "total_steps": 10853, "loss": 0.1646, "learning_rate": 4.116222266728631e-06, "epoch": 0.3124337771225872, "percentage": 31.24, "elapsed_time": "10:40:23", "remaining_time": "23:29:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3392, "total_steps": 10853, "loss": 0.1468, "learning_rate": 4.115641009719456e-06, "epoch": 0.3125259132998572, "percentage": 31.25, "elapsed_time": "10:40:36", "remaining_time": "23:29:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3393, "total_steps": 10853, "loss": 0.1555, "learning_rate": 4.11505960269784e-06, "epoch": 0.3126180494771272, "percentage": 31.26, "elapsed_time": "10:40:47", "remaining_time": "23:28:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3394, "total_steps": 10853, "loss": 0.1644, "learning_rate": 4.114478045717767e-06, "epoch": 0.3127101856543972, "percentage": 31.27, "elapsed_time": "10:40:59", "remaining_time": "23:28:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3395, "total_steps": 10853, "loss": 0.1553, "learning_rate": 4.113896338833233e-06, "epoch": 0.31280232183166723, "percentage": 31.28, "elapsed_time": "10:41:09", "remaining_time": "23:28:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3396, "total_steps": 10853, "loss": 0.1795, "learning_rate": 4.11331448209825e-06, "epoch": 0.3128944580089372, "percentage": 31.29, "elapsed_time": "10:41:20", "remaining_time": "23:28:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3397, "total_steps": 10853, "loss": 0.1525, "learning_rate": 4.112732475566844e-06, "epoch": 0.3129865941862072, "percentage": 31.3, "elapsed_time": "10:41:31", "remaining_time": "23:28:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3398, "total_steps": 10853, "loss": 0.1616, "learning_rate": 4.112150319293055e-06, "epoch": 0.3130787303634772, "percentage": 31.31, "elapsed_time": "10:41:42", "remaining_time": "23:27:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3399, "total_steps": 10853, "loss": 0.1549, "learning_rate": 4.111568013330933e-06, "epoch": 0.3131708665407472, "percentage": 31.32, "elapsed_time": "10:41:53", "remaining_time": "23:27:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3400, "total_steps": 10853, "loss": 0.1411, "learning_rate": 4.110985557734549e-06, "epoch": 0.3132630027180172, "percentage": 31.33, "elapsed_time": "10:42:02", "remaining_time": "23:27:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3401, "total_steps": 10853, "loss": 0.1589, "learning_rate": 4.110402952557982e-06, "epoch": 0.3133551388952872, "percentage": 31.34, "elapsed_time": "10:42:12", "remaining_time": "23:27:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3402, "total_steps": 10853, "loss": 0.1565, "learning_rate": 4.109820197855329e-06, "epoch": 0.31344727507255726, "percentage": 31.35, "elapsed_time": "10:42:23", "remaining_time": "23:26:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3403, "total_steps": 10853, "loss": 0.1578, "learning_rate": 4.109237293680697e-06, "epoch": 0.31353941124982726, "percentage": 31.36, "elapsed_time": "10:42:34", "remaining_time": "23:26:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3404, "total_steps": 10853, "loss": 0.1331, "learning_rate": 4.108654240088208e-06, "epoch": 0.31363154742709726, "percentage": 31.36, "elapsed_time": "10:42:43", "remaining_time": "23:26:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3405, "total_steps": 10853, "loss": 0.1516, "learning_rate": 4.1080710371319995e-06, "epoch": 0.31372368360436725, "percentage": 31.37, "elapsed_time": "10:42:54", "remaining_time": "23:26:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3406, "total_steps": 10853, "loss": 0.1681, "learning_rate": 4.107487684866224e-06, "epoch": 0.31381581978163725, "percentage": 31.38, "elapsed_time": "10:43:05", "remaining_time": "23:26:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3407, "total_steps": 10853, "loss": 0.1454, "learning_rate": 4.106904183345042e-06, "epoch": 0.31390795595890725, "percentage": 31.39, "elapsed_time": "10:43:13", "remaining_time": "23:25:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3408, "total_steps": 10853, "loss": 0.1789, "learning_rate": 4.106320532622635e-06, "epoch": 0.31400009213617724, "percentage": 31.4, "elapsed_time": "10:43:24", "remaining_time": "23:25:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3409, "total_steps": 10853, "loss": 0.176, "learning_rate": 4.105736732753193e-06, "epoch": 0.3140922283134473, "percentage": 31.41, "elapsed_time": "10:43:35", "remaining_time": "23:25:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3410, "total_steps": 10853, "loss": 0.1372, "learning_rate": 4.1051527837909225e-06, "epoch": 0.3141843644907173, "percentage": 31.42, "elapsed_time": "10:43:46", "remaining_time": "23:25:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3411, "total_steps": 10853, "loss": 0.1487, "learning_rate": 4.104568685790043e-06, "epoch": 0.3142765006679873, "percentage": 31.43, "elapsed_time": "10:43:57", "remaining_time": "23:24:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3412, "total_steps": 10853, "loss": 0.1538, "learning_rate": 4.103984438804789e-06, "epoch": 0.3143686368452573, "percentage": 31.44, "elapsed_time": "10:44:08", "remaining_time": "23:24:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3413, "total_steps": 10853, "loss": 0.1637, "learning_rate": 4.103400042889407e-06, "epoch": 0.3144607730225273, "percentage": 31.45, "elapsed_time": "10:44:19", "remaining_time": "23:24:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3414, "total_steps": 10853, "loss": 0.1578, "learning_rate": 4.102815498098159e-06, "epoch": 0.3145529091997973, "percentage": 31.46, "elapsed_time": "10:44:29", "remaining_time": "23:24:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3415, "total_steps": 10853, "loss": 0.1495, "learning_rate": 4.102230804485318e-06, "epoch": 0.3146450453770673, "percentage": 31.47, "elapsed_time": "10:44:41", "remaining_time": "23:24:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3416, "total_steps": 10853, "loss": 0.163, "learning_rate": 4.101645962105176e-06, "epoch": 0.31473718155433733, "percentage": 31.48, "elapsed_time": "10:44:51", "remaining_time": "23:23:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3417, "total_steps": 10853, "loss": 0.1591, "learning_rate": 4.101060971012033e-06, "epoch": 0.3148293177316073, "percentage": 31.48, "elapsed_time": "10:45:01", "remaining_time": "23:23:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3418, "total_steps": 10853, "loss": 0.1444, "learning_rate": 4.100475831260208e-06, "epoch": 0.3149214539088773, "percentage": 31.49, "elapsed_time": "10:45:12", "remaining_time": "23:23:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3419, "total_steps": 10853, "loss": 0.1576, "learning_rate": 4.099890542904028e-06, "epoch": 0.3150135900861473, "percentage": 31.5, "elapsed_time": "10:45:22", "remaining_time": "23:23:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3420, "total_steps": 10853, "loss": 0.1549, "learning_rate": 4.0993051059978405e-06, "epoch": 0.3151057262634173, "percentage": 31.51, "elapsed_time": "10:45:33", "remaining_time": "23:23:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3421, "total_steps": 10853, "loss": 0.1417, "learning_rate": 4.098719520596e-06, "epoch": 0.3151978624406873, "percentage": 31.52, "elapsed_time": "10:45:43", "remaining_time": "23:22:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3422, "total_steps": 10853, "loss": 0.1456, "learning_rate": 4.098133786752881e-06, "epoch": 0.31528999861795737, "percentage": 31.53, "elapsed_time": "10:45:53", "remaining_time": "23:22:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3423, "total_steps": 10853, "loss": 0.1505, "learning_rate": 4.097547904522869e-06, "epoch": 0.31538213479522736, "percentage": 31.54, "elapsed_time": "10:46:03", "remaining_time": "23:22:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3424, "total_steps": 10853, "loss": 0.1493, "learning_rate": 4.09696187396036e-06, "epoch": 0.31547427097249736, "percentage": 31.55, "elapsed_time": "10:46:16", "remaining_time": "23:22:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3425, "total_steps": 10853, "loss": 0.1606, "learning_rate": 4.0963756951197695e-06, "epoch": 0.31556640714976736, "percentage": 31.56, "elapsed_time": "10:46:25", "remaining_time": "23:21:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3426, "total_steps": 10853, "loss": 0.1664, "learning_rate": 4.095789368055525e-06, "epoch": 0.31565854332703736, "percentage": 31.57, "elapsed_time": "10:46:37", "remaining_time": "23:21:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3427, "total_steps": 10853, "loss": 0.1499, "learning_rate": 4.095202892822066e-06, "epoch": 0.31575067950430735, "percentage": 31.58, "elapsed_time": "10:46:48", "remaining_time": "23:21:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3428, "total_steps": 10853, "loss": 0.1698, "learning_rate": 4.094616269473846e-06, "epoch": 0.31584281568157735, "percentage": 31.59, "elapsed_time": "10:46:59", "remaining_time": "23:21:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3429, "total_steps": 10853, "loss": 0.1596, "learning_rate": 4.0940294980653335e-06, "epoch": 0.3159349518588474, "percentage": 31.59, "elapsed_time": "10:47:09", "remaining_time": "23:21:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3430, "total_steps": 10853, "loss": 0.151, "learning_rate": 4.093442578651011e-06, "epoch": 0.3160270880361174, "percentage": 31.6, "elapsed_time": "10:47:20", "remaining_time": "23:20:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3431, "total_steps": 10853, "loss": 0.1416, "learning_rate": 4.092855511285373e-06, "epoch": 0.3161192242133874, "percentage": 31.61, "elapsed_time": "10:47:30", "remaining_time": "23:20:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3432, "total_steps": 10853, "loss": 0.1493, "learning_rate": 4.09226829602293e-06, "epoch": 0.3162113603906574, "percentage": 31.62, "elapsed_time": "10:47:40", "remaining_time": "23:20:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3433, "total_steps": 10853, "loss": 0.1633, "learning_rate": 4.091680932918205e-06, "epoch": 0.3163034965679274, "percentage": 31.63, "elapsed_time": "10:47:52", "remaining_time": "23:20:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3434, "total_steps": 10853, "loss": 0.1687, "learning_rate": 4.091093422025733e-06, "epoch": 0.3163956327451974, "percentage": 31.64, "elapsed_time": "10:48:03", "remaining_time": "23:20:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3435, "total_steps": 10853, "loss": 0.1624, "learning_rate": 4.090505763400065e-06, "epoch": 0.3164877689224674, "percentage": 31.65, "elapsed_time": "10:48:14", "remaining_time": "23:19:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3436, "total_steps": 10853, "loss": 0.1473, "learning_rate": 4.089917957095767e-06, "epoch": 0.31657990509973744, "percentage": 31.66, "elapsed_time": "10:48:24", "remaining_time": "23:19:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3437, "total_steps": 10853, "loss": 0.1532, "learning_rate": 4.089330003167416e-06, "epoch": 0.31667204127700743, "percentage": 31.67, "elapsed_time": "10:48:35", "remaining_time": "23:19:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3438, "total_steps": 10853, "loss": 0.1418, "learning_rate": 4.088741901669601e-06, "epoch": 0.31676417745427743, "percentage": 31.68, "elapsed_time": "10:48:45", "remaining_time": "23:19:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3439, "total_steps": 10853, "loss": 0.1606, "learning_rate": 4.088153652656932e-06, "epoch": 0.3168563136315474, "percentage": 31.69, "elapsed_time": "10:48:56", "remaining_time": "23:19:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3440, "total_steps": 10853, "loss": 0.1566, "learning_rate": 4.087565256184024e-06, "epoch": 0.3169484498088174, "percentage": 31.7, "elapsed_time": "10:49:08", "remaining_time": "23:18:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3441, "total_steps": 10853, "loss": 0.1799, "learning_rate": 4.086976712305511e-06, "epoch": 0.3170405859860874, "percentage": 31.71, "elapsed_time": "10:49:18", "remaining_time": "23:18:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3442, "total_steps": 10853, "loss": 0.1616, "learning_rate": 4.08638802107604e-06, "epoch": 0.3171327221633574, "percentage": 31.71, "elapsed_time": "10:49:29", "remaining_time": "23:18:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3443, "total_steps": 10853, "loss": 0.1676, "learning_rate": 4.0857991825502696e-06, "epoch": 0.31722485834062747, "percentage": 31.72, "elapsed_time": "10:49:41", "remaining_time": "23:18:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3444, "total_steps": 10853, "loss": 0.1604, "learning_rate": 4.085210196782875e-06, "epoch": 0.31731699451789747, "percentage": 31.73, "elapsed_time": "10:49:51", "remaining_time": "23:18:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3445, "total_steps": 10853, "loss": 0.1738, "learning_rate": 4.084621063828544e-06, "epoch": 0.31740913069516746, "percentage": 31.74, "elapsed_time": "10:50:03", "remaining_time": "23:17:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3446, "total_steps": 10853, "loss": 0.1716, "learning_rate": 4.0840317837419754e-06, "epoch": 0.31750126687243746, "percentage": 31.75, "elapsed_time": "10:50:13", "remaining_time": "23:17:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3447, "total_steps": 10853, "loss": 0.1568, "learning_rate": 4.083442356577886e-06, "epoch": 0.31759340304970746, "percentage": 31.76, "elapsed_time": "10:50:23", "remaining_time": "23:17:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3448, "total_steps": 10853, "loss": 0.1646, "learning_rate": 4.082852782391003e-06, "epoch": 0.31768553922697745, "percentage": 31.77, "elapsed_time": "10:50:33", "remaining_time": "23:17:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3449, "total_steps": 10853, "loss": 0.159, "learning_rate": 4.0822630612360685e-06, "epoch": 0.31777767540424745, "percentage": 31.78, "elapsed_time": "10:50:45", "remaining_time": "23:16:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3450, "total_steps": 10853, "loss": 0.1522, "learning_rate": 4.081673193167839e-06, "epoch": 0.3178698115815175, "percentage": 31.79, "elapsed_time": "10:50:56", "remaining_time": "23:16:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3451, "total_steps": 10853, "loss": 0.1493, "learning_rate": 4.081083178241083e-06, "epoch": 0.3179619477587875, "percentage": 31.8, "elapsed_time": "10:51:08", "remaining_time": "23:16:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3452, "total_steps": 10853, "loss": 0.1639, "learning_rate": 4.080493016510583e-06, "epoch": 0.3180540839360575, "percentage": 31.81, "elapsed_time": "10:51:18", "remaining_time": "23:16:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3453, "total_steps": 10853, "loss": 0.1601, "learning_rate": 4.079902708031137e-06, "epoch": 0.3181462201133275, "percentage": 31.82, "elapsed_time": "10:51:31", "remaining_time": "23:16:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3454, "total_steps": 10853, "loss": 0.1541, "learning_rate": 4.079312252857556e-06, "epoch": 0.3182383562905975, "percentage": 31.83, "elapsed_time": "10:51:41", "remaining_time": "23:16:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3455, "total_steps": 10853, "loss": 0.1623, "learning_rate": 4.07872165104466e-06, "epoch": 0.3183304924678675, "percentage": 31.83, "elapsed_time": "10:51:52", "remaining_time": "23:15:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3456, "total_steps": 10853, "loss": 0.1597, "learning_rate": 4.07813090264729e-06, "epoch": 0.31842262864513754, "percentage": 31.84, "elapsed_time": "10:52:03", "remaining_time": "23:15:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3457, "total_steps": 10853, "loss": 0.1722, "learning_rate": 4.077540007720295e-06, "epoch": 0.31851476482240754, "percentage": 31.85, "elapsed_time": "10:52:15", "remaining_time": "23:15:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3458, "total_steps": 10853, "loss": 0.1491, "learning_rate": 4.076948966318542e-06, "epoch": 0.31860690099967753, "percentage": 31.86, "elapsed_time": "10:52:25", "remaining_time": "23:15:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3459, "total_steps": 10853, "loss": 0.1519, "learning_rate": 4.076357778496906e-06, "epoch": 0.31869903717694753, "percentage": 31.87, "elapsed_time": "10:52:35", "remaining_time": "23:14:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3460, "total_steps": 10853, "loss": 0.1484, "learning_rate": 4.075766444310282e-06, "epoch": 0.3187911733542175, "percentage": 31.88, "elapsed_time": "10:52:46", "remaining_time": "23:14:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3461, "total_steps": 10853, "loss": 0.1551, "learning_rate": 4.075174963813574e-06, "epoch": 0.3188833095314875, "percentage": 31.89, "elapsed_time": "10:52:57", "remaining_time": "23:14:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3462, "total_steps": 10853, "loss": 0.1598, "learning_rate": 4.0745833370617e-06, "epoch": 0.3189754457087575, "percentage": 31.9, "elapsed_time": "10:53:08", "remaining_time": "23:14:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3463, "total_steps": 10853, "loss": 0.1535, "learning_rate": 4.073991564109595e-06, "epoch": 0.3190675818860276, "percentage": 31.91, "elapsed_time": "10:53:20", "remaining_time": "23:14:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3464, "total_steps": 10853, "loss": 0.1534, "learning_rate": 4.073399645012203e-06, "epoch": 0.31915971806329757, "percentage": 31.92, "elapsed_time": "10:53:30", "remaining_time": "23:13:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3465, "total_steps": 10853, "loss": 0.1729, "learning_rate": 4.072807579824485e-06, "epoch": 0.31925185424056757, "percentage": 31.93, "elapsed_time": "10:53:40", "remaining_time": "23:13:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3466, "total_steps": 10853, "loss": 0.1619, "learning_rate": 4.072215368601414e-06, "epoch": 0.31934399041783756, "percentage": 31.94, "elapsed_time": "10:53:51", "remaining_time": "23:13:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3467, "total_steps": 10853, "loss": 0.1502, "learning_rate": 4.0716230113979766e-06, "epoch": 0.31943612659510756, "percentage": 31.95, "elapsed_time": "10:54:03", "remaining_time": "23:13:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3468, "total_steps": 10853, "loss": 0.1699, "learning_rate": 4.071030508269173e-06, "epoch": 0.31952826277237756, "percentage": 31.95, "elapsed_time": "10:54:13", "remaining_time": "23:13:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3469, "total_steps": 10853, "loss": 0.1637, "learning_rate": 4.070437859270019e-06, "epoch": 0.31962039894964756, "percentage": 31.96, "elapsed_time": "10:54:24", "remaining_time": "23:12:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3470, "total_steps": 10853, "loss": 0.1581, "learning_rate": 4.06984506445554e-06, "epoch": 0.3197125351269176, "percentage": 31.97, "elapsed_time": "10:54:35", "remaining_time": "23:12:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3471, "total_steps": 10853, "loss": 0.1619, "learning_rate": 4.069252123880777e-06, "epoch": 0.3198046713041876, "percentage": 31.98, "elapsed_time": "10:54:46", "remaining_time": "23:12:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3472, "total_steps": 10853, "loss": 0.1542, "learning_rate": 4.068659037600786e-06, "epoch": 0.3198968074814576, "percentage": 31.99, "elapsed_time": "10:54:56", "remaining_time": "23:12:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3473, "total_steps": 10853, "loss": 0.1417, "learning_rate": 4.068065805670635e-06, "epoch": 0.3199889436587276, "percentage": 32.0, "elapsed_time": "10:55:06", "remaining_time": "23:12:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3474, "total_steps": 10853, "loss": 0.1494, "learning_rate": 4.067472428145405e-06, "epoch": 0.3200810798359976, "percentage": 32.01, "elapsed_time": "10:55:17", "remaining_time": "23:11:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3475, "total_steps": 10853, "loss": 0.1396, "learning_rate": 4.066878905080191e-06, "epoch": 0.3201732160132676, "percentage": 32.02, "elapsed_time": "10:55:28", "remaining_time": "23:11:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3476, "total_steps": 10853, "loss": 0.1597, "learning_rate": 4.066285236530103e-06, "epoch": 0.3202653521905376, "percentage": 32.03, "elapsed_time": "10:55:38", "remaining_time": "23:11:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3477, "total_steps": 10853, "loss": 0.1512, "learning_rate": 4.065691422550261e-06, "epoch": 0.32035748836780764, "percentage": 32.04, "elapsed_time": "10:55:49", "remaining_time": "23:11:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3478, "total_steps": 10853, "loss": 0.1592, "learning_rate": 4.065097463195803e-06, "epoch": 0.32044962454507764, "percentage": 32.05, "elapsed_time": "10:56:01", "remaining_time": "23:11:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3479, "total_steps": 10853, "loss": 0.1459, "learning_rate": 4.064503358521876e-06, "epoch": 0.32054176072234764, "percentage": 32.06, "elapsed_time": "10:56:11", "remaining_time": "23:10:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3480, "total_steps": 10853, "loss": 0.1553, "learning_rate": 4.063909108583644e-06, "epoch": 0.32063389689961763, "percentage": 32.06, "elapsed_time": "10:56:21", "remaining_time": "23:10:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3481, "total_steps": 10853, "loss": 0.1656, "learning_rate": 4.063314713436283e-06, "epoch": 0.32072603307688763, "percentage": 32.07, "elapsed_time": "10:56:31", "remaining_time": "23:10:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3482, "total_steps": 10853, "loss": 0.1709, "learning_rate": 4.062720173134983e-06, "epoch": 0.3208181692541576, "percentage": 32.08, "elapsed_time": "10:56:42", "remaining_time": "23:10:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3483, "total_steps": 10853, "loss": 0.151, "learning_rate": 4.062125487734947e-06, "epoch": 0.3209103054314276, "percentage": 32.09, "elapsed_time": "10:56:52", "remaining_time": "23:09:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3484, "total_steps": 10853, "loss": 0.1477, "learning_rate": 4.06153065729139e-06, "epoch": 0.3210024416086977, "percentage": 32.1, "elapsed_time": "10:57:02", "remaining_time": "23:09:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3485, "total_steps": 10853, "loss": 0.1509, "learning_rate": 4.060935681859545e-06, "epoch": 0.32109457778596767, "percentage": 32.11, "elapsed_time": "10:57:13", "remaining_time": "23:09:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3486, "total_steps": 10853, "loss": 0.1606, "learning_rate": 4.060340561494654e-06, "epoch": 0.32118671396323767, "percentage": 32.12, "elapsed_time": "10:57:23", "remaining_time": "23:09:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3487, "total_steps": 10853, "loss": 0.1612, "learning_rate": 4.059745296251972e-06, "epoch": 0.32127885014050767, "percentage": 32.13, "elapsed_time": "10:57:35", "remaining_time": "23:09:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3488, "total_steps": 10853, "loss": 0.1586, "learning_rate": 4.059149886186773e-06, "epoch": 0.32137098631777766, "percentage": 32.14, "elapsed_time": "10:57:45", "remaining_time": "23:08:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3489, "total_steps": 10853, "loss": 0.1608, "learning_rate": 4.058554331354339e-06, "epoch": 0.32146312249504766, "percentage": 32.15, "elapsed_time": "10:57:55", "remaining_time": "23:08:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3490, "total_steps": 10853, "loss": 0.1549, "learning_rate": 4.057958631809967e-06, "epoch": 0.3215552586723177, "percentage": 32.16, "elapsed_time": "10:58:06", "remaining_time": "23:08:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3491, "total_steps": 10853, "loss": 0.1546, "learning_rate": 4.057362787608969e-06, "epoch": 0.3216473948495877, "percentage": 32.17, "elapsed_time": "10:58:16", "remaining_time": "23:08:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3492, "total_steps": 10853, "loss": 0.1484, "learning_rate": 4.056766798806668e-06, "epoch": 0.3217395310268577, "percentage": 32.18, "elapsed_time": "10:58:27", "remaining_time": "23:08:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3493, "total_steps": 10853, "loss": 0.1511, "learning_rate": 4.056170665458403e-06, "epoch": 0.3218316672041277, "percentage": 32.18, "elapsed_time": "10:58:37", "remaining_time": "23:07:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3494, "total_steps": 10853, "loss": 0.1733, "learning_rate": 4.055574387619524e-06, "epoch": 0.3219238033813977, "percentage": 32.19, "elapsed_time": "10:58:48", "remaining_time": "23:07:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3495, "total_steps": 10853, "loss": 0.1658, "learning_rate": 4.054977965345396e-06, "epoch": 0.3220159395586677, "percentage": 32.2, "elapsed_time": "10:58:59", "remaining_time": "23:07:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3496, "total_steps": 10853, "loss": 0.1651, "learning_rate": 4.054381398691396e-06, "epoch": 0.3221080757359377, "percentage": 32.21, "elapsed_time": "10:59:10", "remaining_time": "23:07:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3497, "total_steps": 10853, "loss": 0.1521, "learning_rate": 4.053784687712916e-06, "epoch": 0.32220021191320775, "percentage": 32.22, "elapsed_time": "10:59:22", "remaining_time": "23:07:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3498, "total_steps": 10853, "loss": 0.1452, "learning_rate": 4.05318783246536e-06, "epoch": 0.32229234809047774, "percentage": 32.23, "elapsed_time": "10:59:32", "remaining_time": "23:06:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3499, "total_steps": 10853, "loss": 0.1554, "learning_rate": 4.052590833004147e-06, "epoch": 0.32238448426774774, "percentage": 32.24, "elapsed_time": "10:59:43", "remaining_time": "23:06:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3500, "total_steps": 10853, "loss": 0.1421, "learning_rate": 4.051993689384709e-06, "epoch": 0.32247662044501774, "percentage": 32.25, "elapsed_time": "10:59:55", "remaining_time": "23:06:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3500, "total_steps": 10853, "eval_loss": 0.15785863995552063, "epoch": 0.32247662044501774, "percentage": 32.25, "elapsed_time": "11:04:55", "remaining_time": "23:16:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3501, "total_steps": 10853, "loss": 0.1431, "learning_rate": 4.051396401662489e-06, "epoch": 0.32256875662228773, "percentage": 32.26, "elapsed_time": "11:05:06", "remaining_time": "23:16:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3502, "total_steps": 10853, "loss": 0.1672, "learning_rate": 4.050798969892946e-06, "epoch": 0.32266089279955773, "percentage": 32.27, "elapsed_time": "11:05:17", "remaining_time": "23:16:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3503, "total_steps": 10853, "loss": 0.1409, "learning_rate": 4.050201394131551e-06, "epoch": 0.3227530289768277, "percentage": 32.28, "elapsed_time": "11:05:28", "remaining_time": "23:16:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3504, "total_steps": 10853, "loss": 0.168, "learning_rate": 4.049603674433791e-06, "epoch": 0.3228451651540978, "percentage": 32.29, "elapsed_time": "11:05:40", "remaining_time": "23:16:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3505, "total_steps": 10853, "loss": 0.1679, "learning_rate": 4.049005810855163e-06, "epoch": 0.3229373013313678, "percentage": 32.3, "elapsed_time": "11:05:52", "remaining_time": "23:15:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3506, "total_steps": 10853, "loss": 0.1591, "learning_rate": 4.048407803451178e-06, "epoch": 0.3230294375086378, "percentage": 32.3, "elapsed_time": "11:06:01", "remaining_time": "23:15:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3507, "total_steps": 10853, "loss": 0.1505, "learning_rate": 4.047809652277362e-06, "epoch": 0.32312157368590777, "percentage": 32.31, "elapsed_time": "11:06:12", "remaining_time": "23:15:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3508, "total_steps": 10853, "loss": 0.1685, "learning_rate": 4.047211357389254e-06, "epoch": 0.32321370986317777, "percentage": 32.32, "elapsed_time": "11:06:23", "remaining_time": "23:15:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3509, "total_steps": 10853, "loss": 0.1543, "learning_rate": 4.046612918842405e-06, "epoch": 0.32330584604044776, "percentage": 32.33, "elapsed_time": "11:06:34", "remaining_time": "23:15:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3510, "total_steps": 10853, "loss": 0.1578, "learning_rate": 4.0460143366923785e-06, "epoch": 0.32339798221771776, "percentage": 32.34, "elapsed_time": "11:06:45", "remaining_time": "23:14:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3511, "total_steps": 10853, "loss": 0.157, "learning_rate": 4.045415610994755e-06, "epoch": 0.3234901183949878, "percentage": 32.35, "elapsed_time": "11:06:56", "remaining_time": "23:14:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3512, "total_steps": 10853, "loss": 0.1471, "learning_rate": 4.044816741805127e-06, "epoch": 0.3235822545722578, "percentage": 32.36, "elapsed_time": "11:07:07", "remaining_time": "23:14:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3513, "total_steps": 10853, "loss": 0.1583, "learning_rate": 4.044217729179097e-06, "epoch": 0.3236743907495278, "percentage": 32.37, "elapsed_time": "11:07:18", "remaining_time": "23:14:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3514, "total_steps": 10853, "loss": 0.1645, "learning_rate": 4.043618573172286e-06, "epoch": 0.3237665269267978, "percentage": 32.38, "elapsed_time": "11:07:29", "remaining_time": "23:14:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3515, "total_steps": 10853, "loss": 0.1599, "learning_rate": 4.043019273840323e-06, "epoch": 0.3238586631040678, "percentage": 32.39, "elapsed_time": "11:07:41", "remaining_time": "23:13:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3516, "total_steps": 10853, "loss": 0.1671, "learning_rate": 4.042419831238855e-06, "epoch": 0.3239507992813378, "percentage": 32.4, "elapsed_time": "11:07:52", "remaining_time": "23:13:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3517, "total_steps": 10853, "loss": 0.1489, "learning_rate": 4.041820245423539e-06, "epoch": 0.3240429354586078, "percentage": 32.41, "elapsed_time": "11:08:01", "remaining_time": "23:13:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3518, "total_steps": 10853, "loss": 0.1429, "learning_rate": 4.041220516450048e-06, "epoch": 0.32413507163587785, "percentage": 32.42, "elapsed_time": "11:08:11", "remaining_time": "23:13:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3519, "total_steps": 10853, "loss": 0.1714, "learning_rate": 4.040620644374066e-06, "epoch": 0.32422720781314784, "percentage": 32.42, "elapsed_time": "11:08:21", "remaining_time": "23:12:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3520, "total_steps": 10853, "loss": 0.1358, "learning_rate": 4.0400206292512914e-06, "epoch": 0.32431934399041784, "percentage": 32.43, "elapsed_time": "11:08:30", "remaining_time": "23:12:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3521, "total_steps": 10853, "loss": 0.1687, "learning_rate": 4.039420471137435e-06, "epoch": 0.32441148016768784, "percentage": 32.44, "elapsed_time": "11:08:40", "remaining_time": "23:12:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3522, "total_steps": 10853, "loss": 0.162, "learning_rate": 4.038820170088223e-06, "epoch": 0.32450361634495783, "percentage": 32.45, "elapsed_time": "11:08:51", "remaining_time": "23:12:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3523, "total_steps": 10853, "loss": 0.1672, "learning_rate": 4.0382197261593925e-06, "epoch": 0.32459575252222783, "percentage": 32.46, "elapsed_time": "11:09:03", "remaining_time": "23:12:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3524, "total_steps": 10853, "loss": 0.1676, "learning_rate": 4.037619139406695e-06, "epoch": 0.3246878886994979, "percentage": 32.47, "elapsed_time": "11:09:13", "remaining_time": "23:11:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3525, "total_steps": 10853, "loss": 0.1641, "learning_rate": 4.037018409885894e-06, "epoch": 0.3247800248767679, "percentage": 32.48, "elapsed_time": "11:09:23", "remaining_time": "23:11:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3526, "total_steps": 10853, "loss": 0.1431, "learning_rate": 4.036417537652769e-06, "epoch": 0.3248721610540379, "percentage": 32.49, "elapsed_time": "11:09:33", "remaining_time": "23:11:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3527, "total_steps": 10853, "loss": 0.1563, "learning_rate": 4.03581652276311e-06, "epoch": 0.3249642972313079, "percentage": 32.5, "elapsed_time": "11:09:44", "remaining_time": "23:11:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3528, "total_steps": 10853, "loss": 0.1403, "learning_rate": 4.035215365272722e-06, "epoch": 0.32505643340857787, "percentage": 32.51, "elapsed_time": "11:09:54", "remaining_time": "23:10:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3529, "total_steps": 10853, "loss": 0.1717, "learning_rate": 4.034614065237421e-06, "epoch": 0.32514856958584787, "percentage": 32.52, "elapsed_time": "11:10:05", "remaining_time": "23:10:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3530, "total_steps": 10853, "loss": 0.1323, "learning_rate": 4.034012622713041e-06, "epoch": 0.32524070576311787, "percentage": 32.53, "elapsed_time": "11:10:17", "remaining_time": "23:10:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3531, "total_steps": 10853, "loss": 0.163, "learning_rate": 4.033411037755422e-06, "epoch": 0.3253328419403879, "percentage": 32.53, "elapsed_time": "11:10:28", "remaining_time": "23:10:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3532, "total_steps": 10853, "loss": 0.1638, "learning_rate": 4.032809310420424e-06, "epoch": 0.3254249781176579, "percentage": 32.54, "elapsed_time": "11:10:39", "remaining_time": "23:10:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3533, "total_steps": 10853, "loss": 0.1482, "learning_rate": 4.032207440763915e-06, "epoch": 0.3255171142949279, "percentage": 32.55, "elapsed_time": "11:10:50", "remaining_time": "23:09:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3534, "total_steps": 10853, "loss": 0.1626, "learning_rate": 4.0316054288417825e-06, "epoch": 0.3256092504721979, "percentage": 32.56, "elapsed_time": "11:11:00", "remaining_time": "23:09:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3535, "total_steps": 10853, "loss": 0.1565, "learning_rate": 4.031003274709919e-06, "epoch": 0.3257013866494679, "percentage": 32.57, "elapsed_time": "11:11:11", "remaining_time": "23:09:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3536, "total_steps": 10853, "loss": 0.1767, "learning_rate": 4.0304009784242385e-06, "epoch": 0.3257935228267379, "percentage": 32.58, "elapsed_time": "11:11:21", "remaining_time": "23:09:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3537, "total_steps": 10853, "loss": 0.1393, "learning_rate": 4.029798540040661e-06, "epoch": 0.3258856590040079, "percentage": 32.59, "elapsed_time": "11:11:32", "remaining_time": "23:09:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3538, "total_steps": 10853, "loss": 0.1465, "learning_rate": 4.029195959615125e-06, "epoch": 0.32597779518127795, "percentage": 32.6, "elapsed_time": "11:11:44", "remaining_time": "23:08:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3539, "total_steps": 10853, "loss": 0.1587, "learning_rate": 4.02859323720358e-06, "epoch": 0.32606993135854795, "percentage": 32.61, "elapsed_time": "11:11:56", "remaining_time": "23:08:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3540, "total_steps": 10853, "loss": 0.1569, "learning_rate": 4.027990372861989e-06, "epoch": 0.32616206753581795, "percentage": 32.62, "elapsed_time": "11:12:05", "remaining_time": "23:08:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3541, "total_steps": 10853, "loss": 0.1594, "learning_rate": 4.027387366646326e-06, "epoch": 0.32625420371308794, "percentage": 32.63, "elapsed_time": "11:12:16", "remaining_time": "23:08:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3542, "total_steps": 10853, "loss": 0.1675, "learning_rate": 4.026784218612581e-06, "epoch": 0.32634633989035794, "percentage": 32.64, "elapsed_time": "11:12:26", "remaining_time": "23:07:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3543, "total_steps": 10853, "loss": 0.1609, "learning_rate": 4.026180928816759e-06, "epoch": 0.32643847606762794, "percentage": 32.65, "elapsed_time": "11:12:37", "remaining_time": "23:07:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3544, "total_steps": 10853, "loss": 0.1638, "learning_rate": 4.0255774973148735e-06, "epoch": 0.32653061224489793, "percentage": 32.65, "elapsed_time": "11:12:48", "remaining_time": "23:07:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3545, "total_steps": 10853, "loss": 0.1462, "learning_rate": 4.024973924162952e-06, "epoch": 0.326622748422168, "percentage": 32.66, "elapsed_time": "11:12:58", "remaining_time": "23:07:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3546, "total_steps": 10853, "loss": 0.1593, "learning_rate": 4.024370209417037e-06, "epoch": 0.326714884599438, "percentage": 32.67, "elapsed_time": "11:13:10", "remaining_time": "23:07:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3547, "total_steps": 10853, "loss": 0.1598, "learning_rate": 4.0237663531331855e-06, "epoch": 0.326807020776708, "percentage": 32.68, "elapsed_time": "11:13:22", "remaining_time": "23:06:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3548, "total_steps": 10853, "loss": 0.1483, "learning_rate": 4.023162355367464e-06, "epoch": 0.326899156953978, "percentage": 32.69, "elapsed_time": "11:13:33", "remaining_time": "23:06:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3549, "total_steps": 10853, "loss": 0.1507, "learning_rate": 4.022558216175953e-06, "epoch": 0.326991293131248, "percentage": 32.7, "elapsed_time": "11:13:45", "remaining_time": "23:06:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3550, "total_steps": 10853, "loss": 0.1442, "learning_rate": 4.021953935614748e-06, "epoch": 0.32708342930851797, "percentage": 32.71, "elapsed_time": "11:13:55", "remaining_time": "23:06:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3551, "total_steps": 10853, "loss": 0.1755, "learning_rate": 4.021349513739956e-06, "epoch": 0.32717556548578797, "percentage": 32.72, "elapsed_time": "11:14:07", "remaining_time": "23:06:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3552, "total_steps": 10853, "loss": 0.1573, "learning_rate": 4.020744950607699e-06, "epoch": 0.327267701663058, "percentage": 32.73, "elapsed_time": "11:14:18", "remaining_time": "23:05:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3553, "total_steps": 10853, "loss": 0.1599, "learning_rate": 4.020140246274109e-06, "epoch": 0.327359837840328, "percentage": 32.74, "elapsed_time": "11:14:28", "remaining_time": "23:05:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3554, "total_steps": 10853, "loss": 0.1746, "learning_rate": 4.019535400795333e-06, "epoch": 0.327451974017598, "percentage": 32.75, "elapsed_time": "11:14:40", "remaining_time": "23:05:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3555, "total_steps": 10853, "loss": 0.1558, "learning_rate": 4.018930414227533e-06, "epoch": 0.327544110194868, "percentage": 32.76, "elapsed_time": "11:14:51", "remaining_time": "23:05:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3556, "total_steps": 10853, "loss": 0.1592, "learning_rate": 4.018325286626879e-06, "epoch": 0.327636246372138, "percentage": 32.77, "elapsed_time": "11:15:03", "remaining_time": "23:05:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3557, "total_steps": 10853, "loss": 0.1532, "learning_rate": 4.017720018049559e-06, "epoch": 0.327728382549408, "percentage": 32.77, "elapsed_time": "11:15:14", "remaining_time": "23:05:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3558, "total_steps": 10853, "loss": 0.1601, "learning_rate": 4.017114608551772e-06, "epoch": 0.32782051872667806, "percentage": 32.78, "elapsed_time": "11:15:23", "remaining_time": "23:04:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3559, "total_steps": 10853, "loss": 0.1505, "learning_rate": 4.016509058189731e-06, "epoch": 0.32791265490394805, "percentage": 32.79, "elapsed_time": "11:15:34", "remaining_time": "23:04:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3560, "total_steps": 10853, "loss": 0.1629, "learning_rate": 4.0159033670196605e-06, "epoch": 0.32800479108121805, "percentage": 32.8, "elapsed_time": "11:15:44", "remaining_time": "23:04:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3561, "total_steps": 10853, "loss": 0.1588, "learning_rate": 4.0152975350978e-06, "epoch": 0.32809692725848805, "percentage": 32.81, "elapsed_time": "11:15:56", "remaining_time": "23:04:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3562, "total_steps": 10853, "loss": 0.1556, "learning_rate": 4.0146915624803985e-06, "epoch": 0.32818906343575804, "percentage": 32.82, "elapsed_time": "11:16:06", "remaining_time": "23:03:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3563, "total_steps": 10853, "loss": 0.1581, "learning_rate": 4.014085449223724e-06, "epoch": 0.32828119961302804, "percentage": 32.83, "elapsed_time": "11:16:17", "remaining_time": "23:03:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3564, "total_steps": 10853, "loss": 0.1686, "learning_rate": 4.013479195384051e-06, "epoch": 0.32837333579029804, "percentage": 32.84, "elapsed_time": "11:16:28", "remaining_time": "23:03:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3565, "total_steps": 10853, "loss": 0.156, "learning_rate": 4.012872801017673e-06, "epoch": 0.3284654719675681, "percentage": 32.85, "elapsed_time": "11:16:40", "remaining_time": "23:03:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3566, "total_steps": 10853, "loss": 0.1477, "learning_rate": 4.012266266180892e-06, "epoch": 0.3285576081448381, "percentage": 32.86, "elapsed_time": "11:16:51", "remaining_time": "23:03:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3567, "total_steps": 10853, "loss": 0.1515, "learning_rate": 4.011659590930026e-06, "epoch": 0.3286497443221081, "percentage": 32.87, "elapsed_time": "11:17:01", "remaining_time": "23:02:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3568, "total_steps": 10853, "loss": 0.1422, "learning_rate": 4.011052775321405e-06, "epoch": 0.3287418804993781, "percentage": 32.88, "elapsed_time": "11:17:11", "remaining_time": "23:02:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3569, "total_steps": 10853, "loss": 0.1684, "learning_rate": 4.010445819411369e-06, "epoch": 0.3288340166766481, "percentage": 32.88, "elapsed_time": "11:17:21", "remaining_time": "23:02:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3570, "total_steps": 10853, "loss": 0.1522, "learning_rate": 4.009838723256278e-06, "epoch": 0.3289261528539181, "percentage": 32.89, "elapsed_time": "11:17:32", "remaining_time": "23:02:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3571, "total_steps": 10853, "loss": 0.1656, "learning_rate": 4.009231486912498e-06, "epoch": 0.32901828903118807, "percentage": 32.9, "elapsed_time": "11:17:42", "remaining_time": "23:02:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3572, "total_steps": 10853, "loss": 0.1527, "learning_rate": 4.008624110436413e-06, "epoch": 0.3291104252084581, "percentage": 32.91, "elapsed_time": "11:17:53", "remaining_time": "23:01:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3573, "total_steps": 10853, "loss": 0.1546, "learning_rate": 4.008016593884416e-06, "epoch": 0.3292025613857281, "percentage": 32.92, "elapsed_time": "11:18:05", "remaining_time": "23:01:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3574, "total_steps": 10853, "loss": 0.1522, "learning_rate": 4.0074089373129165e-06, "epoch": 0.3292946975629981, "percentage": 32.93, "elapsed_time": "11:18:15", "remaining_time": "23:01:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3575, "total_steps": 10853, "loss": 0.1472, "learning_rate": 4.006801140778335e-06, "epoch": 0.3293868337402681, "percentage": 32.94, "elapsed_time": "11:18:25", "remaining_time": "23:01:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3576, "total_steps": 10853, "loss": 0.1604, "learning_rate": 4.006193204337106e-06, "epoch": 0.3294789699175381, "percentage": 32.95, "elapsed_time": "11:18:37", "remaining_time": "23:00:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3577, "total_steps": 10853, "loss": 0.1431, "learning_rate": 4.005585128045675e-06, "epoch": 0.3295711060948081, "percentage": 32.96, "elapsed_time": "11:18:48", "remaining_time": "23:00:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3578, "total_steps": 10853, "loss": 0.1629, "learning_rate": 4.004976911960503e-06, "epoch": 0.3296632422720781, "percentage": 32.97, "elapsed_time": "11:18:58", "remaining_time": "23:00:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3579, "total_steps": 10853, "loss": 0.1551, "learning_rate": 4.004368556138062e-06, "epoch": 0.32975537844934816, "percentage": 32.98, "elapsed_time": "11:19:09", "remaining_time": "23:00:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3580, "total_steps": 10853, "loss": 0.1552, "learning_rate": 4.003760060634839e-06, "epoch": 0.32984751462661815, "percentage": 32.99, "elapsed_time": "11:19:21", "remaining_time": "23:00:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3581, "total_steps": 10853, "loss": 0.1515, "learning_rate": 4.003151425507333e-06, "epoch": 0.32993965080388815, "percentage": 33.0, "elapsed_time": "11:19:32", "remaining_time": "22:59:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3582, "total_steps": 10853, "loss": 0.1705, "learning_rate": 4.002542650812056e-06, "epoch": 0.33003178698115815, "percentage": 33.0, "elapsed_time": "11:19:43", "remaining_time": "22:59:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3583, "total_steps": 10853, "loss": 0.1577, "learning_rate": 4.001933736605531e-06, "epoch": 0.33012392315842815, "percentage": 33.01, "elapsed_time": "11:19:53", "remaining_time": "22:59:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3584, "total_steps": 10853, "loss": 0.1623, "learning_rate": 4.001324682944297e-06, "epoch": 0.33021605933569814, "percentage": 33.02, "elapsed_time": "11:20:04", "remaining_time": "22:59:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3585, "total_steps": 10853, "loss": 0.1561, "learning_rate": 4.000715489884906e-06, "epoch": 0.3303081955129682, "percentage": 33.03, "elapsed_time": "11:20:16", "remaining_time": "22:59:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3586, "total_steps": 10853, "loss": 0.1475, "learning_rate": 4.000106157483919e-06, "epoch": 0.3304003316902382, "percentage": 33.04, "elapsed_time": "11:20:28", "remaining_time": "22:58:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3587, "total_steps": 10853, "loss": 0.1643, "learning_rate": 3.999496685797914e-06, "epoch": 0.3304924678675082, "percentage": 33.05, "elapsed_time": "11:20:39", "remaining_time": "22:58:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3588, "total_steps": 10853, "loss": 0.16, "learning_rate": 3.998887074883481e-06, "epoch": 0.3305846040447782, "percentage": 33.06, "elapsed_time": "11:20:49", "remaining_time": "22:58:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3589, "total_steps": 10853, "loss": 0.1718, "learning_rate": 3.9982773247972204e-06, "epoch": 0.3306767402220482, "percentage": 33.07, "elapsed_time": "11:21:01", "remaining_time": "22:58:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3590, "total_steps": 10853, "loss": 0.1617, "learning_rate": 3.99766743559575e-06, "epoch": 0.3307688763993182, "percentage": 33.08, "elapsed_time": "11:21:12", "remaining_time": "22:58:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3591, "total_steps": 10853, "loss": 0.1537, "learning_rate": 3.997057407335697e-06, "epoch": 0.3308610125765882, "percentage": 33.09, "elapsed_time": "11:21:23", "remaining_time": "22:57:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3592, "total_steps": 10853, "loss": 0.1617, "learning_rate": 3.996447240073702e-06, "epoch": 0.33095314875385823, "percentage": 33.1, "elapsed_time": "11:21:34", "remaining_time": "22:57:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3593, "total_steps": 10853, "loss": 0.1493, "learning_rate": 3.995836933866421e-06, "epoch": 0.3310452849311282, "percentage": 33.11, "elapsed_time": "11:21:44", "remaining_time": "22:57:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3594, "total_steps": 10853, "loss": 0.1603, "learning_rate": 3.995226488770519e-06, "epoch": 0.3311374211083982, "percentage": 33.12, "elapsed_time": "11:21:55", "remaining_time": "22:57:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3595, "total_steps": 10853, "loss": 0.1612, "learning_rate": 3.994615904842676e-06, "epoch": 0.3312295572856682, "percentage": 33.12, "elapsed_time": "11:22:05", "remaining_time": "22:57:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3596, "total_steps": 10853, "loss": 0.1813, "learning_rate": 3.994005182139586e-06, "epoch": 0.3313216934629382, "percentage": 33.13, "elapsed_time": "11:22:17", "remaining_time": "22:56:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3597, "total_steps": 10853, "loss": 0.1597, "learning_rate": 3.993394320717952e-06, "epoch": 0.3314138296402082, "percentage": 33.14, "elapsed_time": "11:22:27", "remaining_time": "22:56:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3598, "total_steps": 10853, "loss": 0.1464, "learning_rate": 3.992783320634498e-06, "epoch": 0.3315059658174782, "percentage": 33.15, "elapsed_time": "11:22:38", "remaining_time": "22:56:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3599, "total_steps": 10853, "loss": 0.1658, "learning_rate": 3.992172181945951e-06, "epoch": 0.33159810199474826, "percentage": 33.16, "elapsed_time": "11:22:47", "remaining_time": "22:56:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3600, "total_steps": 10853, "loss": 0.166, "learning_rate": 3.991560904709055e-06, "epoch": 0.33169023817201826, "percentage": 33.17, "elapsed_time": "11:22:59", "remaining_time": "22:56:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3601, "total_steps": 10853, "loss": 0.161, "learning_rate": 3.990949488980569e-06, "epoch": 0.33178237434928826, "percentage": 33.18, "elapsed_time": "11:23:09", "remaining_time": "22:55:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3602, "total_steps": 10853, "loss": 0.1685, "learning_rate": 3.990337934817263e-06, "epoch": 0.33187451052655825, "percentage": 33.19, "elapsed_time": "11:23:21", "remaining_time": "22:55:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3603, "total_steps": 10853, "loss": 0.1489, "learning_rate": 3.989726242275919e-06, "epoch": 0.33196664670382825, "percentage": 33.2, "elapsed_time": "11:23:33", "remaining_time": "22:55:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3604, "total_steps": 10853, "loss": 0.1636, "learning_rate": 3.989114411413333e-06, "epoch": 0.33205878288109825, "percentage": 33.21, "elapsed_time": "11:23:44", "remaining_time": "22:55:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3605, "total_steps": 10853, "loss": 0.1496, "learning_rate": 3.988502442286314e-06, "epoch": 0.33215091905836824, "percentage": 33.22, "elapsed_time": "11:23:55", "remaining_time": "22:55:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3606, "total_steps": 10853, "loss": 0.1521, "learning_rate": 3.987890334951683e-06, "epoch": 0.3322430552356383, "percentage": 33.23, "elapsed_time": "11:24:06", "remaining_time": "22:54:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3607, "total_steps": 10853, "loss": 0.1754, "learning_rate": 3.987278089466274e-06, "epoch": 0.3323351914129083, "percentage": 33.24, "elapsed_time": "11:24:16", "remaining_time": "22:54:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3608, "total_steps": 10853, "loss": 0.1557, "learning_rate": 3.986665705886934e-06, "epoch": 0.3324273275901783, "percentage": 33.24, "elapsed_time": "11:24:27", "remaining_time": "22:54:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3609, "total_steps": 10853, "loss": 0.1541, "learning_rate": 3.986053184270524e-06, "epoch": 0.3325194637674483, "percentage": 33.25, "elapsed_time": "11:24:39", "remaining_time": "22:54:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3610, "total_steps": 10853, "loss": 0.1632, "learning_rate": 3.9854405246739155e-06, "epoch": 0.3326115999447183, "percentage": 33.26, "elapsed_time": "11:24:50", "remaining_time": "22:54:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3611, "total_steps": 10853, "loss": 0.1606, "learning_rate": 3.984827727153995e-06, "epoch": 0.3327037361219883, "percentage": 33.27, "elapsed_time": "11:25:01", "remaining_time": "22:53:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3612, "total_steps": 10853, "loss": 0.1548, "learning_rate": 3.984214791767659e-06, "epoch": 0.3327958722992583, "percentage": 33.28, "elapsed_time": "11:25:11", "remaining_time": "22:53:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3613, "total_steps": 10853, "loss": 0.1577, "learning_rate": 3.983601718571821e-06, "epoch": 0.33288800847652833, "percentage": 33.29, "elapsed_time": "11:25:22", "remaining_time": "22:53:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3614, "total_steps": 10853, "loss": 0.1532, "learning_rate": 3.982988507623403e-06, "epoch": 0.3329801446537983, "percentage": 33.3, "elapsed_time": "11:25:32", "remaining_time": "22:53:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3615, "total_steps": 10853, "loss": 0.1573, "learning_rate": 3.982375158979344e-06, "epoch": 0.3330722808310683, "percentage": 33.31, "elapsed_time": "11:25:42", "remaining_time": "22:52:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3616, "total_steps": 10853, "loss": 0.1479, "learning_rate": 3.98176167269659e-06, "epoch": 0.3331644170083383, "percentage": 33.32, "elapsed_time": "11:25:53", "remaining_time": "22:52:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3617, "total_steps": 10853, "loss": 0.1608, "learning_rate": 3.981148048832106e-06, "epoch": 0.3332565531856083, "percentage": 33.33, "elapsed_time": "11:26:03", "remaining_time": "22:52:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3618, "total_steps": 10853, "loss": 0.1521, "learning_rate": 3.980534287442866e-06, "epoch": 0.3333486893628783, "percentage": 33.34, "elapsed_time": "11:26:15", "remaining_time": "22:52:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3619, "total_steps": 10853, "loss": 0.1519, "learning_rate": 3.9799203885858584e-06, "epoch": 0.33344082554014837, "percentage": 33.35, "elapsed_time": "11:26:26", "remaining_time": "22:52:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3620, "total_steps": 10853, "loss": 0.1425, "learning_rate": 3.979306352318083e-06, "epoch": 0.33353296171741836, "percentage": 33.35, "elapsed_time": "11:26:36", "remaining_time": "22:51:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3621, "total_steps": 10853, "loss": 0.1494, "learning_rate": 3.978692178696555e-06, "epoch": 0.33362509789468836, "percentage": 33.36, "elapsed_time": "11:26:47", "remaining_time": "22:51:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3622, "total_steps": 10853, "loss": 0.1709, "learning_rate": 3.9780778677782974e-06, "epoch": 0.33371723407195836, "percentage": 33.37, "elapsed_time": "11:26:58", "remaining_time": "22:51:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3623, "total_steps": 10853, "loss": 0.1779, "learning_rate": 3.977463419620352e-06, "epoch": 0.33380937024922835, "percentage": 33.38, "elapsed_time": "11:27:09", "remaining_time": "22:51:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3624, "total_steps": 10853, "loss": 0.1615, "learning_rate": 3.976848834279767e-06, "epoch": 0.33390150642649835, "percentage": 33.39, "elapsed_time": "11:27:20", "remaining_time": "22:51:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3625, "total_steps": 10853, "loss": 0.1568, "learning_rate": 3.976234111813611e-06, "epoch": 0.33399364260376835, "percentage": 33.4, "elapsed_time": "11:27:31", "remaining_time": "22:50:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3626, "total_steps": 10853, "loss": 0.1648, "learning_rate": 3.975619252278958e-06, "epoch": 0.3340857787810384, "percentage": 33.41, "elapsed_time": "11:27:43", "remaining_time": "22:50:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3627, "total_steps": 10853, "loss": 0.1494, "learning_rate": 3.9750042557328986e-06, "epoch": 0.3341779149583084, "percentage": 33.42, "elapsed_time": "11:27:54", "remaining_time": "22:50:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3628, "total_steps": 10853, "loss": 0.1505, "learning_rate": 3.974389122232536e-06, "epoch": 0.3342700511355784, "percentage": 33.43, "elapsed_time": "11:28:05", "remaining_time": "22:50:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3629, "total_steps": 10853, "loss": 0.1441, "learning_rate": 3.973773851834983e-06, "epoch": 0.3343621873128484, "percentage": 33.44, "elapsed_time": "11:28:16", "remaining_time": "22:50:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3630, "total_steps": 10853, "loss": 0.1566, "learning_rate": 3.973158444597371e-06, "epoch": 0.3344543234901184, "percentage": 33.45, "elapsed_time": "11:28:27", "remaining_time": "22:49:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3631, "total_steps": 10853, "loss": 0.1642, "learning_rate": 3.972542900576838e-06, "epoch": 0.3345464596673884, "percentage": 33.46, "elapsed_time": "11:28:37", "remaining_time": "22:49:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3632, "total_steps": 10853, "loss": 0.1546, "learning_rate": 3.9719272198305385e-06, "epoch": 0.3346385958446584, "percentage": 33.47, "elapsed_time": "11:28:47", "remaining_time": "22:49:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3633, "total_steps": 10853, "loss": 0.154, "learning_rate": 3.971311402415638e-06, "epoch": 0.33473073202192843, "percentage": 33.47, "elapsed_time": "11:28:58", "remaining_time": "22:49:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3634, "total_steps": 10853, "loss": 0.1566, "learning_rate": 3.970695448389315e-06, "epoch": 0.33482286819919843, "percentage": 33.48, "elapsed_time": "11:29:09", "remaining_time": "22:49:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3635, "total_steps": 10853, "loss": 0.1522, "learning_rate": 3.970079357808763e-06, "epoch": 0.33491500437646843, "percentage": 33.49, "elapsed_time": "11:29:20", "remaining_time": "22:48:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3636, "total_steps": 10853, "loss": 0.1658, "learning_rate": 3.969463130731183e-06, "epoch": 0.3350071405537384, "percentage": 33.5, "elapsed_time": "11:29:31", "remaining_time": "22:48:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3637, "total_steps": 10853, "loss": 0.1638, "learning_rate": 3.968846767213794e-06, "epoch": 0.3350992767310084, "percentage": 33.51, "elapsed_time": "11:29:42", "remaining_time": "22:48:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3638, "total_steps": 10853, "loss": 0.1607, "learning_rate": 3.968230267313824e-06, "epoch": 0.3351914129082784, "percentage": 33.52, "elapsed_time": "11:29:52", "remaining_time": "22:48:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3639, "total_steps": 10853, "loss": 0.1602, "learning_rate": 3.967613631088516e-06, "epoch": 0.3352835490855484, "percentage": 33.53, "elapsed_time": "11:30:03", "remaining_time": "22:47:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3640, "total_steps": 10853, "loss": 0.1621, "learning_rate": 3.966996858595123e-06, "epoch": 0.33537568526281847, "percentage": 33.54, "elapsed_time": "11:30:13", "remaining_time": "22:47:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3641, "total_steps": 10853, "loss": 0.1479, "learning_rate": 3.966379949890916e-06, "epoch": 0.33546782144008847, "percentage": 33.55, "elapsed_time": "11:30:24", "remaining_time": "22:47:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3642, "total_steps": 10853, "loss": 0.1442, "learning_rate": 3.965762905033171e-06, "epoch": 0.33555995761735846, "percentage": 33.56, "elapsed_time": "11:30:35", "remaining_time": "22:47:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3643, "total_steps": 10853, "loss": 0.1727, "learning_rate": 3.965145724079184e-06, "epoch": 0.33565209379462846, "percentage": 33.57, "elapsed_time": "11:30:46", "remaining_time": "22:47:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3644, "total_steps": 10853, "loss": 0.1582, "learning_rate": 3.964528407086259e-06, "epoch": 0.33574422997189846, "percentage": 33.58, "elapsed_time": "11:30:58", "remaining_time": "22:46:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3645, "total_steps": 10853, "loss": 0.1427, "learning_rate": 3.963910954111712e-06, "epoch": 0.33583636614916845, "percentage": 33.59, "elapsed_time": "11:31:10", "remaining_time": "22:46:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3646, "total_steps": 10853, "loss": 0.1634, "learning_rate": 3.9632933652128765e-06, "epoch": 0.33592850232643845, "percentage": 33.59, "elapsed_time": "11:31:20", "remaining_time": "22:46:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3647, "total_steps": 10853, "loss": 0.1768, "learning_rate": 3.962675640447094e-06, "epoch": 0.3360206385037085, "percentage": 33.6, "elapsed_time": "11:31:32", "remaining_time": "22:46:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3648, "total_steps": 10853, "loss": 0.169, "learning_rate": 3.962057779871722e-06, "epoch": 0.3361127746809785, "percentage": 33.61, "elapsed_time": "11:31:43", "remaining_time": "22:46:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3649, "total_steps": 10853, "loss": 0.1548, "learning_rate": 3.961439783544126e-06, "epoch": 0.3362049108582485, "percentage": 33.62, "elapsed_time": "11:31:54", "remaining_time": "22:45:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3650, "total_steps": 10853, "loss": 0.1531, "learning_rate": 3.960821651521691e-06, "epoch": 0.3362970470355185, "percentage": 33.63, "elapsed_time": "11:32:05", "remaining_time": "22:45:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3651, "total_steps": 10853, "loss": 0.1662, "learning_rate": 3.960203383861807e-06, "epoch": 0.3363891832127885, "percentage": 33.64, "elapsed_time": "11:32:16", "remaining_time": "22:45:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3652, "total_steps": 10853, "loss": 0.1519, "learning_rate": 3.959584980621883e-06, "epoch": 0.3364813193900585, "percentage": 33.65, "elapsed_time": "11:32:26", "remaining_time": "22:45:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3653, "total_steps": 10853, "loss": 0.161, "learning_rate": 3.958966441859335e-06, "epoch": 0.33657345556732854, "percentage": 33.66, "elapsed_time": "11:32:37", "remaining_time": "22:45:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3654, "total_steps": 10853, "loss": 0.1478, "learning_rate": 3.958347767631595e-06, "epoch": 0.33666559174459854, "percentage": 33.67, "elapsed_time": "11:32:47", "remaining_time": "22:44:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3655, "total_steps": 10853, "loss": 0.1577, "learning_rate": 3.95772895799611e-06, "epoch": 0.33675772792186853, "percentage": 33.68, "elapsed_time": "11:32:58", "remaining_time": "22:44:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3656, "total_steps": 10853, "loss": 0.1574, "learning_rate": 3.957110013010333e-06, "epoch": 0.33684986409913853, "percentage": 33.69, "elapsed_time": "11:33:09", "remaining_time": "22:44:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3657, "total_steps": 10853, "loss": 0.1531, "learning_rate": 3.9564909327317355e-06, "epoch": 0.3369420002764085, "percentage": 33.7, "elapsed_time": "11:33:21", "remaining_time": "22:44:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3658, "total_steps": 10853, "loss": 0.1433, "learning_rate": 3.955871717217797e-06, "epoch": 0.3370341364536785, "percentage": 33.7, "elapsed_time": "11:33:31", "remaining_time": "22:44:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3659, "total_steps": 10853, "loss": 0.1626, "learning_rate": 3.955252366526014e-06, "epoch": 0.3371262726309485, "percentage": 33.71, "elapsed_time": "11:33:41", "remaining_time": "22:43:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3660, "total_steps": 10853, "loss": 0.1569, "learning_rate": 3.954632880713891e-06, "epoch": 0.3372184088082186, "percentage": 33.72, "elapsed_time": "11:33:52", "remaining_time": "22:43:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3661, "total_steps": 10853, "loss": 0.1612, "learning_rate": 3.954013259838949e-06, "epoch": 0.33731054498548857, "percentage": 33.73, "elapsed_time": "11:34:02", "remaining_time": "22:43:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3662, "total_steps": 10853, "loss": 0.1407, "learning_rate": 3.95339350395872e-06, "epoch": 0.33740268116275857, "percentage": 33.74, "elapsed_time": "11:34:13", "remaining_time": "22:43:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3663, "total_steps": 10853, "loss": 0.177, "learning_rate": 3.952773613130747e-06, "epoch": 0.33749481734002856, "percentage": 33.75, "elapsed_time": "11:34:23", "remaining_time": "22:43:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3664, "total_steps": 10853, "loss": 0.1529, "learning_rate": 3.9521535874125875e-06, "epoch": 0.33758695351729856, "percentage": 33.76, "elapsed_time": "11:34:35", "remaining_time": "22:42:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3665, "total_steps": 10853, "loss": 0.1519, "learning_rate": 3.951533426861812e-06, "epoch": 0.33767908969456856, "percentage": 33.77, "elapsed_time": "11:34:46", "remaining_time": "22:42:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3666, "total_steps": 10853, "loss": 0.1431, "learning_rate": 3.950913131536001e-06, "epoch": 0.33777122587183855, "percentage": 33.78, "elapsed_time": "11:34:57", "remaining_time": "22:42:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3667, "total_steps": 10853, "loss": 0.1693, "learning_rate": 3.950292701492749e-06, "epoch": 0.3378633620491086, "percentage": 33.79, "elapsed_time": "11:35:09", "remaining_time": "22:42:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3668, "total_steps": 10853, "loss": 0.138, "learning_rate": 3.949672136789665e-06, "epoch": 0.3379554982263786, "percentage": 33.8, "elapsed_time": "11:35:17", "remaining_time": "22:41:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3669, "total_steps": 10853, "loss": 0.1486, "learning_rate": 3.949051437484367e-06, "epoch": 0.3380476344036486, "percentage": 33.81, "elapsed_time": "11:35:27", "remaining_time": "22:41:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3670, "total_steps": 10853, "loss": 0.1483, "learning_rate": 3.948430603634486e-06, "epoch": 0.3381397705809186, "percentage": 33.82, "elapsed_time": "11:35:37", "remaining_time": "22:41:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3671, "total_steps": 10853, "loss": 0.1517, "learning_rate": 3.947809635297668e-06, "epoch": 0.3382319067581886, "percentage": 33.82, "elapsed_time": "11:35:48", "remaining_time": "22:41:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3672, "total_steps": 10853, "loss": 0.1727, "learning_rate": 3.9471885325315695e-06, "epoch": 0.3383240429354586, "percentage": 33.83, "elapsed_time": "11:36:00", "remaining_time": "22:41:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3673, "total_steps": 10853, "loss": 0.1555, "learning_rate": 3.94656729539386e-06, "epoch": 0.3384161791127286, "percentage": 33.84, "elapsed_time": "11:36:10", "remaining_time": "22:40:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3674, "total_steps": 10853, "loss": 0.1635, "learning_rate": 3.945945923942221e-06, "epoch": 0.33850831528999864, "percentage": 33.85, "elapsed_time": "11:36:20", "remaining_time": "22:40:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3675, "total_steps": 10853, "loss": 0.1637, "learning_rate": 3.945324418234349e-06, "epoch": 0.33860045146726864, "percentage": 33.86, "elapsed_time": "11:36:31", "remaining_time": "22:40:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3676, "total_steps": 10853, "loss": 0.1479, "learning_rate": 3.944702778327948e-06, "epoch": 0.33869258764453863, "percentage": 33.87, "elapsed_time": "11:36:42", "remaining_time": "22:40:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3677, "total_steps": 10853, "loss": 0.1577, "learning_rate": 3.944081004280738e-06, "epoch": 0.33878472382180863, "percentage": 33.88, "elapsed_time": "11:36:53", "remaining_time": "22:40:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3678, "total_steps": 10853, "loss": 0.1505, "learning_rate": 3.943459096150452e-06, "epoch": 0.33887685999907863, "percentage": 33.89, "elapsed_time": "11:37:04", "remaining_time": "22:39:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3679, "total_steps": 10853, "loss": 0.1561, "learning_rate": 3.942837053994834e-06, "epoch": 0.3389689961763486, "percentage": 33.9, "elapsed_time": "11:37:15", "remaining_time": "22:39:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3680, "total_steps": 10853, "loss": 0.1631, "learning_rate": 3.942214877871639e-06, "epoch": 0.3390611323536186, "percentage": 33.91, "elapsed_time": "11:37:26", "remaining_time": "22:39:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3681, "total_steps": 10853, "loss": 0.1599, "learning_rate": 3.941592567838638e-06, "epoch": 0.3391532685308887, "percentage": 33.92, "elapsed_time": "11:37:37", "remaining_time": "22:39:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3682, "total_steps": 10853, "loss": 0.1481, "learning_rate": 3.940970123953613e-06, "epoch": 0.33924540470815867, "percentage": 33.93, "elapsed_time": "11:37:47", "remaining_time": "22:39:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3683, "total_steps": 10853, "loss": 0.156, "learning_rate": 3.940347546274355e-06, "epoch": 0.33933754088542867, "percentage": 33.94, "elapsed_time": "11:38:00", "remaining_time": "22:38:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3684, "total_steps": 10853, "loss": 0.1548, "learning_rate": 3.9397248348586735e-06, "epoch": 0.33942967706269866, "percentage": 33.94, "elapsed_time": "11:38:10", "remaining_time": "22:38:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3685, "total_steps": 10853, "loss": 0.1437, "learning_rate": 3.939101989764386e-06, "epoch": 0.33952181323996866, "percentage": 33.95, "elapsed_time": "11:38:21", "remaining_time": "22:38:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3686, "total_steps": 10853, "loss": 0.1368, "learning_rate": 3.938479011049324e-06, "epoch": 0.33961394941723866, "percentage": 33.96, "elapsed_time": "11:38:34", "remaining_time": "22:38:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3687, "total_steps": 10853, "loss": 0.1525, "learning_rate": 3.937855898771331e-06, "epoch": 0.3397060855945087, "percentage": 33.97, "elapsed_time": "11:38:44", "remaining_time": "22:38:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3688, "total_steps": 10853, "loss": 0.172, "learning_rate": 3.9372326529882635e-06, "epoch": 0.3397982217717787, "percentage": 33.98, "elapsed_time": "11:38:53", "remaining_time": "22:37:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3689, "total_steps": 10853, "loss": 0.1527, "learning_rate": 3.936609273757988e-06, "epoch": 0.3398903579490487, "percentage": 33.99, "elapsed_time": "11:39:03", "remaining_time": "22:37:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3690, "total_steps": 10853, "loss": 0.1564, "learning_rate": 3.935985761138388e-06, "epoch": 0.3399824941263187, "percentage": 34.0, "elapsed_time": "11:39:13", "remaining_time": "22:37:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3691, "total_steps": 10853, "loss": 0.1446, "learning_rate": 3.935362115187356e-06, "epoch": 0.3400746303035887, "percentage": 34.01, "elapsed_time": "11:39:24", "remaining_time": "22:37:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3692, "total_steps": 10853, "loss": 0.1689, "learning_rate": 3.934738335962796e-06, "epoch": 0.3401667664808587, "percentage": 34.02, "elapsed_time": "11:39:36", "remaining_time": "22:36:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3693, "total_steps": 10853, "loss": 0.1464, "learning_rate": 3.934114423522627e-06, "epoch": 0.3402589026581287, "percentage": 34.03, "elapsed_time": "11:39:47", "remaining_time": "22:36:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3694, "total_steps": 10853, "loss": 0.1603, "learning_rate": 3.93349037792478e-06, "epoch": 0.34035103883539874, "percentage": 34.04, "elapsed_time": "11:39:58", "remaining_time": "22:36:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3695, "total_steps": 10853, "loss": 0.1527, "learning_rate": 3.932866199227196e-06, "epoch": 0.34044317501266874, "percentage": 34.05, "elapsed_time": "11:40:09", "remaining_time": "22:36:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3696, "total_steps": 10853, "loss": 0.1608, "learning_rate": 3.932241887487834e-06, "epoch": 0.34053531118993874, "percentage": 34.06, "elapsed_time": "11:40:21", "remaining_time": "22:36:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3697, "total_steps": 10853, "loss": 0.1627, "learning_rate": 3.931617442764656e-06, "epoch": 0.34062744736720874, "percentage": 34.06, "elapsed_time": "11:40:32", "remaining_time": "22:35:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3698, "total_steps": 10853, "loss": 0.1604, "learning_rate": 3.930992865115645e-06, "epoch": 0.34071958354447873, "percentage": 34.07, "elapsed_time": "11:40:44", "remaining_time": "22:35:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3699, "total_steps": 10853, "loss": 0.1572, "learning_rate": 3.930368154598793e-06, "epoch": 0.34081171972174873, "percentage": 34.08, "elapsed_time": "11:40:55", "remaining_time": "22:35:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3700, "total_steps": 10853, "loss": 0.1598, "learning_rate": 3.929743311272104e-06, "epoch": 0.3409038558990187, "percentage": 34.09, "elapsed_time": "11:41:06", "remaining_time": "22:35:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3701, "total_steps": 10853, "loss": 0.1538, "learning_rate": 3.929118335193594e-06, "epoch": 0.3409959920762888, "percentage": 34.1, "elapsed_time": "11:41:17", "remaining_time": "22:35:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3702, "total_steps": 10853, "loss": 0.1595, "learning_rate": 3.9284932264212925e-06, "epoch": 0.3410881282535588, "percentage": 34.11, "elapsed_time": "11:41:27", "remaining_time": "22:34:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3703, "total_steps": 10853, "loss": 0.1596, "learning_rate": 3.927867985013242e-06, "epoch": 0.3411802644308288, "percentage": 34.12, "elapsed_time": "11:41:39", "remaining_time": "22:34:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3704, "total_steps": 10853, "loss": 0.1655, "learning_rate": 3.9272426110274955e-06, "epoch": 0.34127240060809877, "percentage": 34.13, "elapsed_time": "11:41:51", "remaining_time": "22:34:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3705, "total_steps": 10853, "loss": 0.1766, "learning_rate": 3.926617104522118e-06, "epoch": 0.34136453678536877, "percentage": 34.14, "elapsed_time": "11:42:03", "remaining_time": "22:34:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3706, "total_steps": 10853, "loss": 0.1627, "learning_rate": 3.92599146555519e-06, "epoch": 0.34145667296263876, "percentage": 34.15, "elapsed_time": "11:42:14", "remaining_time": "22:34:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3707, "total_steps": 10853, "loss": 0.1639, "learning_rate": 3.9253656941848e-06, "epoch": 0.34154880913990876, "percentage": 34.16, "elapsed_time": "11:42:26", "remaining_time": "22:34:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3708, "total_steps": 10853, "loss": 0.1669, "learning_rate": 3.9247397904690526e-06, "epoch": 0.3416409453171788, "percentage": 34.17, "elapsed_time": "11:42:37", "remaining_time": "22:33:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3709, "total_steps": 10853, "loss": 0.1528, "learning_rate": 3.924113754466062e-06, "epoch": 0.3417330814944488, "percentage": 34.17, "elapsed_time": "11:42:48", "remaining_time": "22:33:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3710, "total_steps": 10853, "loss": 0.153, "learning_rate": 3.923487586233956e-06, "epoch": 0.3418252176717188, "percentage": 34.18, "elapsed_time": "11:42:59", "remaining_time": "22:33:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3711, "total_steps": 10853, "loss": 0.1599, "learning_rate": 3.922861285830874e-06, "epoch": 0.3419173538489888, "percentage": 34.19, "elapsed_time": "11:43:11", "remaining_time": "22:33:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3712, "total_steps": 10853, "loss": 0.1563, "learning_rate": 3.922234853314969e-06, "epoch": 0.3420094900262588, "percentage": 34.2, "elapsed_time": "11:43:23", "remaining_time": "22:33:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3713, "total_steps": 10853, "loss": 0.1571, "learning_rate": 3.921608288744405e-06, "epoch": 0.3421016262035288, "percentage": 34.21, "elapsed_time": "11:43:34", "remaining_time": "22:32:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3714, "total_steps": 10853, "loss": 0.1327, "learning_rate": 3.920981592177358e-06, "epoch": 0.3421937623807988, "percentage": 34.22, "elapsed_time": "11:43:44", "remaining_time": "22:32:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3715, "total_steps": 10853, "loss": 0.1589, "learning_rate": 3.920354763672017e-06, "epoch": 0.34228589855806885, "percentage": 34.23, "elapsed_time": "11:43:56", "remaining_time": "22:32:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3716, "total_steps": 10853, "loss": 0.146, "learning_rate": 3.9197278032865835e-06, "epoch": 0.34237803473533884, "percentage": 34.24, "elapsed_time": "11:44:09", "remaining_time": "22:32:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3717, "total_steps": 10853, "loss": 0.1544, "learning_rate": 3.919100711079271e-06, "epoch": 0.34247017091260884, "percentage": 34.25, "elapsed_time": "11:44:19", "remaining_time": "22:32:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3718, "total_steps": 10853, "loss": 0.1521, "learning_rate": 3.918473487108305e-06, "epoch": 0.34256230708987884, "percentage": 34.26, "elapsed_time": "11:44:31", "remaining_time": "22:32:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3719, "total_steps": 10853, "loss": 0.1532, "learning_rate": 3.917846131431923e-06, "epoch": 0.34265444326714883, "percentage": 34.27, "elapsed_time": "11:44:42", "remaining_time": "22:31:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3720, "total_steps": 10853, "loss": 0.1548, "learning_rate": 3.917218644108375e-06, "epoch": 0.34274657944441883, "percentage": 34.28, "elapsed_time": "11:44:53", "remaining_time": "22:31:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3721, "total_steps": 10853, "loss": 0.1618, "learning_rate": 3.916591025195923e-06, "epoch": 0.3428387156216889, "percentage": 34.29, "elapsed_time": "11:45:03", "remaining_time": "22:31:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3722, "total_steps": 10853, "loss": 0.1598, "learning_rate": 3.915963274752842e-06, "epoch": 0.3429308517989589, "percentage": 34.29, "elapsed_time": "11:45:13", "remaining_time": "22:31:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3723, "total_steps": 10853, "loss": 0.1608, "learning_rate": 3.915335392837418e-06, "epoch": 0.3430229879762289, "percentage": 34.3, "elapsed_time": "11:45:24", "remaining_time": "22:30:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3724, "total_steps": 10853, "loss": 0.1429, "learning_rate": 3.914707379507952e-06, "epoch": 0.3431151241534989, "percentage": 34.31, "elapsed_time": "11:45:34", "remaining_time": "22:30:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3725, "total_steps": 10853, "loss": 0.1562, "learning_rate": 3.914079234822752e-06, "epoch": 0.34320726033076887, "percentage": 34.32, "elapsed_time": "11:45:45", "remaining_time": "22:30:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3726, "total_steps": 10853, "loss": 0.1487, "learning_rate": 3.913450958840144e-06, "epoch": 0.34329939650803887, "percentage": 34.33, "elapsed_time": "11:45:57", "remaining_time": "22:30:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3727, "total_steps": 10853, "loss": 0.1618, "learning_rate": 3.912822551618461e-06, "epoch": 0.34339153268530886, "percentage": 34.34, "elapsed_time": "11:46:08", "remaining_time": "22:30:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3728, "total_steps": 10853, "loss": 0.1582, "learning_rate": 3.912194013216053e-06, "epoch": 0.3434836688625789, "percentage": 34.35, "elapsed_time": "11:46:20", "remaining_time": "22:29:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3729, "total_steps": 10853, "loss": 0.1441, "learning_rate": 3.911565343691279e-06, "epoch": 0.3435758050398489, "percentage": 34.36, "elapsed_time": "11:46:30", "remaining_time": "22:29:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3730, "total_steps": 10853, "loss": 0.1624, "learning_rate": 3.910936543102511e-06, "epoch": 0.3436679412171189, "percentage": 34.37, "elapsed_time": "11:46:40", "remaining_time": "22:29:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3731, "total_steps": 10853, "loss": 0.1491, "learning_rate": 3.910307611508133e-06, "epoch": 0.3437600773943889, "percentage": 34.38, "elapsed_time": "11:46:51", "remaining_time": "22:29:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3732, "total_steps": 10853, "loss": 0.146, "learning_rate": 3.9096785489665405e-06, "epoch": 0.3438522135716589, "percentage": 34.39, "elapsed_time": "11:47:03", "remaining_time": "22:29:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3733, "total_steps": 10853, "loss": 0.1623, "learning_rate": 3.9090493555361445e-06, "epoch": 0.3439443497489289, "percentage": 34.4, "elapsed_time": "11:47:14", "remaining_time": "22:28:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3734, "total_steps": 10853, "loss": 0.1448, "learning_rate": 3.908420031275363e-06, "epoch": 0.3440364859261989, "percentage": 34.41, "elapsed_time": "11:47:24", "remaining_time": "22:28:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3735, "total_steps": 10853, "loss": 0.159, "learning_rate": 3.907790576242631e-06, "epoch": 0.34412862210346895, "percentage": 34.41, "elapsed_time": "11:47:35", "remaining_time": "22:28:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3736, "total_steps": 10853, "loss": 0.1518, "learning_rate": 3.907160990496392e-06, "epoch": 0.34422075828073895, "percentage": 34.42, "elapsed_time": "11:47:47", "remaining_time": "22:28:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3737, "total_steps": 10853, "loss": 0.1551, "learning_rate": 3.9065312740951035e-06, "epoch": 0.34431289445800894, "percentage": 34.43, "elapsed_time": "11:47:58", "remaining_time": "22:28:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3738, "total_steps": 10853, "loss": 0.1389, "learning_rate": 3.905901427097235e-06, "epoch": 0.34440503063527894, "percentage": 34.44, "elapsed_time": "11:48:08", "remaining_time": "22:27:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3739, "total_steps": 10853, "loss": 0.1479, "learning_rate": 3.9052714495612675e-06, "epoch": 0.34449716681254894, "percentage": 34.45, "elapsed_time": "11:48:18", "remaining_time": "22:27:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3740, "total_steps": 10853, "loss": 0.143, "learning_rate": 3.904641341545694e-06, "epoch": 0.34458930298981894, "percentage": 34.46, "elapsed_time": "11:48:30", "remaining_time": "22:27:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3741, "total_steps": 10853, "loss": 0.1571, "learning_rate": 3.904011103109022e-06, "epoch": 0.34468143916708893, "percentage": 34.47, "elapsed_time": "11:48:42", "remaining_time": "22:27:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3742, "total_steps": 10853, "loss": 0.1667, "learning_rate": 3.903380734309767e-06, "epoch": 0.344773575344359, "percentage": 34.48, "elapsed_time": "11:48:54", "remaining_time": "22:27:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3743, "total_steps": 10853, "loss": 0.1539, "learning_rate": 3.90275023520646e-06, "epoch": 0.344865711521629, "percentage": 34.49, "elapsed_time": "11:49:04", "remaining_time": "22:26:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3744, "total_steps": 10853, "loss": 0.1546, "learning_rate": 3.902119605857644e-06, "epoch": 0.344957847698899, "percentage": 34.5, "elapsed_time": "11:49:15", "remaining_time": "22:26:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3745, "total_steps": 10853, "loss": 0.135, "learning_rate": 3.90148884632187e-06, "epoch": 0.345049983876169, "percentage": 34.51, "elapsed_time": "11:49:25", "remaining_time": "22:26:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3746, "total_steps": 10853, "loss": 0.1506, "learning_rate": 3.900857956657707e-06, "epoch": 0.34514212005343897, "percentage": 34.52, "elapsed_time": "11:49:35", "remaining_time": "22:26:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3747, "total_steps": 10853, "loss": 0.1406, "learning_rate": 3.900226936923731e-06, "epoch": 0.34523425623070897, "percentage": 34.53, "elapsed_time": "11:49:45", "remaining_time": "22:26:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3748, "total_steps": 10853, "loss": 0.1551, "learning_rate": 3.899595787178534e-06, "epoch": 0.34532639240797897, "percentage": 34.53, "elapsed_time": "11:49:57", "remaining_time": "22:25:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3749, "total_steps": 10853, "loss": 0.147, "learning_rate": 3.898964507480717e-06, "epoch": 0.345418528585249, "percentage": 34.54, "elapsed_time": "11:50:06", "remaining_time": "22:25:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3750, "total_steps": 10853, "loss": 0.1523, "learning_rate": 3.8983330978888955e-06, "epoch": 0.345510664762519, "percentage": 34.55, "elapsed_time": "11:50:17", "remaining_time": "22:25:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3751, "total_steps": 10853, "loss": 0.1709, "learning_rate": 3.897701558461695e-06, "epoch": 0.345602800939789, "percentage": 34.56, "elapsed_time": "11:50:26", "remaining_time": "22:25:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3752, "total_steps": 10853, "loss": 0.1615, "learning_rate": 3.897069889257754e-06, "epoch": 0.345694937117059, "percentage": 34.57, "elapsed_time": "11:50:38", "remaining_time": "22:24:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3753, "total_steps": 10853, "loss": 0.1491, "learning_rate": 3.8964380903357244e-06, "epoch": 0.345787073294329, "percentage": 34.58, "elapsed_time": "11:50:48", "remaining_time": "22:24:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3754, "total_steps": 10853, "loss": 0.1555, "learning_rate": 3.895806161754267e-06, "epoch": 0.345879209471599, "percentage": 34.59, "elapsed_time": "11:50:59", "remaining_time": "22:24:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3755, "total_steps": 10853, "loss": 0.1739, "learning_rate": 3.895174103572057e-06, "epoch": 0.34597134564886906, "percentage": 34.6, "elapsed_time": "11:51:10", "remaining_time": "22:24:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3756, "total_steps": 10853, "loss": 0.1661, "learning_rate": 3.894541915847783e-06, "epoch": 0.34606348182613905, "percentage": 34.61, "elapsed_time": "11:51:23", "remaining_time": "22:24:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3757, "total_steps": 10853, "loss": 0.159, "learning_rate": 3.89390959864014e-06, "epoch": 0.34615561800340905, "percentage": 34.62, "elapsed_time": "11:51:33", "remaining_time": "22:23:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3758, "total_steps": 10853, "loss": 0.1549, "learning_rate": 3.893277152007842e-06, "epoch": 0.34624775418067905, "percentage": 34.63, "elapsed_time": "11:51:45", "remaining_time": "22:23:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3759, "total_steps": 10853, "loss": 0.1441, "learning_rate": 3.89264457600961e-06, "epoch": 0.34633989035794904, "percentage": 34.64, "elapsed_time": "11:51:56", "remaining_time": "22:23:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3760, "total_steps": 10853, "loss": 0.1581, "learning_rate": 3.892011870704179e-06, "epoch": 0.34643202653521904, "percentage": 34.64, "elapsed_time": "11:52:08", "remaining_time": "22:23:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3761, "total_steps": 10853, "loss": 0.1408, "learning_rate": 3.891379036150297e-06, "epoch": 0.34652416271248904, "percentage": 34.65, "elapsed_time": "11:52:20", "remaining_time": "22:23:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3762, "total_steps": 10853, "loss": 0.1503, "learning_rate": 3.89074607240672e-06, "epoch": 0.3466162988897591, "percentage": 34.66, "elapsed_time": "11:52:31", "remaining_time": "22:23:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3763, "total_steps": 10853, "loss": 0.1541, "learning_rate": 3.890112979532222e-06, "epoch": 0.3467084350670291, "percentage": 34.67, "elapsed_time": "11:52:41", "remaining_time": "22:22:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3764, "total_steps": 10853, "loss": 0.1665, "learning_rate": 3.889479757585584e-06, "epoch": 0.3468005712442991, "percentage": 34.68, "elapsed_time": "11:52:50", "remaining_time": "22:22:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3765, "total_steps": 10853, "loss": 0.1454, "learning_rate": 3.888846406625601e-06, "epoch": 0.3468927074215691, "percentage": 34.69, "elapsed_time": "11:53:01", "remaining_time": "22:22:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3766, "total_steps": 10853, "loss": 0.1573, "learning_rate": 3.888212926711079e-06, "epoch": 0.3469848435988391, "percentage": 34.7, "elapsed_time": "11:53:11", "remaining_time": "22:22:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3767, "total_steps": 10853, "loss": 0.1512, "learning_rate": 3.887579317900838e-06, "epoch": 0.3470769797761091, "percentage": 34.71, "elapsed_time": "11:53:21", "remaining_time": "22:21:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3768, "total_steps": 10853, "loss": 0.1507, "learning_rate": 3.886945580253708e-06, "epoch": 0.34716911595337907, "percentage": 34.72, "elapsed_time": "11:53:32", "remaining_time": "22:21:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3769, "total_steps": 10853, "loss": 0.134, "learning_rate": 3.886311713828531e-06, "epoch": 0.3472612521306491, "percentage": 34.73, "elapsed_time": "11:53:43", "remaining_time": "22:21:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3770, "total_steps": 10853, "loss": 0.1652, "learning_rate": 3.885677718684163e-06, "epoch": 0.3473533883079191, "percentage": 34.74, "elapsed_time": "11:53:54", "remaining_time": "22:21:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3771, "total_steps": 10853, "loss": 0.1515, "learning_rate": 3.885043594879469e-06, "epoch": 0.3474455244851891, "percentage": 34.75, "elapsed_time": "11:54:05", "remaining_time": "22:21:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3772, "total_steps": 10853, "loss": 0.1722, "learning_rate": 3.884409342473329e-06, "epoch": 0.3475376606624591, "percentage": 34.76, "elapsed_time": "11:54:16", "remaining_time": "22:20:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3773, "total_steps": 10853, "loss": 0.1591, "learning_rate": 3.883774961524632e-06, "epoch": 0.3476297968397291, "percentage": 34.76, "elapsed_time": "11:54:26", "remaining_time": "22:20:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3774, "total_steps": 10853, "loss": 0.1586, "learning_rate": 3.88314045209228e-06, "epoch": 0.3477219330169991, "percentage": 34.77, "elapsed_time": "11:54:35", "remaining_time": "22:20:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3775, "total_steps": 10853, "loss": 0.1474, "learning_rate": 3.8825058142351895e-06, "epoch": 0.3478140691942691, "percentage": 34.78, "elapsed_time": "11:54:47", "remaining_time": "22:20:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3776, "total_steps": 10853, "loss": 0.1534, "learning_rate": 3.881871048012285e-06, "epoch": 0.34790620537153916, "percentage": 34.79, "elapsed_time": "11:54:59", "remaining_time": "22:20:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3777, "total_steps": 10853, "loss": 0.1684, "learning_rate": 3.881236153482505e-06, "epoch": 0.34799834154880915, "percentage": 34.8, "elapsed_time": "11:55:09", "remaining_time": "22:19:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3778, "total_steps": 10853, "loss": 0.1594, "learning_rate": 3.880601130704799e-06, "epoch": 0.34809047772607915, "percentage": 34.81, "elapsed_time": "11:55:21", "remaining_time": "22:19:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3779, "total_steps": 10853, "loss": 0.1494, "learning_rate": 3.87996597973813e-06, "epoch": 0.34818261390334915, "percentage": 34.82, "elapsed_time": "11:55:33", "remaining_time": "22:19:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3780, "total_steps": 10853, "loss": 0.1516, "learning_rate": 3.879330700641471e-06, "epoch": 0.34827475008061914, "percentage": 34.83, "elapsed_time": "11:55:43", "remaining_time": "22:19:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3781, "total_steps": 10853, "loss": 0.1786, "learning_rate": 3.878695293473809e-06, "epoch": 0.34836688625788914, "percentage": 34.84, "elapsed_time": "11:55:54", "remaining_time": "22:19:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3782, "total_steps": 10853, "loss": 0.1566, "learning_rate": 3.878059758294139e-06, "epoch": 0.34845902243515914, "percentage": 34.85, "elapsed_time": "11:56:04", "remaining_time": "22:18:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3783, "total_steps": 10853, "loss": 0.1643, "learning_rate": 3.877424095161473e-06, "epoch": 0.3485511586124292, "percentage": 34.86, "elapsed_time": "11:56:16", "remaining_time": "22:18:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3784, "total_steps": 10853, "loss": 0.1524, "learning_rate": 3.8767883041348305e-06, "epoch": 0.3486432947896992, "percentage": 34.87, "elapsed_time": "11:56:27", "remaining_time": "22:18:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3785, "total_steps": 10853, "loss": 0.1486, "learning_rate": 3.8761523852732475e-06, "epoch": 0.3487354309669692, "percentage": 34.88, "elapsed_time": "11:56:38", "remaining_time": "22:18:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3786, "total_steps": 10853, "loss": 0.1456, "learning_rate": 3.875516338635766e-06, "epoch": 0.3488275671442392, "percentage": 34.88, "elapsed_time": "11:56:48", "remaining_time": "22:18:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3787, "total_steps": 10853, "loss": 0.1403, "learning_rate": 3.874880164281446e-06, "epoch": 0.3489197033215092, "percentage": 34.89, "elapsed_time": "11:56:59", "remaining_time": "22:17:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3788, "total_steps": 10853, "loss": 0.1505, "learning_rate": 3.874243862269353e-06, "epoch": 0.3490118394987792, "percentage": 34.9, "elapsed_time": "11:57:10", "remaining_time": "22:17:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3789, "total_steps": 10853, "loss": 0.1628, "learning_rate": 3.87360743265857e-06, "epoch": 0.3491039756760492, "percentage": 34.91, "elapsed_time": "11:57:20", "remaining_time": "22:17:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3790, "total_steps": 10853, "loss": 0.1624, "learning_rate": 3.87297087550819e-06, "epoch": 0.3491961118533192, "percentage": 34.92, "elapsed_time": "11:57:31", "remaining_time": "22:17:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3791, "total_steps": 10853, "loss": 0.1459, "learning_rate": 3.872334190877316e-06, "epoch": 0.3492882480305892, "percentage": 34.93, "elapsed_time": "11:57:42", "remaining_time": "22:16:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3792, "total_steps": 10853, "loss": 0.1444, "learning_rate": 3.8716973788250645e-06, "epoch": 0.3493803842078592, "percentage": 34.94, "elapsed_time": "11:57:53", "remaining_time": "22:16:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3793, "total_steps": 10853, "loss": 0.1463, "learning_rate": 3.871060439410563e-06, "epoch": 0.3494725203851292, "percentage": 34.95, "elapsed_time": "11:58:03", "remaining_time": "22:16:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3794, "total_steps": 10853, "loss": 0.147, "learning_rate": 3.870423372692953e-06, "epoch": 0.3495646565623992, "percentage": 34.96, "elapsed_time": "11:58:15", "remaining_time": "22:16:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3795, "total_steps": 10853, "loss": 0.1471, "learning_rate": 3.869786178731386e-06, "epoch": 0.3496567927396692, "percentage": 34.97, "elapsed_time": "11:58:27", "remaining_time": "22:16:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3796, "total_steps": 10853, "loss": 0.1567, "learning_rate": 3.869148857585024e-06, "epoch": 0.34974892891693926, "percentage": 34.98, "elapsed_time": "11:58:38", "remaining_time": "22:16:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3797, "total_steps": 10853, "loss": 0.1605, "learning_rate": 3.8685114093130436e-06, "epoch": 0.34984106509420926, "percentage": 34.99, "elapsed_time": "11:58:49", "remaining_time": "22:15:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3798, "total_steps": 10853, "loss": 0.1628, "learning_rate": 3.867873833974631e-06, "epoch": 0.34993320127147926, "percentage": 34.99, "elapsed_time": "11:59:00", "remaining_time": "22:15:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3799, "total_steps": 10853, "loss": 0.147, "learning_rate": 3.867236131628985e-06, "epoch": 0.35002533744874925, "percentage": 35.0, "elapsed_time": "11:59:09", "remaining_time": "22:15:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3800, "total_steps": 10853, "loss": 0.1613, "learning_rate": 3.8665983023353195e-06, "epoch": 0.35011747362601925, "percentage": 35.01, "elapsed_time": "11:59:20", "remaining_time": "22:15:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3801, "total_steps": 10853, "loss": 0.1575, "learning_rate": 3.865960346152853e-06, "epoch": 0.35020960980328925, "percentage": 35.02, "elapsed_time": "11:59:31", "remaining_time": "22:14:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3802, "total_steps": 10853, "loss": 0.1603, "learning_rate": 3.865322263140821e-06, "epoch": 0.35030174598055924, "percentage": 35.03, "elapsed_time": "11:59:40", "remaining_time": "22:14:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3803, "total_steps": 10853, "loss": 0.1593, "learning_rate": 3.86468405335847e-06, "epoch": 0.3503938821578293, "percentage": 35.04, "elapsed_time": "11:59:49", "remaining_time": "22:14:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3804, "total_steps": 10853, "loss": 0.1564, "learning_rate": 3.864045716865059e-06, "epoch": 0.3504860183350993, "percentage": 35.05, "elapsed_time": "12:00:01", "remaining_time": "22:14:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3805, "total_steps": 10853, "loss": 0.1658, "learning_rate": 3.863407253719855e-06, "epoch": 0.3505781545123693, "percentage": 35.06, "elapsed_time": "12:00:13", "remaining_time": "22:14:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3806, "total_steps": 10853, "loss": 0.1524, "learning_rate": 3.8627686639821415e-06, "epoch": 0.3506702906896393, "percentage": 35.07, "elapsed_time": "12:00:24", "remaining_time": "22:13:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3807, "total_steps": 10853, "loss": 0.1594, "learning_rate": 3.8621299477112105e-06, "epoch": 0.3507624268669093, "percentage": 35.08, "elapsed_time": "12:00:34", "remaining_time": "22:13:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3808, "total_steps": 10853, "loss": 0.143, "learning_rate": 3.861491104966368e-06, "epoch": 0.3508545630441793, "percentage": 35.09, "elapsed_time": "12:00:44", "remaining_time": "22:13:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3809, "total_steps": 10853, "loss": 0.1612, "learning_rate": 3.860852135806929e-06, "epoch": 0.3509466992214493, "percentage": 35.1, "elapsed_time": "12:00:55", "remaining_time": "22:13:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3810, "total_steps": 10853, "loss": 0.1516, "learning_rate": 3.860213040292224e-06, "epoch": 0.35103883539871933, "percentage": 35.11, "elapsed_time": "12:01:06", "remaining_time": "22:13:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3811, "total_steps": 10853, "loss": 0.1462, "learning_rate": 3.85957381848159e-06, "epoch": 0.3511309715759893, "percentage": 35.11, "elapsed_time": "12:01:17", "remaining_time": "22:12:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3812, "total_steps": 10853, "loss": 0.1489, "learning_rate": 3.858934470434381e-06, "epoch": 0.3512231077532593, "percentage": 35.12, "elapsed_time": "12:01:28", "remaining_time": "22:12:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3813, "total_steps": 10853, "loss": 0.1563, "learning_rate": 3.858294996209961e-06, "epoch": 0.3513152439305293, "percentage": 35.13, "elapsed_time": "12:01:38", "remaining_time": "22:12:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3814, "total_steps": 10853, "loss": 0.1571, "learning_rate": 3.857655395867704e-06, "epoch": 0.3514073801077993, "percentage": 35.14, "elapsed_time": "12:01:49", "remaining_time": "22:12:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3815, "total_steps": 10853, "loss": 0.157, "learning_rate": 3.857015669466998e-06, "epoch": 0.3514995162850693, "percentage": 35.15, "elapsed_time": "12:01:59", "remaining_time": "22:11:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3816, "total_steps": 10853, "loss": 0.1627, "learning_rate": 3.856375817067241e-06, "epoch": 0.3515916524623393, "percentage": 35.16, "elapsed_time": "12:02:10", "remaining_time": "22:11:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3817, "total_steps": 10853, "loss": 0.1417, "learning_rate": 3.855735838727842e-06, "epoch": 0.35168378863960936, "percentage": 35.17, "elapsed_time": "12:02:20", "remaining_time": "22:11:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3818, "total_steps": 10853, "loss": 0.1379, "learning_rate": 3.855095734508225e-06, "epoch": 0.35177592481687936, "percentage": 35.18, "elapsed_time": "12:02:31", "remaining_time": "22:11:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3819, "total_steps": 10853, "loss": 0.1494, "learning_rate": 3.854455504467824e-06, "epoch": 0.35186806099414936, "percentage": 35.19, "elapsed_time": "12:02:43", "remaining_time": "22:11:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3820, "total_steps": 10853, "loss": 0.1392, "learning_rate": 3.853815148666084e-06, "epoch": 0.35196019717141935, "percentage": 35.2, "elapsed_time": "12:02:52", "remaining_time": "22:10:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3821, "total_steps": 10853, "loss": 0.1459, "learning_rate": 3.85317466716246e-06, "epoch": 0.35205233334868935, "percentage": 35.21, "elapsed_time": "12:03:03", "remaining_time": "22:10:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3822, "total_steps": 10853, "loss": 0.1514, "learning_rate": 3.852534060016424e-06, "epoch": 0.35214446952595935, "percentage": 35.22, "elapsed_time": "12:03:13", "remaining_time": "22:10:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3823, "total_steps": 10853, "loss": 0.1556, "learning_rate": 3.8518933272874546e-06, "epoch": 0.3522366057032294, "percentage": 35.23, "elapsed_time": "12:03:23", "remaining_time": "22:10:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3824, "total_steps": 10853, "loss": 0.1647, "learning_rate": 3.851252469035044e-06, "epoch": 0.3523287418804994, "percentage": 35.23, "elapsed_time": "12:03:34", "remaining_time": "22:10:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3825, "total_steps": 10853, "loss": 0.1526, "learning_rate": 3.850611485318696e-06, "epoch": 0.3524208780577694, "percentage": 35.24, "elapsed_time": "12:03:44", "remaining_time": "22:09:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3826, "total_steps": 10853, "loss": 0.1504, "learning_rate": 3.8499703761979276e-06, "epoch": 0.3525130142350394, "percentage": 35.25, "elapsed_time": "12:03:54", "remaining_time": "22:09:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3827, "total_steps": 10853, "loss": 0.1539, "learning_rate": 3.849329141732263e-06, "epoch": 0.3526051504123094, "percentage": 35.26, "elapsed_time": "12:04:04", "remaining_time": "22:09:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3828, "total_steps": 10853, "loss": 0.1552, "learning_rate": 3.848687781981243e-06, "epoch": 0.3526972865895794, "percentage": 35.27, "elapsed_time": "12:04:16", "remaining_time": "22:09:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3829, "total_steps": 10853, "loss": 0.1447, "learning_rate": 3.848046297004417e-06, "epoch": 0.3527894227668494, "percentage": 35.28, "elapsed_time": "12:04:26", "remaining_time": "22:08:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3830, "total_steps": 10853, "loss": 0.1439, "learning_rate": 3.847404686861348e-06, "epoch": 0.35288155894411943, "percentage": 35.29, "elapsed_time": "12:04:37", "remaining_time": "22:08:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3831, "total_steps": 10853, "loss": 0.1552, "learning_rate": 3.846762951611608e-06, "epoch": 0.35297369512138943, "percentage": 35.3, "elapsed_time": "12:04:47", "remaining_time": "22:08:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3832, "total_steps": 10853, "loss": 0.1545, "learning_rate": 3.846121091314783e-06, "epoch": 0.3530658312986594, "percentage": 35.31, "elapsed_time": "12:04:58", "remaining_time": "22:08:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3833, "total_steps": 10853, "loss": 0.1405, "learning_rate": 3.84547910603047e-06, "epoch": 0.3531579674759294, "percentage": 35.32, "elapsed_time": "12:05:09", "remaining_time": "22:08:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3834, "total_steps": 10853, "loss": 0.1757, "learning_rate": 3.8448369958182775e-06, "epoch": 0.3532501036531994, "percentage": 35.33, "elapsed_time": "12:05:20", "remaining_time": "22:07:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3835, "total_steps": 10853, "loss": 0.163, "learning_rate": 3.844194760737825e-06, "epoch": 0.3533422398304694, "percentage": 35.34, "elapsed_time": "12:05:31", "remaining_time": "22:07:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3836, "total_steps": 10853, "loss": 0.1492, "learning_rate": 3.843552400848744e-06, "epoch": 0.3534343760077394, "percentage": 35.35, "elapsed_time": "12:05:43", "remaining_time": "22:07:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3837, "total_steps": 10853, "loss": 0.143, "learning_rate": 3.842909916210678e-06, "epoch": 0.35352651218500947, "percentage": 35.35, "elapsed_time": "12:05:52", "remaining_time": "22:07:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3838, "total_steps": 10853, "loss": 0.1589, "learning_rate": 3.842267306883283e-06, "epoch": 0.35361864836227946, "percentage": 35.36, "elapsed_time": "12:06:03", "remaining_time": "22:07:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3839, "total_steps": 10853, "loss": 0.1415, "learning_rate": 3.8416245729262225e-06, "epoch": 0.35371078453954946, "percentage": 35.37, "elapsed_time": "12:06:13", "remaining_time": "22:06:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3840, "total_steps": 10853, "loss": 0.1517, "learning_rate": 3.840981714399177e-06, "epoch": 0.35380292071681946, "percentage": 35.38, "elapsed_time": "12:06:23", "remaining_time": "22:06:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3841, "total_steps": 10853, "loss": 0.1494, "learning_rate": 3.840338731361834e-06, "epoch": 0.35389505689408945, "percentage": 35.39, "elapsed_time": "12:06:33", "remaining_time": "22:06:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3842, "total_steps": 10853, "loss": 0.1558, "learning_rate": 3.839695623873896e-06, "epoch": 0.35398719307135945, "percentage": 35.4, "elapsed_time": "12:06:44", "remaining_time": "22:06:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3843, "total_steps": 10853, "loss": 0.1542, "learning_rate": 3.839052391995076e-06, "epoch": 0.35407932924862945, "percentage": 35.41, "elapsed_time": "12:06:54", "remaining_time": "22:05:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3844, "total_steps": 10853, "loss": 0.1544, "learning_rate": 3.8384090357850964e-06, "epoch": 0.3541714654258995, "percentage": 35.42, "elapsed_time": "12:07:05", "remaining_time": "22:05:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3845, "total_steps": 10853, "loss": 0.1538, "learning_rate": 3.837765555303694e-06, "epoch": 0.3542636016031695, "percentage": 35.43, "elapsed_time": "12:07:16", "remaining_time": "22:05:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3846, "total_steps": 10853, "loss": 0.1479, "learning_rate": 3.837121950610616e-06, "epoch": 0.3543557377804395, "percentage": 35.44, "elapsed_time": "12:07:26", "remaining_time": "22:05:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3847, "total_steps": 10853, "loss": 0.1324, "learning_rate": 3.8364782217656205e-06, "epoch": 0.3544478739577095, "percentage": 35.45, "elapsed_time": "12:07:37", "remaining_time": "22:05:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3848, "total_steps": 10853, "loss": 0.1557, "learning_rate": 3.835834368828479e-06, "epoch": 0.3545400101349795, "percentage": 35.46, "elapsed_time": "12:07:48", "remaining_time": "22:04:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3849, "total_steps": 10853, "loss": 0.1607, "learning_rate": 3.835190391858972e-06, "epoch": 0.3546321463122495, "percentage": 35.46, "elapsed_time": "12:08:00", "remaining_time": "22:04:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3850, "total_steps": 10853, "loss": 0.1565, "learning_rate": 3.834546290916893e-06, "epoch": 0.3547242824895195, "percentage": 35.47, "elapsed_time": "12:08:11", "remaining_time": "22:04:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3851, "total_steps": 10853, "loss": 0.14, "learning_rate": 3.833902066062049e-06, "epoch": 0.35481641866678953, "percentage": 35.48, "elapsed_time": "12:08:22", "remaining_time": "22:04:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3852, "total_steps": 10853, "loss": 0.162, "learning_rate": 3.833257717354253e-06, "epoch": 0.35490855484405953, "percentage": 35.49, "elapsed_time": "12:08:33", "remaining_time": "22:04:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3853, "total_steps": 10853, "loss": 0.1549, "learning_rate": 3.832613244853335e-06, "epoch": 0.35500069102132953, "percentage": 35.5, "elapsed_time": "12:08:43", "remaining_time": "22:03:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3854, "total_steps": 10853, "loss": 0.1643, "learning_rate": 3.831968648619133e-06, "epoch": 0.3550928271985995, "percentage": 35.51, "elapsed_time": "12:08:55", "remaining_time": "22:03:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3855, "total_steps": 10853, "loss": 0.148, "learning_rate": 3.8313239287115e-06, "epoch": 0.3551849633758695, "percentage": 35.52, "elapsed_time": "12:09:05", "remaining_time": "22:03:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3856, "total_steps": 10853, "loss": 0.1585, "learning_rate": 3.830679085190296e-06, "epoch": 0.3552770995531395, "percentage": 35.53, "elapsed_time": "12:09:17", "remaining_time": "22:03:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3857, "total_steps": 10853, "loss": 0.1582, "learning_rate": 3.830034118115396e-06, "epoch": 0.35536923573040957, "percentage": 35.54, "elapsed_time": "12:09:27", "remaining_time": "22:03:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3858, "total_steps": 10853, "loss": 0.1437, "learning_rate": 3.829389027546685e-06, "epoch": 0.35546137190767957, "percentage": 35.55, "elapsed_time": "12:09:37", "remaining_time": "22:02:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3859, "total_steps": 10853, "loss": 0.1432, "learning_rate": 3.828743813544059e-06, "epoch": 0.35555350808494957, "percentage": 35.56, "elapsed_time": "12:09:47", "remaining_time": "22:02:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3860, "total_steps": 10853, "loss": 0.1554, "learning_rate": 3.8280984761674286e-06, "epoch": 0.35564564426221956, "percentage": 35.57, "elapsed_time": "12:09:57", "remaining_time": "22:02:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3861, "total_steps": 10853, "loss": 0.1604, "learning_rate": 3.82745301547671e-06, "epoch": 0.35573778043948956, "percentage": 35.58, "elapsed_time": "12:10:08", "remaining_time": "22:02:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3862, "total_steps": 10853, "loss": 0.1585, "learning_rate": 3.8268074315318375e-06, "epoch": 0.35582991661675956, "percentage": 35.58, "elapsed_time": "12:10:19", "remaining_time": "22:02:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3863, "total_steps": 10853, "loss": 0.142, "learning_rate": 3.826161724392751e-06, "epoch": 0.35592205279402955, "percentage": 35.59, "elapsed_time": "12:10:30", "remaining_time": "22:01:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3864, "total_steps": 10853, "loss": 0.1413, "learning_rate": 3.8255158941194066e-06, "epoch": 0.3560141889712996, "percentage": 35.6, "elapsed_time": "12:10:39", "remaining_time": "22:01:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3865, "total_steps": 10853, "loss": 0.1448, "learning_rate": 3.824869940771768e-06, "epoch": 0.3561063251485696, "percentage": 35.61, "elapsed_time": "12:10:49", "remaining_time": "22:01:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3866, "total_steps": 10853, "loss": 0.1508, "learning_rate": 3.824223864409813e-06, "epoch": 0.3561984613258396, "percentage": 35.62, "elapsed_time": "12:10:59", "remaining_time": "22:01:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3867, "total_steps": 10853, "loss": 0.1583, "learning_rate": 3.823577665093529e-06, "epoch": 0.3562905975031096, "percentage": 35.63, "elapsed_time": "12:11:10", "remaining_time": "22:00:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3868, "total_steps": 10853, "loss": 0.154, "learning_rate": 3.822931342882918e-06, "epoch": 0.3563827336803796, "percentage": 35.64, "elapsed_time": "12:11:20", "remaining_time": "22:00:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3869, "total_steps": 10853, "loss": 0.1574, "learning_rate": 3.822284897837989e-06, "epoch": 0.3564748698576496, "percentage": 35.65, "elapsed_time": "12:11:30", "remaining_time": "22:00:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3870, "total_steps": 10853, "loss": 0.1613, "learning_rate": 3.821638330018764e-06, "epoch": 0.3565670060349196, "percentage": 35.66, "elapsed_time": "12:11:41", "remaining_time": "22:00:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3871, "total_steps": 10853, "loss": 0.15, "learning_rate": 3.820991639485279e-06, "epoch": 0.35665914221218964, "percentage": 35.67, "elapsed_time": "12:11:53", "remaining_time": "22:00:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3872, "total_steps": 10853, "loss": 0.1482, "learning_rate": 3.820344826297577e-06, "epoch": 0.35675127838945964, "percentage": 35.68, "elapsed_time": "12:12:03", "remaining_time": "21:59:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3873, "total_steps": 10853, "loss": 0.1741, "learning_rate": 3.819697890515717e-06, "epoch": 0.35684341456672963, "percentage": 35.69, "elapsed_time": "12:12:14", "remaining_time": "21:59:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3874, "total_steps": 10853, "loss": 0.1534, "learning_rate": 3.819050832199766e-06, "epoch": 0.35693555074399963, "percentage": 35.7, "elapsed_time": "12:12:25", "remaining_time": "21:59:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3875, "total_steps": 10853, "loss": 0.166, "learning_rate": 3.818403651409801e-06, "epoch": 0.3570276869212696, "percentage": 35.7, "elapsed_time": "12:12:36", "remaining_time": "21:59:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3876, "total_steps": 10853, "loss": 0.1534, "learning_rate": 3.817756348205917e-06, "epoch": 0.3571198230985396, "percentage": 35.71, "elapsed_time": "12:12:46", "remaining_time": "21:59:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3877, "total_steps": 10853, "loss": 0.1479, "learning_rate": 3.817108922648214e-06, "epoch": 0.3572119592758096, "percentage": 35.72, "elapsed_time": "12:12:56", "remaining_time": "21:58:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3878, "total_steps": 10853, "loss": 0.1581, "learning_rate": 3.816461374796805e-06, "epoch": 0.3573040954530797, "percentage": 35.73, "elapsed_time": "12:13:08", "remaining_time": "21:58:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3879, "total_steps": 10853, "loss": 0.1535, "learning_rate": 3.815813704711816e-06, "epoch": 0.35739623163034967, "percentage": 35.74, "elapsed_time": "12:13:19", "remaining_time": "21:58:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3880, "total_steps": 10853, "loss": 0.1377, "learning_rate": 3.815165912453383e-06, "epoch": 0.35748836780761967, "percentage": 35.75, "elapsed_time": "12:13:29", "remaining_time": "21:58:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3881, "total_steps": 10853, "loss": 0.1672, "learning_rate": 3.814517998081654e-06, "epoch": 0.35758050398488966, "percentage": 35.76, "elapsed_time": "12:13:39", "remaining_time": "21:57:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3882, "total_steps": 10853, "loss": 0.1619, "learning_rate": 3.8138699616567875e-06, "epoch": 0.35767264016215966, "percentage": 35.77, "elapsed_time": "12:13:52", "remaining_time": "21:57:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3883, "total_steps": 10853, "loss": 0.1438, "learning_rate": 3.8132218032389524e-06, "epoch": 0.35776477633942966, "percentage": 35.78, "elapsed_time": "12:14:03", "remaining_time": "21:57:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3884, "total_steps": 10853, "loss": 0.1516, "learning_rate": 3.812573522888332e-06, "epoch": 0.35785691251669965, "percentage": 35.79, "elapsed_time": "12:14:12", "remaining_time": "21:57:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3885, "total_steps": 10853, "loss": 0.1721, "learning_rate": 3.81192512066512e-06, "epoch": 0.3579490486939697, "percentage": 35.8, "elapsed_time": "12:14:24", "remaining_time": "21:57:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3886, "total_steps": 10853, "loss": 0.1502, "learning_rate": 3.811276596629518e-06, "epoch": 0.3580411848712397, "percentage": 35.81, "elapsed_time": "12:14:35", "remaining_time": "21:57:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3887, "total_steps": 10853, "loss": 0.1586, "learning_rate": 3.810627950841743e-06, "epoch": 0.3581333210485097, "percentage": 35.81, "elapsed_time": "12:14:45", "remaining_time": "21:56:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3888, "total_steps": 10853, "loss": 0.1533, "learning_rate": 3.8099791833620214e-06, "epoch": 0.3582254572257797, "percentage": 35.82, "elapsed_time": "12:14:55", "remaining_time": "21:56:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3889, "total_steps": 10853, "loss": 0.1585, "learning_rate": 3.8093302942505935e-06, "epoch": 0.3583175934030497, "percentage": 35.83, "elapsed_time": "12:15:05", "remaining_time": "21:56:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3890, "total_steps": 10853, "loss": 0.1624, "learning_rate": 3.8086812835677044e-06, "epoch": 0.3584097295803197, "percentage": 35.84, "elapsed_time": "12:15:17", "remaining_time": "21:56:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3891, "total_steps": 10853, "loss": 0.1618, "learning_rate": 3.808032151373619e-06, "epoch": 0.35850186575758974, "percentage": 35.85, "elapsed_time": "12:15:28", "remaining_time": "21:55:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3892, "total_steps": 10853, "loss": 0.1444, "learning_rate": 3.807382897728607e-06, "epoch": 0.35859400193485974, "percentage": 35.86, "elapsed_time": "12:15:39", "remaining_time": "21:55:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3893, "total_steps": 10853, "loss": 0.1554, "learning_rate": 3.8067335226929523e-06, "epoch": 0.35868613811212974, "percentage": 35.87, "elapsed_time": "12:15:49", "remaining_time": "21:55:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3894, "total_steps": 10853, "loss": 0.1553, "learning_rate": 3.8060840263269494e-06, "epoch": 0.35877827428939973, "percentage": 35.88, "elapsed_time": "12:16:01", "remaining_time": "21:55:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3895, "total_steps": 10853, "loss": 0.1539, "learning_rate": 3.8054344086909043e-06, "epoch": 0.35887041046666973, "percentage": 35.89, "elapsed_time": "12:16:12", "remaining_time": "21:55:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3896, "total_steps": 10853, "loss": 0.1438, "learning_rate": 3.804784669845133e-06, "epoch": 0.35896254664393973, "percentage": 35.9, "elapsed_time": "12:16:24", "remaining_time": "21:54:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3897, "total_steps": 10853, "loss": 0.1397, "learning_rate": 3.8041348098499655e-06, "epoch": 0.3590546828212097, "percentage": 35.91, "elapsed_time": "12:16:33", "remaining_time": "21:54:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3898, "total_steps": 10853, "loss": 0.153, "learning_rate": 3.8034848287657403e-06, "epoch": 0.3591468189984798, "percentage": 35.92, "elapsed_time": "12:16:44", "remaining_time": "21:54:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3899, "total_steps": 10853, "loss": 0.1583, "learning_rate": 3.802834726652809e-06, "epoch": 0.3592389551757498, "percentage": 35.93, "elapsed_time": "12:16:54", "remaining_time": "21:54:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3900, "total_steps": 10853, "loss": 0.1508, "learning_rate": 3.802184503571532e-06, "epoch": 0.35933109135301977, "percentage": 35.93, "elapsed_time": "12:17:06", "remaining_time": "21:54:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3901, "total_steps": 10853, "loss": 0.1728, "learning_rate": 3.801534159582285e-06, "epoch": 0.35942322753028977, "percentage": 35.94, "elapsed_time": "12:17:16", "remaining_time": "21:53:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3902, "total_steps": 10853, "loss": 0.1571, "learning_rate": 3.80088369474545e-06, "epoch": 0.35951536370755977, "percentage": 35.95, "elapsed_time": "12:17:27", "remaining_time": "21:53:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3903, "total_steps": 10853, "loss": 0.1395, "learning_rate": 3.800233109121425e-06, "epoch": 0.35960749988482976, "percentage": 35.96, "elapsed_time": "12:17:38", "remaining_time": "21:53:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3904, "total_steps": 10853, "loss": 0.1475, "learning_rate": 3.7995824027706152e-06, "epoch": 0.35969963606209976, "percentage": 35.97, "elapsed_time": "12:17:50", "remaining_time": "21:53:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3905, "total_steps": 10853, "loss": 0.1549, "learning_rate": 3.7989315757534397e-06, "epoch": 0.3597917722393698, "percentage": 35.98, "elapsed_time": "12:18:01", "remaining_time": "21:53:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3906, "total_steps": 10853, "loss": 0.1672, "learning_rate": 3.7982806281303276e-06, "epoch": 0.3598839084166398, "percentage": 35.99, "elapsed_time": "12:18:13", "remaining_time": "21:52:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3907, "total_steps": 10853, "loss": 0.1436, "learning_rate": 3.797629559961719e-06, "epoch": 0.3599760445939098, "percentage": 36.0, "elapsed_time": "12:18:24", "remaining_time": "21:52:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3908, "total_steps": 10853, "loss": 0.1595, "learning_rate": 3.7969783713080665e-06, "epoch": 0.3600681807711798, "percentage": 36.01, "elapsed_time": "12:18:34", "remaining_time": "21:52:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3909, "total_steps": 10853, "loss": 0.1572, "learning_rate": 3.796327062229833e-06, "epoch": 0.3601603169484498, "percentage": 36.02, "elapsed_time": "12:18:45", "remaining_time": "21:52:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3910, "total_steps": 10853, "loss": 0.1623, "learning_rate": 3.7956756327874912e-06, "epoch": 0.3602524531257198, "percentage": 36.03, "elapsed_time": "12:18:57", "remaining_time": "21:52:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3911, "total_steps": 10853, "loss": 0.1594, "learning_rate": 3.7950240830415286e-06, "epoch": 0.3603445893029898, "percentage": 36.04, "elapsed_time": "12:19:08", "remaining_time": "21:51:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3912, "total_steps": 10853, "loss": 0.157, "learning_rate": 3.79437241305244e-06, "epoch": 0.36043672548025985, "percentage": 36.05, "elapsed_time": "12:19:18", "remaining_time": "21:51:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3913, "total_steps": 10853, "loss": 0.1491, "learning_rate": 3.7937206228807333e-06, "epoch": 0.36052886165752984, "percentage": 36.05, "elapsed_time": "12:19:29", "remaining_time": "21:51:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3914, "total_steps": 10853, "loss": 0.1456, "learning_rate": 3.793068712586928e-06, "epoch": 0.36062099783479984, "percentage": 36.06, "elapsed_time": "12:19:40", "remaining_time": "21:51:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3915, "total_steps": 10853, "loss": 0.1605, "learning_rate": 3.7924166822315535e-06, "epoch": 0.36071313401206984, "percentage": 36.07, "elapsed_time": "12:19:51", "remaining_time": "21:51:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3916, "total_steps": 10853, "loss": 0.1638, "learning_rate": 3.791764531875151e-06, "epoch": 0.36080527018933983, "percentage": 36.08, "elapsed_time": "12:20:00", "remaining_time": "21:50:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3917, "total_steps": 10853, "loss": 0.1557, "learning_rate": 3.7911122615782727e-06, "epoch": 0.36089740636660983, "percentage": 36.09, "elapsed_time": "12:20:12", "remaining_time": "21:50:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3918, "total_steps": 10853, "loss": 0.1624, "learning_rate": 3.790459871401482e-06, "epoch": 0.3609895425438799, "percentage": 36.1, "elapsed_time": "12:20:23", "remaining_time": "21:50:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3919, "total_steps": 10853, "loss": 0.1455, "learning_rate": 3.7898073614053527e-06, "epoch": 0.3610816787211499, "percentage": 36.11, "elapsed_time": "12:20:34", "remaining_time": "21:50:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3920, "total_steps": 10853, "loss": 0.146, "learning_rate": 3.7891547316504716e-06, "epoch": 0.3611738148984199, "percentage": 36.12, "elapsed_time": "12:20:47", "remaining_time": "21:50:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3921, "total_steps": 10853, "loss": 0.1392, "learning_rate": 3.788501982197435e-06, "epoch": 0.3612659510756899, "percentage": 36.13, "elapsed_time": "12:20:58", "remaining_time": "21:49:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3922, "total_steps": 10853, "loss": 0.159, "learning_rate": 3.787849113106851e-06, "epoch": 0.36135808725295987, "percentage": 36.14, "elapsed_time": "12:21:09", "remaining_time": "21:49:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3923, "total_steps": 10853, "loss": 0.1694, "learning_rate": 3.787196124439337e-06, "epoch": 0.36145022343022987, "percentage": 36.15, "elapsed_time": "12:21:22", "remaining_time": "21:49:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3924, "total_steps": 10853, "loss": 0.1639, "learning_rate": 3.7865430162555255e-06, "epoch": 0.36154235960749986, "percentage": 36.16, "elapsed_time": "12:21:31", "remaining_time": "21:49:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3925, "total_steps": 10853, "loss": 0.1453, "learning_rate": 3.7858897886160562e-06, "epoch": 0.3616344957847699, "percentage": 36.17, "elapsed_time": "12:21:43", "remaining_time": "21:49:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3926, "total_steps": 10853, "loss": 0.1674, "learning_rate": 3.785236441581581e-06, "epoch": 0.3617266319620399, "percentage": 36.17, "elapsed_time": "12:21:54", "remaining_time": "21:49:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3927, "total_steps": 10853, "loss": 0.1456, "learning_rate": 3.784582975212765e-06, "epoch": 0.3618187681393099, "percentage": 36.18, "elapsed_time": "12:22:05", "remaining_time": "21:48:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3928, "total_steps": 10853, "loss": 0.1455, "learning_rate": 3.783929389570281e-06, "epoch": 0.3619109043165799, "percentage": 36.19, "elapsed_time": "12:22:14", "remaining_time": "21:48:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3929, "total_steps": 10853, "loss": 0.1616, "learning_rate": 3.7832756847148146e-06, "epoch": 0.3620030404938499, "percentage": 36.2, "elapsed_time": "12:22:25", "remaining_time": "21:48:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3930, "total_steps": 10853, "loss": 0.1725, "learning_rate": 3.782621860707063e-06, "epoch": 0.3620951766711199, "percentage": 36.21, "elapsed_time": "12:22:35", "remaining_time": "21:48:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3931, "total_steps": 10853, "loss": 0.1351, "learning_rate": 3.781967917607734e-06, "epoch": 0.3621873128483899, "percentage": 36.22, "elapsed_time": "12:22:46", "remaining_time": "21:47:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3932, "total_steps": 10853, "loss": 0.1477, "learning_rate": 3.7813138554775454e-06, "epoch": 0.36227944902565995, "percentage": 36.23, "elapsed_time": "12:22:56", "remaining_time": "21:47:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3933, "total_steps": 10853, "loss": 0.1596, "learning_rate": 3.780659674377227e-06, "epoch": 0.36237158520292995, "percentage": 36.24, "elapsed_time": "12:23:09", "remaining_time": "21:47:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3934, "total_steps": 10853, "loss": 0.1419, "learning_rate": 3.7800053743675213e-06, "epoch": 0.36246372138019994, "percentage": 36.25, "elapsed_time": "12:23:20", "remaining_time": "21:47:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3935, "total_steps": 10853, "loss": 0.1565, "learning_rate": 3.779350955509178e-06, "epoch": 0.36255585755746994, "percentage": 36.26, "elapsed_time": "12:23:30", "remaining_time": "21:47:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3936, "total_steps": 10853, "loss": 0.1398, "learning_rate": 3.7786964178629613e-06, "epoch": 0.36264799373473994, "percentage": 36.27, "elapsed_time": "12:23:41", "remaining_time": "21:46:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3937, "total_steps": 10853, "loss": 0.1573, "learning_rate": 3.7780417614896438e-06, "epoch": 0.36274012991200993, "percentage": 36.28, "elapsed_time": "12:23:52", "remaining_time": "21:46:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3938, "total_steps": 10853, "loss": 0.1549, "learning_rate": 3.777386986450012e-06, "epoch": 0.36283226608927993, "percentage": 36.28, "elapsed_time": "12:24:05", "remaining_time": "21:46:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3939, "total_steps": 10853, "loss": 0.1537, "learning_rate": 3.77673209280486e-06, "epoch": 0.36292440226655, "percentage": 36.29, "elapsed_time": "12:24:17", "remaining_time": "21:46:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3940, "total_steps": 10853, "loss": 0.14, "learning_rate": 3.776077080614997e-06, "epoch": 0.36301653844382, "percentage": 36.3, "elapsed_time": "12:24:27", "remaining_time": "21:46:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3941, "total_steps": 10853, "loss": 0.1416, "learning_rate": 3.7754219499412393e-06, "epoch": 0.36310867462109, "percentage": 36.31, "elapsed_time": "12:24:37", "remaining_time": "21:45:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3942, "total_steps": 10853, "loss": 0.1442, "learning_rate": 3.7747667008444154e-06, "epoch": 0.36320081079836, "percentage": 36.32, "elapsed_time": "12:24:48", "remaining_time": "21:45:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3943, "total_steps": 10853, "loss": 0.1625, "learning_rate": 3.7741113333853673e-06, "epoch": 0.36329294697562997, "percentage": 36.33, "elapsed_time": "12:25:00", "remaining_time": "21:45:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3944, "total_steps": 10853, "loss": 0.1602, "learning_rate": 3.773455847624944e-06, "epoch": 0.36338508315289997, "percentage": 36.34, "elapsed_time": "12:25:10", "remaining_time": "21:45:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3945, "total_steps": 10853, "loss": 0.1449, "learning_rate": 3.7728002436240086e-06, "epoch": 0.36347721933016996, "percentage": 36.35, "elapsed_time": "12:25:20", "remaining_time": "21:45:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3946, "total_steps": 10853, "loss": 0.1466, "learning_rate": 3.772144521443434e-06, "epoch": 0.36356935550744, "percentage": 36.36, "elapsed_time": "12:25:31", "remaining_time": "21:44:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3947, "total_steps": 10853, "loss": 0.1544, "learning_rate": 3.7714886811441033e-06, "epoch": 0.36366149168471, "percentage": 36.37, "elapsed_time": "12:25:41", "remaining_time": "21:44:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3948, "total_steps": 10853, "loss": 0.1619, "learning_rate": 3.7708327227869113e-06, "epoch": 0.36375362786198, "percentage": 36.38, "elapsed_time": "12:25:53", "remaining_time": "21:44:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3949, "total_steps": 10853, "loss": 0.1611, "learning_rate": 3.770176646432765e-06, "epoch": 0.36384576403925, "percentage": 36.39, "elapsed_time": "12:26:02", "remaining_time": "21:44:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3950, "total_steps": 10853, "loss": 0.1474, "learning_rate": 3.76952045214258e-06, "epoch": 0.36393790021652, "percentage": 36.4, "elapsed_time": "12:26:12", "remaining_time": "21:44:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3951, "total_steps": 10853, "loss": 0.1556, "learning_rate": 3.7688641399772842e-06, "epoch": 0.36403003639379, "percentage": 36.4, "elapsed_time": "12:26:24", "remaining_time": "21:43:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3952, "total_steps": 10853, "loss": 0.1646, "learning_rate": 3.7682077099978163e-06, "epoch": 0.36412217257106005, "percentage": 36.41, "elapsed_time": "12:26:35", "remaining_time": "21:43:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3953, "total_steps": 10853, "loss": 0.1535, "learning_rate": 3.767551162265126e-06, "epoch": 0.36421430874833005, "percentage": 36.42, "elapsed_time": "12:26:45", "remaining_time": "21:43:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3954, "total_steps": 10853, "loss": 0.1544, "learning_rate": 3.7668944968401743e-06, "epoch": 0.36430644492560005, "percentage": 36.43, "elapsed_time": "12:26:56", "remaining_time": "21:43:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3955, "total_steps": 10853, "loss": 0.1442, "learning_rate": 3.7662377137839323e-06, "epoch": 0.36439858110287005, "percentage": 36.44, "elapsed_time": "12:27:06", "remaining_time": "21:43:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3956, "total_steps": 10853, "loss": 0.1511, "learning_rate": 3.7655808131573823e-06, "epoch": 0.36449071728014004, "percentage": 36.45, "elapsed_time": "12:27:16", "remaining_time": "21:42:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3957, "total_steps": 10853, "loss": 0.1387, "learning_rate": 3.7649237950215178e-06, "epoch": 0.36458285345741004, "percentage": 36.46, "elapsed_time": "12:27:27", "remaining_time": "21:42:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3958, "total_steps": 10853, "loss": 0.1752, "learning_rate": 3.764266659437342e-06, "epoch": 0.36467498963468004, "percentage": 36.47, "elapsed_time": "12:27:38", "remaining_time": "21:42:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3959, "total_steps": 10853, "loss": 0.1442, "learning_rate": 3.763609406465872e-06, "epoch": 0.3647671258119501, "percentage": 36.48, "elapsed_time": "12:27:49", "remaining_time": "21:42:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3960, "total_steps": 10853, "loss": 0.1613, "learning_rate": 3.7629520361681317e-06, "epoch": 0.3648592619892201, "percentage": 36.49, "elapsed_time": "12:27:59", "remaining_time": "21:41:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3961, "total_steps": 10853, "loss": 0.1412, "learning_rate": 3.7622945486051585e-06, "epoch": 0.3649513981664901, "percentage": 36.5, "elapsed_time": "12:28:09", "remaining_time": "21:41:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3962, "total_steps": 10853, "loss": 0.1592, "learning_rate": 3.7616369438380014e-06, "epoch": 0.3650435343437601, "percentage": 36.51, "elapsed_time": "12:28:20", "remaining_time": "21:41:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3963, "total_steps": 10853, "loss": 0.1501, "learning_rate": 3.760979221927718e-06, "epoch": 0.3651356705210301, "percentage": 36.52, "elapsed_time": "12:28:29", "remaining_time": "21:41:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3964, "total_steps": 10853, "loss": 0.1633, "learning_rate": 3.760321382935378e-06, "epoch": 0.3652278066983001, "percentage": 36.52, "elapsed_time": "12:28:41", "remaining_time": "21:41:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3965, "total_steps": 10853, "loss": 0.1406, "learning_rate": 3.759663426922062e-06, "epoch": 0.36531994287557007, "percentage": 36.53, "elapsed_time": "12:28:51", "remaining_time": "21:40:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3966, "total_steps": 10853, "loss": 0.1573, "learning_rate": 3.7590053539488613e-06, "epoch": 0.3654120790528401, "percentage": 36.54, "elapsed_time": "12:29:02", "remaining_time": "21:40:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3967, "total_steps": 10853, "loss": 0.1561, "learning_rate": 3.758347164076879e-06, "epoch": 0.3655042152301101, "percentage": 36.55, "elapsed_time": "12:29:14", "remaining_time": "21:40:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3968, "total_steps": 10853, "loss": 0.1592, "learning_rate": 3.7576888573672254e-06, "epoch": 0.3655963514073801, "percentage": 36.56, "elapsed_time": "12:29:25", "remaining_time": "21:40:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3969, "total_steps": 10853, "loss": 0.1468, "learning_rate": 3.757030433881027e-06, "epoch": 0.3656884875846501, "percentage": 36.57, "elapsed_time": "12:29:36", "remaining_time": "21:40:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3970, "total_steps": 10853, "loss": 0.1567, "learning_rate": 3.7563718936794176e-06, "epoch": 0.3657806237619201, "percentage": 36.58, "elapsed_time": "12:29:47", "remaining_time": "21:39:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3971, "total_steps": 10853, "loss": 0.1589, "learning_rate": 3.755713236823542e-06, "epoch": 0.3658727599391901, "percentage": 36.59, "elapsed_time": "12:29:58", "remaining_time": "21:39:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3972, "total_steps": 10853, "loss": 0.1525, "learning_rate": 3.755054463374558e-06, "epoch": 0.3659648961164601, "percentage": 36.6, "elapsed_time": "12:30:09", "remaining_time": "21:39:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3973, "total_steps": 10853, "loss": 0.1728, "learning_rate": 3.754395573393631e-06, "epoch": 0.36605703229373016, "percentage": 36.61, "elapsed_time": "12:30:19", "remaining_time": "21:39:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3974, "total_steps": 10853, "loss": 0.1518, "learning_rate": 3.7537365669419413e-06, "epoch": 0.36614916847100015, "percentage": 36.62, "elapsed_time": "12:30:30", "remaining_time": "21:39:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3975, "total_steps": 10853, "loss": 0.1473, "learning_rate": 3.7530774440806757e-06, "epoch": 0.36624130464827015, "percentage": 36.63, "elapsed_time": "12:30:42", "remaining_time": "21:38:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3976, "total_steps": 10853, "loss": 0.1439, "learning_rate": 3.7524182048710343e-06, "epoch": 0.36633344082554015, "percentage": 36.64, "elapsed_time": "12:30:52", "remaining_time": "21:38:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3977, "total_steps": 10853, "loss": 0.1413, "learning_rate": 3.751758849374228e-06, "epoch": 0.36642557700281014, "percentage": 36.64, "elapsed_time": "12:31:02", "remaining_time": "21:38:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3978, "total_steps": 10853, "loss": 0.1513, "learning_rate": 3.7510993776514786e-06, "epoch": 0.36651771318008014, "percentage": 36.65, "elapsed_time": "12:31:14", "remaining_time": "21:38:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3979, "total_steps": 10853, "loss": 0.1499, "learning_rate": 3.7504397897640165e-06, "epoch": 0.36660984935735014, "percentage": 36.66, "elapsed_time": "12:31:25", "remaining_time": "21:38:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3980, "total_steps": 10853, "loss": 0.1526, "learning_rate": 3.7497800857730854e-06, "epoch": 0.3667019855346202, "percentage": 36.67, "elapsed_time": "12:31:36", "remaining_time": "21:37:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3981, "total_steps": 10853, "loss": 0.1416, "learning_rate": 3.749120265739939e-06, "epoch": 0.3667941217118902, "percentage": 36.68, "elapsed_time": "12:31:47", "remaining_time": "21:37:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3982, "total_steps": 10853, "loss": 0.1526, "learning_rate": 3.7484603297258413e-06, "epoch": 0.3668862578891602, "percentage": 36.69, "elapsed_time": "12:31:59", "remaining_time": "21:37:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3983, "total_steps": 10853, "loss": 0.1547, "learning_rate": 3.747800277792068e-06, "epoch": 0.3669783940664302, "percentage": 36.7, "elapsed_time": "12:32:09", "remaining_time": "21:37:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3984, "total_steps": 10853, "loss": 0.152, "learning_rate": 3.7471401099999044e-06, "epoch": 0.3670705302437002, "percentage": 36.71, "elapsed_time": "12:32:20", "remaining_time": "21:37:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3985, "total_steps": 10853, "loss": 0.1546, "learning_rate": 3.7464798264106474e-06, "epoch": 0.3671626664209702, "percentage": 36.72, "elapsed_time": "12:32:30", "remaining_time": "21:36:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3986, "total_steps": 10853, "loss": 0.1496, "learning_rate": 3.7458194270856046e-06, "epoch": 0.3672548025982402, "percentage": 36.73, "elapsed_time": "12:32:40", "remaining_time": "21:36:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3987, "total_steps": 10853, "loss": 0.166, "learning_rate": 3.745158912086093e-06, "epoch": 0.3673469387755102, "percentage": 36.74, "elapsed_time": "12:32:51", "remaining_time": "21:36:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3988, "total_steps": 10853, "loss": 0.1558, "learning_rate": 3.744498281473443e-06, "epoch": 0.3674390749527802, "percentage": 36.75, "elapsed_time": "12:33:01", "remaining_time": "21:36:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3989, "total_steps": 10853, "loss": 0.1401, "learning_rate": 3.743837535308994e-06, "epoch": 0.3675312111300502, "percentage": 36.75, "elapsed_time": "12:33:10", "remaining_time": "21:36:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3990, "total_steps": 10853, "loss": 0.1482, "learning_rate": 3.7431766736540958e-06, "epoch": 0.3676233473073202, "percentage": 36.76, "elapsed_time": "12:33:20", "remaining_time": "21:35:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3991, "total_steps": 10853, "loss": 0.1511, "learning_rate": 3.74251569657011e-06, "epoch": 0.3677154834845902, "percentage": 36.77, "elapsed_time": "12:33:30", "remaining_time": "21:35:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3992, "total_steps": 10853, "loss": 0.1467, "learning_rate": 3.7418546041184074e-06, "epoch": 0.3678076196618602, "percentage": 36.78, "elapsed_time": "12:33:40", "remaining_time": "21:35:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3993, "total_steps": 10853, "loss": 0.1655, "learning_rate": 3.7411933963603706e-06, "epoch": 0.36789975583913026, "percentage": 36.79, "elapsed_time": "12:33:52", "remaining_time": "21:35:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3994, "total_steps": 10853, "loss": 0.1433, "learning_rate": 3.7405320733573948e-06, "epoch": 0.36799189201640026, "percentage": 36.8, "elapsed_time": "12:34:01", "remaining_time": "21:34:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3995, "total_steps": 10853, "loss": 0.1674, "learning_rate": 3.739870635170881e-06, "epoch": 0.36808402819367025, "percentage": 36.81, "elapsed_time": "12:34:12", "remaining_time": "21:34:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3996, "total_steps": 10853, "loss": 0.1408, "learning_rate": 3.739209081862247e-06, "epoch": 0.36817616437094025, "percentage": 36.82, "elapsed_time": "12:34:24", "remaining_time": "21:34:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3997, "total_steps": 10853, "loss": 0.1445, "learning_rate": 3.738547413492916e-06, "epoch": 0.36826830054821025, "percentage": 36.83, "elapsed_time": "12:34:34", "remaining_time": "21:34:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3998, "total_steps": 10853, "loss": 0.1558, "learning_rate": 3.7378856301243233e-06, "epoch": 0.36836043672548024, "percentage": 36.84, "elapsed_time": "12:34:45", "remaining_time": "21:34:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3999, "total_steps": 10853, "loss": 0.1533, "learning_rate": 3.7372237318179172e-06, "epoch": 0.36845257290275024, "percentage": 36.85, "elapsed_time": "12:34:56", "remaining_time": "21:33:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4000, "total_steps": 10853, "loss": 0.1403, "learning_rate": 3.7365617186351538e-06, "epoch": 0.3685447090800203, "percentage": 36.86, "elapsed_time": "12:35:06", "remaining_time": "21:33:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4000, "total_steps": 10853, "eval_loss": 0.15275675058364868, "epoch": 0.3685447090800203, "percentage": 36.86, "elapsed_time": "12:40:06", "remaining_time": "21:42:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4001, "total_steps": 10853, "loss": 0.1374, "learning_rate": 3.735899590637503e-06, "epoch": 0.3686368452572903, "percentage": 36.87, "elapsed_time": "12:40:17", "remaining_time": "21:42:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4002, "total_steps": 10853, "loss": 0.141, "learning_rate": 3.735237347886441e-06, "epoch": 0.3687289814345603, "percentage": 36.87, "elapsed_time": "12:40:27", "remaining_time": "21:41:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4003, "total_steps": 10853, "loss": 0.1463, "learning_rate": 3.7345749904434593e-06, "epoch": 0.3688211176118303, "percentage": 36.88, "elapsed_time": "12:40:37", "remaining_time": "21:41:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4004, "total_steps": 10853, "loss": 0.1416, "learning_rate": 3.733912518370056e-06, "epoch": 0.3689132537891003, "percentage": 36.89, "elapsed_time": "12:40:48", "remaining_time": "21:41:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4005, "total_steps": 10853, "loss": 0.1514, "learning_rate": 3.7332499317277432e-06, "epoch": 0.3690053899663703, "percentage": 36.9, "elapsed_time": "12:40:58", "remaining_time": "21:41:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4006, "total_steps": 10853, "loss": 0.1498, "learning_rate": 3.732587230578041e-06, "epoch": 0.3690975261436403, "percentage": 36.91, "elapsed_time": "12:41:08", "remaining_time": "21:40:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4007, "total_steps": 10853, "loss": 0.1502, "learning_rate": 3.7319244149824825e-06, "epoch": 0.36918966232091033, "percentage": 36.92, "elapsed_time": "12:41:20", "remaining_time": "21:40:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4008, "total_steps": 10853, "loss": 0.1647, "learning_rate": 3.7312614850026086e-06, "epoch": 0.3692817984981803, "percentage": 36.93, "elapsed_time": "12:41:30", "remaining_time": "21:40:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4009, "total_steps": 10853, "loss": 0.1508, "learning_rate": 3.730598440699974e-06, "epoch": 0.3693739346754503, "percentage": 36.94, "elapsed_time": "12:41:40", "remaining_time": "21:40:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4010, "total_steps": 10853, "loss": 0.1527, "learning_rate": 3.729935282136142e-06, "epoch": 0.3694660708527203, "percentage": 36.95, "elapsed_time": "12:41:51", "remaining_time": "21:40:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4011, "total_steps": 10853, "loss": 0.1528, "learning_rate": 3.729272009372686e-06, "epoch": 0.3695582070299903, "percentage": 36.96, "elapsed_time": "12:42:03", "remaining_time": "21:39:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4012, "total_steps": 10853, "loss": 0.1455, "learning_rate": 3.7286086224711916e-06, "epoch": 0.3696503432072603, "percentage": 36.97, "elapsed_time": "12:42:14", "remaining_time": "21:39:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4013, "total_steps": 10853, "loss": 0.1496, "learning_rate": 3.727945121493255e-06, "epoch": 0.3697424793845303, "percentage": 36.98, "elapsed_time": "12:42:24", "remaining_time": "21:39:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4014, "total_steps": 10853, "loss": 0.1641, "learning_rate": 3.7272815065004808e-06, "epoch": 0.36983461556180036, "percentage": 36.99, "elapsed_time": "12:42:34", "remaining_time": "21:39:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4015, "total_steps": 10853, "loss": 0.1511, "learning_rate": 3.7266177775544877e-06, "epoch": 0.36992675173907036, "percentage": 36.99, "elapsed_time": "12:42:44", "remaining_time": "21:39:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4016, "total_steps": 10853, "loss": 0.1371, "learning_rate": 3.7259539347169015e-06, "epoch": 0.37001888791634036, "percentage": 37.0, "elapsed_time": "12:42:56", "remaining_time": "21:38:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4017, "total_steps": 10853, "loss": 0.1519, "learning_rate": 3.72528997804936e-06, "epoch": 0.37011102409361035, "percentage": 37.01, "elapsed_time": "12:43:07", "remaining_time": "21:38:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4018, "total_steps": 10853, "loss": 0.1565, "learning_rate": 3.724625907613513e-06, "epoch": 0.37020316027088035, "percentage": 37.02, "elapsed_time": "12:43:16", "remaining_time": "21:38:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4019, "total_steps": 10853, "loss": 0.1413, "learning_rate": 3.7239617234710185e-06, "epoch": 0.37029529644815035, "percentage": 37.03, "elapsed_time": "12:43:29", "remaining_time": "21:38:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4020, "total_steps": 10853, "loss": 0.1433, "learning_rate": 3.7232974256835457e-06, "epoch": 0.3703874326254204, "percentage": 37.04, "elapsed_time": "12:43:37", "remaining_time": "21:37:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4021, "total_steps": 10853, "loss": 0.1468, "learning_rate": 3.7226330143127765e-06, "epoch": 0.3704795688026904, "percentage": 37.05, "elapsed_time": "12:43:48", "remaining_time": "21:37:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4022, "total_steps": 10853, "loss": 0.1358, "learning_rate": 3.721968489420399e-06, "epoch": 0.3705717049799604, "percentage": 37.06, "elapsed_time": "12:43:58", "remaining_time": "21:37:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4023, "total_steps": 10853, "loss": 0.1602, "learning_rate": 3.721303851068116e-06, "epoch": 0.3706638411572304, "percentage": 37.07, "elapsed_time": "12:44:09", "remaining_time": "21:37:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4024, "total_steps": 10853, "loss": 0.1414, "learning_rate": 3.7206390993176395e-06, "epoch": 0.3707559773345004, "percentage": 37.08, "elapsed_time": "12:44:20", "remaining_time": "21:37:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4025, "total_steps": 10853, "loss": 0.1542, "learning_rate": 3.719974234230691e-06, "epoch": 0.3708481135117704, "percentage": 37.09, "elapsed_time": "12:44:30", "remaining_time": "21:36:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4026, "total_steps": 10853, "loss": 0.1479, "learning_rate": 3.7193092558690036e-06, "epoch": 0.3709402496890404, "percentage": 37.1, "elapsed_time": "12:44:40", "remaining_time": "21:36:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4027, "total_steps": 10853, "loss": 0.1483, "learning_rate": 3.7186441642943206e-06, "epoch": 0.37103238586631043, "percentage": 37.1, "elapsed_time": "12:44:51", "remaining_time": "21:36:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4028, "total_steps": 10853, "loss": 0.1474, "learning_rate": 3.7179789595683954e-06, "epoch": 0.37112452204358043, "percentage": 37.11, "elapsed_time": "12:45:00", "remaining_time": "21:36:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4029, "total_steps": 10853, "loss": 0.147, "learning_rate": 3.717313641752993e-06, "epoch": 0.3712166582208504, "percentage": 37.12, "elapsed_time": "12:45:11", "remaining_time": "21:36:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4030, "total_steps": 10853, "loss": 0.1558, "learning_rate": 3.7166482109098878e-06, "epoch": 0.3713087943981204, "percentage": 37.13, "elapsed_time": "12:45:22", "remaining_time": "21:35:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4031, "total_steps": 10853, "loss": 0.1637, "learning_rate": 3.715982667100866e-06, "epoch": 0.3714009305753904, "percentage": 37.14, "elapsed_time": "12:45:33", "remaining_time": "21:35:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4032, "total_steps": 10853, "loss": 0.1431, "learning_rate": 3.7153170103877216e-06, "epoch": 0.3714930667526604, "percentage": 37.15, "elapsed_time": "12:45:44", "remaining_time": "21:35:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4033, "total_steps": 10853, "loss": 0.1652, "learning_rate": 3.7146512408322623e-06, "epoch": 0.3715852029299304, "percentage": 37.16, "elapsed_time": "12:45:55", "remaining_time": "21:35:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4034, "total_steps": 10853, "loss": 0.1552, "learning_rate": 3.7139853584963054e-06, "epoch": 0.37167733910720047, "percentage": 37.17, "elapsed_time": "12:46:05", "remaining_time": "21:34:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4035, "total_steps": 10853, "loss": 0.148, "learning_rate": 3.7133193634416766e-06, "epoch": 0.37176947528447046, "percentage": 37.18, "elapsed_time": "12:46:15", "remaining_time": "21:34:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4036, "total_steps": 10853, "loss": 0.1667, "learning_rate": 3.7126532557302144e-06, "epoch": 0.37186161146174046, "percentage": 37.19, "elapsed_time": "12:46:27", "remaining_time": "21:34:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4037, "total_steps": 10853, "loss": 0.1566, "learning_rate": 3.711987035423767e-06, "epoch": 0.37195374763901046, "percentage": 37.2, "elapsed_time": "12:46:37", "remaining_time": "21:34:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4038, "total_steps": 10853, "loss": 0.154, "learning_rate": 3.711320702584193e-06, "epoch": 0.37204588381628045, "percentage": 37.21, "elapsed_time": "12:46:46", "remaining_time": "21:34:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4039, "total_steps": 10853, "loss": 0.1507, "learning_rate": 3.710654257273361e-06, "epoch": 0.37213801999355045, "percentage": 37.22, "elapsed_time": "12:46:57", "remaining_time": "21:33:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4040, "total_steps": 10853, "loss": 0.1568, "learning_rate": 3.7099876995531515e-06, "epoch": 0.37223015617082045, "percentage": 37.22, "elapsed_time": "12:47:07", "remaining_time": "21:33:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4041, "total_steps": 10853, "loss": 0.1596, "learning_rate": 3.709321029485453e-06, "epoch": 0.3723222923480905, "percentage": 37.23, "elapsed_time": "12:47:18", "remaining_time": "21:33:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4042, "total_steps": 10853, "loss": 0.1473, "learning_rate": 3.708654247132168e-06, "epoch": 0.3724144285253605, "percentage": 37.24, "elapsed_time": "12:47:29", "remaining_time": "21:33:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4043, "total_steps": 10853, "loss": 0.1471, "learning_rate": 3.7079873525552053e-06, "epoch": 0.3725065647026305, "percentage": 37.25, "elapsed_time": "12:47:40", "remaining_time": "21:33:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4044, "total_steps": 10853, "loss": 0.151, "learning_rate": 3.707320345816487e-06, "epoch": 0.3725987008799005, "percentage": 37.26, "elapsed_time": "12:47:51", "remaining_time": "21:32:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4045, "total_steps": 10853, "loss": 0.142, "learning_rate": 3.7066532269779444e-06, "epoch": 0.3726908370571705, "percentage": 37.27, "elapsed_time": "12:48:01", "remaining_time": "21:32:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4046, "total_steps": 10853, "loss": 0.1437, "learning_rate": 3.7059859961015205e-06, "epoch": 0.3727829732344405, "percentage": 37.28, "elapsed_time": "12:48:11", "remaining_time": "21:32:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4047, "total_steps": 10853, "loss": 0.1624, "learning_rate": 3.705318653249166e-06, "epoch": 0.3728751094117105, "percentage": 37.29, "elapsed_time": "12:48:22", "remaining_time": "21:32:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4048, "total_steps": 10853, "loss": 0.151, "learning_rate": 3.704651198482846e-06, "epoch": 0.37296724558898053, "percentage": 37.3, "elapsed_time": "12:48:33", "remaining_time": "21:32:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4049, "total_steps": 10853, "loss": 0.1651, "learning_rate": 3.703983631864532e-06, "epoch": 0.37305938176625053, "percentage": 37.31, "elapsed_time": "12:48:44", "remaining_time": "21:31:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4050, "total_steps": 10853, "loss": 0.1457, "learning_rate": 3.703315953456208e-06, "epoch": 0.3731515179435205, "percentage": 37.32, "elapsed_time": "12:48:56", "remaining_time": "21:31:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4051, "total_steps": 10853, "loss": 0.1631, "learning_rate": 3.7026481633198687e-06, "epoch": 0.3732436541207905, "percentage": 37.33, "elapsed_time": "12:49:06", "remaining_time": "21:31:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4052, "total_steps": 10853, "loss": 0.1661, "learning_rate": 3.701980261517518e-06, "epoch": 0.3733357902980605, "percentage": 37.34, "elapsed_time": "12:49:18", "remaining_time": "21:31:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4053, "total_steps": 10853, "loss": 0.1579, "learning_rate": 3.70131224811117e-06, "epoch": 0.3734279264753305, "percentage": 37.34, "elapsed_time": "12:49:29", "remaining_time": "21:31:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4054, "total_steps": 10853, "loss": 0.1474, "learning_rate": 3.7006441231628517e-06, "epoch": 0.37352006265260057, "percentage": 37.35, "elapsed_time": "12:49:38", "remaining_time": "21:30:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4055, "total_steps": 10853, "loss": 0.1638, "learning_rate": 3.699975886734596e-06, "epoch": 0.37361219882987057, "percentage": 37.36, "elapsed_time": "12:49:50", "remaining_time": "21:30:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4056, "total_steps": 10853, "loss": 0.1477, "learning_rate": 3.6993075388884507e-06, "epoch": 0.37370433500714056, "percentage": 37.37, "elapsed_time": "12:50:00", "remaining_time": "21:30:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4057, "total_steps": 10853, "loss": 0.1577, "learning_rate": 3.698639079686471e-06, "epoch": 0.37379647118441056, "percentage": 37.38, "elapsed_time": "12:50:11", "remaining_time": "21:30:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4058, "total_steps": 10853, "loss": 0.158, "learning_rate": 3.6979705091907244e-06, "epoch": 0.37388860736168056, "percentage": 37.39, "elapsed_time": "12:50:22", "remaining_time": "21:29:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4059, "total_steps": 10853, "loss": 0.1529, "learning_rate": 3.6973018274632865e-06, "epoch": 0.37398074353895056, "percentage": 37.4, "elapsed_time": "12:50:32", "remaining_time": "21:29:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4060, "total_steps": 10853, "loss": 0.157, "learning_rate": 3.696633034566245e-06, "epoch": 0.37407287971622055, "percentage": 37.41, "elapsed_time": "12:50:44", "remaining_time": "21:29:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4061, "total_steps": 10853, "loss": 0.1503, "learning_rate": 3.6959641305616984e-06, "epoch": 0.3741650158934906, "percentage": 37.42, "elapsed_time": "12:50:55", "remaining_time": "21:29:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4062, "total_steps": 10853, "loss": 0.1516, "learning_rate": 3.695295115511752e-06, "epoch": 0.3742571520707606, "percentage": 37.43, "elapsed_time": "12:51:04", "remaining_time": "21:29:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4063, "total_steps": 10853, "loss": 0.1631, "learning_rate": 3.694625989478527e-06, "epoch": 0.3743492882480306, "percentage": 37.44, "elapsed_time": "12:51:15", "remaining_time": "21:28:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4064, "total_steps": 10853, "loss": 0.1423, "learning_rate": 3.69395675252415e-06, "epoch": 0.3744414244253006, "percentage": 37.45, "elapsed_time": "12:51:26", "remaining_time": "21:28:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4065, "total_steps": 10853, "loss": 0.1411, "learning_rate": 3.6932874047107597e-06, "epoch": 0.3745335606025706, "percentage": 37.46, "elapsed_time": "12:51:37", "remaining_time": "21:28:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4066, "total_steps": 10853, "loss": 0.1569, "learning_rate": 3.6926179461005056e-06, "epoch": 0.3746256967798406, "percentage": 37.46, "elapsed_time": "12:51:48", "remaining_time": "21:28:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4067, "total_steps": 10853, "loss": 0.1572, "learning_rate": 3.691948376755547e-06, "epoch": 0.3747178329571106, "percentage": 37.47, "elapsed_time": "12:51:58", "remaining_time": "21:28:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4068, "total_steps": 10853, "loss": 0.1562, "learning_rate": 3.6912786967380528e-06, "epoch": 0.37480996913438064, "percentage": 37.48, "elapsed_time": "12:52:09", "remaining_time": "21:27:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4069, "total_steps": 10853, "loss": 0.1413, "learning_rate": 3.6906089061102043e-06, "epoch": 0.37490210531165064, "percentage": 37.49, "elapsed_time": "12:52:19", "remaining_time": "21:27:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4070, "total_steps": 10853, "loss": 0.1587, "learning_rate": 3.6899390049341893e-06, "epoch": 0.37499424148892063, "percentage": 37.5, "elapsed_time": "12:52:30", "remaining_time": "21:27:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4071, "total_steps": 10853, "loss": 0.1514, "learning_rate": 3.68926899327221e-06, "epoch": 0.37508637766619063, "percentage": 37.51, "elapsed_time": "12:52:40", "remaining_time": "21:27:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4072, "total_steps": 10853, "loss": 0.1583, "learning_rate": 3.6885988711864777e-06, "epoch": 0.3751785138434606, "percentage": 37.52, "elapsed_time": "12:52:51", "remaining_time": "21:27:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4073, "total_steps": 10853, "loss": 0.1512, "learning_rate": 3.6879286387392122e-06, "epoch": 0.3752706500207306, "percentage": 37.53, "elapsed_time": "12:53:04", "remaining_time": "21:26:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4074, "total_steps": 10853, "loss": 0.1334, "learning_rate": 3.687258295992644e-06, "epoch": 0.3753627861980006, "percentage": 37.54, "elapsed_time": "12:53:15", "remaining_time": "21:26:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4075, "total_steps": 10853, "loss": 0.1479, "learning_rate": 3.686587843009016e-06, "epoch": 0.37545492237527067, "percentage": 37.55, "elapsed_time": "12:53:26", "remaining_time": "21:26:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4076, "total_steps": 10853, "loss": 0.1606, "learning_rate": 3.685917279850578e-06, "epoch": 0.37554705855254067, "percentage": 37.56, "elapsed_time": "12:53:37", "remaining_time": "21:26:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4077, "total_steps": 10853, "loss": 0.1479, "learning_rate": 3.685246606579594e-06, "epoch": 0.37563919472981067, "percentage": 37.57, "elapsed_time": "12:53:47", "remaining_time": "21:26:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4078, "total_steps": 10853, "loss": 0.1553, "learning_rate": 3.684575823258334e-06, "epoch": 0.37573133090708066, "percentage": 37.57, "elapsed_time": "12:53:57", "remaining_time": "21:25:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4079, "total_steps": 10853, "loss": 0.1606, "learning_rate": 3.683904929949082e-06, "epoch": 0.37582346708435066, "percentage": 37.58, "elapsed_time": "12:54:09", "remaining_time": "21:25:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4080, "total_steps": 10853, "loss": 0.1512, "learning_rate": 3.68323392671413e-06, "epoch": 0.37591560326162066, "percentage": 37.59, "elapsed_time": "12:54:19", "remaining_time": "21:25:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4081, "total_steps": 10853, "loss": 0.1645, "learning_rate": 3.6825628136157805e-06, "epoch": 0.37600773943889065, "percentage": 37.6, "elapsed_time": "12:54:29", "remaining_time": "21:25:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4082, "total_steps": 10853, "loss": 0.1546, "learning_rate": 3.6818915907163456e-06, "epoch": 0.3760998756161607, "percentage": 37.61, "elapsed_time": "12:54:41", "remaining_time": "21:25:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4083, "total_steps": 10853, "loss": 0.1357, "learning_rate": 3.6812202580781507e-06, "epoch": 0.3761920117934307, "percentage": 37.62, "elapsed_time": "12:54:52", "remaining_time": "21:24:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4084, "total_steps": 10853, "loss": 0.1486, "learning_rate": 3.680548815763527e-06, "epoch": 0.3762841479707007, "percentage": 37.63, "elapsed_time": "12:55:05", "remaining_time": "21:24:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4085, "total_steps": 10853, "loss": 0.1452, "learning_rate": 3.6798772638348186e-06, "epoch": 0.3763762841479707, "percentage": 37.64, "elapsed_time": "12:55:16", "remaining_time": "21:24:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4086, "total_steps": 10853, "loss": 0.1593, "learning_rate": 3.679205602354379e-06, "epoch": 0.3764684203252407, "percentage": 37.65, "elapsed_time": "12:55:27", "remaining_time": "21:24:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4087, "total_steps": 10853, "loss": 0.17, "learning_rate": 3.6785338313845725e-06, "epoch": 0.3765605565025107, "percentage": 37.66, "elapsed_time": "12:55:38", "remaining_time": "21:24:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4088, "total_steps": 10853, "loss": 0.1476, "learning_rate": 3.677861950987773e-06, "epoch": 0.37665269267978074, "percentage": 37.67, "elapsed_time": "12:55:49", "remaining_time": "21:23:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4089, "total_steps": 10853, "loss": 0.1477, "learning_rate": 3.677189961226365e-06, "epoch": 0.37674482885705074, "percentage": 37.68, "elapsed_time": "12:56:00", "remaining_time": "21:23:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4090, "total_steps": 10853, "loss": 0.1616, "learning_rate": 3.6765178621627418e-06, "epoch": 0.37683696503432074, "percentage": 37.69, "elapsed_time": "12:56:11", "remaining_time": "21:23:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4091, "total_steps": 10853, "loss": 0.1403, "learning_rate": 3.675845653859309e-06, "epoch": 0.37692910121159073, "percentage": 37.69, "elapsed_time": "12:56:22", "remaining_time": "21:23:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4092, "total_steps": 10853, "loss": 0.1523, "learning_rate": 3.6751733363784804e-06, "epoch": 0.37702123738886073, "percentage": 37.7, "elapsed_time": "12:56:33", "remaining_time": "21:23:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4093, "total_steps": 10853, "loss": 0.1412, "learning_rate": 3.6745009097826813e-06, "epoch": 0.3771133735661307, "percentage": 37.71, "elapsed_time": "12:56:44", "remaining_time": "21:22:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4094, "total_steps": 10853, "loss": 0.1518, "learning_rate": 3.6738283741343463e-06, "epoch": 0.3772055097434007, "percentage": 37.72, "elapsed_time": "12:56:56", "remaining_time": "21:22:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4095, "total_steps": 10853, "loss": 0.156, "learning_rate": 3.6731557294959196e-06, "epoch": 0.3772976459206708, "percentage": 37.73, "elapsed_time": "12:57:09", "remaining_time": "21:22:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4096, "total_steps": 10853, "loss": 0.1567, "learning_rate": 3.6724829759298585e-06, "epoch": 0.3773897820979408, "percentage": 37.74, "elapsed_time": "12:57:20", "remaining_time": "21:22:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4097, "total_steps": 10853, "loss": 0.1514, "learning_rate": 3.671810113498626e-06, "epoch": 0.37748191827521077, "percentage": 37.75, "elapsed_time": "12:57:30", "remaining_time": "21:22:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4098, "total_steps": 10853, "loss": 0.1529, "learning_rate": 3.6711371422646984e-06, "epoch": 0.37757405445248077, "percentage": 37.76, "elapsed_time": "12:57:43", "remaining_time": "21:21:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4099, "total_steps": 10853, "loss": 0.1632, "learning_rate": 3.6704640622905617e-06, "epoch": 0.37766619062975076, "percentage": 37.77, "elapsed_time": "12:57:54", "remaining_time": "21:21:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4100, "total_steps": 10853, "loss": 0.1664, "learning_rate": 3.6697908736387105e-06, "epoch": 0.37775832680702076, "percentage": 37.78, "elapsed_time": "12:58:05", "remaining_time": "21:21:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4101, "total_steps": 10853, "loss": 0.1355, "learning_rate": 3.669117576371651e-06, "epoch": 0.37785046298429076, "percentage": 37.79, "elapsed_time": "12:58:16", "remaining_time": "21:21:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4102, "total_steps": 10853, "loss": 0.1607, "learning_rate": 3.668444170551898e-06, "epoch": 0.3779425991615608, "percentage": 37.8, "elapsed_time": "12:58:27", "remaining_time": "21:21:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4103, "total_steps": 10853, "loss": 0.1641, "learning_rate": 3.6677706562419784e-06, "epoch": 0.3780347353388308, "percentage": 37.81, "elapsed_time": "12:58:37", "remaining_time": "21:20:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4104, "total_steps": 10853, "loss": 0.1692, "learning_rate": 3.667097033504428e-06, "epoch": 0.3781268715161008, "percentage": 37.81, "elapsed_time": "12:58:48", "remaining_time": "21:20:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4105, "total_steps": 10853, "loss": 0.1667, "learning_rate": 3.666423302401792e-06, "epoch": 0.3782190076933708, "percentage": 37.82, "elapsed_time": "12:58:59", "remaining_time": "21:20:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4106, "total_steps": 10853, "loss": 0.144, "learning_rate": 3.6657494629966274e-06, "epoch": 0.3783111438706408, "percentage": 37.83, "elapsed_time": "12:59:09", "remaining_time": "21:20:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4107, "total_steps": 10853, "loss": 0.1451, "learning_rate": 3.6650755153514993e-06, "epoch": 0.3784032800479108, "percentage": 37.84, "elapsed_time": "12:59:21", "remaining_time": "21:20:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4108, "total_steps": 10853, "loss": 0.1522, "learning_rate": 3.664401459528984e-06, "epoch": 0.3784954162251808, "percentage": 37.85, "elapsed_time": "12:59:31", "remaining_time": "21:19:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4109, "total_steps": 10853, "loss": 0.1603, "learning_rate": 3.663727295591668e-06, "epoch": 0.37858755240245084, "percentage": 37.86, "elapsed_time": "12:59:42", "remaining_time": "21:19:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4110, "total_steps": 10853, "loss": 0.1527, "learning_rate": 3.6630530236021478e-06, "epoch": 0.37867968857972084, "percentage": 37.87, "elapsed_time": "12:59:53", "remaining_time": "21:19:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4111, "total_steps": 10853, "loss": 0.1487, "learning_rate": 3.6623786436230287e-06, "epoch": 0.37877182475699084, "percentage": 37.88, "elapsed_time": "13:00:03", "remaining_time": "21:19:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4112, "total_steps": 10853, "loss": 0.1429, "learning_rate": 3.6617041557169282e-06, "epoch": 0.37886396093426083, "percentage": 37.89, "elapsed_time": "13:00:14", "remaining_time": "21:19:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4113, "total_steps": 10853, "loss": 0.1474, "learning_rate": 3.6610295599464707e-06, "epoch": 0.37895609711153083, "percentage": 37.9, "elapsed_time": "13:00:25", "remaining_time": "21:18:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4114, "total_steps": 10853, "loss": 0.1462, "learning_rate": 3.660354856374294e-06, "epoch": 0.37904823328880083, "percentage": 37.91, "elapsed_time": "13:00:37", "remaining_time": "21:18:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4115, "total_steps": 10853, "loss": 0.1488, "learning_rate": 3.6596800450630445e-06, "epoch": 0.3791403694660708, "percentage": 37.92, "elapsed_time": "13:00:47", "remaining_time": "21:18:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4116, "total_steps": 10853, "loss": 0.1606, "learning_rate": 3.659005126075377e-06, "epoch": 0.3792325056433409, "percentage": 37.92, "elapsed_time": "13:00:58", "remaining_time": "21:18:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4117, "total_steps": 10853, "loss": 0.1618, "learning_rate": 3.65833009947396e-06, "epoch": 0.3793246418206109, "percentage": 37.93, "elapsed_time": "13:01:07", "remaining_time": "21:18:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4118, "total_steps": 10853, "loss": 0.151, "learning_rate": 3.657654965321468e-06, "epoch": 0.37941677799788087, "percentage": 37.94, "elapsed_time": "13:01:18", "remaining_time": "21:17:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4119, "total_steps": 10853, "loss": 0.1531, "learning_rate": 3.6569797236805877e-06, "epoch": 0.37950891417515087, "percentage": 37.95, "elapsed_time": "13:01:28", "remaining_time": "21:17:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4120, "total_steps": 10853, "loss": 0.1608, "learning_rate": 3.656304374614016e-06, "epoch": 0.37960105035242087, "percentage": 37.96, "elapsed_time": "13:01:39", "remaining_time": "21:17:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4121, "total_steps": 10853, "loss": 0.1614, "learning_rate": 3.6556289181844582e-06, "epoch": 0.37969318652969086, "percentage": 37.97, "elapsed_time": "13:01:51", "remaining_time": "21:17:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4122, "total_steps": 10853, "loss": 0.1658, "learning_rate": 3.654953354454631e-06, "epoch": 0.3797853227069609, "percentage": 37.98, "elapsed_time": "13:02:03", "remaining_time": "21:17:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4123, "total_steps": 10853, "loss": 0.1318, "learning_rate": 3.654277683487261e-06, "epoch": 0.3798774588842309, "percentage": 37.99, "elapsed_time": "13:02:14", "remaining_time": "21:16:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4124, "total_steps": 10853, "loss": 0.161, "learning_rate": 3.6536019053450834e-06, "epoch": 0.3799695950615009, "percentage": 38.0, "elapsed_time": "13:02:24", "remaining_time": "21:16:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4125, "total_steps": 10853, "loss": 0.1518, "learning_rate": 3.652926020090845e-06, "epoch": 0.3800617312387709, "percentage": 38.01, "elapsed_time": "13:02:33", "remaining_time": "21:16:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4126, "total_steps": 10853, "loss": 0.1413, "learning_rate": 3.6522500277873017e-06, "epoch": 0.3801538674160409, "percentage": 38.02, "elapsed_time": "13:02:43", "remaining_time": "21:16:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4127, "total_steps": 10853, "loss": 0.1545, "learning_rate": 3.651573928497219e-06, "epoch": 0.3802460035933109, "percentage": 38.03, "elapsed_time": "13:02:53", "remaining_time": "21:15:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4128, "total_steps": 10853, "loss": 0.1546, "learning_rate": 3.6508977222833737e-06, "epoch": 0.3803381397705809, "percentage": 38.04, "elapsed_time": "13:03:02", "remaining_time": "21:15:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4129, "total_steps": 10853, "loss": 0.1529, "learning_rate": 3.6502214092085504e-06, "epoch": 0.38043027594785095, "percentage": 38.04, "elapsed_time": "13:03:12", "remaining_time": "21:15:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4130, "total_steps": 10853, "loss": 0.1542, "learning_rate": 3.649544989335545e-06, "epoch": 0.38052241212512095, "percentage": 38.05, "elapsed_time": "13:03:23", "remaining_time": "21:15:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4131, "total_steps": 10853, "loss": 0.1575, "learning_rate": 3.648868462727165e-06, "epoch": 0.38061454830239094, "percentage": 38.06, "elapsed_time": "13:03:33", "remaining_time": "21:15:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4132, "total_steps": 10853, "loss": 0.1533, "learning_rate": 3.6481918294462237e-06, "epoch": 0.38070668447966094, "percentage": 38.07, "elapsed_time": "13:03:45", "remaining_time": "21:14:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4133, "total_steps": 10853, "loss": 0.1587, "learning_rate": 3.647515089555548e-06, "epoch": 0.38079882065693094, "percentage": 38.08, "elapsed_time": "13:03:56", "remaining_time": "21:14:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4134, "total_steps": 10853, "loss": 0.1435, "learning_rate": 3.6468382431179717e-06, "epoch": 0.38089095683420093, "percentage": 38.09, "elapsed_time": "13:04:08", "remaining_time": "21:14:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4135, "total_steps": 10853, "loss": 0.1529, "learning_rate": 3.646161290196342e-06, "epoch": 0.38098309301147093, "percentage": 38.1, "elapsed_time": "13:04:19", "remaining_time": "21:14:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4136, "total_steps": 10853, "loss": 0.1707, "learning_rate": 3.645484230853513e-06, "epoch": 0.381075229188741, "percentage": 38.11, "elapsed_time": "13:04:29", "remaining_time": "21:14:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4137, "total_steps": 10853, "loss": 0.1673, "learning_rate": 3.64480706515235e-06, "epoch": 0.381167365366011, "percentage": 38.12, "elapsed_time": "13:04:41", "remaining_time": "21:13:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4138, "total_steps": 10853, "loss": 0.1552, "learning_rate": 3.6441297931557274e-06, "epoch": 0.381259501543281, "percentage": 38.13, "elapsed_time": "13:04:51", "remaining_time": "21:13:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4139, "total_steps": 10853, "loss": 0.1594, "learning_rate": 3.643452414926531e-06, "epoch": 0.381351637720551, "percentage": 38.14, "elapsed_time": "13:05:02", "remaining_time": "21:13:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4140, "total_steps": 10853, "loss": 0.1415, "learning_rate": 3.6427749305276537e-06, "epoch": 0.38144377389782097, "percentage": 38.15, "elapsed_time": "13:05:12", "remaining_time": "21:13:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4141, "total_steps": 10853, "loss": 0.16, "learning_rate": 3.6420973400220016e-06, "epoch": 0.38153591007509097, "percentage": 38.16, "elapsed_time": "13:05:23", "remaining_time": "21:13:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4142, "total_steps": 10853, "loss": 0.1576, "learning_rate": 3.641419643472489e-06, "epoch": 0.38162804625236096, "percentage": 38.16, "elapsed_time": "13:05:34", "remaining_time": "21:12:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4143, "total_steps": 10853, "loss": 0.1504, "learning_rate": 3.640741840942039e-06, "epoch": 0.381720182429631, "percentage": 38.17, "elapsed_time": "13:05:45", "remaining_time": "21:12:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4144, "total_steps": 10853, "loss": 0.1525, "learning_rate": 3.640063932493588e-06, "epoch": 0.381812318606901, "percentage": 38.18, "elapsed_time": "13:05:56", "remaining_time": "21:12:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4145, "total_steps": 10853, "loss": 0.1527, "learning_rate": 3.639385918190076e-06, "epoch": 0.381904454784171, "percentage": 38.19, "elapsed_time": "13:06:07", "remaining_time": "21:12:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4146, "total_steps": 10853, "loss": 0.1621, "learning_rate": 3.6387077980944595e-06, "epoch": 0.381996590961441, "percentage": 38.2, "elapsed_time": "13:06:18", "remaining_time": "21:12:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4147, "total_steps": 10853, "loss": 0.1505, "learning_rate": 3.6380295722697023e-06, "epoch": 0.382088727138711, "percentage": 38.21, "elapsed_time": "13:06:28", "remaining_time": "21:11:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4148, "total_steps": 10853, "loss": 0.1354, "learning_rate": 3.637351240778776e-06, "epoch": 0.382180863315981, "percentage": 38.22, "elapsed_time": "13:06:39", "remaining_time": "21:11:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4149, "total_steps": 10853, "loss": 0.1546, "learning_rate": 3.6366728036846647e-06, "epoch": 0.382272999493251, "percentage": 38.23, "elapsed_time": "13:06:49", "remaining_time": "21:11:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4150, "total_steps": 10853, "loss": 0.1544, "learning_rate": 3.635994261050362e-06, "epoch": 0.38236513567052105, "percentage": 38.24, "elapsed_time": "13:06:59", "remaining_time": "21:11:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4151, "total_steps": 10853, "loss": 0.1522, "learning_rate": 3.6353156129388683e-06, "epoch": 0.38245727184779105, "percentage": 38.25, "elapsed_time": "13:07:10", "remaining_time": "21:10:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4152, "total_steps": 10853, "loss": 0.1393, "learning_rate": 3.634636859413199e-06, "epoch": 0.38254940802506104, "percentage": 38.26, "elapsed_time": "13:07:22", "remaining_time": "21:10:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4153, "total_steps": 10853, "loss": 0.1567, "learning_rate": 3.633958000536375e-06, "epoch": 0.38264154420233104, "percentage": 38.27, "elapsed_time": "13:07:32", "remaining_time": "21:10:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4154, "total_steps": 10853, "loss": 0.1542, "learning_rate": 3.633279036371429e-06, "epoch": 0.38273368037960104, "percentage": 38.28, "elapsed_time": "13:07:44", "remaining_time": "21:10:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4155, "total_steps": 10853, "loss": 0.1477, "learning_rate": 3.6325999669814014e-06, "epoch": 0.38282581655687103, "percentage": 38.28, "elapsed_time": "13:07:55", "remaining_time": "21:10:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4156, "total_steps": 10853, "loss": 0.1534, "learning_rate": 3.631920792429346e-06, "epoch": 0.3829179527341411, "percentage": 38.29, "elapsed_time": "13:08:05", "remaining_time": "21:09:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4157, "total_steps": 10853, "loss": 0.1436, "learning_rate": 3.6312415127783228e-06, "epoch": 0.3830100889114111, "percentage": 38.3, "elapsed_time": "13:08:16", "remaining_time": "21:09:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4158, "total_steps": 10853, "loss": 0.1546, "learning_rate": 3.630562128091403e-06, "epoch": 0.3831022250886811, "percentage": 38.31, "elapsed_time": "13:08:28", "remaining_time": "21:09:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4159, "total_steps": 10853, "loss": 0.1514, "learning_rate": 3.6298826384316684e-06, "epoch": 0.3831943612659511, "percentage": 38.32, "elapsed_time": "13:08:38", "remaining_time": "21:09:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4160, "total_steps": 10853, "loss": 0.1424, "learning_rate": 3.6292030438622093e-06, "epoch": 0.3832864974432211, "percentage": 38.33, "elapsed_time": "13:08:48", "remaining_time": "21:09:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4161, "total_steps": 10853, "loss": 0.1644, "learning_rate": 3.6285233444461255e-06, "epoch": 0.38337863362049107, "percentage": 38.34, "elapsed_time": "13:08:59", "remaining_time": "21:08:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4162, "total_steps": 10853, "loss": 0.1357, "learning_rate": 3.6278435402465283e-06, "epoch": 0.38347076979776107, "percentage": 38.35, "elapsed_time": "13:09:09", "remaining_time": "21:08:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4163, "total_steps": 10853, "loss": 0.1697, "learning_rate": 3.6271636313265368e-06, "epoch": 0.3835629059750311, "percentage": 38.36, "elapsed_time": "13:09:20", "remaining_time": "21:08:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4164, "total_steps": 10853, "loss": 0.1469, "learning_rate": 3.6264836177492812e-06, "epoch": 0.3836550421523011, "percentage": 38.37, "elapsed_time": "13:09:30", "remaining_time": "21:08:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4165, "total_steps": 10853, "loss": 0.1342, "learning_rate": 3.6258034995778994e-06, "epoch": 0.3837471783295711, "percentage": 38.38, "elapsed_time": "13:09:42", "remaining_time": "21:08:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4166, "total_steps": 10853, "loss": 0.154, "learning_rate": 3.6251232768755428e-06, "epoch": 0.3838393145068411, "percentage": 38.39, "elapsed_time": "13:09:53", "remaining_time": "21:07:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4167, "total_steps": 10853, "loss": 0.1507, "learning_rate": 3.6244429497053678e-06, "epoch": 0.3839314506841111, "percentage": 38.39, "elapsed_time": "13:10:03", "remaining_time": "21:07:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4168, "total_steps": 10853, "loss": 0.1474, "learning_rate": 3.623762518130545e-06, "epoch": 0.3840235868613811, "percentage": 38.4, "elapsed_time": "13:10:13", "remaining_time": "21:07:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4169, "total_steps": 10853, "loss": 0.1416, "learning_rate": 3.6230819822142504e-06, "epoch": 0.3841157230386511, "percentage": 38.41, "elapsed_time": "13:10:22", "remaining_time": "21:07:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4170, "total_steps": 10853, "loss": 0.1586, "learning_rate": 3.6224013420196734e-06, "epoch": 0.38420785921592115, "percentage": 38.42, "elapsed_time": "13:10:32", "remaining_time": "21:06:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4171, "total_steps": 10853, "loss": 0.1431, "learning_rate": 3.621720597610011e-06, "epoch": 0.38429999539319115, "percentage": 38.43, "elapsed_time": "13:10:42", "remaining_time": "21:06:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4172, "total_steps": 10853, "loss": 0.1383, "learning_rate": 3.62103974904847e-06, "epoch": 0.38439213157046115, "percentage": 38.44, "elapsed_time": "13:10:53", "remaining_time": "21:06:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4173, "total_steps": 10853, "loss": 0.1438, "learning_rate": 3.620358796398268e-06, "epoch": 0.38448426774773115, "percentage": 38.45, "elapsed_time": "13:11:04", "remaining_time": "21:06:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4174, "total_steps": 10853, "loss": 0.1439, "learning_rate": 3.6196777397226314e-06, "epoch": 0.38457640392500114, "percentage": 38.46, "elapsed_time": "13:11:15", "remaining_time": "21:06:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4175, "total_steps": 10853, "loss": 0.1706, "learning_rate": 3.618996579084796e-06, "epoch": 0.38466854010227114, "percentage": 38.47, "elapsed_time": "13:11:26", "remaining_time": "21:05:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4176, "total_steps": 10853, "loss": 0.1502, "learning_rate": 3.6183153145480075e-06, "epoch": 0.38476067627954114, "percentage": 38.48, "elapsed_time": "13:11:36", "remaining_time": "21:05:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4177, "total_steps": 10853, "loss": 0.1544, "learning_rate": 3.6176339461755217e-06, "epoch": 0.3848528124568112, "percentage": 38.49, "elapsed_time": "13:11:48", "remaining_time": "21:05:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4178, "total_steps": 10853, "loss": 0.1269, "learning_rate": 3.6169524740306038e-06, "epoch": 0.3849449486340812, "percentage": 38.5, "elapsed_time": "13:11:59", "remaining_time": "21:05:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4179, "total_steps": 10853, "loss": 0.1392, "learning_rate": 3.6162708981765294e-06, "epoch": 0.3850370848113512, "percentage": 38.51, "elapsed_time": "13:12:11", "remaining_time": "21:05:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4180, "total_steps": 10853, "loss": 0.1477, "learning_rate": 3.6155892186765805e-06, "epoch": 0.3851292209886212, "percentage": 38.51, "elapsed_time": "13:12:22", "remaining_time": "21:04:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4181, "total_steps": 10853, "loss": 0.1398, "learning_rate": 3.6149074355940533e-06, "epoch": 0.3852213571658912, "percentage": 38.52, "elapsed_time": "13:12:32", "remaining_time": "21:04:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4182, "total_steps": 10853, "loss": 0.1531, "learning_rate": 3.614225548992251e-06, "epoch": 0.3853134933431612, "percentage": 38.53, "elapsed_time": "13:12:45", "remaining_time": "21:04:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4183, "total_steps": 10853, "loss": 0.1451, "learning_rate": 3.6135435589344857e-06, "epoch": 0.38540562952043117, "percentage": 38.54, "elapsed_time": "13:12:57", "remaining_time": "21:04:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4184, "total_steps": 10853, "loss": 0.1572, "learning_rate": 3.612861465484082e-06, "epoch": 0.3854977656977012, "percentage": 38.55, "elapsed_time": "13:13:07", "remaining_time": "21:04:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4185, "total_steps": 10853, "loss": 0.1673, "learning_rate": 3.612179268704371e-06, "epoch": 0.3855899018749712, "percentage": 38.56, "elapsed_time": "13:13:18", "remaining_time": "21:03:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4186, "total_steps": 10853, "loss": 0.1397, "learning_rate": 3.611496968658695e-06, "epoch": 0.3856820380522412, "percentage": 38.57, "elapsed_time": "13:13:29", "remaining_time": "21:03:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4187, "total_steps": 10853, "loss": 0.1539, "learning_rate": 3.6108145654104065e-06, "epoch": 0.3857741742295112, "percentage": 38.58, "elapsed_time": "13:13:40", "remaining_time": "21:03:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4188, "total_steps": 10853, "loss": 0.151, "learning_rate": 3.610132059022865e-06, "epoch": 0.3858663104067812, "percentage": 38.59, "elapsed_time": "13:13:52", "remaining_time": "21:03:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4189, "total_steps": 10853, "loss": 0.1457, "learning_rate": 3.6094494495594435e-06, "epoch": 0.3859584465840512, "percentage": 38.6, "elapsed_time": "13:14:03", "remaining_time": "21:03:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4190, "total_steps": 10853, "loss": 0.1533, "learning_rate": 3.6087667370835213e-06, "epoch": 0.38605058276132126, "percentage": 38.61, "elapsed_time": "13:14:14", "remaining_time": "21:03:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4191, "total_steps": 10853, "loss": 0.1463, "learning_rate": 3.6080839216584875e-06, "epoch": 0.38614271893859126, "percentage": 38.62, "elapsed_time": "13:14:24", "remaining_time": "21:02:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4192, "total_steps": 10853, "loss": 0.1473, "learning_rate": 3.6074010033477425e-06, "epoch": 0.38623485511586125, "percentage": 38.63, "elapsed_time": "13:14:34", "remaining_time": "21:02:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4193, "total_steps": 10853, "loss": 0.1629, "learning_rate": 3.606717982214695e-06, "epoch": 0.38632699129313125, "percentage": 38.63, "elapsed_time": "13:14:44", "remaining_time": "21:02:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4194, "total_steps": 10853, "loss": 0.1282, "learning_rate": 3.6060348583227635e-06, "epoch": 0.38641912747040125, "percentage": 38.64, "elapsed_time": "13:14:55", "remaining_time": "21:02:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4195, "total_steps": 10853, "loss": 0.1499, "learning_rate": 3.6053516317353777e-06, "epoch": 0.38651126364767124, "percentage": 38.65, "elapsed_time": "13:15:05", "remaining_time": "21:01:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4196, "total_steps": 10853, "loss": 0.1315, "learning_rate": 3.6046683025159722e-06, "epoch": 0.38660339982494124, "percentage": 38.66, "elapsed_time": "13:15:16", "remaining_time": "21:01:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4197, "total_steps": 10853, "loss": 0.1675, "learning_rate": 3.6039848707279965e-06, "epoch": 0.3866955360022113, "percentage": 38.67, "elapsed_time": "13:15:27", "remaining_time": "21:01:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4198, "total_steps": 10853, "loss": 0.1433, "learning_rate": 3.6033013364349074e-06, "epoch": 0.3867876721794813, "percentage": 38.68, "elapsed_time": "13:15:38", "remaining_time": "21:01:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4199, "total_steps": 10853, "loss": 0.1602, "learning_rate": 3.60261769970017e-06, "epoch": 0.3868798083567513, "percentage": 38.69, "elapsed_time": "13:15:50", "remaining_time": "21:01:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4200, "total_steps": 10853, "loss": 0.1423, "learning_rate": 3.6019339605872604e-06, "epoch": 0.3869719445340213, "percentage": 38.7, "elapsed_time": "13:15:59", "remaining_time": "21:00:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4201, "total_steps": 10853, "loss": 0.129, "learning_rate": 3.6012501191596637e-06, "epoch": 0.3870640807112913, "percentage": 38.71, "elapsed_time": "13:16:10", "remaining_time": "21:00:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4202, "total_steps": 10853, "loss": 0.1306, "learning_rate": 3.6005661754808755e-06, "epoch": 0.3871562168885613, "percentage": 38.72, "elapsed_time": "13:16:21", "remaining_time": "21:00:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4203, "total_steps": 10853, "loss": 0.1647, "learning_rate": 3.5998821296143995e-06, "epoch": 0.3872483530658313, "percentage": 38.73, "elapsed_time": "13:16:30", "remaining_time": "21:00:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4204, "total_steps": 10853, "loss": 0.1398, "learning_rate": 3.5991979816237495e-06, "epoch": 0.3873404892431013, "percentage": 38.74, "elapsed_time": "13:16:41", "remaining_time": "21:00:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4205, "total_steps": 10853, "loss": 0.1467, "learning_rate": 3.5985137315724476e-06, "epoch": 0.3874326254203713, "percentage": 38.75, "elapsed_time": "13:16:50", "remaining_time": "20:59:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4206, "total_steps": 10853, "loss": 0.1527, "learning_rate": 3.597829379524029e-06, "epoch": 0.3875247615976413, "percentage": 38.75, "elapsed_time": "13:17:00", "remaining_time": "20:59:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4207, "total_steps": 10853, "loss": 0.1429, "learning_rate": 3.5971449255420334e-06, "epoch": 0.3876168977749113, "percentage": 38.76, "elapsed_time": "13:17:12", "remaining_time": "20:59:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4208, "total_steps": 10853, "loss": 0.1767, "learning_rate": 3.5964603696900137e-06, "epoch": 0.3877090339521813, "percentage": 38.77, "elapsed_time": "13:17:23", "remaining_time": "20:59:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4209, "total_steps": 10853, "loss": 0.1477, "learning_rate": 3.59577571203153e-06, "epoch": 0.3878011701294513, "percentage": 38.78, "elapsed_time": "13:17:35", "remaining_time": "20:59:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4210, "total_steps": 10853, "loss": 0.1435, "learning_rate": 3.5950909526301543e-06, "epoch": 0.3878933063067213, "percentage": 38.79, "elapsed_time": "13:17:45", "remaining_time": "20:58:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4211, "total_steps": 10853, "loss": 0.1496, "learning_rate": 3.5944060915494656e-06, "epoch": 0.38798544248399136, "percentage": 38.8, "elapsed_time": "13:17:55", "remaining_time": "20:58:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4212, "total_steps": 10853, "loss": 0.1414, "learning_rate": 3.5937211288530536e-06, "epoch": 0.38807757866126136, "percentage": 38.81, "elapsed_time": "13:18:06", "remaining_time": "20:58:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4213, "total_steps": 10853, "loss": 0.144, "learning_rate": 3.5930360646045165e-06, "epoch": 0.38816971483853135, "percentage": 38.82, "elapsed_time": "13:18:17", "remaining_time": "20:58:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4214, "total_steps": 10853, "loss": 0.1531, "learning_rate": 3.5923508988674643e-06, "epoch": 0.38826185101580135, "percentage": 38.83, "elapsed_time": "13:18:28", "remaining_time": "20:57:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4215, "total_steps": 10853, "loss": 0.1583, "learning_rate": 3.591665631705512e-06, "epoch": 0.38835398719307135, "percentage": 38.84, "elapsed_time": "13:18:39", "remaining_time": "20:57:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4216, "total_steps": 10853, "loss": 0.1392, "learning_rate": 3.59098026318229e-06, "epoch": 0.38844612337034135, "percentage": 38.85, "elapsed_time": "13:18:49", "remaining_time": "20:57:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4217, "total_steps": 10853, "loss": 0.1394, "learning_rate": 3.5902947933614317e-06, "epoch": 0.38853825954761134, "percentage": 38.86, "elapsed_time": "13:19:00", "remaining_time": "20:57:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4218, "total_steps": 10853, "loss": 0.1541, "learning_rate": 3.5896092223065854e-06, "epoch": 0.3886303957248814, "percentage": 38.86, "elapsed_time": "13:19:11", "remaining_time": "20:57:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4219, "total_steps": 10853, "loss": 0.1542, "learning_rate": 3.5889235500814055e-06, "epoch": 0.3887225319021514, "percentage": 38.87, "elapsed_time": "13:19:22", "remaining_time": "20:56:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4220, "total_steps": 10853, "loss": 0.1501, "learning_rate": 3.588237776749557e-06, "epoch": 0.3888146680794214, "percentage": 38.88, "elapsed_time": "13:19:33", "remaining_time": "20:56:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4221, "total_steps": 10853, "loss": 0.1453, "learning_rate": 3.5875519023747125e-06, "epoch": 0.3889068042566914, "percentage": 38.89, "elapsed_time": "13:19:43", "remaining_time": "20:56:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4222, "total_steps": 10853, "loss": 0.1493, "learning_rate": 3.5868659270205584e-06, "epoch": 0.3889989404339614, "percentage": 38.9, "elapsed_time": "13:19:52", "remaining_time": "20:56:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4223, "total_steps": 10853, "loss": 0.1544, "learning_rate": 3.586179850750785e-06, "epoch": 0.3890910766112314, "percentage": 38.91, "elapsed_time": "13:20:02", "remaining_time": "20:56:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4224, "total_steps": 10853, "loss": 0.1495, "learning_rate": 3.5854936736290956e-06, "epoch": 0.38918321278850143, "percentage": 38.92, "elapsed_time": "13:20:12", "remaining_time": "20:55:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4225, "total_steps": 10853, "loss": 0.1316, "learning_rate": 3.584807395719202e-06, "epoch": 0.38927534896577143, "percentage": 38.93, "elapsed_time": "13:20:22", "remaining_time": "20:55:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4226, "total_steps": 10853, "loss": 0.162, "learning_rate": 3.584121017084825e-06, "epoch": 0.3893674851430414, "percentage": 38.94, "elapsed_time": "13:20:33", "remaining_time": "20:55:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4227, "total_steps": 10853, "loss": 0.1534, "learning_rate": 3.5834345377896953e-06, "epoch": 0.3894596213203114, "percentage": 38.95, "elapsed_time": "13:20:44", "remaining_time": "20:55:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4228, "total_steps": 10853, "loss": 0.1485, "learning_rate": 3.5827479578975523e-06, "epoch": 0.3895517574975814, "percentage": 38.96, "elapsed_time": "13:20:57", "remaining_time": "20:55:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4229, "total_steps": 10853, "loss": 0.142, "learning_rate": 3.582061277472144e-06, "epoch": 0.3896438936748514, "percentage": 38.97, "elapsed_time": "13:21:08", "remaining_time": "20:54:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4230, "total_steps": 10853, "loss": 0.1496, "learning_rate": 3.5813744965772296e-06, "epoch": 0.3897360298521214, "percentage": 38.98, "elapsed_time": "13:21:19", "remaining_time": "20:54:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4231, "total_steps": 10853, "loss": 0.1349, "learning_rate": 3.580687615276577e-06, "epoch": 0.38982816602939147, "percentage": 38.98, "elapsed_time": "13:21:31", "remaining_time": "20:54:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4232, "total_steps": 10853, "loss": 0.1495, "learning_rate": 3.580000633633963e-06, "epoch": 0.38992030220666146, "percentage": 38.99, "elapsed_time": "13:21:40", "remaining_time": "20:54:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4233, "total_steps": 10853, "loss": 0.1616, "learning_rate": 3.579313551713175e-06, "epoch": 0.39001243838393146, "percentage": 39.0, "elapsed_time": "13:21:51", "remaining_time": "20:54:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4234, "total_steps": 10853, "loss": 0.145, "learning_rate": 3.578626369578006e-06, "epoch": 0.39010457456120146, "percentage": 39.01, "elapsed_time": "13:22:02", "remaining_time": "20:53:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4235, "total_steps": 10853, "loss": 0.1542, "learning_rate": 3.5779390872922637e-06, "epoch": 0.39019671073847145, "percentage": 39.02, "elapsed_time": "13:22:13", "remaining_time": "20:53:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4236, "total_steps": 10853, "loss": 0.1668, "learning_rate": 3.5772517049197602e-06, "epoch": 0.39028884691574145, "percentage": 39.03, "elapsed_time": "13:22:24", "remaining_time": "20:53:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4237, "total_steps": 10853, "loss": 0.1501, "learning_rate": 3.5765642225243204e-06, "epoch": 0.39038098309301145, "percentage": 39.04, "elapsed_time": "13:22:34", "remaining_time": "20:53:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4238, "total_steps": 10853, "loss": 0.1526, "learning_rate": 3.575876640169777e-06, "epoch": 0.3904731192702815, "percentage": 39.05, "elapsed_time": "13:22:45", "remaining_time": "20:52:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4239, "total_steps": 10853, "loss": 0.1519, "learning_rate": 3.5751889579199715e-06, "epoch": 0.3905652554475515, "percentage": 39.06, "elapsed_time": "13:22:56", "remaining_time": "20:52:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4240, "total_steps": 10853, "loss": 0.147, "learning_rate": 3.574501175838755e-06, "epoch": 0.3906573916248215, "percentage": 39.07, "elapsed_time": "13:23:07", "remaining_time": "20:52:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4241, "total_steps": 10853, "loss": 0.1593, "learning_rate": 3.5738132939899895e-06, "epoch": 0.3907495278020915, "percentage": 39.08, "elapsed_time": "13:23:19", "remaining_time": "20:52:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4242, "total_steps": 10853, "loss": 0.1571, "learning_rate": 3.573125312437544e-06, "epoch": 0.3908416639793615, "percentage": 39.09, "elapsed_time": "13:23:29", "remaining_time": "20:52:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4243, "total_steps": 10853, "loss": 0.1469, "learning_rate": 3.572437231245297e-06, "epoch": 0.3909338001566315, "percentage": 39.1, "elapsed_time": "13:23:40", "remaining_time": "20:52:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4244, "total_steps": 10853, "loss": 0.1549, "learning_rate": 3.5717490504771386e-06, "epoch": 0.3910259363339015, "percentage": 39.1, "elapsed_time": "13:23:51", "remaining_time": "20:51:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4245, "total_steps": 10853, "loss": 0.1426, "learning_rate": 3.571060770196965e-06, "epoch": 0.39111807251117153, "percentage": 39.11, "elapsed_time": "13:24:02", "remaining_time": "20:51:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4246, "total_steps": 10853, "loss": 0.1373, "learning_rate": 3.570372390468684e-06, "epoch": 0.39121020868844153, "percentage": 39.12, "elapsed_time": "13:24:12", "remaining_time": "20:51:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4247, "total_steps": 10853, "loss": 0.147, "learning_rate": 3.569683911356211e-06, "epoch": 0.3913023448657115, "percentage": 39.13, "elapsed_time": "13:24:22", "remaining_time": "20:51:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4248, "total_steps": 10853, "loss": 0.1557, "learning_rate": 3.568995332923472e-06, "epoch": 0.3913944810429815, "percentage": 39.14, "elapsed_time": "13:24:34", "remaining_time": "20:50:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4249, "total_steps": 10853, "loss": 0.1653, "learning_rate": 3.568306655234401e-06, "epoch": 0.3914866172202515, "percentage": 39.15, "elapsed_time": "13:24:46", "remaining_time": "20:50:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4250, "total_steps": 10853, "loss": 0.1434, "learning_rate": 3.567617878352942e-06, "epoch": 0.3915787533975215, "percentage": 39.16, "elapsed_time": "13:24:57", "remaining_time": "20:50:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4251, "total_steps": 10853, "loss": 0.145, "learning_rate": 3.566929002343048e-06, "epoch": 0.3916708895747915, "percentage": 39.17, "elapsed_time": "13:25:07", "remaining_time": "20:50:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4252, "total_steps": 10853, "loss": 0.1505, "learning_rate": 3.5662400272686813e-06, "epoch": 0.39176302575206157, "percentage": 39.18, "elapsed_time": "13:25:17", "remaining_time": "20:50:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4253, "total_steps": 10853, "loss": 0.1491, "learning_rate": 3.5655509531938143e-06, "epoch": 0.39185516192933156, "percentage": 39.19, "elapsed_time": "13:25:28", "remaining_time": "20:49:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4254, "total_steps": 10853, "loss": 0.1474, "learning_rate": 3.5648617801824257e-06, "epoch": 0.39194729810660156, "percentage": 39.2, "elapsed_time": "13:25:39", "remaining_time": "20:49:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4255, "total_steps": 10853, "loss": 0.1385, "learning_rate": 3.5641725082985066e-06, "epoch": 0.39203943428387156, "percentage": 39.21, "elapsed_time": "13:25:50", "remaining_time": "20:49:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4256, "total_steps": 10853, "loss": 0.1483, "learning_rate": 3.5634831376060554e-06, "epoch": 0.39213157046114155, "percentage": 39.21, "elapsed_time": "13:26:01", "remaining_time": "20:49:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4257, "total_steps": 10853, "loss": 0.1385, "learning_rate": 3.5627936681690804e-06, "epoch": 0.39222370663841155, "percentage": 39.22, "elapsed_time": "13:26:13", "remaining_time": "20:49:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4258, "total_steps": 10853, "loss": 0.1502, "learning_rate": 3.562104100051599e-06, "epoch": 0.3923158428156816, "percentage": 39.23, "elapsed_time": "13:26:25", "remaining_time": "20:49:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4259, "total_steps": 10853, "loss": 0.144, "learning_rate": 3.561414433317637e-06, "epoch": 0.3924079789929516, "percentage": 39.24, "elapsed_time": "13:26:34", "remaining_time": "20:48:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4260, "total_steps": 10853, "loss": 0.1535, "learning_rate": 3.560724668031231e-06, "epoch": 0.3925001151702216, "percentage": 39.25, "elapsed_time": "13:26:45", "remaining_time": "20:48:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4261, "total_steps": 10853, "loss": 0.1575, "learning_rate": 3.560034804256426e-06, "epoch": 0.3925922513474916, "percentage": 39.26, "elapsed_time": "13:26:55", "remaining_time": "20:48:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4262, "total_steps": 10853, "loss": 0.1352, "learning_rate": 3.5593448420572753e-06, "epoch": 0.3926843875247616, "percentage": 39.27, "elapsed_time": "13:27:06", "remaining_time": "20:48:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4263, "total_steps": 10853, "loss": 0.1351, "learning_rate": 3.558654781497841e-06, "epoch": 0.3927765237020316, "percentage": 39.28, "elapsed_time": "13:27:17", "remaining_time": "20:47:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4264, "total_steps": 10853, "loss": 0.1488, "learning_rate": 3.557964622642197e-06, "epoch": 0.3928686598793016, "percentage": 39.29, "elapsed_time": "13:27:28", "remaining_time": "20:47:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4265, "total_steps": 10853, "loss": 0.1651, "learning_rate": 3.557274365554424e-06, "epoch": 0.39296079605657164, "percentage": 39.3, "elapsed_time": "13:27:39", "remaining_time": "20:47:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4266, "total_steps": 10853, "loss": 0.1377, "learning_rate": 3.5565840102986128e-06, "epoch": 0.39305293223384163, "percentage": 39.31, "elapsed_time": "13:27:50", "remaining_time": "20:47:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4267, "total_steps": 10853, "loss": 0.1401, "learning_rate": 3.555893556938862e-06, "epoch": 0.39314506841111163, "percentage": 39.32, "elapsed_time": "13:28:01", "remaining_time": "20:47:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4268, "total_steps": 10853, "loss": 0.1333, "learning_rate": 3.5552030055392805e-06, "epoch": 0.39323720458838163, "percentage": 39.33, "elapsed_time": "13:28:11", "remaining_time": "20:46:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4269, "total_steps": 10853, "loss": 0.152, "learning_rate": 3.554512356163986e-06, "epoch": 0.3933293407656516, "percentage": 39.33, "elapsed_time": "13:28:21", "remaining_time": "20:46:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4270, "total_steps": 10853, "loss": 0.1355, "learning_rate": 3.553821608877107e-06, "epoch": 0.3934214769429216, "percentage": 39.34, "elapsed_time": "13:28:30", "remaining_time": "20:46:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4271, "total_steps": 10853, "loss": 0.1461, "learning_rate": 3.5531307637427774e-06, "epoch": 0.3935136131201916, "percentage": 39.35, "elapsed_time": "13:28:41", "remaining_time": "20:46:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4272, "total_steps": 10853, "loss": 0.1475, "learning_rate": 3.552439820825143e-06, "epoch": 0.39360574929746167, "percentage": 39.36, "elapsed_time": "13:28:53", "remaining_time": "20:46:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4273, "total_steps": 10853, "loss": 0.1617, "learning_rate": 3.5517487801883587e-06, "epoch": 0.39369788547473167, "percentage": 39.37, "elapsed_time": "13:29:03", "remaining_time": "20:45:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4274, "total_steps": 10853, "loss": 0.1383, "learning_rate": 3.5510576418965862e-06, "epoch": 0.39379002165200166, "percentage": 39.38, "elapsed_time": "13:29:13", "remaining_time": "20:45:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4275, "total_steps": 10853, "loss": 0.1514, "learning_rate": 3.5503664060139987e-06, "epoch": 0.39388215782927166, "percentage": 39.39, "elapsed_time": "13:29:26", "remaining_time": "20:45:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4276, "total_steps": 10853, "loss": 0.1327, "learning_rate": 3.549675072604778e-06, "epoch": 0.39397429400654166, "percentage": 39.4, "elapsed_time": "13:29:36", "remaining_time": "20:45:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4277, "total_steps": 10853, "loss": 0.1525, "learning_rate": 3.548983641733113e-06, "epoch": 0.39406643018381166, "percentage": 39.41, "elapsed_time": "13:29:46", "remaining_time": "20:45:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4278, "total_steps": 10853, "loss": 0.1509, "learning_rate": 3.5482921134632043e-06, "epoch": 0.39415856636108165, "percentage": 39.42, "elapsed_time": "13:29:57", "remaining_time": "20:44:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4279, "total_steps": 10853, "loss": 0.1454, "learning_rate": 3.54760048785926e-06, "epoch": 0.3942507025383517, "percentage": 39.43, "elapsed_time": "13:30:08", "remaining_time": "20:44:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4280, "total_steps": 10853, "loss": 0.1604, "learning_rate": 3.546908764985498e-06, "epoch": 0.3943428387156217, "percentage": 39.44, "elapsed_time": "13:30:20", "remaining_time": "20:44:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4281, "total_steps": 10853, "loss": 0.1433, "learning_rate": 3.5462169449061445e-06, "epoch": 0.3944349748928917, "percentage": 39.45, "elapsed_time": "13:30:30", "remaining_time": "20:44:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4282, "total_steps": 10853, "loss": 0.1445, "learning_rate": 3.5455250276854348e-06, "epoch": 0.3945271110701617, "percentage": 39.45, "elapsed_time": "13:30:41", "remaining_time": "20:44:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4283, "total_steps": 10853, "loss": 0.1269, "learning_rate": 3.544833013387613e-06, "epoch": 0.3946192472474317, "percentage": 39.46, "elapsed_time": "13:30:51", "remaining_time": "20:43:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4284, "total_steps": 10853, "loss": 0.1496, "learning_rate": 3.5441409020769347e-06, "epoch": 0.3947113834247017, "percentage": 39.47, "elapsed_time": "13:31:03", "remaining_time": "20:43:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4285, "total_steps": 10853, "loss": 0.1407, "learning_rate": 3.5434486938176606e-06, "epoch": 0.39480351960197174, "percentage": 39.48, "elapsed_time": "13:31:13", "remaining_time": "20:43:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4286, "total_steps": 10853, "loss": 0.1519, "learning_rate": 3.5427563886740633e-06, "epoch": 0.39489565577924174, "percentage": 39.49, "elapsed_time": "13:31:23", "remaining_time": "20:43:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4287, "total_steps": 10853, "loss": 0.1582, "learning_rate": 3.542063986710423e-06, "epoch": 0.39498779195651174, "percentage": 39.5, "elapsed_time": "13:31:36", "remaining_time": "20:43:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4288, "total_steps": 10853, "loss": 0.1435, "learning_rate": 3.5413714879910287e-06, "epoch": 0.39507992813378173, "percentage": 39.51, "elapsed_time": "13:31:47", "remaining_time": "20:42:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4289, "total_steps": 10853, "loss": 0.146, "learning_rate": 3.540678892580181e-06, "epoch": 0.39517206431105173, "percentage": 39.52, "elapsed_time": "13:31:56", "remaining_time": "20:42:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4290, "total_steps": 10853, "loss": 0.148, "learning_rate": 3.539986200542185e-06, "epoch": 0.3952642004883217, "percentage": 39.53, "elapsed_time": "13:32:06", "remaining_time": "20:42:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4291, "total_steps": 10853, "loss": 0.1486, "learning_rate": 3.539293411941359e-06, "epoch": 0.3953563366655917, "percentage": 39.54, "elapsed_time": "13:32:17", "remaining_time": "20:42:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4292, "total_steps": 10853, "loss": 0.1507, "learning_rate": 3.5386005268420277e-06, "epoch": 0.3954484728428618, "percentage": 39.55, "elapsed_time": "13:32:29", "remaining_time": "20:42:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4293, "total_steps": 10853, "loss": 0.1572, "learning_rate": 3.5379075453085256e-06, "epoch": 0.3955406090201318, "percentage": 39.56, "elapsed_time": "13:32:40", "remaining_time": "20:41:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4294, "total_steps": 10853, "loss": 0.1366, "learning_rate": 3.5372144674051963e-06, "epoch": 0.39563274519740177, "percentage": 39.57, "elapsed_time": "13:32:50", "remaining_time": "20:41:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4295, "total_steps": 10853, "loss": 0.1654, "learning_rate": 3.536521293196392e-06, "epoch": 0.39572488137467177, "percentage": 39.57, "elapsed_time": "13:33:00", "remaining_time": "20:41:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4296, "total_steps": 10853, "loss": 0.1624, "learning_rate": 3.5358280227464735e-06, "epoch": 0.39581701755194176, "percentage": 39.58, "elapsed_time": "13:33:12", "remaining_time": "20:41:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4297, "total_steps": 10853, "loss": 0.1367, "learning_rate": 3.535134656119813e-06, "epoch": 0.39590915372921176, "percentage": 39.59, "elapsed_time": "13:33:24", "remaining_time": "20:41:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4298, "total_steps": 10853, "loss": 0.142, "learning_rate": 3.534441193380787e-06, "epoch": 0.39600128990648176, "percentage": 39.6, "elapsed_time": "13:33:35", "remaining_time": "20:40:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4299, "total_steps": 10853, "loss": 0.1462, "learning_rate": 3.5337476345937853e-06, "epoch": 0.3960934260837518, "percentage": 39.61, "elapsed_time": "13:33:45", "remaining_time": "20:40:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4300, "total_steps": 10853, "loss": 0.1333, "learning_rate": 3.5330539798232044e-06, "epoch": 0.3961855622610218, "percentage": 39.62, "elapsed_time": "13:33:56", "remaining_time": "20:40:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4301, "total_steps": 10853, "loss": 0.1525, "learning_rate": 3.5323602291334508e-06, "epoch": 0.3962776984382918, "percentage": 39.63, "elapsed_time": "13:34:07", "remaining_time": "20:40:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4302, "total_steps": 10853, "loss": 0.1462, "learning_rate": 3.5316663825889384e-06, "epoch": 0.3963698346155618, "percentage": 39.64, "elapsed_time": "13:34:16", "remaining_time": "20:39:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4303, "total_steps": 10853, "loss": 0.1465, "learning_rate": 3.530972440254092e-06, "epoch": 0.3964619707928318, "percentage": 39.65, "elapsed_time": "13:34:27", "remaining_time": "20:39:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4304, "total_steps": 10853, "loss": 0.1501, "learning_rate": 3.530278402193342e-06, "epoch": 0.3965541069701018, "percentage": 39.66, "elapsed_time": "13:34:39", "remaining_time": "20:39:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4305, "total_steps": 10853, "loss": 0.1487, "learning_rate": 3.5295842684711334e-06, "epoch": 0.3966462431473718, "percentage": 39.67, "elapsed_time": "13:34:51", "remaining_time": "20:39:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4306, "total_steps": 10853, "loss": 0.1374, "learning_rate": 3.528890039151913e-06, "epoch": 0.39673837932464184, "percentage": 39.68, "elapsed_time": "13:35:01", "remaining_time": "20:39:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4307, "total_steps": 10853, "loss": 0.165, "learning_rate": 3.5281957143001426e-06, "epoch": 0.39683051550191184, "percentage": 39.68, "elapsed_time": "13:35:11", "remaining_time": "20:38:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4308, "total_steps": 10853, "loss": 0.1546, "learning_rate": 3.5275012939802895e-06, "epoch": 0.39692265167918184, "percentage": 39.69, "elapsed_time": "13:35:22", "remaining_time": "20:38:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4309, "total_steps": 10853, "loss": 0.1433, "learning_rate": 3.5268067782568306e-06, "epoch": 0.39701478785645183, "percentage": 39.7, "elapsed_time": "13:35:33", "remaining_time": "20:38:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4310, "total_steps": 10853, "loss": 0.1475, "learning_rate": 3.5261121671942515e-06, "epoch": 0.39710692403372183, "percentage": 39.71, "elapsed_time": "13:35:44", "remaining_time": "20:38:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4311, "total_steps": 10853, "loss": 0.1468, "learning_rate": 3.525417460857048e-06, "epoch": 0.39719906021099183, "percentage": 39.72, "elapsed_time": "13:35:54", "remaining_time": "20:38:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4312, "total_steps": 10853, "loss": 0.1642, "learning_rate": 3.524722659309722e-06, "epoch": 0.3972911963882618, "percentage": 39.73, "elapsed_time": "13:36:06", "remaining_time": "20:37:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4313, "total_steps": 10853, "loss": 0.1434, "learning_rate": 3.5240277626167875e-06, "epoch": 0.3973833325655319, "percentage": 39.74, "elapsed_time": "13:36:18", "remaining_time": "20:37:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4314, "total_steps": 10853, "loss": 0.1382, "learning_rate": 3.5233327708427638e-06, "epoch": 0.3974754687428019, "percentage": 39.75, "elapsed_time": "13:36:27", "remaining_time": "20:37:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4315, "total_steps": 10853, "loss": 0.1358, "learning_rate": 3.522637684052184e-06, "epoch": 0.39756760492007187, "percentage": 39.76, "elapsed_time": "13:36:38", "remaining_time": "20:37:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4316, "total_steps": 10853, "loss": 0.1547, "learning_rate": 3.5219425023095837e-06, "epoch": 0.39765974109734187, "percentage": 39.77, "elapsed_time": "13:36:50", "remaining_time": "20:37:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4317, "total_steps": 10853, "loss": 0.151, "learning_rate": 3.5212472256795122e-06, "epoch": 0.39775187727461186, "percentage": 39.78, "elapsed_time": "13:37:01", "remaining_time": "20:36:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4318, "total_steps": 10853, "loss": 0.1536, "learning_rate": 3.5205518542265265e-06, "epoch": 0.39784401345188186, "percentage": 39.79, "elapsed_time": "13:37:12", "remaining_time": "20:36:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4319, "total_steps": 10853, "loss": 0.1609, "learning_rate": 3.5198563880151913e-06, "epoch": 0.3979361496291519, "percentage": 39.8, "elapsed_time": "13:37:23", "remaining_time": "20:36:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4320, "total_steps": 10853, "loss": 0.1391, "learning_rate": 3.519160827110081e-06, "epoch": 0.3980282858064219, "percentage": 39.8, "elapsed_time": "13:37:34", "remaining_time": "20:36:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4321, "total_steps": 10853, "loss": 0.148, "learning_rate": 3.5184651715757772e-06, "epoch": 0.3981204219836919, "percentage": 39.81, "elapsed_time": "13:37:44", "remaining_time": "20:36:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4322, "total_steps": 10853, "loss": 0.1324, "learning_rate": 3.517769421476873e-06, "epoch": 0.3982125581609619, "percentage": 39.82, "elapsed_time": "13:37:54", "remaining_time": "20:35:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4323, "total_steps": 10853, "loss": 0.1576, "learning_rate": 3.5170735768779683e-06, "epoch": 0.3983046943382319, "percentage": 39.83, "elapsed_time": "13:38:04", "remaining_time": "20:35:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4324, "total_steps": 10853, "loss": 0.1509, "learning_rate": 3.5163776378436736e-06, "epoch": 0.3983968305155019, "percentage": 39.84, "elapsed_time": "13:38:15", "remaining_time": "20:35:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4325, "total_steps": 10853, "loss": 0.1584, "learning_rate": 3.515681604438605e-06, "epoch": 0.3984889666927719, "percentage": 39.85, "elapsed_time": "13:38:26", "remaining_time": "20:35:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4326, "total_steps": 10853, "loss": 0.163, "learning_rate": 3.5149854767273904e-06, "epoch": 0.39858110287004195, "percentage": 39.86, "elapsed_time": "13:38:35", "remaining_time": "20:35:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4327, "total_steps": 10853, "loss": 0.1507, "learning_rate": 3.5142892547746647e-06, "epoch": 0.39867323904731194, "percentage": 39.87, "elapsed_time": "13:38:46", "remaining_time": "20:34:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4328, "total_steps": 10853, "loss": 0.1598, "learning_rate": 3.513592938645073e-06, "epoch": 0.39876537522458194, "percentage": 39.88, "elapsed_time": "13:38:57", "remaining_time": "20:34:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4329, "total_steps": 10853, "loss": 0.1378, "learning_rate": 3.5128965284032677e-06, "epoch": 0.39885751140185194, "percentage": 39.89, "elapsed_time": "13:39:08", "remaining_time": "20:34:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4330, "total_steps": 10853, "loss": 0.1586, "learning_rate": 3.512200024113911e-06, "epoch": 0.39894964757912194, "percentage": 39.9, "elapsed_time": "13:39:19", "remaining_time": "20:34:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4331, "total_steps": 10853, "loss": 0.158, "learning_rate": 3.511503425841672e-06, "epoch": 0.39904178375639193, "percentage": 39.91, "elapsed_time": "13:39:29", "remaining_time": "20:34:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4332, "total_steps": 10853, "loss": 0.1327, "learning_rate": 3.5108067336512325e-06, "epoch": 0.39913391993366193, "percentage": 39.92, "elapsed_time": "13:39:42", "remaining_time": "20:33:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4333, "total_steps": 10853, "loss": 0.1561, "learning_rate": 3.5101099476072776e-06, "epoch": 0.399226056110932, "percentage": 39.92, "elapsed_time": "13:39:51", "remaining_time": "20:33:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4334, "total_steps": 10853, "loss": 0.1564, "learning_rate": 3.5094130677745065e-06, "epoch": 0.399318192288202, "percentage": 39.93, "elapsed_time": "13:40:02", "remaining_time": "20:33:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4335, "total_steps": 10853, "loss": 0.1551, "learning_rate": 3.5087160942176228e-06, "epoch": 0.399410328465472, "percentage": 39.94, "elapsed_time": "13:40:13", "remaining_time": "20:33:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4336, "total_steps": 10853, "loss": 0.149, "learning_rate": 3.5080190270013415e-06, "epoch": 0.399502464642742, "percentage": 39.95, "elapsed_time": "13:40:25", "remaining_time": "20:33:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4337, "total_steps": 10853, "loss": 0.1491, "learning_rate": 3.5073218661903852e-06, "epoch": 0.39959460082001197, "percentage": 39.96, "elapsed_time": "13:40:36", "remaining_time": "20:32:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4338, "total_steps": 10853, "loss": 0.1651, "learning_rate": 3.5066246118494847e-06, "epoch": 0.39968673699728197, "percentage": 39.97, "elapsed_time": "13:40:49", "remaining_time": "20:32:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4339, "total_steps": 10853, "loss": 0.1455, "learning_rate": 3.5059272640433808e-06, "epoch": 0.39977887317455196, "percentage": 39.98, "elapsed_time": "13:40:59", "remaining_time": "20:32:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4340, "total_steps": 10853, "loss": 0.1585, "learning_rate": 3.5052298228368227e-06, "epoch": 0.399871009351822, "percentage": 39.99, "elapsed_time": "13:41:10", "remaining_time": "20:32:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4341, "total_steps": 10853, "loss": 0.1511, "learning_rate": 3.5045322882945666e-06, "epoch": 0.399963145529092, "percentage": 40.0, "elapsed_time": "13:41:21", "remaining_time": "20:32:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4342, "total_steps": 10853, "loss": 0.1208, "learning_rate": 3.5038346604813796e-06, "epoch": 0.400055281706362, "percentage": 40.01, "elapsed_time": "13:41:30", "remaining_time": "20:31:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4343, "total_steps": 10853, "loss": 0.1461, "learning_rate": 3.5031369394620364e-06, "epoch": 0.400147417883632, "percentage": 40.02, "elapsed_time": "13:41:41", "remaining_time": "20:31:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4344, "total_steps": 10853, "loss": 0.1492, "learning_rate": 3.5024391253013206e-06, "epoch": 0.400239554060902, "percentage": 40.03, "elapsed_time": "13:41:53", "remaining_time": "20:31:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4345, "total_steps": 10853, "loss": 0.1521, "learning_rate": 3.5017412180640243e-06, "epoch": 0.400331690238172, "percentage": 40.04, "elapsed_time": "13:42:02", "remaining_time": "20:31:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4346, "total_steps": 10853, "loss": 0.1609, "learning_rate": 3.5010432178149473e-06, "epoch": 0.400423826415442, "percentage": 40.04, "elapsed_time": "13:42:14", "remaining_time": "20:31:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4347, "total_steps": 10853, "loss": 0.1482, "learning_rate": 3.5003451246189003e-06, "epoch": 0.40051596259271205, "percentage": 40.05, "elapsed_time": "13:42:25", "remaining_time": "20:30:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4348, "total_steps": 10853, "loss": 0.146, "learning_rate": 3.499646938540701e-06, "epoch": 0.40060809876998205, "percentage": 40.06, "elapsed_time": "13:42:37", "remaining_time": "20:30:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4349, "total_steps": 10853, "loss": 0.1484, "learning_rate": 3.498948659645176e-06, "epoch": 0.40070023494725204, "percentage": 40.07, "elapsed_time": "13:42:47", "remaining_time": "20:30:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4350, "total_steps": 10853, "loss": 0.1429, "learning_rate": 3.4982502879971596e-06, "epoch": 0.40079237112452204, "percentage": 40.08, "elapsed_time": "13:42:58", "remaining_time": "20:30:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4351, "total_steps": 10853, "loss": 0.1438, "learning_rate": 3.497551823661498e-06, "epoch": 0.40088450730179204, "percentage": 40.09, "elapsed_time": "13:43:07", "remaining_time": "20:30:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4352, "total_steps": 10853, "loss": 0.1684, "learning_rate": 3.4968532667030408e-06, "epoch": 0.40097664347906203, "percentage": 40.1, "elapsed_time": "13:43:17", "remaining_time": "20:29:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4353, "total_steps": 10853, "loss": 0.1452, "learning_rate": 3.496154617186651e-06, "epoch": 0.4010687796563321, "percentage": 40.11, "elapsed_time": "13:43:29", "remaining_time": "20:29:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4354, "total_steps": 10853, "loss": 0.1611, "learning_rate": 3.4954558751771976e-06, "epoch": 0.4011609158336021, "percentage": 40.12, "elapsed_time": "13:43:40", "remaining_time": "20:29:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4355, "total_steps": 10853, "loss": 0.1568, "learning_rate": 3.4947570407395593e-06, "epoch": 0.4012530520108721, "percentage": 40.13, "elapsed_time": "13:43:49", "remaining_time": "20:29:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4356, "total_steps": 10853, "loss": 0.1454, "learning_rate": 3.494058113938623e-06, "epoch": 0.4013451881881421, "percentage": 40.14, "elapsed_time": "13:44:00", "remaining_time": "20:29:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4357, "total_steps": 10853, "loss": 0.1454, "learning_rate": 3.493359094839284e-06, "epoch": 0.4014373243654121, "percentage": 40.15, "elapsed_time": "13:44:11", "remaining_time": "20:28:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4358, "total_steps": 10853, "loss": 0.1527, "learning_rate": 3.4926599835064446e-06, "epoch": 0.40152946054268207, "percentage": 40.15, "elapsed_time": "13:44:21", "remaining_time": "20:28:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4359, "total_steps": 10853, "loss": 0.1488, "learning_rate": 3.491960780005021e-06, "epoch": 0.40162159671995207, "percentage": 40.16, "elapsed_time": "13:44:31", "remaining_time": "20:28:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4360, "total_steps": 10853, "loss": 0.1519, "learning_rate": 3.4912614843999304e-06, "epoch": 0.4017137328972221, "percentage": 40.17, "elapsed_time": "13:44:41", "remaining_time": "20:28:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4361, "total_steps": 10853, "loss": 0.145, "learning_rate": 3.490562096756105e-06, "epoch": 0.4018058690744921, "percentage": 40.18, "elapsed_time": "13:44:50", "remaining_time": "20:27:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4362, "total_steps": 10853, "loss": 0.1319, "learning_rate": 3.4898626171384823e-06, "epoch": 0.4018980052517621, "percentage": 40.19, "elapsed_time": "13:45:01", "remaining_time": "20:27:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4363, "total_steps": 10853, "loss": 0.1478, "learning_rate": 3.4891630456120098e-06, "epoch": 0.4019901414290321, "percentage": 40.2, "elapsed_time": "13:45:14", "remaining_time": "20:27:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4364, "total_steps": 10853, "loss": 0.1411, "learning_rate": 3.4884633822416412e-06, "epoch": 0.4020822776063021, "percentage": 40.21, "elapsed_time": "13:45:26", "remaining_time": "20:27:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4365, "total_steps": 10853, "loss": 0.1557, "learning_rate": 3.4877636270923416e-06, "epoch": 0.4021744137835721, "percentage": 40.22, "elapsed_time": "13:45:36", "remaining_time": "20:27:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4366, "total_steps": 10853, "loss": 0.1528, "learning_rate": 3.4870637802290817e-06, "epoch": 0.4022665499608421, "percentage": 40.23, "elapsed_time": "13:45:47", "remaining_time": "20:26:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4367, "total_steps": 10853, "loss": 0.1406, "learning_rate": 3.4863638417168455e-06, "epoch": 0.40235868613811215, "percentage": 40.24, "elapsed_time": "13:45:59", "remaining_time": "20:26:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4368, "total_steps": 10853, "loss": 0.1522, "learning_rate": 3.4856638116206194e-06, "epoch": 0.40245082231538215, "percentage": 40.25, "elapsed_time": "13:46:11", "remaining_time": "20:26:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4369, "total_steps": 10853, "loss": 0.1414, "learning_rate": 3.4849636900054023e-06, "epoch": 0.40254295849265215, "percentage": 40.26, "elapsed_time": "13:46:21", "remaining_time": "20:26:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4370, "total_steps": 10853, "loss": 0.1527, "learning_rate": 3.484263476936201e-06, "epoch": 0.40263509466992214, "percentage": 40.27, "elapsed_time": "13:46:32", "remaining_time": "20:26:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4371, "total_steps": 10853, "loss": 0.1445, "learning_rate": 3.4835631724780296e-06, "epoch": 0.40272723084719214, "percentage": 40.27, "elapsed_time": "13:46:43", "remaining_time": "20:25:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4372, "total_steps": 10853, "loss": 0.1491, "learning_rate": 3.4828627766959123e-06, "epoch": 0.40281936702446214, "percentage": 40.28, "elapsed_time": "13:46:54", "remaining_time": "20:25:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4373, "total_steps": 10853, "loss": 0.1483, "learning_rate": 3.4821622896548795e-06, "epoch": 0.40291150320173214, "percentage": 40.29, "elapsed_time": "13:47:05", "remaining_time": "20:25:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4374, "total_steps": 10853, "loss": 0.1514, "learning_rate": 3.4814617114199722e-06, "epoch": 0.4030036393790022, "percentage": 40.3, "elapsed_time": "13:47:17", "remaining_time": "20:25:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4375, "total_steps": 10853, "loss": 0.1599, "learning_rate": 3.4807610420562406e-06, "epoch": 0.4030957755562722, "percentage": 40.31, "elapsed_time": "13:47:28", "remaining_time": "20:25:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4376, "total_steps": 10853, "loss": 0.1532, "learning_rate": 3.48006028162874e-06, "epoch": 0.4031879117335422, "percentage": 40.32, "elapsed_time": "13:47:39", "remaining_time": "20:25:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4377, "total_steps": 10853, "loss": 0.1465, "learning_rate": 3.4793594302025367e-06, "epoch": 0.4032800479108122, "percentage": 40.33, "elapsed_time": "13:47:51", "remaining_time": "20:24:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4378, "total_steps": 10853, "loss": 0.134, "learning_rate": 3.4786584878427056e-06, "epoch": 0.4033721840880822, "percentage": 40.34, "elapsed_time": "13:48:02", "remaining_time": "20:24:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4379, "total_steps": 10853, "loss": 0.1539, "learning_rate": 3.4779574546143276e-06, "epoch": 0.40346432026535217, "percentage": 40.35, "elapsed_time": "13:48:13", "remaining_time": "20:24:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4380, "total_steps": 10853, "loss": 0.1612, "learning_rate": 3.4772563305824956e-06, "epoch": 0.40355645644262217, "percentage": 40.36, "elapsed_time": "13:48:25", "remaining_time": "20:24:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4381, "total_steps": 10853, "loss": 0.1333, "learning_rate": 3.4765551158123074e-06, "epoch": 0.4036485926198922, "percentage": 40.37, "elapsed_time": "13:48:35", "remaining_time": "20:24:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4382, "total_steps": 10853, "loss": 0.1525, "learning_rate": 3.4758538103688723e-06, "epoch": 0.4037407287971622, "percentage": 40.38, "elapsed_time": "13:48:47", "remaining_time": "20:23:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4383, "total_steps": 10853, "loss": 0.1651, "learning_rate": 3.4751524143173055e-06, "epoch": 0.4038328649744322, "percentage": 40.39, "elapsed_time": "13:48:58", "remaining_time": "20:23:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4384, "total_steps": 10853, "loss": 0.1493, "learning_rate": 3.4744509277227316e-06, "epoch": 0.4039250011517022, "percentage": 40.39, "elapsed_time": "13:49:09", "remaining_time": "20:23:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4385, "total_steps": 10853, "loss": 0.1554, "learning_rate": 3.473749350650285e-06, "epoch": 0.4040171373289722, "percentage": 40.4, "elapsed_time": "13:49:19", "remaining_time": "20:23:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4386, "total_steps": 10853, "loss": 0.1552, "learning_rate": 3.473047683165106e-06, "epoch": 0.4041092735062422, "percentage": 40.41, "elapsed_time": "13:49:29", "remaining_time": "20:23:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4387, "total_steps": 10853, "loss": 0.156, "learning_rate": 3.472345925332344e-06, "epoch": 0.40420140968351226, "percentage": 40.42, "elapsed_time": "13:49:40", "remaining_time": "20:22:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4388, "total_steps": 10853, "loss": 0.1601, "learning_rate": 3.47164407721716e-06, "epoch": 0.40429354586078226, "percentage": 40.43, "elapsed_time": "13:49:51", "remaining_time": "20:22:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4389, "total_steps": 10853, "loss": 0.1442, "learning_rate": 3.4709421388847177e-06, "epoch": 0.40438568203805225, "percentage": 40.44, "elapsed_time": "13:50:01", "remaining_time": "20:22:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4390, "total_steps": 10853, "loss": 0.161, "learning_rate": 3.4702401104001937e-06, "epoch": 0.40447781821532225, "percentage": 40.45, "elapsed_time": "13:50:12", "remaining_time": "20:22:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4391, "total_steps": 10853, "loss": 0.147, "learning_rate": 3.4695379918287708e-06, "epoch": 0.40456995439259225, "percentage": 40.46, "elapsed_time": "13:50:23", "remaining_time": "20:22:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4392, "total_steps": 10853, "loss": 0.1664, "learning_rate": 3.468835783235641e-06, "epoch": 0.40466209056986224, "percentage": 40.47, "elapsed_time": "13:50:35", "remaining_time": "20:21:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4393, "total_steps": 10853, "loss": 0.1581, "learning_rate": 3.468133484686005e-06, "epoch": 0.40475422674713224, "percentage": 40.48, "elapsed_time": "13:50:46", "remaining_time": "20:21:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4394, "total_steps": 10853, "loss": 0.1458, "learning_rate": 3.467431096245071e-06, "epoch": 0.4048463629244023, "percentage": 40.49, "elapsed_time": "13:50:56", "remaining_time": "20:21:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4395, "total_steps": 10853, "loss": 0.1465, "learning_rate": 3.466728617978054e-06, "epoch": 0.4049384991016723, "percentage": 40.5, "elapsed_time": "13:51:07", "remaining_time": "20:21:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4396, "total_steps": 10853, "loss": 0.1533, "learning_rate": 3.466026049950182e-06, "epoch": 0.4050306352789423, "percentage": 40.5, "elapsed_time": "13:51:17", "remaining_time": "20:21:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4397, "total_steps": 10853, "loss": 0.1474, "learning_rate": 3.465323392226687e-06, "epoch": 0.4051227714562123, "percentage": 40.51, "elapsed_time": "13:51:28", "remaining_time": "20:20:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4398, "total_steps": 10853, "loss": 0.1471, "learning_rate": 3.4646206448728113e-06, "epoch": 0.4052149076334823, "percentage": 40.52, "elapsed_time": "13:51:37", "remaining_time": "20:20:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4399, "total_steps": 10853, "loss": 0.1514, "learning_rate": 3.463917807953805e-06, "epoch": 0.4053070438107523, "percentage": 40.53, "elapsed_time": "13:51:47", "remaining_time": "20:20:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4400, "total_steps": 10853, "loss": 0.1411, "learning_rate": 3.4632148815349265e-06, "epoch": 0.4053991799880223, "percentage": 40.54, "elapsed_time": "13:52:00", "remaining_time": "20:20:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4401, "total_steps": 10853, "loss": 0.1531, "learning_rate": 3.4625118656814414e-06, "epoch": 0.4054913161652923, "percentage": 40.55, "elapsed_time": "13:52:10", "remaining_time": "20:19:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4402, "total_steps": 10853, "loss": 0.1476, "learning_rate": 3.4618087604586277e-06, "epoch": 0.4055834523425623, "percentage": 40.56, "elapsed_time": "13:52:20", "remaining_time": "20:19:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4403, "total_steps": 10853, "loss": 0.1403, "learning_rate": 3.4611055659317663e-06, "epoch": 0.4056755885198323, "percentage": 40.57, "elapsed_time": "13:52:31", "remaining_time": "20:19:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4404, "total_steps": 10853, "loss": 0.1217, "learning_rate": 3.4604022821661493e-06, "epoch": 0.4057677246971023, "percentage": 40.58, "elapsed_time": "13:52:41", "remaining_time": "20:19:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4405, "total_steps": 10853, "loss": 0.15, "learning_rate": 3.459698909227078e-06, "epoch": 0.4058598608743723, "percentage": 40.59, "elapsed_time": "13:52:52", "remaining_time": "20:19:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4406, "total_steps": 10853, "loss": 0.1442, "learning_rate": 3.458995447179858e-06, "epoch": 0.4059519970516423, "percentage": 40.6, "elapsed_time": "13:53:03", "remaining_time": "20:18:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4407, "total_steps": 10853, "loss": 0.1556, "learning_rate": 3.4582918960898094e-06, "epoch": 0.4060441332289123, "percentage": 40.61, "elapsed_time": "13:53:13", "remaining_time": "20:18:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4408, "total_steps": 10853, "loss": 0.1425, "learning_rate": 3.457588256022254e-06, "epoch": 0.40613626940618236, "percentage": 40.62, "elapsed_time": "13:53:24", "remaining_time": "20:18:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4409, "total_steps": 10853, "loss": 0.1402, "learning_rate": 3.4568845270425268e-06, "epoch": 0.40622840558345236, "percentage": 40.62, "elapsed_time": "13:53:35", "remaining_time": "20:18:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4410, "total_steps": 10853, "loss": 0.1391, "learning_rate": 3.456180709215968e-06, "epoch": 0.40632054176072235, "percentage": 40.63, "elapsed_time": "13:53:45", "remaining_time": "20:18:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4411, "total_steps": 10853, "loss": 0.1455, "learning_rate": 3.455476802607927e-06, "epoch": 0.40641267793799235, "percentage": 40.64, "elapsed_time": "13:53:57", "remaining_time": "20:17:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4412, "total_steps": 10853, "loss": 0.1595, "learning_rate": 3.454772807283763e-06, "epoch": 0.40650481411526235, "percentage": 40.65, "elapsed_time": "13:54:07", "remaining_time": "20:17:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4413, "total_steps": 10853, "loss": 0.1451, "learning_rate": 3.45406872330884e-06, "epoch": 0.40659695029253234, "percentage": 40.66, "elapsed_time": "13:54:18", "remaining_time": "20:17:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4414, "total_steps": 10853, "loss": 0.1496, "learning_rate": 3.453364550748533e-06, "epoch": 0.40668908646980234, "percentage": 40.67, "elapsed_time": "13:54:29", "remaining_time": "20:17:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4415, "total_steps": 10853, "loss": 0.1435, "learning_rate": 3.4526602896682267e-06, "epoch": 0.4067812226470724, "percentage": 40.68, "elapsed_time": "13:54:39", "remaining_time": "20:17:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4416, "total_steps": 10853, "loss": 0.1436, "learning_rate": 3.451955940133308e-06, "epoch": 0.4068733588243424, "percentage": 40.69, "elapsed_time": "13:54:50", "remaining_time": "20:16:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4417, "total_steps": 10853, "loss": 0.1572, "learning_rate": 3.451251502209179e-06, "epoch": 0.4069654950016124, "percentage": 40.7, "elapsed_time": "13:55:00", "remaining_time": "20:16:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4418, "total_steps": 10853, "loss": 0.1454, "learning_rate": 3.4505469759612453e-06, "epoch": 0.4070576311788824, "percentage": 40.71, "elapsed_time": "13:55:11", "remaining_time": "20:16:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4419, "total_steps": 10853, "loss": 0.1437, "learning_rate": 3.4498423614549226e-06, "epoch": 0.4071497673561524, "percentage": 40.72, "elapsed_time": "13:55:22", "remaining_time": "20:16:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4420, "total_steps": 10853, "loss": 0.1558, "learning_rate": 3.449137658755635e-06, "epoch": 0.4072419035334224, "percentage": 40.73, "elapsed_time": "13:55:33", "remaining_time": "20:16:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4421, "total_steps": 10853, "loss": 0.1512, "learning_rate": 3.4484328679288133e-06, "epoch": 0.40733403971069243, "percentage": 40.74, "elapsed_time": "13:55:43", "remaining_time": "20:15:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4422, "total_steps": 10853, "loss": 0.1472, "learning_rate": 3.4477279890398968e-06, "epoch": 0.4074261758879624, "percentage": 40.74, "elapsed_time": "13:55:56", "remaining_time": "20:15:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4423, "total_steps": 10853, "loss": 0.1431, "learning_rate": 3.4470230221543362e-06, "epoch": 0.4075183120652324, "percentage": 40.75, "elapsed_time": "13:56:07", "remaining_time": "20:15:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4424, "total_steps": 10853, "loss": 0.1426, "learning_rate": 3.4463179673375846e-06, "epoch": 0.4076104482425024, "percentage": 40.76, "elapsed_time": "13:56:18", "remaining_time": "20:15:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4425, "total_steps": 10853, "loss": 0.1414, "learning_rate": 3.445612824655108e-06, "epoch": 0.4077025844197724, "percentage": 40.77, "elapsed_time": "13:56:29", "remaining_time": "20:15:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4426, "total_steps": 10853, "loss": 0.1427, "learning_rate": 3.4449075941723797e-06, "epoch": 0.4077947205970424, "percentage": 40.78, "elapsed_time": "13:56:40", "remaining_time": "20:14:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4427, "total_steps": 10853, "loss": 0.1412, "learning_rate": 3.444202275954879e-06, "epoch": 0.4078868567743124, "percentage": 40.79, "elapsed_time": "13:56:51", "remaining_time": "20:14:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4428, "total_steps": 10853, "loss": 0.1483, "learning_rate": 3.443496870068096e-06, "epoch": 0.40797899295158246, "percentage": 40.8, "elapsed_time": "13:57:02", "remaining_time": "20:14:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4429, "total_steps": 10853, "loss": 0.1372, "learning_rate": 3.442791376577527e-06, "epoch": 0.40807112912885246, "percentage": 40.81, "elapsed_time": "13:57:12", "remaining_time": "20:14:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4430, "total_steps": 10853, "loss": 0.1442, "learning_rate": 3.4420857955486756e-06, "epoch": 0.40816326530612246, "percentage": 40.82, "elapsed_time": "13:57:22", "remaining_time": "20:14:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4431, "total_steps": 10853, "loss": 0.1345, "learning_rate": 3.441380127047058e-06, "epoch": 0.40825540148339245, "percentage": 40.83, "elapsed_time": "13:57:34", "remaining_time": "20:13:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4432, "total_steps": 10853, "loss": 0.1435, "learning_rate": 3.4406743711381945e-06, "epoch": 0.40834753766066245, "percentage": 40.84, "elapsed_time": "13:57:45", "remaining_time": "20:13:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4433, "total_steps": 10853, "loss": 0.1462, "learning_rate": 3.439968527887614e-06, "epoch": 0.40843967383793245, "percentage": 40.85, "elapsed_time": "13:57:56", "remaining_time": "20:13:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4434, "total_steps": 10853, "loss": 0.152, "learning_rate": 3.439262597360855e-06, "epoch": 0.40853181001520245, "percentage": 40.86, "elapsed_time": "13:58:07", "remaining_time": "20:13:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4435, "total_steps": 10853, "loss": 0.1412, "learning_rate": 3.438556579623462e-06, "epoch": 0.4086239461924725, "percentage": 40.86, "elapsed_time": "13:58:16", "remaining_time": "20:13:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4436, "total_steps": 10853, "loss": 0.1574, "learning_rate": 3.43785047474099e-06, "epoch": 0.4087160823697425, "percentage": 40.87, "elapsed_time": "13:58:27", "remaining_time": "20:12:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4437, "total_steps": 10853, "loss": 0.1449, "learning_rate": 3.437144282779e-06, "epoch": 0.4088082185470125, "percentage": 40.88, "elapsed_time": "13:58:39", "remaining_time": "20:12:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4438, "total_steps": 10853, "loss": 0.1647, "learning_rate": 3.4364380038030636e-06, "epoch": 0.4089003547242825, "percentage": 40.89, "elapsed_time": "13:58:51", "remaining_time": "20:12:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4439, "total_steps": 10853, "loss": 0.146, "learning_rate": 3.435731637878757e-06, "epoch": 0.4089924909015525, "percentage": 40.9, "elapsed_time": "13:59:01", "remaining_time": "20:12:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4440, "total_steps": 10853, "loss": 0.1494, "learning_rate": 3.435025185071668e-06, "epoch": 0.4090846270788225, "percentage": 40.91, "elapsed_time": "13:59:14", "remaining_time": "20:12:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4441, "total_steps": 10853, "loss": 0.1344, "learning_rate": 3.434318645447388e-06, "epoch": 0.4091767632560925, "percentage": 40.92, "elapsed_time": "13:59:24", "remaining_time": "20:11:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4442, "total_steps": 10853, "loss": 0.1481, "learning_rate": 3.433612019071523e-06, "epoch": 0.40926889943336253, "percentage": 40.93, "elapsed_time": "13:59:34", "remaining_time": "20:11:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4443, "total_steps": 10853, "loss": 0.1564, "learning_rate": 3.4329053060096805e-06, "epoch": 0.40936103561063253, "percentage": 40.94, "elapsed_time": "13:59:44", "remaining_time": "20:11:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4444, "total_steps": 10853, "loss": 0.1566, "learning_rate": 3.4321985063274805e-06, "epoch": 0.4094531717879025, "percentage": 40.95, "elapsed_time": "13:59:55", "remaining_time": "20:11:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4445, "total_steps": 10853, "loss": 0.1529, "learning_rate": 3.431491620090549e-06, "epoch": 0.4095453079651725, "percentage": 40.96, "elapsed_time": "14:00:05", "remaining_time": "20:11:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4446, "total_steps": 10853, "loss": 0.1382, "learning_rate": 3.43078464736452e-06, "epoch": 0.4096374441424425, "percentage": 40.97, "elapsed_time": "14:00:16", "remaining_time": "20:10:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4447, "total_steps": 10853, "loss": 0.1642, "learning_rate": 3.4300775882150367e-06, "epoch": 0.4097295803197125, "percentage": 40.97, "elapsed_time": "14:00:26", "remaining_time": "20:10:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4448, "total_steps": 10853, "loss": 0.1474, "learning_rate": 3.429370442707749e-06, "epoch": 0.4098217164969825, "percentage": 40.98, "elapsed_time": "14:00:38", "remaining_time": "20:10:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4449, "total_steps": 10853, "loss": 0.1565, "learning_rate": 3.428663210908315e-06, "epoch": 0.40991385267425257, "percentage": 40.99, "elapsed_time": "14:00:50", "remaining_time": "20:10:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4450, "total_steps": 10853, "loss": 0.1561, "learning_rate": 3.427955892882403e-06, "epoch": 0.41000598885152256, "percentage": 41.0, "elapsed_time": "14:01:02", "remaining_time": "20:10:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4451, "total_steps": 10853, "loss": 0.1532, "learning_rate": 3.4272484886956856e-06, "epoch": 0.41009812502879256, "percentage": 41.01, "elapsed_time": "14:01:14", "remaining_time": "20:09:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4452, "total_steps": 10853, "loss": 0.1552, "learning_rate": 3.4265409984138463e-06, "epoch": 0.41019026120606256, "percentage": 41.02, "elapsed_time": "14:01:24", "remaining_time": "20:09:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4453, "total_steps": 10853, "loss": 0.1392, "learning_rate": 3.4258334221025763e-06, "epoch": 0.41028239738333255, "percentage": 41.03, "elapsed_time": "14:01:35", "remaining_time": "20:09:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4454, "total_steps": 10853, "loss": 0.1408, "learning_rate": 3.425125759827573e-06, "epoch": 0.41037453356060255, "percentage": 41.04, "elapsed_time": "14:01:46", "remaining_time": "20:09:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4455, "total_steps": 10853, "loss": 0.1493, "learning_rate": 3.4244180116545434e-06, "epoch": 0.4104666697378726, "percentage": 41.05, "elapsed_time": "14:01:58", "remaining_time": "20:09:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4456, "total_steps": 10853, "loss": 0.1469, "learning_rate": 3.423710177649202e-06, "epoch": 0.4105588059151426, "percentage": 41.06, "elapsed_time": "14:02:10", "remaining_time": "20:09:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4457, "total_steps": 10853, "loss": 0.1524, "learning_rate": 3.423002257877271e-06, "epoch": 0.4106509420924126, "percentage": 41.07, "elapsed_time": "14:02:20", "remaining_time": "20:08:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4458, "total_steps": 10853, "loss": 0.1635, "learning_rate": 3.4222942524044817e-06, "epoch": 0.4107430782696826, "percentage": 41.08, "elapsed_time": "14:02:32", "remaining_time": "20:08:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4459, "total_steps": 10853, "loss": 0.1364, "learning_rate": 3.4215861612965705e-06, "epoch": 0.4108352144469526, "percentage": 41.09, "elapsed_time": "14:02:43", "remaining_time": "20:08:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4460, "total_steps": 10853, "loss": 0.1471, "learning_rate": 3.4208779846192856e-06, "epoch": 0.4109273506242226, "percentage": 41.09, "elapsed_time": "14:02:55", "remaining_time": "20:08:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4461, "total_steps": 10853, "loss": 0.1481, "learning_rate": 3.420169722438381e-06, "epoch": 0.4110194868014926, "percentage": 41.1, "elapsed_time": "14:03:06", "remaining_time": "20:08:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4462, "total_steps": 10853, "loss": 0.153, "learning_rate": 3.419461374819618e-06, "epoch": 0.41111162297876264, "percentage": 41.11, "elapsed_time": "14:03:18", "remaining_time": "20:07:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4463, "total_steps": 10853, "loss": 0.1479, "learning_rate": 3.418752941828769e-06, "epoch": 0.41120375915603263, "percentage": 41.12, "elapsed_time": "14:03:29", "remaining_time": "20:07:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4464, "total_steps": 10853, "loss": 0.1493, "learning_rate": 3.418044423531609e-06, "epoch": 0.41129589533330263, "percentage": 41.13, "elapsed_time": "14:03:41", "remaining_time": "20:07:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4465, "total_steps": 10853, "loss": 0.1544, "learning_rate": 3.4173358199939253e-06, "epoch": 0.4113880315105726, "percentage": 41.14, "elapsed_time": "14:03:50", "remaining_time": "20:07:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4466, "total_steps": 10853, "loss": 0.1501, "learning_rate": 3.416627131281513e-06, "epoch": 0.4114801676878426, "percentage": 41.15, "elapsed_time": "14:04:00", "remaining_time": "20:07:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4467, "total_steps": 10853, "loss": 0.1529, "learning_rate": 3.415918357460173e-06, "epoch": 0.4115723038651126, "percentage": 41.16, "elapsed_time": "14:04:10", "remaining_time": "20:06:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4468, "total_steps": 10853, "loss": 0.1537, "learning_rate": 3.4152094985957135e-06, "epoch": 0.4116644400423826, "percentage": 41.17, "elapsed_time": "14:04:21", "remaining_time": "20:06:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4469, "total_steps": 10853, "loss": 0.1422, "learning_rate": 3.4145005547539552e-06, "epoch": 0.41175657621965267, "percentage": 41.18, "elapsed_time": "14:04:31", "remaining_time": "20:06:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4470, "total_steps": 10853, "loss": 0.137, "learning_rate": 3.413791526000721e-06, "epoch": 0.41184871239692267, "percentage": 41.19, "elapsed_time": "14:04:41", "remaining_time": "20:06:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4471, "total_steps": 10853, "loss": 0.1487, "learning_rate": 3.4130824124018453e-06, "epoch": 0.41194084857419266, "percentage": 41.2, "elapsed_time": "14:04:52", "remaining_time": "20:05:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4472, "total_steps": 10853, "loss": 0.1505, "learning_rate": 3.4123732140231695e-06, "epoch": 0.41203298475146266, "percentage": 41.21, "elapsed_time": "14:05:04", "remaining_time": "20:05:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4473, "total_steps": 10853, "loss": 0.1559, "learning_rate": 3.411663930930543e-06, "epoch": 0.41212512092873266, "percentage": 41.21, "elapsed_time": "14:05:15", "remaining_time": "20:05:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4474, "total_steps": 10853, "loss": 0.1559, "learning_rate": 3.4109545631898223e-06, "epoch": 0.41221725710600265, "percentage": 41.22, "elapsed_time": "14:05:25", "remaining_time": "20:05:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4475, "total_steps": 10853, "loss": 0.1598, "learning_rate": 3.410245110866872e-06, "epoch": 0.41230939328327265, "percentage": 41.23, "elapsed_time": "14:05:37", "remaining_time": "20:05:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4476, "total_steps": 10853, "loss": 0.1373, "learning_rate": 3.409535574027565e-06, "epoch": 0.4124015294605427, "percentage": 41.24, "elapsed_time": "14:05:48", "remaining_time": "20:05:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4477, "total_steps": 10853, "loss": 0.1453, "learning_rate": 3.4088259527377826e-06, "epoch": 0.4124936656378127, "percentage": 41.25, "elapsed_time": "14:05:58", "remaining_time": "20:04:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4478, "total_steps": 10853, "loss": 0.1624, "learning_rate": 3.408116247063412e-06, "epoch": 0.4125858018150827, "percentage": 41.26, "elapsed_time": "14:06:11", "remaining_time": "20:04:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4479, "total_steps": 10853, "loss": 0.1439, "learning_rate": 3.407406457070351e-06, "epoch": 0.4126779379923527, "percentage": 41.27, "elapsed_time": "14:06:20", "remaining_time": "20:04:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4480, "total_steps": 10853, "loss": 0.1495, "learning_rate": 3.4066965828245023e-06, "epoch": 0.4127700741696227, "percentage": 41.28, "elapsed_time": "14:06:31", "remaining_time": "20:04:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4481, "total_steps": 10853, "loss": 0.1587, "learning_rate": 3.4059866243917784e-06, "epoch": 0.4128622103468927, "percentage": 41.29, "elapsed_time": "14:06:42", "remaining_time": "20:04:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4482, "total_steps": 10853, "loss": 0.1528, "learning_rate": 3.4052765818380988e-06, "epoch": 0.4129543465241627, "percentage": 41.3, "elapsed_time": "14:06:54", "remaining_time": "20:03:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4483, "total_steps": 10853, "loss": 0.1439, "learning_rate": 3.4045664552293913e-06, "epoch": 0.41304648270143274, "percentage": 41.31, "elapsed_time": "14:07:05", "remaining_time": "20:03:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4484, "total_steps": 10853, "loss": 0.1621, "learning_rate": 3.4038562446315908e-06, "epoch": 0.41313861887870273, "percentage": 41.32, "elapsed_time": "14:07:18", "remaining_time": "20:03:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4485, "total_steps": 10853, "loss": 0.1402, "learning_rate": 3.4031459501106412e-06, "epoch": 0.41323075505597273, "percentage": 41.32, "elapsed_time": "14:07:29", "remaining_time": "20:03:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4486, "total_steps": 10853, "loss": 0.1599, "learning_rate": 3.4024355717324927e-06, "epoch": 0.41332289123324273, "percentage": 41.33, "elapsed_time": "14:07:40", "remaining_time": "20:03:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4487, "total_steps": 10853, "loss": 0.15, "learning_rate": 3.4017251095631044e-06, "epoch": 0.4134150274105127, "percentage": 41.34, "elapsed_time": "14:07:51", "remaining_time": "20:02:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4488, "total_steps": 10853, "loss": 0.1457, "learning_rate": 3.401014563668442e-06, "epoch": 0.4135071635877827, "percentage": 41.35, "elapsed_time": "14:08:02", "remaining_time": "20:02:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4489, "total_steps": 10853, "loss": 0.1381, "learning_rate": 3.4003039341144807e-06, "epoch": 0.4135992997650528, "percentage": 41.36, "elapsed_time": "14:08:14", "remaining_time": "20:02:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4490, "total_steps": 10853, "loss": 0.1457, "learning_rate": 3.3995932209672028e-06, "epoch": 0.41369143594232277, "percentage": 41.37, "elapsed_time": "14:08:26", "remaining_time": "20:02:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4491, "total_steps": 10853, "loss": 0.1516, "learning_rate": 3.3988824242925965e-06, "epoch": 0.41378357211959277, "percentage": 41.38, "elapsed_time": "14:08:35", "remaining_time": "20:02:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4492, "total_steps": 10853, "loss": 0.1294, "learning_rate": 3.398171544156661e-06, "epoch": 0.41387570829686277, "percentage": 41.39, "elapsed_time": "14:08:47", "remaining_time": "20:01:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4493, "total_steps": 10853, "loss": 0.1455, "learning_rate": 3.3974605806254015e-06, "epoch": 0.41396784447413276, "percentage": 41.4, "elapsed_time": "14:08:58", "remaining_time": "20:01:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4494, "total_steps": 10853, "loss": 0.1471, "learning_rate": 3.3967495337648297e-06, "epoch": 0.41405998065140276, "percentage": 41.41, "elapsed_time": "14:09:09", "remaining_time": "20:01:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4495, "total_steps": 10853, "loss": 0.1588, "learning_rate": 3.396038403640968e-06, "epoch": 0.41415211682867276, "percentage": 41.42, "elapsed_time": "14:09:17", "remaining_time": "20:01:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4496, "total_steps": 10853, "loss": 0.1556, "learning_rate": 3.395327190319843e-06, "epoch": 0.4142442530059428, "percentage": 41.43, "elapsed_time": "14:09:27", "remaining_time": "20:01:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4497, "total_steps": 10853, "loss": 0.1425, "learning_rate": 3.394615893867492e-06, "epoch": 0.4143363891832128, "percentage": 41.44, "elapsed_time": "14:09:39", "remaining_time": "20:00:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4498, "total_steps": 10853, "loss": 0.1392, "learning_rate": 3.3939045143499604e-06, "epoch": 0.4144285253604828, "percentage": 41.44, "elapsed_time": "14:09:47", "remaining_time": "20:00:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4499, "total_steps": 10853, "loss": 0.146, "learning_rate": 3.393193051833297e-06, "epoch": 0.4145206615377528, "percentage": 41.45, "elapsed_time": "14:09:58", "remaining_time": "20:00:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4500, "total_steps": 10853, "loss": 0.1557, "learning_rate": 3.392481506383563e-06, "epoch": 0.4146127977150228, "percentage": 41.46, "elapsed_time": "14:10:09", "remaining_time": "20:00:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4500, "total_steps": 10853, "eval_loss": 0.14849522709846497, "epoch": 0.4146127977150228, "percentage": 41.46, "elapsed_time": "14:15:09", "remaining_time": "20:07:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4501, "total_steps": 10853, "loss": 0.1554, "learning_rate": 3.391769878066825e-06, "epoch": 0.4147049338922928, "percentage": 41.47, "elapsed_time": "14:15:19", "remaining_time": "20:07:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4502, "total_steps": 10853, "loss": 0.1483, "learning_rate": 3.391058166949159e-06, "epoch": 0.4147970700695628, "percentage": 41.48, "elapsed_time": "14:15:29", "remaining_time": "20:06:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4503, "total_steps": 10853, "loss": 0.1622, "learning_rate": 3.390346373096645e-06, "epoch": 0.41488920624683284, "percentage": 41.49, "elapsed_time": "14:15:40", "remaining_time": "20:06:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4504, "total_steps": 10853, "loss": 0.1542, "learning_rate": 3.3896344965753746e-06, "epoch": 0.41498134242410284, "percentage": 41.5, "elapsed_time": "14:15:51", "remaining_time": "20:06:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4505, "total_steps": 10853, "loss": 0.1522, "learning_rate": 3.3889225374514455e-06, "epoch": 0.41507347860137284, "percentage": 41.51, "elapsed_time": "14:16:03", "remaining_time": "20:06:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4506, "total_steps": 10853, "loss": 0.1447, "learning_rate": 3.388210495790964e-06, "epoch": 0.41516561477864283, "percentage": 41.52, "elapsed_time": "14:16:14", "remaining_time": "20:06:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4507, "total_steps": 10853, "loss": 0.1459, "learning_rate": 3.3874983716600414e-06, "epoch": 0.41525775095591283, "percentage": 41.53, "elapsed_time": "14:16:26", "remaining_time": "20:05:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4508, "total_steps": 10853, "loss": 0.1605, "learning_rate": 3.3867861651247997e-06, "epoch": 0.4153498871331828, "percentage": 41.54, "elapsed_time": "14:16:37", "remaining_time": "20:05:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4509, "total_steps": 10853, "loss": 0.1539, "learning_rate": 3.3860738762513674e-06, "epoch": 0.4154420233104528, "percentage": 41.55, "elapsed_time": "14:16:49", "remaining_time": "20:05:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4510, "total_steps": 10853, "loss": 0.1476, "learning_rate": 3.3853615051058798e-06, "epoch": 0.4155341594877229, "percentage": 41.56, "elapsed_time": "14:17:00", "remaining_time": "20:05:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4511, "total_steps": 10853, "loss": 0.1453, "learning_rate": 3.384649051754481e-06, "epoch": 0.4156262956649929, "percentage": 41.56, "elapsed_time": "14:17:11", "remaining_time": "20:05:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4512, "total_steps": 10853, "loss": 0.1554, "learning_rate": 3.3839365162633237e-06, "epoch": 0.41571843184226287, "percentage": 41.57, "elapsed_time": "14:17:21", "remaining_time": "20:04:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4513, "total_steps": 10853, "loss": 0.1581, "learning_rate": 3.3832238986985643e-06, "epoch": 0.41581056801953287, "percentage": 41.58, "elapsed_time": "14:17:32", "remaining_time": "20:04:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4514, "total_steps": 10853, "loss": 0.1353, "learning_rate": 3.382511199126372e-06, "epoch": 0.41590270419680286, "percentage": 41.59, "elapsed_time": "14:17:43", "remaining_time": "20:04:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4515, "total_steps": 10853, "loss": 0.1456, "learning_rate": 3.3817984176129194e-06, "epoch": 0.41599484037407286, "percentage": 41.6, "elapsed_time": "14:17:54", "remaining_time": "20:04:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4516, "total_steps": 10853, "loss": 0.1417, "learning_rate": 3.3810855542243892e-06, "epoch": 0.41608697655134286, "percentage": 41.61, "elapsed_time": "14:18:05", "remaining_time": "20:04:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4517, "total_steps": 10853, "loss": 0.146, "learning_rate": 3.38037260902697e-06, "epoch": 0.4161791127286129, "percentage": 41.62, "elapsed_time": "14:18:19", "remaining_time": "20:03:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4518, "total_steps": 10853, "loss": 0.1403, "learning_rate": 3.3796595820868596e-06, "epoch": 0.4162712489058829, "percentage": 41.63, "elapsed_time": "14:18:28", "remaining_time": "20:03:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4519, "total_steps": 10853, "loss": 0.1535, "learning_rate": 3.378946473470262e-06, "epoch": 0.4163633850831529, "percentage": 41.64, "elapsed_time": "14:18:39", "remaining_time": "20:03:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4520, "total_steps": 10853, "loss": 0.1357, "learning_rate": 3.37823328324339e-06, "epoch": 0.4164555212604229, "percentage": 41.65, "elapsed_time": "14:18:48", "remaining_time": "20:03:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4521, "total_steps": 10853, "loss": 0.1479, "learning_rate": 3.3775200114724632e-06, "epoch": 0.4165476574376929, "percentage": 41.66, "elapsed_time": "14:19:00", "remaining_time": "20:03:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4522, "total_steps": 10853, "loss": 0.162, "learning_rate": 3.3768066582237084e-06, "epoch": 0.4166397936149629, "percentage": 41.67, "elapsed_time": "14:19:11", "remaining_time": "20:02:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4523, "total_steps": 10853, "loss": 0.1555, "learning_rate": 3.3760932235633614e-06, "epoch": 0.41673192979223295, "percentage": 41.68, "elapsed_time": "14:19:22", "remaining_time": "20:02:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4524, "total_steps": 10853, "loss": 0.1515, "learning_rate": 3.3753797075576646e-06, "epoch": 0.41682406596950294, "percentage": 41.68, "elapsed_time": "14:19:32", "remaining_time": "20:02:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4525, "total_steps": 10853, "loss": 0.137, "learning_rate": 3.374666110272868e-06, "epoch": 0.41691620214677294, "percentage": 41.69, "elapsed_time": "14:19:43", "remaining_time": "20:02:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4526, "total_steps": 10853, "loss": 0.1297, "learning_rate": 3.3739524317752276e-06, "epoch": 0.41700833832404294, "percentage": 41.7, "elapsed_time": "14:19:55", "remaining_time": "20:02:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4527, "total_steps": 10853, "loss": 0.1383, "learning_rate": 3.373238672131011e-06, "epoch": 0.41710047450131293, "percentage": 41.71, "elapsed_time": "14:20:05", "remaining_time": "20:01:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4528, "total_steps": 10853, "loss": 0.1405, "learning_rate": 3.372524831406489e-06, "epoch": 0.41719261067858293, "percentage": 41.72, "elapsed_time": "14:20:16", "remaining_time": "20:01:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4529, "total_steps": 10853, "loss": 0.1425, "learning_rate": 3.371810909667943e-06, "epoch": 0.41728474685585293, "percentage": 41.73, "elapsed_time": "14:20:26", "remaining_time": "20:01:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4530, "total_steps": 10853, "loss": 0.1298, "learning_rate": 3.37109690698166e-06, "epoch": 0.417376883033123, "percentage": 41.74, "elapsed_time": "14:20:37", "remaining_time": "20:01:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4531, "total_steps": 10853, "loss": 0.1335, "learning_rate": 3.3703828234139357e-06, "epoch": 0.417469019210393, "percentage": 41.75, "elapsed_time": "14:20:46", "remaining_time": "20:01:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4532, "total_steps": 10853, "loss": 0.1542, "learning_rate": 3.369668659031072e-06, "epoch": 0.417561155387663, "percentage": 41.76, "elapsed_time": "14:20:56", "remaining_time": "20:00:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4533, "total_steps": 10853, "loss": 0.1557, "learning_rate": 3.368954413899381e-06, "epoch": 0.41765329156493297, "percentage": 41.77, "elapsed_time": "14:21:07", "remaining_time": "20:00:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4534, "total_steps": 10853, "loss": 0.1361, "learning_rate": 3.368240088085177e-06, "epoch": 0.41774542774220297, "percentage": 41.78, "elapsed_time": "14:21:19", "remaining_time": "20:00:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4535, "total_steps": 10853, "loss": 0.1636, "learning_rate": 3.367525681654789e-06, "epoch": 0.41783756391947297, "percentage": 41.79, "elapsed_time": "14:21:31", "remaining_time": "20:00:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4536, "total_steps": 10853, "loss": 0.1275, "learning_rate": 3.366811194674548e-06, "epoch": 0.41792970009674296, "percentage": 41.79, "elapsed_time": "14:21:42", "remaining_time": "20:00:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4537, "total_steps": 10853, "loss": 0.1401, "learning_rate": 3.3660966272107943e-06, "epoch": 0.418021836274013, "percentage": 41.8, "elapsed_time": "14:21:54", "remaining_time": "19:59:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4538, "total_steps": 10853, "loss": 0.1425, "learning_rate": 3.365381979329875e-06, "epoch": 0.418113972451283, "percentage": 41.81, "elapsed_time": "14:22:04", "remaining_time": "19:59:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4539, "total_steps": 10853, "loss": 0.1518, "learning_rate": 3.3646672510981458e-06, "epoch": 0.418206108628553, "percentage": 41.82, "elapsed_time": "14:22:14", "remaining_time": "19:59:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4540, "total_steps": 10853, "loss": 0.1453, "learning_rate": 3.363952442581969e-06, "epoch": 0.418298244805823, "percentage": 41.83, "elapsed_time": "14:22:25", "remaining_time": "19:59:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4541, "total_steps": 10853, "loss": 0.1379, "learning_rate": 3.3632375538477165e-06, "epoch": 0.418390380983093, "percentage": 41.84, "elapsed_time": "14:22:36", "remaining_time": "19:59:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4542, "total_steps": 10853, "loss": 0.1578, "learning_rate": 3.3625225849617625e-06, "epoch": 0.418482517160363, "percentage": 41.85, "elapsed_time": "14:22:48", "remaining_time": "19:58:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4543, "total_steps": 10853, "loss": 0.1376, "learning_rate": 3.3618075359904946e-06, "epoch": 0.418574653337633, "percentage": 41.86, "elapsed_time": "14:23:01", "remaining_time": "19:58:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4544, "total_steps": 10853, "loss": 0.1585, "learning_rate": 3.361092407000304e-06, "epoch": 0.41866678951490305, "percentage": 41.87, "elapsed_time": "14:23:11", "remaining_time": "19:58:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4545, "total_steps": 10853, "loss": 0.1444, "learning_rate": 3.3603771980575907e-06, "epoch": 0.41875892569217305, "percentage": 41.88, "elapsed_time": "14:23:25", "remaining_time": "19:58:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4546, "total_steps": 10853, "loss": 0.159, "learning_rate": 3.359661909228762e-06, "epoch": 0.41885106186944304, "percentage": 41.89, "elapsed_time": "14:23:34", "remaining_time": "19:58:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4547, "total_steps": 10853, "loss": 0.1441, "learning_rate": 3.3589465405802324e-06, "epoch": 0.41894319804671304, "percentage": 41.9, "elapsed_time": "14:23:45", "remaining_time": "19:57:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4548, "total_steps": 10853, "loss": 0.1474, "learning_rate": 3.358231092178424e-06, "epoch": 0.41903533422398304, "percentage": 41.91, "elapsed_time": "14:23:57", "remaining_time": "19:57:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4549, "total_steps": 10853, "loss": 0.1414, "learning_rate": 3.3575155640897666e-06, "epoch": 0.41912747040125303, "percentage": 41.91, "elapsed_time": "14:24:07", "remaining_time": "19:57:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4550, "total_steps": 10853, "loss": 0.1402, "learning_rate": 3.356799956380697e-06, "epoch": 0.41921960657852303, "percentage": 41.92, "elapsed_time": "14:24:18", "remaining_time": "19:57:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4551, "total_steps": 10853, "loss": 0.1449, "learning_rate": 3.3560842691176583e-06, "epoch": 0.4193117427557931, "percentage": 41.93, "elapsed_time": "14:24:28", "remaining_time": "19:57:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4552, "total_steps": 10853, "loss": 0.1467, "learning_rate": 3.355368502367104e-06, "epoch": 0.4194038789330631, "percentage": 41.94, "elapsed_time": "14:24:39", "remaining_time": "19:56:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4553, "total_steps": 10853, "loss": 0.1522, "learning_rate": 3.354652656195492e-06, "epoch": 0.4194960151103331, "percentage": 41.95, "elapsed_time": "14:24:49", "remaining_time": "19:56:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4554, "total_steps": 10853, "loss": 0.1479, "learning_rate": 3.3539367306692884e-06, "epoch": 0.4195881512876031, "percentage": 41.96, "elapsed_time": "14:24:59", "remaining_time": "19:56:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4555, "total_steps": 10853, "loss": 0.1422, "learning_rate": 3.3532207258549676e-06, "epoch": 0.41968028746487307, "percentage": 41.97, "elapsed_time": "14:25:11", "remaining_time": "19:56:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4556, "total_steps": 10853, "loss": 0.1351, "learning_rate": 3.352504641819011e-06, "epoch": 0.41977242364214307, "percentage": 41.98, "elapsed_time": "14:25:22", "remaining_time": "19:56:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4557, "total_steps": 10853, "loss": 0.1455, "learning_rate": 3.3517884786279065e-06, "epoch": 0.4198645598194131, "percentage": 41.99, "elapsed_time": "14:25:33", "remaining_time": "19:55:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4558, "total_steps": 10853, "loss": 0.1318, "learning_rate": 3.3510722363481505e-06, "epoch": 0.4199566959966831, "percentage": 42.0, "elapsed_time": "14:25:44", "remaining_time": "19:55:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4559, "total_steps": 10853, "loss": 0.1579, "learning_rate": 3.350355915046245e-06, "epoch": 0.4200488321739531, "percentage": 42.01, "elapsed_time": "14:25:56", "remaining_time": "19:55:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4560, "total_steps": 10853, "loss": 0.1434, "learning_rate": 3.3496395147887017e-06, "epoch": 0.4201409683512231, "percentage": 42.02, "elapsed_time": "14:26:07", "remaining_time": "19:55:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4561, "total_steps": 10853, "loss": 0.1534, "learning_rate": 3.348923035642038e-06, "epoch": 0.4202331045284931, "percentage": 42.03, "elapsed_time": "14:26:18", "remaining_time": "19:55:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4562, "total_steps": 10853, "loss": 0.1621, "learning_rate": 3.3482064776727784e-06, "epoch": 0.4203252407057631, "percentage": 42.03, "elapsed_time": "14:26:29", "remaining_time": "19:54:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4563, "total_steps": 10853, "loss": 0.1429, "learning_rate": 3.3474898409474573e-06, "epoch": 0.4204173768830331, "percentage": 42.04, "elapsed_time": "14:26:39", "remaining_time": "19:54:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4564, "total_steps": 10853, "loss": 0.1698, "learning_rate": 3.3467731255326123e-06, "epoch": 0.42050951306030315, "percentage": 42.05, "elapsed_time": "14:26:50", "remaining_time": "19:54:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4565, "total_steps": 10853, "loss": 0.1444, "learning_rate": 3.346056331494792e-06, "epoch": 0.42060164923757315, "percentage": 42.06, "elapsed_time": "14:27:02", "remaining_time": "19:54:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4566, "total_steps": 10853, "loss": 0.1327, "learning_rate": 3.34533945890055e-06, "epoch": 0.42069378541484315, "percentage": 42.07, "elapsed_time": "14:27:14", "remaining_time": "19:54:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4567, "total_steps": 10853, "loss": 0.1254, "learning_rate": 3.344622507816448e-06, "epoch": 0.42078592159211314, "percentage": 42.08, "elapsed_time": "14:27:24", "remaining_time": "19:53:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4568, "total_steps": 10853, "loss": 0.1392, "learning_rate": 3.343905478309056e-06, "epoch": 0.42087805776938314, "percentage": 42.09, "elapsed_time": "14:27:35", "remaining_time": "19:53:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4569, "total_steps": 10853, "loss": 0.165, "learning_rate": 3.3431883704449485e-06, "epoch": 0.42097019394665314, "percentage": 42.1, "elapsed_time": "14:27:47", "remaining_time": "19:53:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4570, "total_steps": 10853, "loss": 0.1468, "learning_rate": 3.342471184290711e-06, "epoch": 0.42106233012392313, "percentage": 42.11, "elapsed_time": "14:27:57", "remaining_time": "19:53:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4571, "total_steps": 10853, "loss": 0.1755, "learning_rate": 3.3417539199129327e-06, "epoch": 0.4211544663011932, "percentage": 42.12, "elapsed_time": "14:28:09", "remaining_time": "19:53:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4572, "total_steps": 10853, "loss": 0.141, "learning_rate": 3.341036577378213e-06, "epoch": 0.4212466024784632, "percentage": 42.13, "elapsed_time": "14:28:19", "remaining_time": "19:52:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4573, "total_steps": 10853, "loss": 0.1612, "learning_rate": 3.3403191567531563e-06, "epoch": 0.4213387386557332, "percentage": 42.14, "elapsed_time": "14:28:30", "remaining_time": "19:52:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4574, "total_steps": 10853, "loss": 0.1416, "learning_rate": 3.3396016581043757e-06, "epoch": 0.4214308748330032, "percentage": 42.15, "elapsed_time": "14:28:41", "remaining_time": "19:52:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4575, "total_steps": 10853, "loss": 0.1674, "learning_rate": 3.3388840814984896e-06, "epoch": 0.4215230110102732, "percentage": 42.15, "elapsed_time": "14:28:52", "remaining_time": "19:52:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4576, "total_steps": 10853, "loss": 0.1526, "learning_rate": 3.3381664270021273e-06, "epoch": 0.42161514718754317, "percentage": 42.16, "elapsed_time": "14:29:03", "remaining_time": "19:52:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4577, "total_steps": 10853, "loss": 0.1466, "learning_rate": 3.337448694681922e-06, "epoch": 0.42170728336481317, "percentage": 42.17, "elapsed_time": "14:29:14", "remaining_time": "19:51:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4578, "total_steps": 10853, "loss": 0.1504, "learning_rate": 3.3367308846045155e-06, "epoch": 0.4217994195420832, "percentage": 42.18, "elapsed_time": "14:29:26", "remaining_time": "19:51:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4579, "total_steps": 10853, "loss": 0.1571, "learning_rate": 3.3360129968365556e-06, "epoch": 0.4218915557193532, "percentage": 42.19, "elapsed_time": "14:29:36", "remaining_time": "19:51:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4580, "total_steps": 10853, "loss": 0.1627, "learning_rate": 3.335295031444699e-06, "epoch": 0.4219836918966232, "percentage": 42.2, "elapsed_time": "14:29:48", "remaining_time": "19:51:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4581, "total_steps": 10853, "loss": 0.1592, "learning_rate": 3.3345769884956097e-06, "epoch": 0.4220758280738932, "percentage": 42.21, "elapsed_time": "14:29:59", "remaining_time": "19:51:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4582, "total_steps": 10853, "loss": 0.1362, "learning_rate": 3.3338588680559565e-06, "epoch": 0.4221679642511632, "percentage": 42.22, "elapsed_time": "14:30:10", "remaining_time": "19:50:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4583, "total_steps": 10853, "loss": 0.1412, "learning_rate": 3.3331406701924173e-06, "epoch": 0.4222601004284332, "percentage": 42.23, "elapsed_time": "14:30:20", "remaining_time": "19:50:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4584, "total_steps": 10853, "loss": 0.1658, "learning_rate": 3.3324223949716783e-06, "epoch": 0.4223522366057032, "percentage": 42.24, "elapsed_time": "14:30:32", "remaining_time": "19:50:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4585, "total_steps": 10853, "loss": 0.1389, "learning_rate": 3.3317040424604296e-06, "epoch": 0.42244437278297325, "percentage": 42.25, "elapsed_time": "14:30:44", "remaining_time": "19:50:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4586, "total_steps": 10853, "loss": 0.1301, "learning_rate": 3.330985612725371e-06, "epoch": 0.42253650896024325, "percentage": 42.26, "elapsed_time": "14:30:54", "remaining_time": "19:50:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4587, "total_steps": 10853, "loss": 0.156, "learning_rate": 3.330267105833209e-06, "epoch": 0.42262864513751325, "percentage": 42.26, "elapsed_time": "14:31:06", "remaining_time": "19:49:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4588, "total_steps": 10853, "loss": 0.1427, "learning_rate": 3.3295485218506568e-06, "epoch": 0.42272078131478324, "percentage": 42.27, "elapsed_time": "14:31:16", "remaining_time": "19:49:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4589, "total_steps": 10853, "loss": 0.1543, "learning_rate": 3.328829860844435e-06, "epoch": 0.42281291749205324, "percentage": 42.28, "elapsed_time": "14:31:26", "remaining_time": "19:49:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4590, "total_steps": 10853, "loss": 0.1499, "learning_rate": 3.328111122881272e-06, "epoch": 0.42290505366932324, "percentage": 42.29, "elapsed_time": "14:31:37", "remaining_time": "19:49:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4591, "total_steps": 10853, "loss": 0.1486, "learning_rate": 3.327392308027902e-06, "epoch": 0.4229971898465933, "percentage": 42.3, "elapsed_time": "14:31:47", "remaining_time": "19:49:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4592, "total_steps": 10853, "loss": 0.1423, "learning_rate": 3.3266734163510668e-06, "epoch": 0.4230893260238633, "percentage": 42.31, "elapsed_time": "14:31:59", "remaining_time": "19:48:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4593, "total_steps": 10853, "loss": 0.145, "learning_rate": 3.325954447917516e-06, "epoch": 0.4231814622011333, "percentage": 42.32, "elapsed_time": "14:32:09", "remaining_time": "19:48:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4594, "total_steps": 10853, "loss": 0.149, "learning_rate": 3.3252354027940055e-06, "epoch": 0.4232735983784033, "percentage": 42.33, "elapsed_time": "14:32:20", "remaining_time": "19:48:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4595, "total_steps": 10853, "loss": 0.155, "learning_rate": 3.3245162810472998e-06, "epoch": 0.4233657345556733, "percentage": 42.34, "elapsed_time": "14:32:29", "remaining_time": "19:48:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4596, "total_steps": 10853, "loss": 0.1412, "learning_rate": 3.323797082744168e-06, "epoch": 0.4234578707329433, "percentage": 42.35, "elapsed_time": "14:32:40", "remaining_time": "19:48:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4597, "total_steps": 10853, "loss": 0.1345, "learning_rate": 3.3230778079513883e-06, "epoch": 0.4235500069102133, "percentage": 42.36, "elapsed_time": "14:32:50", "remaining_time": "19:47:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4598, "total_steps": 10853, "loss": 0.1398, "learning_rate": 3.3223584567357458e-06, "epoch": 0.4236421430874833, "percentage": 42.37, "elapsed_time": "14:33:00", "remaining_time": "19:47:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4599, "total_steps": 10853, "loss": 0.1479, "learning_rate": 3.3216390291640327e-06, "epoch": 0.4237342792647533, "percentage": 42.38, "elapsed_time": "14:33:11", "remaining_time": "19:47:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4600, "total_steps": 10853, "loss": 0.1504, "learning_rate": 3.320919525303047e-06, "epoch": 0.4238264154420233, "percentage": 42.38, "elapsed_time": "14:33:22", "remaining_time": "19:47:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4601, "total_steps": 10853, "loss": 0.1497, "learning_rate": 3.3201999452195942e-06, "epoch": 0.4239185516192933, "percentage": 42.39, "elapsed_time": "14:33:33", "remaining_time": "19:47:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4602, "total_steps": 10853, "loss": 0.1511, "learning_rate": 3.3194802889804887e-06, "epoch": 0.4240106877965633, "percentage": 42.4, "elapsed_time": "14:33:43", "remaining_time": "19:46:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4603, "total_steps": 10853, "loss": 0.1413, "learning_rate": 3.318760556652551e-06, "epoch": 0.4241028239738333, "percentage": 42.41, "elapsed_time": "14:33:53", "remaining_time": "19:46:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4604, "total_steps": 10853, "loss": 0.1566, "learning_rate": 3.318040748302606e-06, "epoch": 0.4241949601511033, "percentage": 42.42, "elapsed_time": "14:34:05", "remaining_time": "19:46:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4605, "total_steps": 10853, "loss": 0.1383, "learning_rate": 3.317320863997491e-06, "epoch": 0.42428709632837336, "percentage": 42.43, "elapsed_time": "14:34:15", "remaining_time": "19:46:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4606, "total_steps": 10853, "loss": 0.1509, "learning_rate": 3.316600903804045e-06, "epoch": 0.42437923250564336, "percentage": 42.44, "elapsed_time": "14:34:26", "remaining_time": "19:45:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4607, "total_steps": 10853, "loss": 0.1571, "learning_rate": 3.3158808677891167e-06, "epoch": 0.42447136868291335, "percentage": 42.45, "elapsed_time": "14:34:37", "remaining_time": "19:45:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4608, "total_steps": 10853, "loss": 0.1448, "learning_rate": 3.315160756019563e-06, "epoch": 0.42456350486018335, "percentage": 42.46, "elapsed_time": "14:34:47", "remaining_time": "19:45:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4609, "total_steps": 10853, "loss": 0.149, "learning_rate": 3.314440568562245e-06, "epoch": 0.42465564103745335, "percentage": 42.47, "elapsed_time": "14:34:58", "remaining_time": "19:45:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4610, "total_steps": 10853, "loss": 0.1444, "learning_rate": 3.3137203054840323e-06, "epoch": 0.42474777721472334, "percentage": 42.48, "elapsed_time": "14:35:09", "remaining_time": "19:45:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4611, "total_steps": 10853, "loss": 0.1431, "learning_rate": 3.312999966851802e-06, "epoch": 0.42483991339199334, "percentage": 42.49, "elapsed_time": "14:35:20", "remaining_time": "19:44:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4612, "total_steps": 10853, "loss": 0.1436, "learning_rate": 3.3122795527324374e-06, "epoch": 0.4249320495692634, "percentage": 42.5, "elapsed_time": "14:35:30", "remaining_time": "19:44:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4613, "total_steps": 10853, "loss": 0.1478, "learning_rate": 3.3115590631928284e-06, "epoch": 0.4250241857465334, "percentage": 42.5, "elapsed_time": "14:35:39", "remaining_time": "19:44:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4614, "total_steps": 10853, "loss": 0.1534, "learning_rate": 3.3108384982998736e-06, "epoch": 0.4251163219238034, "percentage": 42.51, "elapsed_time": "14:35:51", "remaining_time": "19:44:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4615, "total_steps": 10853, "loss": 0.144, "learning_rate": 3.310117858120476e-06, "epoch": 0.4252084581010734, "percentage": 42.52, "elapsed_time": "14:36:03", "remaining_time": "19:44:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4616, "total_steps": 10853, "loss": 0.1514, "learning_rate": 3.3093971427215497e-06, "epoch": 0.4253005942783434, "percentage": 42.53, "elapsed_time": "14:36:13", "remaining_time": "19:43:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4617, "total_steps": 10853, "loss": 0.1418, "learning_rate": 3.3086763521700105e-06, "epoch": 0.4253927304556134, "percentage": 42.54, "elapsed_time": "14:36:23", "remaining_time": "19:43:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4618, "total_steps": 10853, "loss": 0.1511, "learning_rate": 3.307955486532785e-06, "epoch": 0.4254848666328834, "percentage": 42.55, "elapsed_time": "14:36:34", "remaining_time": "19:43:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4619, "total_steps": 10853, "loss": 0.1489, "learning_rate": 3.3072345458768063e-06, "epoch": 0.4255770028101534, "percentage": 42.56, "elapsed_time": "14:36:45", "remaining_time": "19:43:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4620, "total_steps": 10853, "loss": 0.1414, "learning_rate": 3.306513530269012e-06, "epoch": 0.4256691389874234, "percentage": 42.57, "elapsed_time": "14:36:56", "remaining_time": "19:43:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4621, "total_steps": 10853, "loss": 0.147, "learning_rate": 3.30579243977635e-06, "epoch": 0.4257612751646934, "percentage": 42.58, "elapsed_time": "14:37:07", "remaining_time": "19:42:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4622, "total_steps": 10853, "loss": 0.1409, "learning_rate": 3.305071274465774e-06, "epoch": 0.4258534113419634, "percentage": 42.59, "elapsed_time": "14:37:18", "remaining_time": "19:42:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4623, "total_steps": 10853, "loss": 0.146, "learning_rate": 3.304350034404243e-06, "epoch": 0.4259455475192334, "percentage": 42.6, "elapsed_time": "14:37:29", "remaining_time": "19:42:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4624, "total_steps": 10853, "loss": 0.1493, "learning_rate": 3.3036287196587245e-06, "epoch": 0.4260376836965034, "percentage": 42.61, "elapsed_time": "14:37:41", "remaining_time": "19:42:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4625, "total_steps": 10853, "loss": 0.1507, "learning_rate": 3.3029073302961933e-06, "epoch": 0.42612981987377346, "percentage": 42.61, "elapsed_time": "14:37:52", "remaining_time": "19:42:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4626, "total_steps": 10853, "loss": 0.1488, "learning_rate": 3.3021858663836302e-06, "epoch": 0.42622195605104346, "percentage": 42.62, "elapsed_time": "14:38:03", "remaining_time": "19:41:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4627, "total_steps": 10853, "loss": 0.1527, "learning_rate": 3.301464327988023e-06, "epoch": 0.42631409222831346, "percentage": 42.63, "elapsed_time": "14:38:14", "remaining_time": "19:41:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4628, "total_steps": 10853, "loss": 0.1607, "learning_rate": 3.300742715176366e-06, "epoch": 0.42640622840558345, "percentage": 42.64, "elapsed_time": "14:38:26", "remaining_time": "19:41:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4629, "total_steps": 10853, "loss": 0.163, "learning_rate": 3.300021028015662e-06, "epoch": 0.42649836458285345, "percentage": 42.65, "elapsed_time": "14:38:38", "remaining_time": "19:41:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4630, "total_steps": 10853, "loss": 0.1473, "learning_rate": 3.29929926657292e-06, "epoch": 0.42659050076012345, "percentage": 42.66, "elapsed_time": "14:38:50", "remaining_time": "19:41:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4631, "total_steps": 10853, "loss": 0.1457, "learning_rate": 3.298577430915155e-06, "epoch": 0.42668263693739344, "percentage": 42.67, "elapsed_time": "14:39:01", "remaining_time": "19:41:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4632, "total_steps": 10853, "loss": 0.1428, "learning_rate": 3.297855521109389e-06, "epoch": 0.4267747731146635, "percentage": 42.68, "elapsed_time": "14:39:12", "remaining_time": "19:40:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4633, "total_steps": 10853, "loss": 0.1494, "learning_rate": 3.297133537222652e-06, "epoch": 0.4268669092919335, "percentage": 42.69, "elapsed_time": "14:39:20", "remaining_time": "19:40:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4634, "total_steps": 10853, "loss": 0.1581, "learning_rate": 3.2964114793219802e-06, "epoch": 0.4269590454692035, "percentage": 42.7, "elapsed_time": "14:39:30", "remaining_time": "19:40:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4635, "total_steps": 10853, "loss": 0.1634, "learning_rate": 3.2956893474744177e-06, "epoch": 0.4270511816464735, "percentage": 42.71, "elapsed_time": "14:39:40", "remaining_time": "19:40:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4636, "total_steps": 10853, "loss": 0.157, "learning_rate": 3.294967141747013e-06, "epoch": 0.4271433178237435, "percentage": 42.72, "elapsed_time": "14:39:51", "remaining_time": "19:39:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4637, "total_steps": 10853, "loss": 0.147, "learning_rate": 3.294244862206824e-06, "epoch": 0.4272354540010135, "percentage": 42.73, "elapsed_time": "14:40:02", "remaining_time": "19:39:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4638, "total_steps": 10853, "loss": 0.15, "learning_rate": 3.293522508920914e-06, "epoch": 0.4273275901782835, "percentage": 42.73, "elapsed_time": "14:40:13", "remaining_time": "19:39:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4639, "total_steps": 10853, "loss": 0.1534, "learning_rate": 3.292800081956354e-06, "epoch": 0.42741972635555353, "percentage": 42.74, "elapsed_time": "14:40:23", "remaining_time": "19:39:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4640, "total_steps": 10853, "loss": 0.1683, "learning_rate": 3.29207758138022e-06, "epoch": 0.42751186253282353, "percentage": 42.75, "elapsed_time": "14:40:34", "remaining_time": "19:39:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4641, "total_steps": 10853, "loss": 0.152, "learning_rate": 3.2913550072595986e-06, "epoch": 0.4276039987100935, "percentage": 42.76, "elapsed_time": "14:40:45", "remaining_time": "19:38:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4642, "total_steps": 10853, "loss": 0.1514, "learning_rate": 3.290632359661578e-06, "epoch": 0.4276961348873635, "percentage": 42.77, "elapsed_time": "14:40:56", "remaining_time": "19:38:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4643, "total_steps": 10853, "loss": 0.155, "learning_rate": 3.289909638653259e-06, "epoch": 0.4277882710646335, "percentage": 42.78, "elapsed_time": "14:41:08", "remaining_time": "19:38:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4644, "total_steps": 10853, "loss": 0.1467, "learning_rate": 3.289186844301745e-06, "epoch": 0.4278804072419035, "percentage": 42.79, "elapsed_time": "14:41:18", "remaining_time": "19:38:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4645, "total_steps": 10853, "loss": 0.1503, "learning_rate": 3.2884639766741473e-06, "epoch": 0.4279725434191735, "percentage": 42.8, "elapsed_time": "14:41:28", "remaining_time": "19:38:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4646, "total_steps": 10853, "loss": 0.1484, "learning_rate": 3.2877410358375845e-06, "epoch": 0.42806467959644356, "percentage": 42.81, "elapsed_time": "14:41:39", "remaining_time": "19:37:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4647, "total_steps": 10853, "loss": 0.1379, "learning_rate": 3.287018021859182e-06, "epoch": 0.42815681577371356, "percentage": 42.82, "elapsed_time": "14:41:49", "remaining_time": "19:37:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4648, "total_steps": 10853, "loss": 0.1485, "learning_rate": 3.2862949348060707e-06, "epoch": 0.42824895195098356, "percentage": 42.83, "elapsed_time": "14:41:59", "remaining_time": "19:37:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4649, "total_steps": 10853, "loss": 0.145, "learning_rate": 3.285571774745391e-06, "epoch": 0.42834108812825356, "percentage": 42.84, "elapsed_time": "14:42:10", "remaining_time": "19:37:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4650, "total_steps": 10853, "loss": 0.143, "learning_rate": 3.2848485417442867e-06, "epoch": 0.42843322430552355, "percentage": 42.85, "elapsed_time": "14:42:20", "remaining_time": "19:37:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4651, "total_steps": 10853, "loss": 0.1428, "learning_rate": 3.2841252358699115e-06, "epoch": 0.42852536048279355, "percentage": 42.85, "elapsed_time": "14:42:31", "remaining_time": "19:36:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4652, "total_steps": 10853, "loss": 0.1447, "learning_rate": 3.2834018571894233e-06, "epoch": 0.4286174966600636, "percentage": 42.86, "elapsed_time": "14:42:41", "remaining_time": "19:36:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4653, "total_steps": 10853, "loss": 0.1542, "learning_rate": 3.282678405769988e-06, "epoch": 0.4287096328373336, "percentage": 42.87, "elapsed_time": "14:42:52", "remaining_time": "19:36:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4654, "total_steps": 10853, "loss": 0.1526, "learning_rate": 3.2819548816787794e-06, "epoch": 0.4288017690146036, "percentage": 42.88, "elapsed_time": "14:43:03", "remaining_time": "19:36:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4655, "total_steps": 10853, "loss": 0.1399, "learning_rate": 3.2812312849829754e-06, "epoch": 0.4288939051918736, "percentage": 42.89, "elapsed_time": "14:43:12", "remaining_time": "19:35:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4656, "total_steps": 10853, "loss": 0.1401, "learning_rate": 3.280507615749763e-06, "epoch": 0.4289860413691436, "percentage": 42.9, "elapsed_time": "14:43:24", "remaining_time": "19:35:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4657, "total_steps": 10853, "loss": 0.1516, "learning_rate": 3.279783874046334e-06, "epoch": 0.4290781775464136, "percentage": 42.91, "elapsed_time": "14:43:35", "remaining_time": "19:35:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4658, "total_steps": 10853, "loss": 0.1416, "learning_rate": 3.2790600599398882e-06, "epoch": 0.4291703137236836, "percentage": 42.92, "elapsed_time": "14:43:45", "remaining_time": "19:35:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4659, "total_steps": 10853, "loss": 0.1585, "learning_rate": 3.2783361734976325e-06, "epoch": 0.42926244990095364, "percentage": 42.93, "elapsed_time": "14:43:57", "remaining_time": "19:35:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4660, "total_steps": 10853, "loss": 0.1388, "learning_rate": 3.2776122147867782e-06, "epoch": 0.42935458607822363, "percentage": 42.94, "elapsed_time": "14:44:06", "remaining_time": "19:34:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4661, "total_steps": 10853, "loss": 0.1348, "learning_rate": 3.276888183874547e-06, "epoch": 0.42944672225549363, "percentage": 42.95, "elapsed_time": "14:44:16", "remaining_time": "19:34:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4662, "total_steps": 10853, "loss": 0.1405, "learning_rate": 3.2761640808281647e-06, "epoch": 0.4295388584327636, "percentage": 42.96, "elapsed_time": "14:44:26", "remaining_time": "19:34:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4663, "total_steps": 10853, "loss": 0.1478, "learning_rate": 3.275439905714863e-06, "epoch": 0.4296309946100336, "percentage": 42.97, "elapsed_time": "14:44:37", "remaining_time": "19:34:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4664, "total_steps": 10853, "loss": 0.1545, "learning_rate": 3.274715658601883e-06, "epoch": 0.4297231307873036, "percentage": 42.97, "elapsed_time": "14:44:49", "remaining_time": "19:34:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4665, "total_steps": 10853, "loss": 0.144, "learning_rate": 3.273991339556471e-06, "epoch": 0.4298152669645736, "percentage": 42.98, "elapsed_time": "14:45:00", "remaining_time": "19:33:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4666, "total_steps": 10853, "loss": 0.1617, "learning_rate": 3.2732669486458796e-06, "epoch": 0.42990740314184367, "percentage": 42.99, "elapsed_time": "14:45:11", "remaining_time": "19:33:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4667, "total_steps": 10853, "loss": 0.1321, "learning_rate": 3.272542485937369e-06, "epoch": 0.42999953931911367, "percentage": 43.0, "elapsed_time": "14:45:22", "remaining_time": "19:33:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4668, "total_steps": 10853, "loss": 0.1404, "learning_rate": 3.271817951498205e-06, "epoch": 0.43009167549638366, "percentage": 43.01, "elapsed_time": "14:45:32", "remaining_time": "19:33:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4669, "total_steps": 10853, "loss": 0.146, "learning_rate": 3.271093345395661e-06, "epoch": 0.43018381167365366, "percentage": 43.02, "elapsed_time": "14:45:42", "remaining_time": "19:33:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4670, "total_steps": 10853, "loss": 0.145, "learning_rate": 3.270368667697018e-06, "epoch": 0.43027594785092366, "percentage": 43.03, "elapsed_time": "14:45:53", "remaining_time": "19:32:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4671, "total_steps": 10853, "loss": 0.124, "learning_rate": 3.2696439184695606e-06, "epoch": 0.43036808402819365, "percentage": 43.04, "elapsed_time": "14:46:03", "remaining_time": "19:32:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4672, "total_steps": 10853, "loss": 0.1293, "learning_rate": 3.2689190977805822e-06, "epoch": 0.43046022020546365, "percentage": 43.05, "elapsed_time": "14:46:14", "remaining_time": "19:32:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4673, "total_steps": 10853, "loss": 0.141, "learning_rate": 3.2681942056973838e-06, "epoch": 0.4305523563827337, "percentage": 43.06, "elapsed_time": "14:46:25", "remaining_time": "19:32:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4674, "total_steps": 10853, "loss": 0.1574, "learning_rate": 3.26746924228727e-06, "epoch": 0.4306444925600037, "percentage": 43.07, "elapsed_time": "14:46:35", "remaining_time": "19:32:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4675, "total_steps": 10853, "loss": 0.1416, "learning_rate": 3.2667442076175543e-06, "epoch": 0.4307366287372737, "percentage": 43.08, "elapsed_time": "14:46:46", "remaining_time": "19:31:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4676, "total_steps": 10853, "loss": 0.1414, "learning_rate": 3.2660191017555567e-06, "epoch": 0.4308287649145437, "percentage": 43.08, "elapsed_time": "14:46:56", "remaining_time": "19:31:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4677, "total_steps": 10853, "loss": 0.1366, "learning_rate": 3.2652939247686027e-06, "epoch": 0.4309209010918137, "percentage": 43.09, "elapsed_time": "14:47:07", "remaining_time": "19:31:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4678, "total_steps": 10853, "loss": 0.1478, "learning_rate": 3.2645686767240263e-06, "epoch": 0.4310130372690837, "percentage": 43.1, "elapsed_time": "14:47:19", "remaining_time": "19:31:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4679, "total_steps": 10853, "loss": 0.1602, "learning_rate": 3.2638433576891647e-06, "epoch": 0.4311051734463537, "percentage": 43.11, "elapsed_time": "14:47:31", "remaining_time": "19:31:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4680, "total_steps": 10853, "loss": 0.1558, "learning_rate": 3.263117967731366e-06, "epoch": 0.43119730962362374, "percentage": 43.12, "elapsed_time": "14:47:41", "remaining_time": "19:30:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4681, "total_steps": 10853, "loss": 0.1335, "learning_rate": 3.2623925069179817e-06, "epoch": 0.43128944580089373, "percentage": 43.13, "elapsed_time": "14:47:52", "remaining_time": "19:30:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4682, "total_steps": 10853, "loss": 0.1554, "learning_rate": 3.2616669753163717e-06, "epoch": 0.43138158197816373, "percentage": 43.14, "elapsed_time": "14:48:03", "remaining_time": "19:30:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4683, "total_steps": 10853, "loss": 0.1444, "learning_rate": 3.2609413729939005e-06, "epoch": 0.4314737181554337, "percentage": 43.15, "elapsed_time": "14:48:14", "remaining_time": "19:30:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4684, "total_steps": 10853, "loss": 0.1378, "learning_rate": 3.260215700017941e-06, "epoch": 0.4315658543327037, "percentage": 43.16, "elapsed_time": "14:48:25", "remaining_time": "19:30:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4685, "total_steps": 10853, "loss": 0.1585, "learning_rate": 3.2594899564558713e-06, "epoch": 0.4316579905099737, "percentage": 43.17, "elapsed_time": "14:48:36", "remaining_time": "19:29:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4686, "total_steps": 10853, "loss": 0.1431, "learning_rate": 3.2587641423750782e-06, "epoch": 0.4317501266872438, "percentage": 43.18, "elapsed_time": "14:48:48", "remaining_time": "19:29:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4687, "total_steps": 10853, "loss": 0.1384, "learning_rate": 3.2580382578429525e-06, "epoch": 0.43184226286451377, "percentage": 43.19, "elapsed_time": "14:48:58", "remaining_time": "19:29:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4688, "total_steps": 10853, "loss": 0.1468, "learning_rate": 3.2573123029268926e-06, "epoch": 0.43193439904178377, "percentage": 43.2, "elapsed_time": "14:49:09", "remaining_time": "19:29:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4689, "total_steps": 10853, "loss": 0.1407, "learning_rate": 3.256586277694305e-06, "epoch": 0.43202653521905376, "percentage": 43.2, "elapsed_time": "14:49:19", "remaining_time": "19:29:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4690, "total_steps": 10853, "loss": 0.159, "learning_rate": 3.255860182212599e-06, "epoch": 0.43211867139632376, "percentage": 43.21, "elapsed_time": "14:49:30", "remaining_time": "19:28:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4691, "total_steps": 10853, "loss": 0.148, "learning_rate": 3.2551340165491947e-06, "epoch": 0.43221080757359376, "percentage": 43.22, "elapsed_time": "14:49:41", "remaining_time": "19:28:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4692, "total_steps": 10853, "loss": 0.1446, "learning_rate": 3.254407780771515e-06, "epoch": 0.43230294375086376, "percentage": 43.23, "elapsed_time": "14:49:51", "remaining_time": "19:28:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4693, "total_steps": 10853, "loss": 0.1287, "learning_rate": 3.2536814749469915e-06, "epoch": 0.4323950799281338, "percentage": 43.24, "elapsed_time": "14:50:02", "remaining_time": "19:28:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4694, "total_steps": 10853, "loss": 0.1402, "learning_rate": 3.252955099143062e-06, "epoch": 0.4324872161054038, "percentage": 43.25, "elapsed_time": "14:50:13", "remaining_time": "19:28:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4695, "total_steps": 10853, "loss": 0.1403, "learning_rate": 3.2522286534271706e-06, "epoch": 0.4325793522826738, "percentage": 43.26, "elapsed_time": "14:50:23", "remaining_time": "19:27:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4696, "total_steps": 10853, "loss": 0.1456, "learning_rate": 3.2515021378667677e-06, "epoch": 0.4326714884599438, "percentage": 43.27, "elapsed_time": "14:50:34", "remaining_time": "19:27:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4697, "total_steps": 10853, "loss": 0.1304, "learning_rate": 3.250775552529312e-06, "epoch": 0.4327636246372138, "percentage": 43.28, "elapsed_time": "14:50:43", "remaining_time": "19:27:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4698, "total_steps": 10853, "loss": 0.1527, "learning_rate": 3.250048897482263e-06, "epoch": 0.4328557608144838, "percentage": 43.29, "elapsed_time": "14:50:53", "remaining_time": "19:27:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4699, "total_steps": 10853, "loss": 0.1568, "learning_rate": 3.2493221727930947e-06, "epoch": 0.4329478969917538, "percentage": 43.3, "elapsed_time": "14:51:04", "remaining_time": "19:26:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4700, "total_steps": 10853, "loss": 0.1467, "learning_rate": 3.2485953785292813e-06, "epoch": 0.43304003316902384, "percentage": 43.31, "elapsed_time": "14:51:15", "remaining_time": "19:26:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4701, "total_steps": 10853, "loss": 0.1507, "learning_rate": 3.247868514758307e-06, "epoch": 0.43313216934629384, "percentage": 43.32, "elapsed_time": "14:51:25", "remaining_time": "19:26:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4702, "total_steps": 10853, "loss": 0.1526, "learning_rate": 3.2471415815476603e-06, "epoch": 0.43322430552356384, "percentage": 43.32, "elapsed_time": "14:51:37", "remaining_time": "19:26:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4703, "total_steps": 10853, "loss": 0.1372, "learning_rate": 3.246414578964837e-06, "epoch": 0.43331644170083383, "percentage": 43.33, "elapsed_time": "14:51:47", "remaining_time": "19:26:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4704, "total_steps": 10853, "loss": 0.1518, "learning_rate": 3.24568750707734e-06, "epoch": 0.43340857787810383, "percentage": 43.34, "elapsed_time": "14:51:57", "remaining_time": "19:25:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4705, "total_steps": 10853, "loss": 0.1414, "learning_rate": 3.2449603659526787e-06, "epoch": 0.4335007140553738, "percentage": 43.35, "elapsed_time": "14:52:09", "remaining_time": "19:25:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4706, "total_steps": 10853, "loss": 0.1561, "learning_rate": 3.244233155658365e-06, "epoch": 0.4335928502326438, "percentage": 43.36, "elapsed_time": "14:52:20", "remaining_time": "19:25:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4707, "total_steps": 10853, "loss": 0.1459, "learning_rate": 3.2435058762619243e-06, "epoch": 0.4336849864099139, "percentage": 43.37, "elapsed_time": "14:52:31", "remaining_time": "19:25:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4708, "total_steps": 10853, "loss": 0.1374, "learning_rate": 3.2427785278308832e-06, "epoch": 0.43377712258718387, "percentage": 43.38, "elapsed_time": "14:52:41", "remaining_time": "19:25:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4709, "total_steps": 10853, "loss": 0.1493, "learning_rate": 3.242051110432775e-06, "epoch": 0.43386925876445387, "percentage": 43.39, "elapsed_time": "14:52:52", "remaining_time": "19:24:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4710, "total_steps": 10853, "loss": 0.1448, "learning_rate": 3.241323624135142e-06, "epoch": 0.43396139494172387, "percentage": 43.4, "elapsed_time": "14:53:03", "remaining_time": "19:24:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4711, "total_steps": 10853, "loss": 0.137, "learning_rate": 3.2405960690055307e-06, "epoch": 0.43405353111899386, "percentage": 43.41, "elapsed_time": "14:53:14", "remaining_time": "19:24:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4712, "total_steps": 10853, "loss": 0.1367, "learning_rate": 3.2398684451114936e-06, "epoch": 0.43414566729626386, "percentage": 43.42, "elapsed_time": "14:53:26", "remaining_time": "19:24:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4713, "total_steps": 10853, "loss": 0.1479, "learning_rate": 3.2391407525205933e-06, "epoch": 0.43423780347353386, "percentage": 43.43, "elapsed_time": "14:53:37", "remaining_time": "19:24:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4714, "total_steps": 10853, "loss": 0.1499, "learning_rate": 3.2384129913003935e-06, "epoch": 0.4343299396508039, "percentage": 43.43, "elapsed_time": "14:53:48", "remaining_time": "19:23:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4715, "total_steps": 10853, "loss": 0.1513, "learning_rate": 3.237685161518468e-06, "epoch": 0.4344220758280739, "percentage": 43.44, "elapsed_time": "14:53:59", "remaining_time": "19:23:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4716, "total_steps": 10853, "loss": 0.1439, "learning_rate": 3.236957263242396e-06, "epoch": 0.4345142120053439, "percentage": 43.45, "elapsed_time": "14:54:11", "remaining_time": "19:23:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4717, "total_steps": 10853, "loss": 0.1528, "learning_rate": 3.2362292965397633e-06, "epoch": 0.4346063481826139, "percentage": 43.46, "elapsed_time": "14:54:22", "remaining_time": "19:23:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4718, "total_steps": 10853, "loss": 0.146, "learning_rate": 3.235501261478161e-06, "epoch": 0.4346984843598839, "percentage": 43.47, "elapsed_time": "14:54:34", "remaining_time": "19:23:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4719, "total_steps": 10853, "loss": 0.1393, "learning_rate": 3.2347731581251866e-06, "epoch": 0.4347906205371539, "percentage": 43.48, "elapsed_time": "14:54:43", "remaining_time": "19:23:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4720, "total_steps": 10853, "loss": 0.1412, "learning_rate": 3.2340449865484464e-06, "epoch": 0.43488275671442395, "percentage": 43.49, "elapsed_time": "14:54:53", "remaining_time": "19:22:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4721, "total_steps": 10853, "loss": 0.127, "learning_rate": 3.23331674681555e-06, "epoch": 0.43497489289169394, "percentage": 43.5, "elapsed_time": "14:55:04", "remaining_time": "19:22:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4722, "total_steps": 10853, "loss": 0.1388, "learning_rate": 3.2325884389941147e-06, "epoch": 0.43506702906896394, "percentage": 43.51, "elapsed_time": "14:55:14", "remaining_time": "19:22:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4723, "total_steps": 10853, "loss": 0.1438, "learning_rate": 3.2318600631517637e-06, "epoch": 0.43515916524623394, "percentage": 43.52, "elapsed_time": "14:55:25", "remaining_time": "19:22:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4724, "total_steps": 10853, "loss": 0.155, "learning_rate": 3.2311316193561277e-06, "epoch": 0.43525130142350393, "percentage": 43.53, "elapsed_time": "14:55:36", "remaining_time": "19:21:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4725, "total_steps": 10853, "loss": 0.1511, "learning_rate": 3.230403107674841e-06, "epoch": 0.43534343760077393, "percentage": 43.54, "elapsed_time": "14:55:47", "remaining_time": "19:21:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4726, "total_steps": 10853, "loss": 0.146, "learning_rate": 3.2296745281755485e-06, "epoch": 0.4354355737780439, "percentage": 43.55, "elapsed_time": "14:55:58", "remaining_time": "19:21:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4727, "total_steps": 10853, "loss": 0.1552, "learning_rate": 3.2289458809258965e-06, "epoch": 0.435527709955314, "percentage": 43.55, "elapsed_time": "14:56:09", "remaining_time": "19:21:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4728, "total_steps": 10853, "loss": 0.1388, "learning_rate": 3.2282171659935415e-06, "epoch": 0.435619846132584, "percentage": 43.56, "elapsed_time": "14:56:19", "remaining_time": "19:21:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4729, "total_steps": 10853, "loss": 0.1344, "learning_rate": 3.2274883834461444e-06, "epoch": 0.435711982309854, "percentage": 43.57, "elapsed_time": "14:56:29", "remaining_time": "19:20:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4730, "total_steps": 10853, "loss": 0.1592, "learning_rate": 3.2267595333513724e-06, "epoch": 0.43580411848712397, "percentage": 43.58, "elapsed_time": "14:56:42", "remaining_time": "19:20:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4731, "total_steps": 10853, "loss": 0.148, "learning_rate": 3.2260306157768994e-06, "epoch": 0.43589625466439397, "percentage": 43.59, "elapsed_time": "14:56:52", "remaining_time": "19:20:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4732, "total_steps": 10853, "loss": 0.1385, "learning_rate": 3.2253016307904063e-06, "epoch": 0.43598839084166396, "percentage": 43.6, "elapsed_time": "14:57:04", "remaining_time": "19:20:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4733, "total_steps": 10853, "loss": 0.1278, "learning_rate": 3.224572578459577e-06, "epoch": 0.43608052701893396, "percentage": 43.61, "elapsed_time": "14:57:15", "remaining_time": "19:20:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4734, "total_steps": 10853, "loss": 0.1501, "learning_rate": 3.2238434588521078e-06, "epoch": 0.436172663196204, "percentage": 43.62, "elapsed_time": "14:57:25", "remaining_time": "19:19:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4735, "total_steps": 10853, "loss": 0.1528, "learning_rate": 3.2231142720356946e-06, "epoch": 0.436264799373474, "percentage": 43.63, "elapsed_time": "14:57:37", "remaining_time": "19:19:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4736, "total_steps": 10853, "loss": 0.1368, "learning_rate": 3.222385018078043e-06, "epoch": 0.436356935550744, "percentage": 43.64, "elapsed_time": "14:57:46", "remaining_time": "19:19:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4737, "total_steps": 10853, "loss": 0.1562, "learning_rate": 3.2216556970468656e-06, "epoch": 0.436449071728014, "percentage": 43.65, "elapsed_time": "14:57:58", "remaining_time": "19:19:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4738, "total_steps": 10853, "loss": 0.1526, "learning_rate": 3.2209263090098785e-06, "epoch": 0.436541207905284, "percentage": 43.66, "elapsed_time": "14:58:09", "remaining_time": "19:19:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4739, "total_steps": 10853, "loss": 0.138, "learning_rate": 3.220196854034806e-06, "epoch": 0.436633344082554, "percentage": 43.67, "elapsed_time": "14:58:20", "remaining_time": "19:18:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4740, "total_steps": 10853, "loss": 0.1288, "learning_rate": 3.2194673321893787e-06, "epoch": 0.436725480259824, "percentage": 43.67, "elapsed_time": "14:58:31", "remaining_time": "19:18:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4741, "total_steps": 10853, "loss": 0.1487, "learning_rate": 3.2187377435413316e-06, "epoch": 0.43681761643709405, "percentage": 43.68, "elapsed_time": "14:58:42", "remaining_time": "19:18:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4742, "total_steps": 10853, "loss": 0.1572, "learning_rate": 3.2180080881584075e-06, "epoch": 0.43690975261436404, "percentage": 43.69, "elapsed_time": "14:58:54", "remaining_time": "19:18:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4743, "total_steps": 10853, "loss": 0.1514, "learning_rate": 3.2172783661083556e-06, "epoch": 0.43700188879163404, "percentage": 43.7, "elapsed_time": "14:59:06", "remaining_time": "19:18:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4744, "total_steps": 10853, "loss": 0.1507, "learning_rate": 3.21654857745893e-06, "epoch": 0.43709402496890404, "percentage": 43.71, "elapsed_time": "14:59:17", "remaining_time": "19:18:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4745, "total_steps": 10853, "loss": 0.1548, "learning_rate": 3.2158187222778926e-06, "epoch": 0.43718616114617403, "percentage": 43.72, "elapsed_time": "14:59:28", "remaining_time": "19:17:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4746, "total_steps": 10853, "loss": 0.1368, "learning_rate": 3.215088800633009e-06, "epoch": 0.43727829732344403, "percentage": 43.73, "elapsed_time": "14:59:39", "remaining_time": "19:17:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4747, "total_steps": 10853, "loss": 0.135, "learning_rate": 3.214358812592053e-06, "epoch": 0.43737043350071403, "percentage": 43.74, "elapsed_time": "14:59:49", "remaining_time": "19:17:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4748, "total_steps": 10853, "loss": 0.1328, "learning_rate": 3.2136287582228048e-06, "epoch": 0.4374625696779841, "percentage": 43.75, "elapsed_time": "15:00:00", "remaining_time": "19:17:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4749, "total_steps": 10853, "loss": 0.1437, "learning_rate": 3.2128986375930495e-06, "epoch": 0.4375547058552541, "percentage": 43.76, "elapsed_time": "15:00:11", "remaining_time": "19:17:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4750, "total_steps": 10853, "loss": 0.1378, "learning_rate": 3.212168450770579e-06, "epoch": 0.4376468420325241, "percentage": 43.77, "elapsed_time": "15:00:21", "remaining_time": "19:16:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4751, "total_steps": 10853, "loss": 0.1443, "learning_rate": 3.2114381978231918e-06, "epoch": 0.43773897820979407, "percentage": 43.78, "elapsed_time": "15:00:31", "remaining_time": "19:16:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4752, "total_steps": 10853, "loss": 0.1488, "learning_rate": 3.21070787881869e-06, "epoch": 0.43783111438706407, "percentage": 43.79, "elapsed_time": "15:00:41", "remaining_time": "19:16:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4753, "total_steps": 10853, "loss": 0.1349, "learning_rate": 3.2099774938248866e-06, "epoch": 0.43792325056433407, "percentage": 43.79, "elapsed_time": "15:00:51", "remaining_time": "19:16:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4754, "total_steps": 10853, "loss": 0.1519, "learning_rate": 3.2092470429095955e-06, "epoch": 0.4380153867416041, "percentage": 43.8, "elapsed_time": "15:01:02", "remaining_time": "19:15:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4755, "total_steps": 10853, "loss": 0.14, "learning_rate": 3.208516526140641e-06, "epoch": 0.4381075229188741, "percentage": 43.81, "elapsed_time": "15:01:12", "remaining_time": "19:15:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4756, "total_steps": 10853, "loss": 0.1601, "learning_rate": 3.2077859435858503e-06, "epoch": 0.4381996590961441, "percentage": 43.82, "elapsed_time": "15:01:23", "remaining_time": "19:15:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4757, "total_steps": 10853, "loss": 0.1589, "learning_rate": 3.2070552953130586e-06, "epoch": 0.4382917952734141, "percentage": 43.83, "elapsed_time": "15:01:33", "remaining_time": "19:15:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4758, "total_steps": 10853, "loss": 0.1582, "learning_rate": 3.2063245813901068e-06, "epoch": 0.4383839314506841, "percentage": 43.84, "elapsed_time": "15:01:46", "remaining_time": "19:15:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4759, "total_steps": 10853, "loss": 0.154, "learning_rate": 3.2055938018848417e-06, "epoch": 0.4384760676279541, "percentage": 43.85, "elapsed_time": "15:01:58", "remaining_time": "19:14:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4760, "total_steps": 10853, "loss": 0.1539, "learning_rate": 3.2048629568651153e-06, "epoch": 0.4385682038052241, "percentage": 43.86, "elapsed_time": "15:02:08", "remaining_time": "19:14:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4761, "total_steps": 10853, "loss": 0.1444, "learning_rate": 3.2041320463987886e-06, "epoch": 0.43866033998249415, "percentage": 43.87, "elapsed_time": "15:02:19", "remaining_time": "19:14:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4762, "total_steps": 10853, "loss": 0.1415, "learning_rate": 3.2034010705537245e-06, "epoch": 0.43875247615976415, "percentage": 43.88, "elapsed_time": "15:02:29", "remaining_time": "19:14:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4763, "total_steps": 10853, "loss": 0.1473, "learning_rate": 3.202670029397796e-06, "epoch": 0.43884461233703415, "percentage": 43.89, "elapsed_time": "15:02:40", "remaining_time": "19:14:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4764, "total_steps": 10853, "loss": 0.1527, "learning_rate": 3.2019389229988794e-06, "epoch": 0.43893674851430414, "percentage": 43.9, "elapsed_time": "15:02:50", "remaining_time": "19:13:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4765, "total_steps": 10853, "loss": 0.1365, "learning_rate": 3.2012077514248592e-06, "epoch": 0.43902888469157414, "percentage": 43.9, "elapsed_time": "15:03:00", "remaining_time": "19:13:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4766, "total_steps": 10853, "loss": 0.1555, "learning_rate": 3.2004765147436228e-06, "epoch": 0.43912102086884414, "percentage": 43.91, "elapsed_time": "15:03:11", "remaining_time": "19:13:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4767, "total_steps": 10853, "loss": 0.1395, "learning_rate": 3.1997452130230664e-06, "epoch": 0.43921315704611413, "percentage": 43.92, "elapsed_time": "15:03:23", "remaining_time": "19:13:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4768, "total_steps": 10853, "loss": 0.1405, "learning_rate": 3.1990138463310923e-06, "epoch": 0.4393052932233842, "percentage": 43.93, "elapsed_time": "15:03:33", "remaining_time": "19:13:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4769, "total_steps": 10853, "loss": 0.1447, "learning_rate": 3.1982824147356078e-06, "epoch": 0.4393974294006542, "percentage": 43.94, "elapsed_time": "15:03:43", "remaining_time": "19:12:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4770, "total_steps": 10853, "loss": 0.141, "learning_rate": 3.197550918304525e-06, "epoch": 0.4394895655779242, "percentage": 43.95, "elapsed_time": "15:03:55", "remaining_time": "19:12:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4771, "total_steps": 10853, "loss": 0.1416, "learning_rate": 3.196819357105764e-06, "epoch": 0.4395817017551942, "percentage": 43.96, "elapsed_time": "15:04:04", "remaining_time": "19:12:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4772, "total_steps": 10853, "loss": 0.1539, "learning_rate": 3.196087731207252e-06, "epoch": 0.4396738379324642, "percentage": 43.97, "elapsed_time": "15:04:16", "remaining_time": "19:12:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4773, "total_steps": 10853, "loss": 0.15, "learning_rate": 3.1953560406769184e-06, "epoch": 0.43976597410973417, "percentage": 43.98, "elapsed_time": "15:04:27", "remaining_time": "19:12:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4774, "total_steps": 10853, "loss": 0.1563, "learning_rate": 3.194624285582702e-06, "epoch": 0.43985811028700417, "percentage": 43.99, "elapsed_time": "15:04:40", "remaining_time": "19:11:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4775, "total_steps": 10853, "loss": 0.1416, "learning_rate": 3.1938924659925457e-06, "epoch": 0.4399502464642742, "percentage": 44.0, "elapsed_time": "15:04:51", "remaining_time": "19:11:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4776, "total_steps": 10853, "loss": 0.1275, "learning_rate": 3.193160581974399e-06, "epoch": 0.4400423826415442, "percentage": 44.01, "elapsed_time": "15:05:02", "remaining_time": "19:11:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4777, "total_steps": 10853, "loss": 0.1475, "learning_rate": 3.1924286335962177e-06, "epoch": 0.4401345188188142, "percentage": 44.02, "elapsed_time": "15:05:12", "remaining_time": "19:11:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4778, "total_steps": 10853, "loss": 0.1506, "learning_rate": 3.1916966209259636e-06, "epoch": 0.4402266549960842, "percentage": 44.02, "elapsed_time": "15:05:23", "remaining_time": "19:11:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4779, "total_steps": 10853, "loss": 0.1322, "learning_rate": 3.1909645440316034e-06, "epoch": 0.4403187911733542, "percentage": 44.03, "elapsed_time": "15:05:34", "remaining_time": "19:10:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4780, "total_steps": 10853, "loss": 0.1433, "learning_rate": 3.1902324029811115e-06, "epoch": 0.4404109273506242, "percentage": 44.04, "elapsed_time": "15:05:46", "remaining_time": "19:10:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4781, "total_steps": 10853, "loss": 0.148, "learning_rate": 3.1895001978424665e-06, "epoch": 0.4405030635278942, "percentage": 44.05, "elapsed_time": "15:05:56", "remaining_time": "19:10:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4782, "total_steps": 10853, "loss": 0.1572, "learning_rate": 3.188767928683654e-06, "epoch": 0.44059519970516425, "percentage": 44.06, "elapsed_time": "15:06:09", "remaining_time": "19:10:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4783, "total_steps": 10853, "loss": 0.1468, "learning_rate": 3.188035595572665e-06, "epoch": 0.44068733588243425, "percentage": 44.07, "elapsed_time": "15:06:19", "remaining_time": "19:10:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4784, "total_steps": 10853, "loss": 0.1417, "learning_rate": 3.1873031985774972e-06, "epoch": 0.44077947205970425, "percentage": 44.08, "elapsed_time": "15:06:30", "remaining_time": "19:09:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4785, "total_steps": 10853, "loss": 0.1524, "learning_rate": 3.186570737766153e-06, "epoch": 0.44087160823697424, "percentage": 44.09, "elapsed_time": "15:06:40", "remaining_time": "19:09:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4786, "total_steps": 10853, "loss": 0.1428, "learning_rate": 3.1858382132066422e-06, "epoch": 0.44096374441424424, "percentage": 44.1, "elapsed_time": "15:06:50", "remaining_time": "19:09:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4787, "total_steps": 10853, "loss": 0.1396, "learning_rate": 3.1851056249669786e-06, "epoch": 0.44105588059151424, "percentage": 44.11, "elapsed_time": "15:07:02", "remaining_time": "19:09:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4788, "total_steps": 10853, "loss": 0.1506, "learning_rate": 3.1843729731151855e-06, "epoch": 0.4411480167687843, "percentage": 44.12, "elapsed_time": "15:07:14", "remaining_time": "19:09:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4789, "total_steps": 10853, "loss": 0.1399, "learning_rate": 3.183640257719287e-06, "epoch": 0.4412401529460543, "percentage": 44.13, "elapsed_time": "15:07:24", "remaining_time": "19:09:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4790, "total_steps": 10853, "loss": 0.1628, "learning_rate": 3.182907478847318e-06, "epoch": 0.4413322891233243, "percentage": 44.14, "elapsed_time": "15:07:37", "remaining_time": "19:08:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4791, "total_steps": 10853, "loss": 0.1507, "learning_rate": 3.1821746365673157e-06, "epoch": 0.4414244253005943, "percentage": 44.14, "elapsed_time": "15:07:47", "remaining_time": "19:08:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4792, "total_steps": 10853, "loss": 0.1401, "learning_rate": 3.1814417309473243e-06, "epoch": 0.4415165614778643, "percentage": 44.15, "elapsed_time": "15:07:57", "remaining_time": "19:08:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4793, "total_steps": 10853, "loss": 0.1535, "learning_rate": 3.1807087620553957e-06, "epoch": 0.4416086976551343, "percentage": 44.16, "elapsed_time": "15:08:06", "remaining_time": "19:08:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4794, "total_steps": 10853, "loss": 0.1532, "learning_rate": 3.179975729959585e-06, "epoch": 0.44170083383240427, "percentage": 44.17, "elapsed_time": "15:08:17", "remaining_time": "19:07:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4795, "total_steps": 10853, "loss": 0.1557, "learning_rate": 3.1792426347279544e-06, "epoch": 0.4417929700096743, "percentage": 44.18, "elapsed_time": "15:08:28", "remaining_time": "19:07:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4796, "total_steps": 10853, "loss": 0.1389, "learning_rate": 3.178509476428573e-06, "epoch": 0.4418851061869443, "percentage": 44.19, "elapsed_time": "15:08:38", "remaining_time": "19:07:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4797, "total_steps": 10853, "loss": 0.1564, "learning_rate": 3.177776255129512e-06, "epoch": 0.4419772423642143, "percentage": 44.2, "elapsed_time": "15:08:48", "remaining_time": "19:07:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4798, "total_steps": 10853, "loss": 0.1665, "learning_rate": 3.1770429708988536e-06, "epoch": 0.4420693785414843, "percentage": 44.21, "elapsed_time": "15:08:59", "remaining_time": "19:07:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4799, "total_steps": 10853, "loss": 0.1448, "learning_rate": 3.1763096238046833e-06, "epoch": 0.4421615147187543, "percentage": 44.22, "elapsed_time": "15:09:10", "remaining_time": "19:06:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4800, "total_steps": 10853, "loss": 0.1496, "learning_rate": 3.1755762139150905e-06, "epoch": 0.4422536508960243, "percentage": 44.23, "elapsed_time": "15:09:21", "remaining_time": "19:06:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4801, "total_steps": 10853, "loss": 0.1418, "learning_rate": 3.1748427412981742e-06, "epoch": 0.4423457870732943, "percentage": 44.24, "elapsed_time": "15:09:31", "remaining_time": "19:06:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4802, "total_steps": 10853, "loss": 0.1345, "learning_rate": 3.1741092060220364e-06, "epoch": 0.44243792325056436, "percentage": 44.25, "elapsed_time": "15:09:42", "remaining_time": "19:06:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4803, "total_steps": 10853, "loss": 0.1394, "learning_rate": 3.1733756081547864e-06, "epoch": 0.44253005942783435, "percentage": 44.26, "elapsed_time": "15:09:52", "remaining_time": "19:06:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4804, "total_steps": 10853, "loss": 0.1449, "learning_rate": 3.172641947764539e-06, "epoch": 0.44262219560510435, "percentage": 44.26, "elapsed_time": "15:10:03", "remaining_time": "19:05:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4805, "total_steps": 10853, "loss": 0.1456, "learning_rate": 3.1719082249194134e-06, "epoch": 0.44271433178237435, "percentage": 44.27, "elapsed_time": "15:10:15", "remaining_time": "19:05:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4806, "total_steps": 10853, "loss": 0.1377, "learning_rate": 3.171174439687538e-06, "epoch": 0.44280646795964435, "percentage": 44.28, "elapsed_time": "15:10:24", "remaining_time": "19:05:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4807, "total_steps": 10853, "loss": 0.1313, "learning_rate": 3.1704405921370428e-06, "epoch": 0.44289860413691434, "percentage": 44.29, "elapsed_time": "15:10:35", "remaining_time": "19:05:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4808, "total_steps": 10853, "loss": 0.1395, "learning_rate": 3.169706682336066e-06, "epoch": 0.44299074031418434, "percentage": 44.3, "elapsed_time": "15:10:46", "remaining_time": "19:05:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4809, "total_steps": 10853, "loss": 0.1408, "learning_rate": 3.1689727103527536e-06, "epoch": 0.4430828764914544, "percentage": 44.31, "elapsed_time": "15:10:57", "remaining_time": "19:04:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4810, "total_steps": 10853, "loss": 0.1433, "learning_rate": 3.168238676255251e-06, "epoch": 0.4431750126687244, "percentage": 44.32, "elapsed_time": "15:11:09", "remaining_time": "19:04:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4811, "total_steps": 10853, "loss": 0.1492, "learning_rate": 3.1675045801117167e-06, "epoch": 0.4432671488459944, "percentage": 44.33, "elapsed_time": "15:11:21", "remaining_time": "19:04:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4812, "total_steps": 10853, "loss": 0.1575, "learning_rate": 3.1667704219903095e-06, "epoch": 0.4433592850232644, "percentage": 44.34, "elapsed_time": "15:11:32", "remaining_time": "19:04:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4813, "total_steps": 10853, "loss": 0.1377, "learning_rate": 3.1660362019591972e-06, "epoch": 0.4434514212005344, "percentage": 44.35, "elapsed_time": "15:11:42", "remaining_time": "19:04:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4814, "total_steps": 10853, "loss": 0.1437, "learning_rate": 3.1653019200865513e-06, "epoch": 0.4435435573778044, "percentage": 44.36, "elapsed_time": "15:11:53", "remaining_time": "19:03:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4815, "total_steps": 10853, "loss": 0.1507, "learning_rate": 3.164567576440552e-06, "epoch": 0.4436356935550744, "percentage": 44.37, "elapsed_time": "15:12:04", "remaining_time": "19:03:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4816, "total_steps": 10853, "loss": 0.1562, "learning_rate": 3.1638331710893804e-06, "epoch": 0.4437278297323444, "percentage": 44.37, "elapsed_time": "15:12:13", "remaining_time": "19:03:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4817, "total_steps": 10853, "loss": 0.1554, "learning_rate": 3.163098704101228e-06, "epoch": 0.4438199659096144, "percentage": 44.38, "elapsed_time": "15:12:24", "remaining_time": "19:03:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4818, "total_steps": 10853, "loss": 0.1472, "learning_rate": 3.162364175544289e-06, "epoch": 0.4439121020868844, "percentage": 44.39, "elapsed_time": "15:12:34", "remaining_time": "19:03:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4819, "total_steps": 10853, "loss": 0.1409, "learning_rate": 3.161629585486766e-06, "epoch": 0.4440042382641544, "percentage": 44.4, "elapsed_time": "15:12:44", "remaining_time": "19:02:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4820, "total_steps": 10853, "loss": 0.149, "learning_rate": 3.160894933996864e-06, "epoch": 0.4440963744414244, "percentage": 44.41, "elapsed_time": "15:12:55", "remaining_time": "19:02:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4821, "total_steps": 10853, "loss": 0.1364, "learning_rate": 3.160160221142797e-06, "epoch": 0.4441885106186944, "percentage": 44.42, "elapsed_time": "15:13:04", "remaining_time": "19:02:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4822, "total_steps": 10853, "loss": 0.143, "learning_rate": 3.159425446992781e-06, "epoch": 0.44428064679596446, "percentage": 44.43, "elapsed_time": "15:13:15", "remaining_time": "19:02:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4823, "total_steps": 10853, "loss": 0.1482, "learning_rate": 3.1586906116150428e-06, "epoch": 0.44437278297323446, "percentage": 44.44, "elapsed_time": "15:13:25", "remaining_time": "19:02:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4824, "total_steps": 10853, "loss": 0.1601, "learning_rate": 3.1579557150778094e-06, "epoch": 0.44446491915050446, "percentage": 44.45, "elapsed_time": "15:13:38", "remaining_time": "19:01:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4825, "total_steps": 10853, "loss": 0.1428, "learning_rate": 3.1572207574493174e-06, "epoch": 0.44455705532777445, "percentage": 44.46, "elapsed_time": "15:13:48", "remaining_time": "19:01:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4826, "total_steps": 10853, "loss": 0.1456, "learning_rate": 3.1564857387978075e-06, "epoch": 0.44464919150504445, "percentage": 44.47, "elapsed_time": "15:13:58", "remaining_time": "19:01:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4827, "total_steps": 10853, "loss": 0.1594, "learning_rate": 3.155750659191526e-06, "epoch": 0.44474132768231445, "percentage": 44.48, "elapsed_time": "15:14:10", "remaining_time": "19:01:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4828, "total_steps": 10853, "loss": 0.1443, "learning_rate": 3.155015518698725e-06, "epoch": 0.44483346385958444, "percentage": 44.49, "elapsed_time": "15:14:22", "remaining_time": "19:01:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4829, "total_steps": 10853, "loss": 0.152, "learning_rate": 3.154280317387663e-06, "epoch": 0.4449256000368545, "percentage": 44.49, "elapsed_time": "15:14:33", "remaining_time": "19:00:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4830, "total_steps": 10853, "loss": 0.1467, "learning_rate": 3.1535450553266024e-06, "epoch": 0.4450177362141245, "percentage": 44.5, "elapsed_time": "15:14:43", "remaining_time": "19:00:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4831, "total_steps": 10853, "loss": 0.1496, "learning_rate": 3.1528097325838143e-06, "epoch": 0.4451098723913945, "percentage": 44.51, "elapsed_time": "15:14:53", "remaining_time": "19:00:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4832, "total_steps": 10853, "loss": 0.1504, "learning_rate": 3.1520743492275714e-06, "epoch": 0.4452020085686645, "percentage": 44.52, "elapsed_time": "15:15:04", "remaining_time": "19:00:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4833, "total_steps": 10853, "loss": 0.1536, "learning_rate": 3.151338905326155e-06, "epoch": 0.4452941447459345, "percentage": 44.53, "elapsed_time": "15:15:13", "remaining_time": "19:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4834, "total_steps": 10853, "loss": 0.1513, "learning_rate": 3.1506034009478515e-06, "epoch": 0.4453862809232045, "percentage": 44.54, "elapsed_time": "15:15:23", "remaining_time": "18:59:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4835, "total_steps": 10853, "loss": 0.1379, "learning_rate": 3.1498678361609514e-06, "epoch": 0.4454784171004745, "percentage": 44.55, "elapsed_time": "15:15:34", "remaining_time": "18:59:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4836, "total_steps": 10853, "loss": 0.1352, "learning_rate": 3.149132211033754e-06, "epoch": 0.44557055327774453, "percentage": 44.56, "elapsed_time": "15:15:44", "remaining_time": "18:59:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4837, "total_steps": 10853, "loss": 0.1409, "learning_rate": 3.1483965256345596e-06, "epoch": 0.4456626894550145, "percentage": 44.57, "elapsed_time": "15:15:54", "remaining_time": "18:59:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4838, "total_steps": 10853, "loss": 0.1584, "learning_rate": 3.147660780031679e-06, "epoch": 0.4457548256322845, "percentage": 44.58, "elapsed_time": "15:16:05", "remaining_time": "18:58:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4839, "total_steps": 10853, "loss": 0.1532, "learning_rate": 3.146924974293425e-06, "epoch": 0.4458469618095545, "percentage": 44.59, "elapsed_time": "15:16:14", "remaining_time": "18:58:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4840, "total_steps": 10853, "loss": 0.1604, "learning_rate": 3.1461891084881175e-06, "epoch": 0.4459390979868245, "percentage": 44.6, "elapsed_time": "15:16:25", "remaining_time": "18:58:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4841, "total_steps": 10853, "loss": 0.1515, "learning_rate": 3.1454531826840816e-06, "epoch": 0.4460312341640945, "percentage": 44.61, "elapsed_time": "15:16:35", "remaining_time": "18:58:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4842, "total_steps": 10853, "loss": 0.1515, "learning_rate": 3.1447171969496487e-06, "epoch": 0.4461233703413645, "percentage": 44.61, "elapsed_time": "15:16:46", "remaining_time": "18:58:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4843, "total_steps": 10853, "loss": 0.1302, "learning_rate": 3.1439811513531537e-06, "epoch": 0.44621550651863456, "percentage": 44.62, "elapsed_time": "15:16:58", "remaining_time": "18:57:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4844, "total_steps": 10853, "loss": 0.134, "learning_rate": 3.143245045962941e-06, "epoch": 0.44630764269590456, "percentage": 44.63, "elapsed_time": "15:17:10", "remaining_time": "18:57:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4845, "total_steps": 10853, "loss": 0.1572, "learning_rate": 3.142508880847355e-06, "epoch": 0.44639977887317456, "percentage": 44.64, "elapsed_time": "15:17:21", "remaining_time": "18:57:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4846, "total_steps": 10853, "loss": 0.1414, "learning_rate": 3.1417726560747507e-06, "epoch": 0.44649191505044455, "percentage": 44.65, "elapsed_time": "15:17:31", "remaining_time": "18:57:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4847, "total_steps": 10853, "loss": 0.1362, "learning_rate": 3.1410363717134868e-06, "epoch": 0.44658405122771455, "percentage": 44.66, "elapsed_time": "15:17:41", "remaining_time": "18:57:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4848, "total_steps": 10853, "loss": 0.156, "learning_rate": 3.140300027831927e-06, "epoch": 0.44667618740498455, "percentage": 44.67, "elapsed_time": "15:17:52", "remaining_time": "18:56:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4849, "total_steps": 10853, "loss": 0.1441, "learning_rate": 3.1395636244984397e-06, "epoch": 0.44676832358225455, "percentage": 44.68, "elapsed_time": "15:18:03", "remaining_time": "18:56:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4850, "total_steps": 10853, "loss": 0.1348, "learning_rate": 3.1388271617814015e-06, "epoch": 0.4468604597595246, "percentage": 44.69, "elapsed_time": "15:18:14", "remaining_time": "18:56:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4851, "total_steps": 10853, "loss": 0.1314, "learning_rate": 3.1380906397491923e-06, "epoch": 0.4469525959367946, "percentage": 44.7, "elapsed_time": "15:18:22", "remaining_time": "18:56:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4852, "total_steps": 10853, "loss": 0.1537, "learning_rate": 3.1373540584701997e-06, "epoch": 0.4470447321140646, "percentage": 44.71, "elapsed_time": "15:18:34", "remaining_time": "18:56:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4853, "total_steps": 10853, "loss": 0.1364, "learning_rate": 3.1366174180128127e-06, "epoch": 0.4471368682913346, "percentage": 44.72, "elapsed_time": "15:18:46", "remaining_time": "18:55:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4854, "total_steps": 10853, "loss": 0.1493, "learning_rate": 3.1358807184454305e-06, "epoch": 0.4472290044686046, "percentage": 44.72, "elapsed_time": "15:18:55", "remaining_time": "18:55:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4855, "total_steps": 10853, "loss": 0.1481, "learning_rate": 3.1351439598364554e-06, "epoch": 0.4473211406458746, "percentage": 44.73, "elapsed_time": "15:19:06", "remaining_time": "18:55:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4856, "total_steps": 10853, "loss": 0.1257, "learning_rate": 3.134407142254295e-06, "epoch": 0.44741327682314463, "percentage": 44.74, "elapsed_time": "15:19:17", "remaining_time": "18:55:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4857, "total_steps": 10853, "loss": 0.1446, "learning_rate": 3.1336702657673625e-06, "epoch": 0.44750541300041463, "percentage": 44.75, "elapsed_time": "15:19:27", "remaining_time": "18:55:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4858, "total_steps": 10853, "loss": 0.1375, "learning_rate": 3.132933330444079e-06, "epoch": 0.44759754917768463, "percentage": 44.76, "elapsed_time": "15:19:38", "remaining_time": "18:54:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4859, "total_steps": 10853, "loss": 0.1317, "learning_rate": 3.132196336352867e-06, "epoch": 0.4476896853549546, "percentage": 44.77, "elapsed_time": "15:19:48", "remaining_time": "18:54:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4860, "total_steps": 10853, "loss": 0.1494, "learning_rate": 3.131459283562157e-06, "epoch": 0.4477818215322246, "percentage": 44.78, "elapsed_time": "15:19:59", "remaining_time": "18:54:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4861, "total_steps": 10853, "loss": 0.1465, "learning_rate": 3.1307221721403846e-06, "epoch": 0.4478739577094946, "percentage": 44.79, "elapsed_time": "15:20:09", "remaining_time": "18:54:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4862, "total_steps": 10853, "loss": 0.1375, "learning_rate": 3.129985002155991e-06, "epoch": 0.4479660938867646, "percentage": 44.8, "elapsed_time": "15:20:20", "remaining_time": "18:54:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4863, "total_steps": 10853, "loss": 0.1459, "learning_rate": 3.129247773677422e-06, "epoch": 0.44805823006403467, "percentage": 44.81, "elapsed_time": "15:20:30", "remaining_time": "18:53:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4864, "total_steps": 10853, "loss": 0.1435, "learning_rate": 3.128510486773129e-06, "epoch": 0.44815036624130467, "percentage": 44.82, "elapsed_time": "15:20:41", "remaining_time": "18:53:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4865, "total_steps": 10853, "loss": 0.1521, "learning_rate": 3.1277731415115696e-06, "epoch": 0.44824250241857466, "percentage": 44.83, "elapsed_time": "15:20:53", "remaining_time": "18:53:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4866, "total_steps": 10853, "loss": 0.1475, "learning_rate": 3.127035737961207e-06, "epoch": 0.44833463859584466, "percentage": 44.84, "elapsed_time": "15:21:05", "remaining_time": "18:53:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4867, "total_steps": 10853, "loss": 0.1483, "learning_rate": 3.1262982761905084e-06, "epoch": 0.44842677477311466, "percentage": 44.84, "elapsed_time": "15:21:14", "remaining_time": "18:53:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4868, "total_steps": 10853, "loss": 0.1431, "learning_rate": 3.125560756267948e-06, "epoch": 0.44851891095038465, "percentage": 44.85, "elapsed_time": "15:21:24", "remaining_time": "18:52:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4869, "total_steps": 10853, "loss": 0.1291, "learning_rate": 3.1248231782620035e-06, "epoch": 0.44861104712765465, "percentage": 44.86, "elapsed_time": "15:21:35", "remaining_time": "18:52:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4870, "total_steps": 10853, "loss": 0.1535, "learning_rate": 3.1240855422411593e-06, "epoch": 0.4487031833049247, "percentage": 44.87, "elapsed_time": "15:21:46", "remaining_time": "18:52:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4871, "total_steps": 10853, "loss": 0.1509, "learning_rate": 3.1233478482739065e-06, "epoch": 0.4487953194821947, "percentage": 44.88, "elapsed_time": "15:21:56", "remaining_time": "18:52:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4872, "total_steps": 10853, "loss": 0.1387, "learning_rate": 3.1226100964287378e-06, "epoch": 0.4488874556594647, "percentage": 44.89, "elapsed_time": "15:22:06", "remaining_time": "18:52:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4873, "total_steps": 10853, "loss": 0.1547, "learning_rate": 3.1218722867741553e-06, "epoch": 0.4489795918367347, "percentage": 44.9, "elapsed_time": "15:22:16", "remaining_time": "18:51:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4874, "total_steps": 10853, "loss": 0.1432, "learning_rate": 3.1211344193786636e-06, "epoch": 0.4490717280140047, "percentage": 44.91, "elapsed_time": "15:22:26", "remaining_time": "18:51:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4875, "total_steps": 10853, "loss": 0.1533, "learning_rate": 3.1203964943107747e-06, "epoch": 0.4491638641912747, "percentage": 44.92, "elapsed_time": "15:22:36", "remaining_time": "18:51:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4876, "total_steps": 10853, "loss": 0.1282, "learning_rate": 3.1196585116390045e-06, "epoch": 0.4492560003685447, "percentage": 44.93, "elapsed_time": "15:22:47", "remaining_time": "18:51:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4877, "total_steps": 10853, "loss": 0.1355, "learning_rate": 3.1189204714318743e-06, "epoch": 0.44934813654581474, "percentage": 44.94, "elapsed_time": "15:22:57", "remaining_time": "18:50:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4878, "total_steps": 10853, "loss": 0.1649, "learning_rate": 3.1181823737579115e-06, "epoch": 0.44944027272308473, "percentage": 44.95, "elapsed_time": "15:23:08", "remaining_time": "18:50:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4879, "total_steps": 10853, "loss": 0.1458, "learning_rate": 3.11744421868565e-06, "epoch": 0.44953240890035473, "percentage": 44.96, "elapsed_time": "15:23:19", "remaining_time": "18:50:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4880, "total_steps": 10853, "loss": 0.148, "learning_rate": 3.1167060062836253e-06, "epoch": 0.4496245450776247, "percentage": 44.96, "elapsed_time": "15:23:30", "remaining_time": "18:50:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4881, "total_steps": 10853, "loss": 0.1443, "learning_rate": 3.1159677366203815e-06, "epoch": 0.4497166812548947, "percentage": 44.97, "elapsed_time": "15:23:41", "remaining_time": "18:50:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4882, "total_steps": 10853, "loss": 0.1631, "learning_rate": 3.1152294097644677e-06, "epoch": 0.4498088174321647, "percentage": 44.98, "elapsed_time": "15:23:52", "remaining_time": "18:49:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4883, "total_steps": 10853, "loss": 0.1562, "learning_rate": 3.1144910257844367e-06, "epoch": 0.4499009536094347, "percentage": 44.99, "elapsed_time": "15:24:01", "remaining_time": "18:49:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4884, "total_steps": 10853, "loss": 0.1413, "learning_rate": 3.113752584748848e-06, "epoch": 0.44999308978670477, "percentage": 45.0, "elapsed_time": "15:24:11", "remaining_time": "18:49:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4885, "total_steps": 10853, "loss": 0.1435, "learning_rate": 3.1130140867262653e-06, "epoch": 0.45008522596397477, "percentage": 45.01, "elapsed_time": "15:24:22", "remaining_time": "18:49:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4886, "total_steps": 10853, "loss": 0.1502, "learning_rate": 3.112275531785259e-06, "epoch": 0.45017736214124476, "percentage": 45.02, "elapsed_time": "15:24:33", "remaining_time": "18:49:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4887, "total_steps": 10853, "loss": 0.1384, "learning_rate": 3.111536919994404e-06, "epoch": 0.45026949831851476, "percentage": 45.03, "elapsed_time": "15:24:45", "remaining_time": "18:48:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4888, "total_steps": 10853, "loss": 0.1376, "learning_rate": 3.110798251422279e-06, "epoch": 0.45036163449578476, "percentage": 45.04, "elapsed_time": "15:24:56", "remaining_time": "18:48:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4889, "total_steps": 10853, "loss": 0.1393, "learning_rate": 3.1100595261374718e-06, "epoch": 0.45045377067305475, "percentage": 45.05, "elapsed_time": "15:25:05", "remaining_time": "18:48:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4890, "total_steps": 10853, "loss": 0.1404, "learning_rate": 3.1093207442085716e-06, "epoch": 0.4505459068503248, "percentage": 45.06, "elapsed_time": "15:25:16", "remaining_time": "18:48:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4891, "total_steps": 10853, "loss": 0.1401, "learning_rate": 3.108581905704175e-06, "epoch": 0.4506380430275948, "percentage": 45.07, "elapsed_time": "15:25:26", "remaining_time": "18:48:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4892, "total_steps": 10853, "loss": 0.1522, "learning_rate": 3.107843010692882e-06, "epoch": 0.4507301792048648, "percentage": 45.08, "elapsed_time": "15:25:37", "remaining_time": "18:47:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4893, "total_steps": 10853, "loss": 0.1625, "learning_rate": 3.1071040592433003e-06, "epoch": 0.4508223153821348, "percentage": 45.08, "elapsed_time": "15:25:49", "remaining_time": "18:47:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4894, "total_steps": 10853, "loss": 0.141, "learning_rate": 3.1063650514240425e-06, "epoch": 0.4509144515594048, "percentage": 45.09, "elapsed_time": "15:26:00", "remaining_time": "18:47:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4895, "total_steps": 10853, "loss": 0.1403, "learning_rate": 3.105625987303723e-06, "epoch": 0.4510065877366748, "percentage": 45.1, "elapsed_time": "15:26:11", "remaining_time": "18:47:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4896, "total_steps": 10853, "loss": 0.1351, "learning_rate": 3.104886866950966e-06, "epoch": 0.4510987239139448, "percentage": 45.11, "elapsed_time": "15:26:22", "remaining_time": "18:47:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4897, "total_steps": 10853, "loss": 0.148, "learning_rate": 3.104147690434398e-06, "epoch": 0.45119086009121484, "percentage": 45.12, "elapsed_time": "15:26:33", "remaining_time": "18:46:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4898, "total_steps": 10853, "loss": 0.1458, "learning_rate": 3.103408457822653e-06, "epoch": 0.45128299626848484, "percentage": 45.13, "elapsed_time": "15:26:43", "remaining_time": "18:46:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4899, "total_steps": 10853, "loss": 0.1448, "learning_rate": 3.1026691691843667e-06, "epoch": 0.45137513244575483, "percentage": 45.14, "elapsed_time": "15:26:55", "remaining_time": "18:46:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4900, "total_steps": 10853, "loss": 0.1261, "learning_rate": 3.1019298245881836e-06, "epoch": 0.45146726862302483, "percentage": 45.15, "elapsed_time": "15:27:06", "remaining_time": "18:46:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4901, "total_steps": 10853, "loss": 0.1444, "learning_rate": 3.101190424102752e-06, "epoch": 0.45155940480029483, "percentage": 45.16, "elapsed_time": "15:27:16", "remaining_time": "18:46:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4902, "total_steps": 10853, "loss": 0.1435, "learning_rate": 3.100450967796724e-06, "epoch": 0.4516515409775648, "percentage": 45.17, "elapsed_time": "15:27:25", "remaining_time": "18:45:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4903, "total_steps": 10853, "loss": 0.1498, "learning_rate": 3.099711455738759e-06, "epoch": 0.4517436771548348, "percentage": 45.18, "elapsed_time": "15:27:36", "remaining_time": "18:45:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4904, "total_steps": 10853, "loss": 0.1261, "learning_rate": 3.0989718879975216e-06, "epoch": 0.4518358133321049, "percentage": 45.19, "elapsed_time": "15:27:48", "remaining_time": "18:45:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4905, "total_steps": 10853, "loss": 0.1539, "learning_rate": 3.098232264641679e-06, "epoch": 0.45192794950937487, "percentage": 45.19, "elapsed_time": "15:27:59", "remaining_time": "18:45:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4906, "total_steps": 10853, "loss": 0.1469, "learning_rate": 3.0974925857399067e-06, "epoch": 0.45202008568664487, "percentage": 45.2, "elapsed_time": "15:28:11", "remaining_time": "18:45:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4907, "total_steps": 10853, "loss": 0.1505, "learning_rate": 3.0967528513608834e-06, "epoch": 0.45211222186391486, "percentage": 45.21, "elapsed_time": "15:28:22", "remaining_time": "18:44:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4908, "total_steps": 10853, "loss": 0.1359, "learning_rate": 3.0960130615732934e-06, "epoch": 0.45220435804118486, "percentage": 45.22, "elapsed_time": "15:28:34", "remaining_time": "18:44:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4909, "total_steps": 10853, "loss": 0.1545, "learning_rate": 3.095273216445827e-06, "epoch": 0.45229649421845486, "percentage": 45.23, "elapsed_time": "15:28:44", "remaining_time": "18:44:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4910, "total_steps": 10853, "loss": 0.1419, "learning_rate": 3.0945333160471784e-06, "epoch": 0.45238863039572486, "percentage": 45.24, "elapsed_time": "15:28:56", "remaining_time": "18:44:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4911, "total_steps": 10853, "loss": 0.1411, "learning_rate": 3.0937933604460475e-06, "epoch": 0.4524807665729949, "percentage": 45.25, "elapsed_time": "15:29:06", "remaining_time": "18:44:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4912, "total_steps": 10853, "loss": 0.1452, "learning_rate": 3.0930533497111385e-06, "epoch": 0.4525729027502649, "percentage": 45.26, "elapsed_time": "15:29:16", "remaining_time": "18:43:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4913, "total_steps": 10853, "loss": 0.1308, "learning_rate": 3.0923132839111623e-06, "epoch": 0.4526650389275349, "percentage": 45.27, "elapsed_time": "15:29:27", "remaining_time": "18:43:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4914, "total_steps": 10853, "loss": 0.1394, "learning_rate": 3.0915731631148347e-06, "epoch": 0.4527571751048049, "percentage": 45.28, "elapsed_time": "15:29:38", "remaining_time": "18:43:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4915, "total_steps": 10853, "loss": 0.1442, "learning_rate": 3.0908329873908744e-06, "epoch": 0.4528493112820749, "percentage": 45.29, "elapsed_time": "15:29:49", "remaining_time": "18:43:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4916, "total_steps": 10853, "loss": 0.1393, "learning_rate": 3.0900927568080074e-06, "epoch": 0.4529414474593449, "percentage": 45.3, "elapsed_time": "15:30:01", "remaining_time": "18:43:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4917, "total_steps": 10853, "loss": 0.1449, "learning_rate": 3.0893524714349655e-06, "epoch": 0.4530335836366149, "percentage": 45.31, "elapsed_time": "15:30:13", "remaining_time": "18:43:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4918, "total_steps": 10853, "loss": 0.1475, "learning_rate": 3.0886121313404827e-06, "epoch": 0.45312571981388494, "percentage": 45.31, "elapsed_time": "15:30:25", "remaining_time": "18:42:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4919, "total_steps": 10853, "loss": 0.1521, "learning_rate": 3.0878717365933005e-06, "epoch": 0.45321785599115494, "percentage": 45.32, "elapsed_time": "15:30:37", "remaining_time": "18:42:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4920, "total_steps": 10853, "loss": 0.1435, "learning_rate": 3.087131287262163e-06, "epoch": 0.45330999216842494, "percentage": 45.33, "elapsed_time": "15:30:48", "remaining_time": "18:42:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4921, "total_steps": 10853, "loss": 0.1489, "learning_rate": 3.0863907834158236e-06, "epoch": 0.45340212834569493, "percentage": 45.34, "elapsed_time": "15:30:58", "remaining_time": "18:42:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4922, "total_steps": 10853, "loss": 0.1406, "learning_rate": 3.0856502251230363e-06, "epoch": 0.45349426452296493, "percentage": 45.35, "elapsed_time": "15:31:09", "remaining_time": "18:42:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4923, "total_steps": 10853, "loss": 0.14, "learning_rate": 3.084909612452563e-06, "epoch": 0.4535864007002349, "percentage": 45.36, "elapsed_time": "15:31:20", "remaining_time": "18:41:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4924, "total_steps": 10853, "loss": 0.1543, "learning_rate": 3.0841689454731686e-06, "epoch": 0.453678536877505, "percentage": 45.37, "elapsed_time": "15:31:31", "remaining_time": "18:41:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4925, "total_steps": 10853, "loss": 0.1433, "learning_rate": 3.0834282242536253e-06, "epoch": 0.453770673054775, "percentage": 45.38, "elapsed_time": "15:31:42", "remaining_time": "18:41:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4926, "total_steps": 10853, "loss": 0.1415, "learning_rate": 3.082687448862708e-06, "epoch": 0.453862809232045, "percentage": 45.39, "elapsed_time": "15:31:53", "remaining_time": "18:41:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4927, "total_steps": 10853, "loss": 0.1366, "learning_rate": 3.0819466193691995e-06, "epoch": 0.45395494540931497, "percentage": 45.4, "elapsed_time": "15:32:05", "remaining_time": "18:41:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4928, "total_steps": 10853, "loss": 0.1516, "learning_rate": 3.0812057358418834e-06, "epoch": 0.45404708158658497, "percentage": 45.41, "elapsed_time": "15:32:16", "remaining_time": "18:40:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4929, "total_steps": 10853, "loss": 0.144, "learning_rate": 3.0804647983495527e-06, "epoch": 0.45413921776385496, "percentage": 45.42, "elapsed_time": "15:32:26", "remaining_time": "18:40:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4930, "total_steps": 10853, "loss": 0.1415, "learning_rate": 3.079723806961003e-06, "epoch": 0.45423135394112496, "percentage": 45.43, "elapsed_time": "15:32:36", "remaining_time": "18:40:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4931, "total_steps": 10853, "loss": 0.1356, "learning_rate": 3.078982761745036e-06, "epoch": 0.454323490118395, "percentage": 45.43, "elapsed_time": "15:32:48", "remaining_time": "18:40:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4932, "total_steps": 10853, "loss": 0.1459, "learning_rate": 3.078241662770456e-06, "epoch": 0.454415626295665, "percentage": 45.44, "elapsed_time": "15:32:58", "remaining_time": "18:40:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4933, "total_steps": 10853, "loss": 0.1334, "learning_rate": 3.0775005101060766e-06, "epoch": 0.454507762472935, "percentage": 45.45, "elapsed_time": "15:33:09", "remaining_time": "18:39:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4934, "total_steps": 10853, "loss": 0.1483, "learning_rate": 3.076759303820712e-06, "epoch": 0.454599898650205, "percentage": 45.46, "elapsed_time": "15:33:20", "remaining_time": "18:39:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4935, "total_steps": 10853, "loss": 0.1461, "learning_rate": 3.0760180439831844e-06, "epoch": 0.454692034827475, "percentage": 45.47, "elapsed_time": "15:33:32", "remaining_time": "18:39:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4936, "total_steps": 10853, "loss": 0.1549, "learning_rate": 3.0752767306623193e-06, "epoch": 0.454784171004745, "percentage": 45.48, "elapsed_time": "15:33:43", "remaining_time": "18:39:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4937, "total_steps": 10853, "loss": 0.1468, "learning_rate": 3.0745353639269476e-06, "epoch": 0.454876307182015, "percentage": 45.49, "elapsed_time": "15:33:54", "remaining_time": "18:39:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4938, "total_steps": 10853, "loss": 0.1312, "learning_rate": 3.073793943845906e-06, "epoch": 0.45496844335928505, "percentage": 45.5, "elapsed_time": "15:34:04", "remaining_time": "18:38:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4939, "total_steps": 10853, "loss": 0.1368, "learning_rate": 3.073052470488035e-06, "epoch": 0.45506057953655504, "percentage": 45.51, "elapsed_time": "15:34:16", "remaining_time": "18:38:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4940, "total_steps": 10853, "loss": 0.1219, "learning_rate": 3.0723109439221794e-06, "epoch": 0.45515271571382504, "percentage": 45.52, "elapsed_time": "15:34:27", "remaining_time": "18:38:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4941, "total_steps": 10853, "loss": 0.1488, "learning_rate": 3.071569364217192e-06, "epoch": 0.45524485189109504, "percentage": 45.53, "elapsed_time": "15:34:39", "remaining_time": "18:38:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4942, "total_steps": 10853, "loss": 0.145, "learning_rate": 3.070827731441927e-06, "epoch": 0.45533698806836503, "percentage": 45.54, "elapsed_time": "15:34:50", "remaining_time": "18:38:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4943, "total_steps": 10853, "loss": 0.1527, "learning_rate": 3.0700860456652467e-06, "epoch": 0.45542912424563503, "percentage": 45.55, "elapsed_time": "15:35:02", "remaining_time": "18:37:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4944, "total_steps": 10853, "loss": 0.1645, "learning_rate": 3.0693443069560147e-06, "epoch": 0.455521260422905, "percentage": 45.55, "elapsed_time": "15:35:13", "remaining_time": "18:37:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4945, "total_steps": 10853, "loss": 0.14, "learning_rate": 3.0686025153831033e-06, "epoch": 0.4556133966001751, "percentage": 45.56, "elapsed_time": "15:35:24", "remaining_time": "18:37:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4946, "total_steps": 10853, "loss": 0.1393, "learning_rate": 3.067860671015387e-06, "epoch": 0.4557055327774451, "percentage": 45.57, "elapsed_time": "15:35:35", "remaining_time": "18:37:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4947, "total_steps": 10853, "loss": 0.1453, "learning_rate": 3.0671187739217455e-06, "epoch": 0.4557976689547151, "percentage": 45.58, "elapsed_time": "15:35:46", "remaining_time": "18:37:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4948, "total_steps": 10853, "loss": 0.1404, "learning_rate": 3.0663768241710653e-06, "epoch": 0.45588980513198507, "percentage": 45.59, "elapsed_time": "15:35:57", "remaining_time": "18:36:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4949, "total_steps": 10853, "loss": 0.1453, "learning_rate": 3.065634821832237e-06, "epoch": 0.45598194130925507, "percentage": 45.6, "elapsed_time": "15:36:08", "remaining_time": "18:36:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4950, "total_steps": 10853, "loss": 0.1337, "learning_rate": 3.064892766974153e-06, "epoch": 0.45607407748652506, "percentage": 45.61, "elapsed_time": "15:36:18", "remaining_time": "18:36:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4951, "total_steps": 10853, "loss": 0.1525, "learning_rate": 3.0641506596657155e-06, "epoch": 0.45616621366379506, "percentage": 45.62, "elapsed_time": "15:36:29", "remaining_time": "18:36:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4952, "total_steps": 10853, "loss": 0.1481, "learning_rate": 3.0634084999758283e-06, "epoch": 0.4562583498410651, "percentage": 45.63, "elapsed_time": "15:36:38", "remaining_time": "18:36:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4953, "total_steps": 10853, "loss": 0.1542, "learning_rate": 3.0626662879734015e-06, "epoch": 0.4563504860183351, "percentage": 45.64, "elapsed_time": "15:36:50", "remaining_time": "18:35:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4954, "total_steps": 10853, "loss": 0.1467, "learning_rate": 3.0619240237273496e-06, "epoch": 0.4564426221956051, "percentage": 45.65, "elapsed_time": "15:37:01", "remaining_time": "18:35:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4955, "total_steps": 10853, "loss": 0.1411, "learning_rate": 3.0611817073065906e-06, "epoch": 0.4565347583728751, "percentage": 45.66, "elapsed_time": "15:37:12", "remaining_time": "18:35:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4956, "total_steps": 10853, "loss": 0.133, "learning_rate": 3.0604393387800506e-06, "epoch": 0.4566268945501451, "percentage": 45.66, "elapsed_time": "15:37:23", "remaining_time": "18:35:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4957, "total_steps": 10853, "loss": 0.1517, "learning_rate": 3.059696918216658e-06, "epoch": 0.4567190307274151, "percentage": 45.67, "elapsed_time": "15:37:35", "remaining_time": "18:35:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4958, "total_steps": 10853, "loss": 0.139, "learning_rate": 3.058954445685346e-06, "epoch": 0.45681116690468515, "percentage": 45.68, "elapsed_time": "15:37:45", "remaining_time": "18:34:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4959, "total_steps": 10853, "loss": 0.1503, "learning_rate": 3.058211921255053e-06, "epoch": 0.45690330308195515, "percentage": 45.69, "elapsed_time": "15:37:55", "remaining_time": "18:34:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4960, "total_steps": 10853, "loss": 0.1369, "learning_rate": 3.0574693449947234e-06, "epoch": 0.45699543925922514, "percentage": 45.7, "elapsed_time": "15:38:06", "remaining_time": "18:34:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4961, "total_steps": 10853, "loss": 0.1402, "learning_rate": 3.056726716973305e-06, "epoch": 0.45708757543649514, "percentage": 45.71, "elapsed_time": "15:38:16", "remaining_time": "18:34:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4962, "total_steps": 10853, "loss": 0.158, "learning_rate": 3.0559840372597516e-06, "epoch": 0.45717971161376514, "percentage": 45.72, "elapsed_time": "15:38:27", "remaining_time": "18:34:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4963, "total_steps": 10853, "loss": 0.1497, "learning_rate": 3.0552413059230196e-06, "epoch": 0.45727184779103514, "percentage": 45.73, "elapsed_time": "15:38:38", "remaining_time": "18:33:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4964, "total_steps": 10853, "loss": 0.1606, "learning_rate": 3.054498523032073e-06, "epoch": 0.45736398396830513, "percentage": 45.74, "elapsed_time": "15:38:48", "remaining_time": "18:33:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4965, "total_steps": 10853, "loss": 0.1419, "learning_rate": 3.053755688655879e-06, "epoch": 0.4574561201455752, "percentage": 45.75, "elapsed_time": "15:38:58", "remaining_time": "18:33:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4966, "total_steps": 10853, "loss": 0.1379, "learning_rate": 3.05301280286341e-06, "epoch": 0.4575482563228452, "percentage": 45.76, "elapsed_time": "15:39:09", "remaining_time": "18:33:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4967, "total_steps": 10853, "loss": 0.1364, "learning_rate": 3.0522698657236417e-06, "epoch": 0.4576403925001152, "percentage": 45.77, "elapsed_time": "15:39:19", "remaining_time": "18:33:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4968, "total_steps": 10853, "loss": 0.1574, "learning_rate": 3.0515268773055577e-06, "epoch": 0.4577325286773852, "percentage": 45.78, "elapsed_time": "15:39:30", "remaining_time": "18:32:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4969, "total_steps": 10853, "loss": 0.1599, "learning_rate": 3.0507838376781433e-06, "epoch": 0.4578246648546552, "percentage": 45.78, "elapsed_time": "15:39:40", "remaining_time": "18:32:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4970, "total_steps": 10853, "loss": 0.1615, "learning_rate": 3.050040746910391e-06, "epoch": 0.45791680103192517, "percentage": 45.79, "elapsed_time": "15:39:51", "remaining_time": "18:32:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4971, "total_steps": 10853, "loss": 0.1472, "learning_rate": 3.049297605071296e-06, "epoch": 0.45800893720919517, "percentage": 45.8, "elapsed_time": "15:40:02", "remaining_time": "18:32:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4972, "total_steps": 10853, "loss": 0.1539, "learning_rate": 3.0485544122298586e-06, "epoch": 0.4581010733864652, "percentage": 45.81, "elapsed_time": "15:40:13", "remaining_time": "18:32:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4973, "total_steps": 10853, "loss": 0.1349, "learning_rate": 3.0478111684550855e-06, "epoch": 0.4581932095637352, "percentage": 45.82, "elapsed_time": "15:40:25", "remaining_time": "18:31:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4974, "total_steps": 10853, "loss": 0.1393, "learning_rate": 3.0470678738159865e-06, "epoch": 0.4582853457410052, "percentage": 45.83, "elapsed_time": "15:40:36", "remaining_time": "18:31:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4975, "total_steps": 10853, "loss": 0.1544, "learning_rate": 3.046324528381576e-06, "epoch": 0.4583774819182752, "percentage": 45.84, "elapsed_time": "15:40:47", "remaining_time": "18:31:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4976, "total_steps": 10853, "loss": 0.144, "learning_rate": 3.045581132220875e-06, "epoch": 0.4584696180955452, "percentage": 45.85, "elapsed_time": "15:40:58", "remaining_time": "18:31:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4977, "total_steps": 10853, "loss": 0.158, "learning_rate": 3.0448376854029067e-06, "epoch": 0.4585617542728152, "percentage": 45.86, "elapsed_time": "15:41:09", "remaining_time": "18:31:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4978, "total_steps": 10853, "loss": 0.1349, "learning_rate": 3.0440941879967007e-06, "epoch": 0.4586538904500852, "percentage": 45.87, "elapsed_time": "15:41:20", "remaining_time": "18:30:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4979, "total_steps": 10853, "loss": 0.1498, "learning_rate": 3.043350640071291e-06, "epoch": 0.45874602662735525, "percentage": 45.88, "elapsed_time": "15:41:29", "remaining_time": "18:30:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4980, "total_steps": 10853, "loss": 0.1367, "learning_rate": 3.0426070416957155e-06, "epoch": 0.45883816280462525, "percentage": 45.89, "elapsed_time": "15:41:41", "remaining_time": "18:30:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4981, "total_steps": 10853, "loss": 0.133, "learning_rate": 3.0418633929390184e-06, "epoch": 0.45893029898189525, "percentage": 45.9, "elapsed_time": "15:41:51", "remaining_time": "18:30:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4982, "total_steps": 10853, "loss": 0.1491, "learning_rate": 3.0411196938702465e-06, "epoch": 0.45902243515916524, "percentage": 45.9, "elapsed_time": "15:42:02", "remaining_time": "18:30:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4983, "total_steps": 10853, "loss": 0.1487, "learning_rate": 3.040375944558453e-06, "epoch": 0.45911457133643524, "percentage": 45.91, "elapsed_time": "15:42:13", "remaining_time": "18:29:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4984, "total_steps": 10853, "loss": 0.1454, "learning_rate": 3.0396321450726946e-06, "epoch": 0.45920670751370524, "percentage": 45.92, "elapsed_time": "15:42:23", "remaining_time": "18:29:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4985, "total_steps": 10853, "loss": 0.1364, "learning_rate": 3.0388882954820336e-06, "epoch": 0.4592988436909753, "percentage": 45.93, "elapsed_time": "15:42:34", "remaining_time": "18:29:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4986, "total_steps": 10853, "loss": 0.139, "learning_rate": 3.0381443958555367e-06, "epoch": 0.4593909798682453, "percentage": 45.94, "elapsed_time": "15:42:45", "remaining_time": "18:29:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4987, "total_steps": 10853, "loss": 0.1471, "learning_rate": 3.037400446262274e-06, "epoch": 0.4594831160455153, "percentage": 45.95, "elapsed_time": "15:42:56", "remaining_time": "18:29:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4988, "total_steps": 10853, "loss": 0.1486, "learning_rate": 3.036656446771322e-06, "epoch": 0.4595752522227853, "percentage": 45.96, "elapsed_time": "15:43:05", "remaining_time": "18:28:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4989, "total_steps": 10853, "loss": 0.1412, "learning_rate": 3.035912397451763e-06, "epoch": 0.4596673884000553, "percentage": 45.97, "elapsed_time": "15:43:15", "remaining_time": "18:28:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4990, "total_steps": 10853, "loss": 0.1395, "learning_rate": 3.035168298372678e-06, "epoch": 0.4597595245773253, "percentage": 45.98, "elapsed_time": "15:43:27", "remaining_time": "18:28:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4991, "total_steps": 10853, "loss": 0.1467, "learning_rate": 3.0344241496031602e-06, "epoch": 0.45985166075459527, "percentage": 45.99, "elapsed_time": "15:43:37", "remaining_time": "18:28:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4992, "total_steps": 10853, "loss": 0.15, "learning_rate": 3.0336799512123017e-06, "epoch": 0.4599437969318653, "percentage": 46.0, "elapsed_time": "15:43:49", "remaining_time": "18:28:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4993, "total_steps": 10853, "loss": 0.145, "learning_rate": 3.032935703269203e-06, "epoch": 0.4600359331091353, "percentage": 46.01, "elapsed_time": "15:44:00", "remaining_time": "18:27:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4994, "total_steps": 10853, "loss": 0.1517, "learning_rate": 3.0321914058429668e-06, "epoch": 0.4601280692864053, "percentage": 46.01, "elapsed_time": "15:44:09", "remaining_time": "18:27:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4995, "total_steps": 10853, "loss": 0.1586, "learning_rate": 3.0314470590027012e-06, "epoch": 0.4602202054636753, "percentage": 46.02, "elapsed_time": "15:44:20", "remaining_time": "18:27:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4996, "total_steps": 10853, "loss": 0.1454, "learning_rate": 3.0307026628175183e-06, "epoch": 0.4603123416409453, "percentage": 46.03, "elapsed_time": "15:44:31", "remaining_time": "18:27:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4997, "total_steps": 10853, "loss": 0.1423, "learning_rate": 3.029958217356537e-06, "epoch": 0.4604044778182153, "percentage": 46.04, "elapsed_time": "15:44:41", "remaining_time": "18:27:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4998, "total_steps": 10853, "loss": 0.1422, "learning_rate": 3.029213722688878e-06, "epoch": 0.4604966139954853, "percentage": 46.05, "elapsed_time": "15:44:53", "remaining_time": "18:26:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4999, "total_steps": 10853, "loss": 0.1535, "learning_rate": 3.0284691788836672e-06, "epoch": 0.46058875017275536, "percentage": 46.06, "elapsed_time": "15:45:04", "remaining_time": "18:26:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5000, "total_steps": 10853, "loss": 0.1536, "learning_rate": 3.027724586010037e-06, "epoch": 0.46068088635002535, "percentage": 46.07, "elapsed_time": "15:45:14", "remaining_time": "18:26:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5000, "total_steps": 10853, "eval_loss": 0.14408743381500244, "epoch": 0.46068088635002535, "percentage": 46.07, "elapsed_time": "15:50:14", "remaining_time": "18:32:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5001, "total_steps": 10853, "loss": 0.1453, "learning_rate": 3.0269799441371224e-06, "epoch": 0.46077302252729535, "percentage": 46.08, "elapsed_time": "15:50:24", "remaining_time": "18:32:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5002, "total_steps": 10853, "loss": 0.1445, "learning_rate": 3.026235253334063e-06, "epoch": 0.46086515870456535, "percentage": 46.09, "elapsed_time": "15:50:34", "remaining_time": "18:31:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5003, "total_steps": 10853, "loss": 0.1415, "learning_rate": 3.0254905136700038e-06, "epoch": 0.46095729488183534, "percentage": 46.1, "elapsed_time": "15:50:45", "remaining_time": "18:31:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5004, "total_steps": 10853, "loss": 0.1404, "learning_rate": 3.024745725214093e-06, "epoch": 0.46104943105910534, "percentage": 46.11, "elapsed_time": "15:50:55", "remaining_time": "18:31:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5005, "total_steps": 10853, "loss": 0.1327, "learning_rate": 3.024000888035486e-06, "epoch": 0.46114156723637534, "percentage": 46.12, "elapsed_time": "15:51:06", "remaining_time": "18:31:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5006, "total_steps": 10853, "loss": 0.1389, "learning_rate": 3.0232560022033398e-06, "epoch": 0.4612337034136454, "percentage": 46.13, "elapsed_time": "15:51:18", "remaining_time": "18:31:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5007, "total_steps": 10853, "loss": 0.1444, "learning_rate": 3.022511067786817e-06, "epoch": 0.4613258395909154, "percentage": 46.13, "elapsed_time": "15:51:30", "remaining_time": "18:30:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5008, "total_steps": 10853, "loss": 0.1616, "learning_rate": 3.0217660848550863e-06, "epoch": 0.4614179757681854, "percentage": 46.14, "elapsed_time": "15:51:40", "remaining_time": "18:30:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5009, "total_steps": 10853, "loss": 0.1461, "learning_rate": 3.0210210534773175e-06, "epoch": 0.4615101119454554, "percentage": 46.15, "elapsed_time": "15:51:52", "remaining_time": "18:30:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5010, "total_steps": 10853, "loss": 0.1413, "learning_rate": 3.020275973722688e-06, "epoch": 0.4616022481227254, "percentage": 46.16, "elapsed_time": "15:52:03", "remaining_time": "18:30:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5011, "total_steps": 10853, "loss": 0.1444, "learning_rate": 3.0195308456603795e-06, "epoch": 0.4616943842999954, "percentage": 46.17, "elapsed_time": "15:52:14", "remaining_time": "18:30:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5012, "total_steps": 10853, "loss": 0.1349, "learning_rate": 3.018785669359575e-06, "epoch": 0.46178652047726537, "percentage": 46.18, "elapsed_time": "15:52:24", "remaining_time": "18:29:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5013, "total_steps": 10853, "loss": 0.1357, "learning_rate": 3.018040444889466e-06, "epoch": 0.4618786566545354, "percentage": 46.19, "elapsed_time": "15:52:35", "remaining_time": "18:29:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5014, "total_steps": 10853, "loss": 0.1374, "learning_rate": 3.0172951723192456e-06, "epoch": 0.4619707928318054, "percentage": 46.2, "elapsed_time": "15:52:47", "remaining_time": "18:29:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5015, "total_steps": 10853, "loss": 0.1456, "learning_rate": 3.016549851718112e-06, "epoch": 0.4620629290090754, "percentage": 46.21, "elapsed_time": "15:52:56", "remaining_time": "18:29:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5016, "total_steps": 10853, "loss": 0.1508, "learning_rate": 3.0158044831552703e-06, "epoch": 0.4621550651863454, "percentage": 46.22, "elapsed_time": "15:53:07", "remaining_time": "18:29:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5017, "total_steps": 10853, "loss": 0.1343, "learning_rate": 3.015059066699926e-06, "epoch": 0.4622472013636154, "percentage": 46.23, "elapsed_time": "15:53:18", "remaining_time": "18:28:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5018, "total_steps": 10853, "loss": 0.1362, "learning_rate": 3.0143136024212923e-06, "epoch": 0.4623393375408854, "percentage": 46.24, "elapsed_time": "15:53:28", "remaining_time": "18:28:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5019, "total_steps": 10853, "loss": 0.145, "learning_rate": 3.013568090388585e-06, "epoch": 0.46243147371815546, "percentage": 46.25, "elapsed_time": "15:53:40", "remaining_time": "18:28:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5020, "total_steps": 10853, "loss": 0.1437, "learning_rate": 3.012822530671026e-06, "epoch": 0.46252360989542546, "percentage": 46.25, "elapsed_time": "15:53:51", "remaining_time": "18:28:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5021, "total_steps": 10853, "loss": 0.1569, "learning_rate": 3.012076923337839e-06, "epoch": 0.46261574607269546, "percentage": 46.26, "elapsed_time": "15:54:02", "remaining_time": "18:28:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5022, "total_steps": 10853, "loss": 0.1424, "learning_rate": 3.011331268458255e-06, "epoch": 0.46270788224996545, "percentage": 46.27, "elapsed_time": "15:54:12", "remaining_time": "18:27:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5023, "total_steps": 10853, "loss": 0.1437, "learning_rate": 3.010585566101507e-06, "epoch": 0.46280001842723545, "percentage": 46.28, "elapsed_time": "15:54:22", "remaining_time": "18:27:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5024, "total_steps": 10853, "loss": 0.1385, "learning_rate": 3.0098398163368353e-06, "epoch": 0.46289215460450545, "percentage": 46.29, "elapsed_time": "15:54:33", "remaining_time": "18:27:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5025, "total_steps": 10853, "loss": 0.1351, "learning_rate": 3.0090940192334805e-06, "epoch": 0.46298429078177544, "percentage": 46.3, "elapsed_time": "15:54:44", "remaining_time": "18:27:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5026, "total_steps": 10853, "loss": 0.1499, "learning_rate": 3.0083481748606923e-06, "epoch": 0.4630764269590455, "percentage": 46.31, "elapsed_time": "15:54:56", "remaining_time": "18:27:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5027, "total_steps": 10853, "loss": 0.1435, "learning_rate": 3.007602283287721e-06, "epoch": 0.4631685631363155, "percentage": 46.32, "elapsed_time": "15:55:06", "remaining_time": "18:26:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5028, "total_steps": 10853, "loss": 0.1496, "learning_rate": 3.0068563445838234e-06, "epoch": 0.4632606993135855, "percentage": 46.33, "elapsed_time": "15:55:17", "remaining_time": "18:26:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5029, "total_steps": 10853, "loss": 0.1532, "learning_rate": 3.0061103588182592e-06, "epoch": 0.4633528354908555, "percentage": 46.34, "elapsed_time": "15:55:27", "remaining_time": "18:26:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5030, "total_steps": 10853, "loss": 0.1267, "learning_rate": 3.005364326060294e-06, "epoch": 0.4634449716681255, "percentage": 46.35, "elapsed_time": "15:55:35", "remaining_time": "18:26:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5031, "total_steps": 10853, "loss": 0.1395, "learning_rate": 3.0046182463791962e-06, "epoch": 0.4635371078453955, "percentage": 46.36, "elapsed_time": "15:55:46", "remaining_time": "18:26:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5032, "total_steps": 10853, "loss": 0.1495, "learning_rate": 3.0038721198442406e-06, "epoch": 0.4636292440226655, "percentage": 46.37, "elapsed_time": "15:55:57", "remaining_time": "18:25:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5033, "total_steps": 10853, "loss": 0.1374, "learning_rate": 3.003125946524704e-06, "epoch": 0.46372138019993553, "percentage": 46.37, "elapsed_time": "15:56:08", "remaining_time": "18:25:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5034, "total_steps": 10853, "loss": 0.1443, "learning_rate": 3.002379726489869e-06, "epoch": 0.4638135163772055, "percentage": 46.38, "elapsed_time": "15:56:19", "remaining_time": "18:25:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5035, "total_steps": 10853, "loss": 0.1544, "learning_rate": 3.001633459809023e-06, "epoch": 0.4639056525544755, "percentage": 46.39, "elapsed_time": "15:56:30", "remaining_time": "18:25:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5036, "total_steps": 10853, "loss": 0.1447, "learning_rate": 3.000887146551455e-06, "epoch": 0.4639977887317455, "percentage": 46.4, "elapsed_time": "15:56:41", "remaining_time": "18:25:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5037, "total_steps": 10853, "loss": 0.1351, "learning_rate": 3.000140786786463e-06, "epoch": 0.4640899249090155, "percentage": 46.41, "elapsed_time": "15:56:51", "remaining_time": "18:24:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5038, "total_steps": 10853, "loss": 0.1449, "learning_rate": 2.9993943805833444e-06, "epoch": 0.4641820610862855, "percentage": 46.42, "elapsed_time": "15:57:02", "remaining_time": "18:24:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5039, "total_steps": 10853, "loss": 0.1423, "learning_rate": 2.998647928011404e-06, "epoch": 0.4642741972635555, "percentage": 46.43, "elapsed_time": "15:57:12", "remaining_time": "18:24:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5040, "total_steps": 10853, "loss": 0.1381, "learning_rate": 2.9979014291399495e-06, "epoch": 0.46436633344082556, "percentage": 46.44, "elapsed_time": "15:57:23", "remaining_time": "18:24:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5041, "total_steps": 10853, "loss": 0.1457, "learning_rate": 2.997154884038294e-06, "epoch": 0.46445846961809556, "percentage": 46.45, "elapsed_time": "15:57:33", "remaining_time": "18:24:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5042, "total_steps": 10853, "loss": 0.1434, "learning_rate": 2.9964082927757537e-06, "epoch": 0.46455060579536556, "percentage": 46.46, "elapsed_time": "15:57:44", "remaining_time": "18:23:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5043, "total_steps": 10853, "loss": 0.1422, "learning_rate": 2.995661655421651e-06, "epoch": 0.46464274197263555, "percentage": 46.47, "elapsed_time": "15:57:56", "remaining_time": "18:23:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5044, "total_steps": 10853, "loss": 0.1519, "learning_rate": 2.994914972045309e-06, "epoch": 0.46473487814990555, "percentage": 46.48, "elapsed_time": "15:58:07", "remaining_time": "18:23:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5045, "total_steps": 10853, "loss": 0.1439, "learning_rate": 2.994168242716059e-06, "epoch": 0.46482701432717555, "percentage": 46.48, "elapsed_time": "15:58:16", "remaining_time": "18:23:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5046, "total_steps": 10853, "loss": 0.1444, "learning_rate": 2.9934214675032346e-06, "epoch": 0.46491915050444554, "percentage": 46.49, "elapsed_time": "15:58:27", "remaining_time": "18:23:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5047, "total_steps": 10853, "loss": 0.1519, "learning_rate": 2.9926746464761743e-06, "epoch": 0.4650112866817156, "percentage": 46.5, "elapsed_time": "15:58:38", "remaining_time": "18:22:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5048, "total_steps": 10853, "loss": 0.1358, "learning_rate": 2.9919277797042196e-06, "epoch": 0.4651034228589856, "percentage": 46.51, "elapsed_time": "15:58:49", "remaining_time": "18:22:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5049, "total_steps": 10853, "loss": 0.1421, "learning_rate": 2.991180867256718e-06, "epoch": 0.4651955590362556, "percentage": 46.52, "elapsed_time": "15:59:02", "remaining_time": "18:22:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5050, "total_steps": 10853, "loss": 0.1419, "learning_rate": 2.990433909203019e-06, "epoch": 0.4652876952135256, "percentage": 46.53, "elapsed_time": "15:59:13", "remaining_time": "18:22:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5051, "total_steps": 10853, "loss": 0.1408, "learning_rate": 2.9896869056124795e-06, "epoch": 0.4653798313907956, "percentage": 46.54, "elapsed_time": "15:59:24", "remaining_time": "18:22:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5052, "total_steps": 10853, "loss": 0.1476, "learning_rate": 2.9889398565544576e-06, "epoch": 0.4654719675680656, "percentage": 46.55, "elapsed_time": "15:59:36", "remaining_time": "18:21:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5053, "total_steps": 10853, "loss": 0.1455, "learning_rate": 2.9881927620983175e-06, "epoch": 0.46556410374533563, "percentage": 46.56, "elapsed_time": "15:59:47", "remaining_time": "18:21:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5054, "total_steps": 10853, "loss": 0.1395, "learning_rate": 2.9874456223134273e-06, "epoch": 0.46565623992260563, "percentage": 46.57, "elapsed_time": "15:59:57", "remaining_time": "18:21:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5055, "total_steps": 10853, "loss": 0.1461, "learning_rate": 2.9866984372691586e-06, "epoch": 0.4657483760998756, "percentage": 46.58, "elapsed_time": "16:00:08", "remaining_time": "18:21:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5056, "total_steps": 10853, "loss": 0.1566, "learning_rate": 2.985951207034888e-06, "epoch": 0.4658405122771456, "percentage": 46.59, "elapsed_time": "16:00:19", "remaining_time": "18:21:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5057, "total_steps": 10853, "loss": 0.1524, "learning_rate": 2.985203931679995e-06, "epoch": 0.4659326484544156, "percentage": 46.6, "elapsed_time": "16:00:32", "remaining_time": "18:20:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5058, "total_steps": 10853, "loss": 0.1522, "learning_rate": 2.984456611273864e-06, "epoch": 0.4660247846316856, "percentage": 46.6, "elapsed_time": "16:00:43", "remaining_time": "18:20:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5059, "total_steps": 10853, "loss": 0.1425, "learning_rate": 2.9837092458858862e-06, "epoch": 0.4661169208089556, "percentage": 46.61, "elapsed_time": "16:00:55", "remaining_time": "18:20:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5060, "total_steps": 10853, "loss": 0.1508, "learning_rate": 2.982961835585451e-06, "epoch": 0.46620905698622567, "percentage": 46.62, "elapsed_time": "16:01:06", "remaining_time": "18:20:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5061, "total_steps": 10853, "loss": 0.1443, "learning_rate": 2.9822143804419586e-06, "epoch": 0.46630119316349566, "percentage": 46.63, "elapsed_time": "16:01:16", "remaining_time": "18:20:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5062, "total_steps": 10853, "loss": 0.1619, "learning_rate": 2.981466880524809e-06, "epoch": 0.46639332934076566, "percentage": 46.64, "elapsed_time": "16:01:26", "remaining_time": "18:19:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5063, "total_steps": 10853, "loss": 0.1437, "learning_rate": 2.9807193359034077e-06, "epoch": 0.46648546551803566, "percentage": 46.65, "elapsed_time": "16:01:36", "remaining_time": "18:19:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5064, "total_steps": 10853, "loss": 0.1503, "learning_rate": 2.979971746647164e-06, "epoch": 0.46657760169530565, "percentage": 46.66, "elapsed_time": "16:01:46", "remaining_time": "18:19:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5065, "total_steps": 10853, "loss": 0.1526, "learning_rate": 2.9792241128254916e-06, "epoch": 0.46666973787257565, "percentage": 46.67, "elapsed_time": "16:01:58", "remaining_time": "18:19:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5066, "total_steps": 10853, "loss": 0.1406, "learning_rate": 2.978476434507809e-06, "epoch": 0.46676187404984565, "percentage": 46.68, "elapsed_time": "16:02:08", "remaining_time": "18:19:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5067, "total_steps": 10853, "loss": 0.1501, "learning_rate": 2.9777287117635387e-06, "epoch": 0.4668540102271157, "percentage": 46.69, "elapsed_time": "16:02:19", "remaining_time": "18:18:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5068, "total_steps": 10853, "loss": 0.1398, "learning_rate": 2.9769809446621057e-06, "epoch": 0.4669461464043857, "percentage": 46.7, "elapsed_time": "16:02:28", "remaining_time": "18:18:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5069, "total_steps": 10853, "loss": 0.1374, "learning_rate": 2.9762331332729405e-06, "epoch": 0.4670382825816557, "percentage": 46.71, "elapsed_time": "16:02:38", "remaining_time": "18:18:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5070, "total_steps": 10853, "loss": 0.1469, "learning_rate": 2.975485277665478e-06, "epoch": 0.4671304187589257, "percentage": 46.72, "elapsed_time": "16:02:48", "remaining_time": "18:18:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5071, "total_steps": 10853, "loss": 0.1442, "learning_rate": 2.9747373779091552e-06, "epoch": 0.4672225549361957, "percentage": 46.72, "elapsed_time": "16:02:58", "remaining_time": "18:17:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5072, "total_steps": 10853, "loss": 0.1485, "learning_rate": 2.9739894340734177e-06, "epoch": 0.4673146911134657, "percentage": 46.73, "elapsed_time": "16:03:09", "remaining_time": "18:17:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5073, "total_steps": 10853, "loss": 0.1361, "learning_rate": 2.9732414462277083e-06, "epoch": 0.4674068272907357, "percentage": 46.74, "elapsed_time": "16:03:20", "remaining_time": "18:17:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5074, "total_steps": 10853, "loss": 0.1392, "learning_rate": 2.9724934144414807e-06, "epoch": 0.46749896346800573, "percentage": 46.75, "elapsed_time": "16:03:30", "remaining_time": "18:17:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5075, "total_steps": 10853, "loss": 0.1477, "learning_rate": 2.9717453387841884e-06, "epoch": 0.46759109964527573, "percentage": 46.76, "elapsed_time": "16:03:40", "remaining_time": "18:17:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5076, "total_steps": 10853, "loss": 0.1448, "learning_rate": 2.9709972193252905e-06, "epoch": 0.46768323582254573, "percentage": 46.77, "elapsed_time": "16:03:50", "remaining_time": "18:16:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5077, "total_steps": 10853, "loss": 0.1384, "learning_rate": 2.9702490561342505e-06, "epoch": 0.4677753719998157, "percentage": 46.78, "elapsed_time": "16:04:00", "remaining_time": "18:16:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5078, "total_steps": 10853, "loss": 0.1306, "learning_rate": 2.969500849280535e-06, "epoch": 0.4678675081770857, "percentage": 46.79, "elapsed_time": "16:04:12", "remaining_time": "18:16:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5079, "total_steps": 10853, "loss": 0.144, "learning_rate": 2.9687525988336147e-06, "epoch": 0.4679596443543557, "percentage": 46.8, "elapsed_time": "16:04:24", "remaining_time": "18:16:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5080, "total_steps": 10853, "loss": 0.1363, "learning_rate": 2.968004304862966e-06, "epoch": 0.4680517805316257, "percentage": 46.81, "elapsed_time": "16:04:33", "remaining_time": "18:16:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5081, "total_steps": 10853, "loss": 0.149, "learning_rate": 2.9672559674380664e-06, "epoch": 0.46814391670889577, "percentage": 46.82, "elapsed_time": "16:04:44", "remaining_time": "18:15:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5082, "total_steps": 10853, "loss": 0.1455, "learning_rate": 2.9665075866284e-06, "epoch": 0.46823605288616577, "percentage": 46.83, "elapsed_time": "16:04:55", "remaining_time": "18:15:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5083, "total_steps": 10853, "loss": 0.1342, "learning_rate": 2.9657591625034543e-06, "epoch": 0.46832818906343576, "percentage": 46.83, "elapsed_time": "16:05:06", "remaining_time": "18:15:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5084, "total_steps": 10853, "loss": 0.1346, "learning_rate": 2.9650106951327202e-06, "epoch": 0.46842032524070576, "percentage": 46.84, "elapsed_time": "16:05:16", "remaining_time": "18:15:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5085, "total_steps": 10853, "loss": 0.1434, "learning_rate": 2.964262184585692e-06, "epoch": 0.46851246141797576, "percentage": 46.85, "elapsed_time": "16:05:25", "remaining_time": "18:15:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5086, "total_steps": 10853, "loss": 0.1576, "learning_rate": 2.963513630931872e-06, "epoch": 0.46860459759524575, "percentage": 46.86, "elapsed_time": "16:05:37", "remaining_time": "18:14:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5087, "total_steps": 10853, "loss": 0.1542, "learning_rate": 2.96276503424076e-06, "epoch": 0.4686967337725158, "percentage": 46.87, "elapsed_time": "16:05:47", "remaining_time": "18:14:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5088, "total_steps": 10853, "loss": 0.1441, "learning_rate": 2.9620163945818648e-06, "epoch": 0.4687888699497858, "percentage": 46.88, "elapsed_time": "16:05:57", "remaining_time": "18:14:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5089, "total_steps": 10853, "loss": 0.1608, "learning_rate": 2.961267712024698e-06, "epoch": 0.4688810061270558, "percentage": 46.89, "elapsed_time": "16:06:08", "remaining_time": "18:14:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5090, "total_steps": 10853, "loss": 0.15, "learning_rate": 2.9605189866387746e-06, "epoch": 0.4689731423043258, "percentage": 46.9, "elapsed_time": "16:06:20", "remaining_time": "18:14:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5091, "total_steps": 10853, "loss": 0.1494, "learning_rate": 2.9597702184936137e-06, "epoch": 0.4690652784815958, "percentage": 46.91, "elapsed_time": "16:06:30", "remaining_time": "18:13:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5092, "total_steps": 10853, "loss": 0.1425, "learning_rate": 2.9590214076587386e-06, "epoch": 0.4691574146588658, "percentage": 46.92, "elapsed_time": "16:06:41", "remaining_time": "18:13:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5093, "total_steps": 10853, "loss": 0.1422, "learning_rate": 2.958272554203676e-06, "epoch": 0.4692495508361358, "percentage": 46.93, "elapsed_time": "16:06:51", "remaining_time": "18:13:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5094, "total_steps": 10853, "loss": 0.1467, "learning_rate": 2.9575236581979576e-06, "epoch": 0.46934168701340584, "percentage": 46.94, "elapsed_time": "16:07:01", "remaining_time": "18:13:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5095, "total_steps": 10853, "loss": 0.1387, "learning_rate": 2.9567747197111186e-06, "epoch": 0.46943382319067584, "percentage": 46.95, "elapsed_time": "16:07:12", "remaining_time": "18:13:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5096, "total_steps": 10853, "loss": 0.1473, "learning_rate": 2.9560257388126973e-06, "epoch": 0.46952595936794583, "percentage": 46.95, "elapsed_time": "16:07:22", "remaining_time": "18:12:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5097, "total_steps": 10853, "loss": 0.132, "learning_rate": 2.9552767155722375e-06, "epoch": 0.46961809554521583, "percentage": 46.96, "elapsed_time": "16:07:33", "remaining_time": "18:12:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5098, "total_steps": 10853, "loss": 0.1394, "learning_rate": 2.954527650059285e-06, "epoch": 0.4697102317224858, "percentage": 46.97, "elapsed_time": "16:07:44", "remaining_time": "18:12:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5099, "total_steps": 10853, "loss": 0.1301, "learning_rate": 2.9537785423433925e-06, "epoch": 0.4698023678997558, "percentage": 46.98, "elapsed_time": "16:07:54", "remaining_time": "18:12:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5100, "total_steps": 10853, "loss": 0.1542, "learning_rate": 2.9530293924941123e-06, "epoch": 0.4698945040770258, "percentage": 46.99, "elapsed_time": "16:08:05", "remaining_time": "18:12:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5101, "total_steps": 10853, "loss": 0.1526, "learning_rate": 2.9522802005810043e-06, "epoch": 0.4699866402542959, "percentage": 47.0, "elapsed_time": "16:08:16", "remaining_time": "18:11:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5102, "total_steps": 10853, "loss": 0.1359, "learning_rate": 2.9515309666736312e-06, "epoch": 0.47007877643156587, "percentage": 47.01, "elapsed_time": "16:08:28", "remaining_time": "18:11:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5103, "total_steps": 10853, "loss": 0.1363, "learning_rate": 2.95078169084156e-06, "epoch": 0.47017091260883587, "percentage": 47.02, "elapsed_time": "16:08:40", "remaining_time": "18:11:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5104, "total_steps": 10853, "loss": 0.1252, "learning_rate": 2.9500323731543596e-06, "epoch": 0.47026304878610586, "percentage": 47.03, "elapsed_time": "16:08:50", "remaining_time": "18:11:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5105, "total_steps": 10853, "loss": 0.1407, "learning_rate": 2.9492830136816053e-06, "epoch": 0.47035518496337586, "percentage": 47.04, "elapsed_time": "16:09:02", "remaining_time": "18:11:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5106, "total_steps": 10853, "loss": 0.1543, "learning_rate": 2.948533612492874e-06, "epoch": 0.47044732114064586, "percentage": 47.05, "elapsed_time": "16:09:11", "remaining_time": "18:10:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5107, "total_steps": 10853, "loss": 0.1342, "learning_rate": 2.947784169657749e-06, "epoch": 0.47053945731791585, "percentage": 47.06, "elapsed_time": "16:09:22", "remaining_time": "18:10:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5108, "total_steps": 10853, "loss": 0.1528, "learning_rate": 2.947034685245816e-06, "epoch": 0.4706315934951859, "percentage": 47.07, "elapsed_time": "16:09:32", "remaining_time": "18:10:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5109, "total_steps": 10853, "loss": 0.146, "learning_rate": 2.946285159326664e-06, "epoch": 0.4707237296724559, "percentage": 47.07, "elapsed_time": "16:09:43", "remaining_time": "18:10:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5110, "total_steps": 10853, "loss": 0.1366, "learning_rate": 2.945535591969887e-06, "epoch": 0.4708158658497259, "percentage": 47.08, "elapsed_time": "16:09:54", "remaining_time": "18:10:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5111, "total_steps": 10853, "loss": 0.1327, "learning_rate": 2.944785983245082e-06, "epoch": 0.4709080020269959, "percentage": 47.09, "elapsed_time": "16:10:06", "remaining_time": "18:09:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5112, "total_steps": 10853, "loss": 0.1538, "learning_rate": 2.944036333221851e-06, "epoch": 0.4710001382042659, "percentage": 47.1, "elapsed_time": "16:10:17", "remaining_time": "18:09:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5113, "total_steps": 10853, "loss": 0.1289, "learning_rate": 2.9432866419697993e-06, "epoch": 0.4710922743815359, "percentage": 47.11, "elapsed_time": "16:10:28", "remaining_time": "18:09:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5114, "total_steps": 10853, "loss": 0.133, "learning_rate": 2.9425369095585337e-06, "epoch": 0.4711844105588059, "percentage": 47.12, "elapsed_time": "16:10:38", "remaining_time": "18:09:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5115, "total_steps": 10853, "loss": 0.1358, "learning_rate": 2.94178713605767e-06, "epoch": 0.47127654673607594, "percentage": 47.13, "elapsed_time": "16:10:49", "remaining_time": "18:09:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5116, "total_steps": 10853, "loss": 0.1402, "learning_rate": 2.9410373215368216e-06, "epoch": 0.47136868291334594, "percentage": 47.14, "elapsed_time": "16:11:00", "remaining_time": "18:08:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5117, "total_steps": 10853, "loss": 0.141, "learning_rate": 2.9402874660656113e-06, "epoch": 0.47146081909061593, "percentage": 47.15, "elapsed_time": "16:11:11", "remaining_time": "18:08:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5118, "total_steps": 10853, "loss": 0.1388, "learning_rate": 2.9395375697136623e-06, "epoch": 0.47155295526788593, "percentage": 47.16, "elapsed_time": "16:11:21", "remaining_time": "18:08:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5119, "total_steps": 10853, "loss": 0.14, "learning_rate": 2.9387876325506025e-06, "epoch": 0.47164509144515593, "percentage": 47.17, "elapsed_time": "16:11:31", "remaining_time": "18:08:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5120, "total_steps": 10853, "loss": 0.1344, "learning_rate": 2.9380376546460643e-06, "epoch": 0.4717372276224259, "percentage": 47.18, "elapsed_time": "16:11:42", "remaining_time": "18:08:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5121, "total_steps": 10853, "loss": 0.1398, "learning_rate": 2.9372876360696823e-06, "epoch": 0.471829363799696, "percentage": 47.19, "elapsed_time": "16:11:54", "remaining_time": "18:07:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5122, "total_steps": 10853, "loss": 0.1398, "learning_rate": 2.9365375768910957e-06, "epoch": 0.471921499976966, "percentage": 47.19, "elapsed_time": "16:12:04", "remaining_time": "18:07:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5123, "total_steps": 10853, "loss": 0.128, "learning_rate": 2.935787477179949e-06, "epoch": 0.47201363615423597, "percentage": 47.2, "elapsed_time": "16:12:14", "remaining_time": "18:07:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5124, "total_steps": 10853, "loss": 0.1482, "learning_rate": 2.9350373370058882e-06, "epoch": 0.47210577233150597, "percentage": 47.21, "elapsed_time": "16:12:24", "remaining_time": "18:07:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5125, "total_steps": 10853, "loss": 0.1445, "learning_rate": 2.9342871564385627e-06, "epoch": 0.47219790850877597, "percentage": 47.22, "elapsed_time": "16:12:34", "remaining_time": "18:07:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5126, "total_steps": 10853, "loss": 0.14, "learning_rate": 2.9335369355476295e-06, "epoch": 0.47229004468604596, "percentage": 47.23, "elapsed_time": "16:12:45", "remaining_time": "18:06:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5127, "total_steps": 10853, "loss": 0.1467, "learning_rate": 2.932786674402744e-06, "epoch": 0.47238218086331596, "percentage": 47.24, "elapsed_time": "16:12:55", "remaining_time": "18:06:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5128, "total_steps": 10853, "loss": 0.1528, "learning_rate": 2.9320363730735696e-06, "epoch": 0.472474317040586, "percentage": 47.25, "elapsed_time": "16:13:05", "remaining_time": "18:06:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5129, "total_steps": 10853, "loss": 0.1349, "learning_rate": 2.9312860316297716e-06, "epoch": 0.472566453217856, "percentage": 47.26, "elapsed_time": "16:13:15", "remaining_time": "18:06:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5130, "total_steps": 10853, "loss": 0.147, "learning_rate": 2.930535650141019e-06, "epoch": 0.472658589395126, "percentage": 47.27, "elapsed_time": "16:13:26", "remaining_time": "18:05:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5131, "total_steps": 10853, "loss": 0.1452, "learning_rate": 2.9297852286769852e-06, "epoch": 0.472750725572396, "percentage": 47.28, "elapsed_time": "16:13:38", "remaining_time": "18:05:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5132, "total_steps": 10853, "loss": 0.1353, "learning_rate": 2.9290347673073466e-06, "epoch": 0.472842861749666, "percentage": 47.29, "elapsed_time": "16:13:48", "remaining_time": "18:05:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5133, "total_steps": 10853, "loss": 0.1379, "learning_rate": 2.928284266101783e-06, "epoch": 0.472934997926936, "percentage": 47.3, "elapsed_time": "16:13:58", "remaining_time": "18:05:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5134, "total_steps": 10853, "loss": 0.1373, "learning_rate": 2.9275337251299808e-06, "epoch": 0.473027134104206, "percentage": 47.3, "elapsed_time": "16:14:08", "remaining_time": "18:05:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5135, "total_steps": 10853, "loss": 0.1358, "learning_rate": 2.9267831444616244e-06, "epoch": 0.47311927028147605, "percentage": 47.31, "elapsed_time": "16:14:20", "remaining_time": "18:04:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5136, "total_steps": 10853, "loss": 0.1382, "learning_rate": 2.926032524166408e-06, "epoch": 0.47321140645874604, "percentage": 47.32, "elapsed_time": "16:14:31", "remaining_time": "18:04:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5137, "total_steps": 10853, "loss": 0.143, "learning_rate": 2.9252818643140256e-06, "epoch": 0.47330354263601604, "percentage": 47.33, "elapsed_time": "16:14:41", "remaining_time": "18:04:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5138, "total_steps": 10853, "loss": 0.1354, "learning_rate": 2.9245311649741765e-06, "epoch": 0.47339567881328604, "percentage": 47.34, "elapsed_time": "16:14:52", "remaining_time": "18:04:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5139, "total_steps": 10853, "loss": 0.1494, "learning_rate": 2.9237804262165632e-06, "epoch": 0.47348781499055603, "percentage": 47.35, "elapsed_time": "16:15:01", "remaining_time": "18:04:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5140, "total_steps": 10853, "loss": 0.1491, "learning_rate": 2.9230296481108916e-06, "epoch": 0.47357995116782603, "percentage": 47.36, "elapsed_time": "16:15:13", "remaining_time": "18:03:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5141, "total_steps": 10853, "loss": 0.1469, "learning_rate": 2.922278830726871e-06, "epoch": 0.473672087345096, "percentage": 47.37, "elapsed_time": "16:15:25", "remaining_time": "18:03:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5142, "total_steps": 10853, "loss": 0.1248, "learning_rate": 2.9215279741342165e-06, "epoch": 0.4737642235223661, "percentage": 47.38, "elapsed_time": "16:15:36", "remaining_time": "18:03:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5143, "total_steps": 10853, "loss": 0.1375, "learning_rate": 2.9207770784026436e-06, "epoch": 0.4738563596996361, "percentage": 47.39, "elapsed_time": "16:15:45", "remaining_time": "18:03:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5144, "total_steps": 10853, "loss": 0.1277, "learning_rate": 2.920026143601874e-06, "epoch": 0.4739484958769061, "percentage": 47.4, "elapsed_time": "16:15:56", "remaining_time": "18:03:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5145, "total_steps": 10853, "loss": 0.1368, "learning_rate": 2.9192751698016317e-06, "epoch": 0.47404063205417607, "percentage": 47.41, "elapsed_time": "16:16:07", "remaining_time": "18:02:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5146, "total_steps": 10853, "loss": 0.1509, "learning_rate": 2.918524157071645e-06, "epoch": 0.47413276823144607, "percentage": 47.42, "elapsed_time": "16:16:19", "remaining_time": "18:02:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5147, "total_steps": 10853, "loss": 0.1535, "learning_rate": 2.917773105481645e-06, "epoch": 0.47422490440871606, "percentage": 47.42, "elapsed_time": "16:16:30", "remaining_time": "18:02:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5148, "total_steps": 10853, "loss": 0.1312, "learning_rate": 2.917022015101367e-06, "epoch": 0.47431704058598606, "percentage": 47.43, "elapsed_time": "16:16:40", "remaining_time": "18:02:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5149, "total_steps": 10853, "loss": 0.1525, "learning_rate": 2.91627088600055e-06, "epoch": 0.4744091767632561, "percentage": 47.44, "elapsed_time": "16:16:52", "remaining_time": "18:02:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5150, "total_steps": 10853, "loss": 0.133, "learning_rate": 2.9155197182489375e-06, "epoch": 0.4745013129405261, "percentage": 47.45, "elapsed_time": "16:17:03", "remaining_time": "18:01:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5151, "total_steps": 10853, "loss": 0.1194, "learning_rate": 2.9147685119162735e-06, "epoch": 0.4745934491177961, "percentage": 47.46, "elapsed_time": "16:17:13", "remaining_time": "18:01:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5152, "total_steps": 10853, "loss": 0.1364, "learning_rate": 2.9140172670723083e-06, "epoch": 0.4746855852950661, "percentage": 47.47, "elapsed_time": "16:17:24", "remaining_time": "18:01:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5153, "total_steps": 10853, "loss": 0.1367, "learning_rate": 2.913265983786796e-06, "epoch": 0.4747777214723361, "percentage": 47.48, "elapsed_time": "16:17:34", "remaining_time": "18:01:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5154, "total_steps": 10853, "loss": 0.1585, "learning_rate": 2.9125146621294915e-06, "epoch": 0.4748698576496061, "percentage": 47.49, "elapsed_time": "16:17:45", "remaining_time": "18:01:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5155, "total_steps": 10853, "loss": 0.1482, "learning_rate": 2.9117633021701574e-06, "epoch": 0.47496199382687615, "percentage": 47.5, "elapsed_time": "16:17:56", "remaining_time": "18:00:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5156, "total_steps": 10853, "loss": 0.1425, "learning_rate": 2.9110119039785554e-06, "epoch": 0.47505413000414615, "percentage": 47.51, "elapsed_time": "16:18:07", "remaining_time": "18:00:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5157, "total_steps": 10853, "loss": 0.153, "learning_rate": 2.910260467624455e-06, "epoch": 0.47514626618141614, "percentage": 47.52, "elapsed_time": "16:18:18", "remaining_time": "18:00:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5158, "total_steps": 10853, "loss": 0.1476, "learning_rate": 2.9095089931776255e-06, "epoch": 0.47523840235868614, "percentage": 47.53, "elapsed_time": "16:18:28", "remaining_time": "18:00:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5159, "total_steps": 10853, "loss": 0.1553, "learning_rate": 2.908757480707842e-06, "epoch": 0.47533053853595614, "percentage": 47.54, "elapsed_time": "16:18:38", "remaining_time": "18:00:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5160, "total_steps": 10853, "loss": 0.1523, "learning_rate": 2.908005930284882e-06, "epoch": 0.47542267471322613, "percentage": 47.54, "elapsed_time": "16:18:50", "remaining_time": "17:59:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5161, "total_steps": 10853, "loss": 0.1479, "learning_rate": 2.907254341978528e-06, "epoch": 0.47551481089049613, "percentage": 47.55, "elapsed_time": "16:19:01", "remaining_time": "17:59:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5162, "total_steps": 10853, "loss": 0.1532, "learning_rate": 2.906502715858564e-06, "epoch": 0.4756069470677662, "percentage": 47.56, "elapsed_time": "16:19:13", "remaining_time": "17:59:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5163, "total_steps": 10853, "loss": 0.1359, "learning_rate": 2.9057510519947794e-06, "epoch": 0.4756990832450362, "percentage": 47.57, "elapsed_time": "16:19:26", "remaining_time": "17:59:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5164, "total_steps": 10853, "loss": 0.1465, "learning_rate": 2.9049993504569663e-06, "epoch": 0.4757912194223062, "percentage": 47.58, "elapsed_time": "16:19:37", "remaining_time": "17:59:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5165, "total_steps": 10853, "loss": 0.136, "learning_rate": 2.9042476113149193e-06, "epoch": 0.4758833555995762, "percentage": 47.59, "elapsed_time": "16:19:48", "remaining_time": "17:59:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5166, "total_steps": 10853, "loss": 0.1507, "learning_rate": 2.9034958346384385e-06, "epoch": 0.47597549177684617, "percentage": 47.6, "elapsed_time": "16:19:58", "remaining_time": "17:58:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5167, "total_steps": 10853, "loss": 0.1503, "learning_rate": 2.9027440204973263e-06, "epoch": 0.47606762795411617, "percentage": 47.61, "elapsed_time": "16:20:11", "remaining_time": "17:58:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5168, "total_steps": 10853, "loss": 0.1339, "learning_rate": 2.9019921689613874e-06, "epoch": 0.47615976413138617, "percentage": 47.62, "elapsed_time": "16:20:22", "remaining_time": "17:58:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5169, "total_steps": 10853, "loss": 0.1389, "learning_rate": 2.9012402801004334e-06, "epoch": 0.4762519003086562, "percentage": 47.63, "elapsed_time": "16:20:32", "remaining_time": "17:58:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5170, "total_steps": 10853, "loss": 0.1456, "learning_rate": 2.9004883539842756e-06, "epoch": 0.4763440364859262, "percentage": 47.64, "elapsed_time": "16:20:45", "remaining_time": "17:58:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5171, "total_steps": 10853, "loss": 0.1365, "learning_rate": 2.8997363906827315e-06, "epoch": 0.4764361726631962, "percentage": 47.65, "elapsed_time": "16:20:56", "remaining_time": "17:57:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5172, "total_steps": 10853, "loss": 0.1291, "learning_rate": 2.8989843902656202e-06, "epoch": 0.4765283088404662, "percentage": 47.66, "elapsed_time": "16:21:06", "remaining_time": "17:57:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5173, "total_steps": 10853, "loss": 0.1453, "learning_rate": 2.898232352802765e-06, "epoch": 0.4766204450177362, "percentage": 47.66, "elapsed_time": "16:21:16", "remaining_time": "17:57:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5174, "total_steps": 10853, "loss": 0.133, "learning_rate": 2.8974802783639934e-06, "epoch": 0.4767125811950062, "percentage": 47.67, "elapsed_time": "16:21:26", "remaining_time": "17:57:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5175, "total_steps": 10853, "loss": 0.146, "learning_rate": 2.8967281670191357e-06, "epoch": 0.4768047173722762, "percentage": 47.68, "elapsed_time": "16:21:37", "remaining_time": "17:57:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5176, "total_steps": 10853, "loss": 0.1397, "learning_rate": 2.895976018838024e-06, "epoch": 0.47689685354954625, "percentage": 47.69, "elapsed_time": "16:21:48", "remaining_time": "17:56:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5177, "total_steps": 10853, "loss": 0.1368, "learning_rate": 2.895223833890497e-06, "epoch": 0.47698898972681625, "percentage": 47.7, "elapsed_time": "16:21:58", "remaining_time": "17:56:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5178, "total_steps": 10853, "loss": 0.127, "learning_rate": 2.8944716122463933e-06, "epoch": 0.47708112590408625, "percentage": 47.71, "elapsed_time": "16:22:10", "remaining_time": "17:56:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5179, "total_steps": 10853, "loss": 0.133, "learning_rate": 2.8937193539755593e-06, "epoch": 0.47717326208135624, "percentage": 47.72, "elapsed_time": "16:22:21", "remaining_time": "17:56:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5180, "total_steps": 10853, "loss": 0.1597, "learning_rate": 2.8929670591478404e-06, "epoch": 0.47726539825862624, "percentage": 47.73, "elapsed_time": "16:22:33", "remaining_time": "17:56:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5181, "total_steps": 10853, "loss": 0.1544, "learning_rate": 2.8922147278330876e-06, "epoch": 0.47735753443589624, "percentage": 47.74, "elapsed_time": "16:22:44", "remaining_time": "17:55:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5182, "total_steps": 10853, "loss": 0.1517, "learning_rate": 2.891462360101156e-06, "epoch": 0.47744967061316623, "percentage": 47.75, "elapsed_time": "16:22:54", "remaining_time": "17:55:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5183, "total_steps": 10853, "loss": 0.14, "learning_rate": 2.890709956021901e-06, "epoch": 0.4775418067904363, "percentage": 47.76, "elapsed_time": "16:23:06", "remaining_time": "17:55:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5184, "total_steps": 10853, "loss": 0.1374, "learning_rate": 2.8899575156651847e-06, "epoch": 0.4776339429677063, "percentage": 47.77, "elapsed_time": "16:23:17", "remaining_time": "17:55:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5185, "total_steps": 10853, "loss": 0.1415, "learning_rate": 2.889205039100872e-06, "epoch": 0.4777260791449763, "percentage": 47.77, "elapsed_time": "16:23:29", "remaining_time": "17:55:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5186, "total_steps": 10853, "loss": 0.1265, "learning_rate": 2.8884525263988288e-06, "epoch": 0.4778182153222463, "percentage": 47.78, "elapsed_time": "16:23:41", "remaining_time": "17:54:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5187, "total_steps": 10853, "loss": 0.1262, "learning_rate": 2.887699977628927e-06, "epoch": 0.4779103514995163, "percentage": 47.79, "elapsed_time": "16:23:51", "remaining_time": "17:54:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5188, "total_steps": 10853, "loss": 0.1349, "learning_rate": 2.886947392861041e-06, "epoch": 0.47800248767678627, "percentage": 47.8, "elapsed_time": "16:24:02", "remaining_time": "17:54:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5189, "total_steps": 10853, "loss": 0.1479, "learning_rate": 2.886194772165046e-06, "epoch": 0.4780946238540563, "percentage": 47.81, "elapsed_time": "16:24:14", "remaining_time": "17:54:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5190, "total_steps": 10853, "loss": 0.15, "learning_rate": 2.8854421156108276e-06, "epoch": 0.4781867600313263, "percentage": 47.82, "elapsed_time": "16:24:25", "remaining_time": "17:54:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5191, "total_steps": 10853, "loss": 0.1476, "learning_rate": 2.8846894232682654e-06, "epoch": 0.4782788962085963, "percentage": 47.83, "elapsed_time": "16:24:35", "remaining_time": "17:53:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5192, "total_steps": 10853, "loss": 0.147, "learning_rate": 2.883936695207249e-06, "epoch": 0.4783710323858663, "percentage": 47.84, "elapsed_time": "16:24:46", "remaining_time": "17:53:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5193, "total_steps": 10853, "loss": 0.1506, "learning_rate": 2.8831839314976696e-06, "epoch": 0.4784631685631363, "percentage": 47.85, "elapsed_time": "16:24:57", "remaining_time": "17:53:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5194, "total_steps": 10853, "loss": 0.137, "learning_rate": 2.8824311322094213e-06, "epoch": 0.4785553047404063, "percentage": 47.86, "elapsed_time": "16:25:08", "remaining_time": "17:53:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5195, "total_steps": 10853, "loss": 0.1586, "learning_rate": 2.8816782974124007e-06, "epoch": 0.4786474409176763, "percentage": 47.87, "elapsed_time": "16:25:20", "remaining_time": "17:53:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5196, "total_steps": 10853, "loss": 0.1361, "learning_rate": 2.880925427176509e-06, "epoch": 0.47873957709494636, "percentage": 47.88, "elapsed_time": "16:25:30", "remaining_time": "17:52:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5197, "total_steps": 10853, "loss": 0.1474, "learning_rate": 2.8801725215716504e-06, "epoch": 0.47883171327221635, "percentage": 47.89, "elapsed_time": "16:25:40", "remaining_time": "17:52:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5198, "total_steps": 10853, "loss": 0.1216, "learning_rate": 2.879419580667733e-06, "epoch": 0.47892384944948635, "percentage": 47.89, "elapsed_time": "16:25:50", "remaining_time": "17:52:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5199, "total_steps": 10853, "loss": 0.1295, "learning_rate": 2.878666604534665e-06, "epoch": 0.47901598562675635, "percentage": 47.9, "elapsed_time": "16:26:00", "remaining_time": "17:52:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5200, "total_steps": 10853, "loss": 0.1377, "learning_rate": 2.8779135932423633e-06, "epoch": 0.47910812180402634, "percentage": 47.91, "elapsed_time": "16:26:12", "remaining_time": "17:52:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5201, "total_steps": 10853, "loss": 0.1505, "learning_rate": 2.877160546860744e-06, "epoch": 0.47920025798129634, "percentage": 47.92, "elapsed_time": "16:26:22", "remaining_time": "17:51:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5202, "total_steps": 10853, "loss": 0.1312, "learning_rate": 2.8764074654597267e-06, "epoch": 0.47929239415856634, "percentage": 47.93, "elapsed_time": "16:26:32", "remaining_time": "17:51:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5203, "total_steps": 10853, "loss": 0.1472, "learning_rate": 2.8756543491092352e-06, "epoch": 0.4793845303358364, "percentage": 47.94, "elapsed_time": "16:26:43", "remaining_time": "17:51:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5204, "total_steps": 10853, "loss": 0.1528, "learning_rate": 2.8749011978791984e-06, "epoch": 0.4794766665131064, "percentage": 47.95, "elapsed_time": "16:26:54", "remaining_time": "17:51:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5205, "total_steps": 10853, "loss": 0.1167, "learning_rate": 2.8741480118395443e-06, "epoch": 0.4795688026903764, "percentage": 47.96, "elapsed_time": "16:27:05", "remaining_time": "17:51:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5206, "total_steps": 10853, "loss": 0.1477, "learning_rate": 2.873394791060207e-06, "epoch": 0.4796609388676464, "percentage": 47.97, "elapsed_time": "16:27:15", "remaining_time": "17:50:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5207, "total_steps": 10853, "loss": 0.1526, "learning_rate": 2.872641535611123e-06, "epoch": 0.4797530750449164, "percentage": 47.98, "elapsed_time": "16:27:28", "remaining_time": "17:50:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5208, "total_steps": 10853, "loss": 0.1596, "learning_rate": 2.8718882455622334e-06, "epoch": 0.4798452112221864, "percentage": 47.99, "elapsed_time": "16:27:39", "remaining_time": "17:50:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5209, "total_steps": 10853, "loss": 0.1333, "learning_rate": 2.871134920983479e-06, "epoch": 0.47993734739945637, "percentage": 48.0, "elapsed_time": "16:27:49", "remaining_time": "17:50:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5210, "total_steps": 10853, "loss": 0.1379, "learning_rate": 2.8703815619448072e-06, "epoch": 0.4800294835767264, "percentage": 48.01, "elapsed_time": "16:28:00", "remaining_time": "17:50:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5211, "total_steps": 10853, "loss": 0.1366, "learning_rate": 2.8696281685161676e-06, "epoch": 0.4801216197539964, "percentage": 48.01, "elapsed_time": "16:28:11", "remaining_time": "17:49:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5212, "total_steps": 10853, "loss": 0.1359, "learning_rate": 2.868874740767513e-06, "epoch": 0.4802137559312664, "percentage": 48.02, "elapsed_time": "16:28:22", "remaining_time": "17:49:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5213, "total_steps": 10853, "loss": 0.1468, "learning_rate": 2.8681212787687997e-06, "epoch": 0.4803058921085364, "percentage": 48.03, "elapsed_time": "16:28:31", "remaining_time": "17:49:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5214, "total_steps": 10853, "loss": 0.156, "learning_rate": 2.8673677825899852e-06, "epoch": 0.4803980282858064, "percentage": 48.04, "elapsed_time": "16:28:42", "remaining_time": "17:49:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5215, "total_steps": 10853, "loss": 0.1298, "learning_rate": 2.866614252301033e-06, "epoch": 0.4804901644630764, "percentage": 48.05, "elapsed_time": "16:28:52", "remaining_time": "17:49:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5216, "total_steps": 10853, "loss": 0.1504, "learning_rate": 2.865860687971907e-06, "epoch": 0.4805823006403464, "percentage": 48.06, "elapsed_time": "16:29:02", "remaining_time": "17:48:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5217, "total_steps": 10853, "loss": 0.1438, "learning_rate": 2.8651070896725786e-06, "epoch": 0.48067443681761646, "percentage": 48.07, "elapsed_time": "16:29:13", "remaining_time": "17:48:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5218, "total_steps": 10853, "loss": 0.1456, "learning_rate": 2.864353457473016e-06, "epoch": 0.48076657299488645, "percentage": 48.08, "elapsed_time": "16:29:25", "remaining_time": "17:48:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5219, "total_steps": 10853, "loss": 0.1452, "learning_rate": 2.863599791443196e-06, "epoch": 0.48085870917215645, "percentage": 48.09, "elapsed_time": "16:29:36", "remaining_time": "17:48:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5220, "total_steps": 10853, "loss": 0.1484, "learning_rate": 2.8628460916530967e-06, "epoch": 0.48095084534942645, "percentage": 48.1, "elapsed_time": "16:29:46", "remaining_time": "17:48:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5221, "total_steps": 10853, "loss": 0.1481, "learning_rate": 2.8620923581726983e-06, "epoch": 0.48104298152669644, "percentage": 48.11, "elapsed_time": "16:29:57", "remaining_time": "17:47:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5222, "total_steps": 10853, "loss": 0.1434, "learning_rate": 2.861338591071986e-06, "epoch": 0.48113511770396644, "percentage": 48.12, "elapsed_time": "16:30:08", "remaining_time": "17:47:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5223, "total_steps": 10853, "loss": 0.1362, "learning_rate": 2.860584790420946e-06, "epoch": 0.4812272538812365, "percentage": 48.12, "elapsed_time": "16:30:18", "remaining_time": "17:47:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5224, "total_steps": 10853, "loss": 0.1554, "learning_rate": 2.85983095628957e-06, "epoch": 0.4813193900585065, "percentage": 48.13, "elapsed_time": "16:30:28", "remaining_time": "17:47:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5225, "total_steps": 10853, "loss": 0.1425, "learning_rate": 2.8590770887478507e-06, "epoch": 0.4814115262357765, "percentage": 48.14, "elapsed_time": "16:30:38", "remaining_time": "17:47:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5226, "total_steps": 10853, "loss": 0.1329, "learning_rate": 2.8583231878657847e-06, "epoch": 0.4815036624130465, "percentage": 48.15, "elapsed_time": "16:30:50", "remaining_time": "17:46:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5227, "total_steps": 10853, "loss": 0.1499, "learning_rate": 2.8575692537133726e-06, "epoch": 0.4815957985903165, "percentage": 48.16, "elapsed_time": "16:31:00", "remaining_time": "17:46:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5228, "total_steps": 10853, "loss": 0.1433, "learning_rate": 2.8568152863606167e-06, "epoch": 0.4816879347675865, "percentage": 48.17, "elapsed_time": "16:31:11", "remaining_time": "17:46:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5229, "total_steps": 10853, "loss": 0.1303, "learning_rate": 2.8560612858775233e-06, "epoch": 0.4817800709448565, "percentage": 48.18, "elapsed_time": "16:31:22", "remaining_time": "17:46:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5230, "total_steps": 10853, "loss": 0.1498, "learning_rate": 2.8553072523341008e-06, "epoch": 0.48187220712212653, "percentage": 48.19, "elapsed_time": "16:31:34", "remaining_time": "17:46:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5231, "total_steps": 10853, "loss": 0.1238, "learning_rate": 2.8545531858003623e-06, "epoch": 0.4819643432993965, "percentage": 48.2, "elapsed_time": "16:31:43", "remaining_time": "17:45:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5232, "total_steps": 10853, "loss": 0.1298, "learning_rate": 2.8537990863463212e-06, "epoch": 0.4820564794766665, "percentage": 48.21, "elapsed_time": "16:31:54", "remaining_time": "17:45:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5233, "total_steps": 10853, "loss": 0.1454, "learning_rate": 2.853044954041998e-06, "epoch": 0.4821486156539365, "percentage": 48.22, "elapsed_time": "16:32:05", "remaining_time": "17:45:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5234, "total_steps": 10853, "loss": 0.1524, "learning_rate": 2.8522907889574117e-06, "epoch": 0.4822407518312065, "percentage": 48.23, "elapsed_time": "16:32:16", "remaining_time": "17:45:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5235, "total_steps": 10853, "loss": 0.1529, "learning_rate": 2.851536591162589e-06, "epoch": 0.4823328880084765, "percentage": 48.24, "elapsed_time": "16:32:27", "remaining_time": "17:45:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5236, "total_steps": 10853, "loss": 0.1484, "learning_rate": 2.8507823607275554e-06, "epoch": 0.4824250241857465, "percentage": 48.24, "elapsed_time": "16:32:37", "remaining_time": "17:44:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5237, "total_steps": 10853, "loss": 0.1247, "learning_rate": 2.8500280977223416e-06, "epoch": 0.48251716036301656, "percentage": 48.25, "elapsed_time": "16:32:46", "remaining_time": "17:44:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5238, "total_steps": 10853, "loss": 0.1393, "learning_rate": 2.8492738022169815e-06, "epoch": 0.48260929654028656, "percentage": 48.26, "elapsed_time": "16:32:57", "remaining_time": "17:44:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5239, "total_steps": 10853, "loss": 0.1298, "learning_rate": 2.848519474281511e-06, "epoch": 0.48270143271755656, "percentage": 48.27, "elapsed_time": "16:33:07", "remaining_time": "17:44:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5240, "total_steps": 10853, "loss": 0.1498, "learning_rate": 2.84776511398597e-06, "epoch": 0.48279356889482655, "percentage": 48.28, "elapsed_time": "16:33:18", "remaining_time": "17:44:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5241, "total_steps": 10853, "loss": 0.1477, "learning_rate": 2.847010721400401e-06, "epoch": 0.48288570507209655, "percentage": 48.29, "elapsed_time": "16:33:29", "remaining_time": "17:43:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5242, "total_steps": 10853, "loss": 0.1316, "learning_rate": 2.8462562965948493e-06, "epoch": 0.48297784124936655, "percentage": 48.3, "elapsed_time": "16:33:40", "remaining_time": "17:43:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5243, "total_steps": 10853, "loss": 0.1386, "learning_rate": 2.8455018396393618e-06, "epoch": 0.48306997742663654, "percentage": 48.31, "elapsed_time": "16:33:50", "remaining_time": "17:43:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5244, "total_steps": 10853, "loss": 0.1274, "learning_rate": 2.8447473506039934e-06, "epoch": 0.4831621136039066, "percentage": 48.32, "elapsed_time": "16:34:00", "remaining_time": "17:43:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5245, "total_steps": 10853, "loss": 0.1402, "learning_rate": 2.8439928295587948e-06, "epoch": 0.4832542497811766, "percentage": 48.33, "elapsed_time": "16:34:10", "remaining_time": "17:42:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5246, "total_steps": 10853, "loss": 0.1395, "learning_rate": 2.843238276573826e-06, "epoch": 0.4833463859584466, "percentage": 48.34, "elapsed_time": "16:34:22", "remaining_time": "17:42:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5247, "total_steps": 10853, "loss": 0.1397, "learning_rate": 2.8424836917191455e-06, "epoch": 0.4834385221357166, "percentage": 48.35, "elapsed_time": "16:34:32", "remaining_time": "17:42:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5248, "total_steps": 10853, "loss": 0.1326, "learning_rate": 2.841729075064818e-06, "epoch": 0.4835306583129866, "percentage": 48.36, "elapsed_time": "16:34:44", "remaining_time": "17:42:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5249, "total_steps": 10853, "loss": 0.1308, "learning_rate": 2.840974426680909e-06, "epoch": 0.4836227944902566, "percentage": 48.36, "elapsed_time": "16:34:54", "remaining_time": "17:42:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5250, "total_steps": 10853, "loss": 0.1499, "learning_rate": 2.840219746637487e-06, "epoch": 0.4837149306675266, "percentage": 48.37, "elapsed_time": "16:35:05", "remaining_time": "17:41:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5251, "total_steps": 10853, "loss": 0.1326, "learning_rate": 2.8394650350046256e-06, "epoch": 0.48380706684479663, "percentage": 48.38, "elapsed_time": "16:35:16", "remaining_time": "17:41:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5252, "total_steps": 10853, "loss": 0.1516, "learning_rate": 2.8387102918523995e-06, "epoch": 0.4838992030220666, "percentage": 48.39, "elapsed_time": "16:35:27", "remaining_time": "17:41:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5253, "total_steps": 10853, "loss": 0.125, "learning_rate": 2.8379555172508853e-06, "epoch": 0.4839913391993366, "percentage": 48.4, "elapsed_time": "16:35:38", "remaining_time": "17:41:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5254, "total_steps": 10853, "loss": 0.1415, "learning_rate": 2.8372007112701657e-06, "epoch": 0.4840834753766066, "percentage": 48.41, "elapsed_time": "16:35:49", "remaining_time": "17:41:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5255, "total_steps": 10853, "loss": 0.1394, "learning_rate": 2.8364458739803237e-06, "epoch": 0.4841756115538766, "percentage": 48.42, "elapsed_time": "16:36:00", "remaining_time": "17:41:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5256, "total_steps": 10853, "loss": 0.1497, "learning_rate": 2.835691005451446e-06, "epoch": 0.4842677477311466, "percentage": 48.43, "elapsed_time": "16:36:10", "remaining_time": "17:40:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5257, "total_steps": 10853, "loss": 0.1438, "learning_rate": 2.8349361057536223e-06, "epoch": 0.48435988390841667, "percentage": 48.44, "elapsed_time": "16:36:23", "remaining_time": "17:40:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5258, "total_steps": 10853, "loss": 0.1391, "learning_rate": 2.8341811749569452e-06, "epoch": 0.48445202008568666, "percentage": 48.45, "elapsed_time": "16:36:34", "remaining_time": "17:40:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5259, "total_steps": 10853, "loss": 0.1476, "learning_rate": 2.8334262131315094e-06, "epoch": 0.48454415626295666, "percentage": 48.46, "elapsed_time": "16:36:46", "remaining_time": "17:40:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5260, "total_steps": 10853, "loss": 0.1265, "learning_rate": 2.832671220347415e-06, "epoch": 0.48463629244022666, "percentage": 48.47, "elapsed_time": "16:36:57", "remaining_time": "17:40:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5261, "total_steps": 10853, "loss": 0.1506, "learning_rate": 2.831916196674761e-06, "epoch": 0.48472842861749665, "percentage": 48.48, "elapsed_time": "16:37:08", "remaining_time": "17:39:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5262, "total_steps": 10853, "loss": 0.1442, "learning_rate": 2.831161142183653e-06, "epoch": 0.48482056479476665, "percentage": 48.48, "elapsed_time": "16:37:18", "remaining_time": "17:39:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5263, "total_steps": 10853, "loss": 0.1395, "learning_rate": 2.830406056944197e-06, "epoch": 0.48491270097203665, "percentage": 48.49, "elapsed_time": "16:37:29", "remaining_time": "17:39:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5264, "total_steps": 10853, "loss": 0.1478, "learning_rate": 2.8296509410265032e-06, "epoch": 0.4850048371493067, "percentage": 48.5, "elapsed_time": "16:37:40", "remaining_time": "17:39:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5265, "total_steps": 10853, "loss": 0.1462, "learning_rate": 2.8288957945006845e-06, "epoch": 0.4850969733265767, "percentage": 48.51, "elapsed_time": "16:37:51", "remaining_time": "17:39:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5266, "total_steps": 10853, "loss": 0.1419, "learning_rate": 2.8281406174368555e-06, "epoch": 0.4851891095038467, "percentage": 48.52, "elapsed_time": "16:38:02", "remaining_time": "17:38:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5267, "total_steps": 10853, "loss": 0.1488, "learning_rate": 2.827385409905134e-06, "epoch": 0.4852812456811167, "percentage": 48.53, "elapsed_time": "16:38:15", "remaining_time": "17:38:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5268, "total_steps": 10853, "loss": 0.1428, "learning_rate": 2.8266301719756427e-06, "epoch": 0.4853733818583867, "percentage": 48.54, "elapsed_time": "16:38:26", "remaining_time": "17:38:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5269, "total_steps": 10853, "loss": 0.1478, "learning_rate": 2.825874903718505e-06, "epoch": 0.4854655180356567, "percentage": 48.55, "elapsed_time": "16:38:38", "remaining_time": "17:38:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5270, "total_steps": 10853, "loss": 0.1551, "learning_rate": 2.8251196052038475e-06, "epoch": 0.4855576542129267, "percentage": 48.56, "elapsed_time": "16:38:49", "remaining_time": "17:38:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5271, "total_steps": 10853, "loss": 0.1507, "learning_rate": 2.8243642765017993e-06, "epoch": 0.48564979039019673, "percentage": 48.57, "elapsed_time": "16:38:59", "remaining_time": "17:37:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5272, "total_steps": 10853, "loss": 0.123, "learning_rate": 2.8236089176824926e-06, "epoch": 0.48574192656746673, "percentage": 48.58, "elapsed_time": "16:39:08", "remaining_time": "17:37:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5273, "total_steps": 10853, "loss": 0.1285, "learning_rate": 2.8228535288160647e-06, "epoch": 0.4858340627447367, "percentage": 48.59, "elapsed_time": "16:39:18", "remaining_time": "17:37:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5274, "total_steps": 10853, "loss": 0.1501, "learning_rate": 2.8220981099726503e-06, "epoch": 0.4859261989220067, "percentage": 48.59, "elapsed_time": "16:39:28", "remaining_time": "17:37:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5275, "total_steps": 10853, "loss": 0.1459, "learning_rate": 2.821342661222392e-06, "epoch": 0.4860183350992767, "percentage": 48.6, "elapsed_time": "16:39:38", "remaining_time": "17:37:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5276, "total_steps": 10853, "loss": 0.1447, "learning_rate": 2.8205871826354336e-06, "epoch": 0.4861104712765467, "percentage": 48.61, "elapsed_time": "16:39:49", "remaining_time": "17:36:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5277, "total_steps": 10853, "loss": 0.1372, "learning_rate": 2.819831674281921e-06, "epoch": 0.4862026074538167, "percentage": 48.62, "elapsed_time": "16:40:00", "remaining_time": "17:36:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5278, "total_steps": 10853, "loss": 0.1374, "learning_rate": 2.819076136232002e-06, "epoch": 0.48629474363108677, "percentage": 48.63, "elapsed_time": "16:40:08", "remaining_time": "17:36:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5279, "total_steps": 10853, "loss": 0.1486, "learning_rate": 2.81832056855583e-06, "epoch": 0.48638687980835676, "percentage": 48.64, "elapsed_time": "16:40:18", "remaining_time": "17:36:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5280, "total_steps": 10853, "loss": 0.1447, "learning_rate": 2.8175649713235586e-06, "epoch": 0.48647901598562676, "percentage": 48.65, "elapsed_time": "16:40:29", "remaining_time": "17:36:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5281, "total_steps": 10853, "loss": 0.1321, "learning_rate": 2.8168093446053455e-06, "epoch": 0.48657115216289676, "percentage": 48.66, "elapsed_time": "16:40:40", "remaining_time": "17:35:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5282, "total_steps": 10853, "loss": 0.1351, "learning_rate": 2.816053688471351e-06, "epoch": 0.48666328834016676, "percentage": 48.67, "elapsed_time": "16:40:51", "remaining_time": "17:35:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5283, "total_steps": 10853, "loss": 0.1382, "learning_rate": 2.815298002991738e-06, "epoch": 0.48675542451743675, "percentage": 48.68, "elapsed_time": "16:41:03", "remaining_time": "17:35:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5284, "total_steps": 10853, "loss": 0.1251, "learning_rate": 2.8145422882366707e-06, "epoch": 0.48684756069470675, "percentage": 48.69, "elapsed_time": "16:41:14", "remaining_time": "17:35:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5285, "total_steps": 10853, "loss": 0.155, "learning_rate": 2.8137865442763186e-06, "epoch": 0.4869396968719768, "percentage": 48.7, "elapsed_time": "16:41:25", "remaining_time": "17:35:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5286, "total_steps": 10853, "loss": 0.1389, "learning_rate": 2.813030771180851e-06, "epoch": 0.4870318330492468, "percentage": 48.71, "elapsed_time": "16:41:36", "remaining_time": "17:34:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5287, "total_steps": 10853, "loss": 0.1375, "learning_rate": 2.8122749690204443e-06, "epoch": 0.4871239692265168, "percentage": 48.71, "elapsed_time": "16:41:46", "remaining_time": "17:34:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5288, "total_steps": 10853, "loss": 0.1402, "learning_rate": 2.8115191378652716e-06, "epoch": 0.4872161054037868, "percentage": 48.72, "elapsed_time": "16:41:57", "remaining_time": "17:34:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5289, "total_steps": 10853, "loss": 0.1345, "learning_rate": 2.810763277785514e-06, "epoch": 0.4873082415810568, "percentage": 48.73, "elapsed_time": "16:42:08", "remaining_time": "17:34:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5290, "total_steps": 10853, "loss": 0.1616, "learning_rate": 2.810007388851353e-06, "epoch": 0.4874003777583268, "percentage": 48.74, "elapsed_time": "16:42:18", "remaining_time": "17:34:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5291, "total_steps": 10853, "loss": 0.1513, "learning_rate": 2.809251471132972e-06, "epoch": 0.48749251393559684, "percentage": 48.75, "elapsed_time": "16:42:28", "remaining_time": "17:33:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5292, "total_steps": 10853, "loss": 0.1291, "learning_rate": 2.808495524700559e-06, "epoch": 0.48758465011286684, "percentage": 48.76, "elapsed_time": "16:42:40", "remaining_time": "17:33:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5293, "total_steps": 10853, "loss": 0.1389, "learning_rate": 2.807739549624303e-06, "epoch": 0.48767678629013683, "percentage": 48.77, "elapsed_time": "16:42:50", "remaining_time": "17:33:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5294, "total_steps": 10853, "loss": 0.1393, "learning_rate": 2.8069835459743965e-06, "epoch": 0.48776892246740683, "percentage": 48.78, "elapsed_time": "16:43:00", "remaining_time": "17:33:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5295, "total_steps": 10853, "loss": 0.1351, "learning_rate": 2.8062275138210355e-06, "epoch": 0.4878610586446768, "percentage": 48.79, "elapsed_time": "16:43:10", "remaining_time": "17:33:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5296, "total_steps": 10853, "loss": 0.1308, "learning_rate": 2.805471453234416e-06, "epoch": 0.4879531948219468, "percentage": 48.8, "elapsed_time": "16:43:21", "remaining_time": "17:32:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5297, "total_steps": 10853, "loss": 0.1431, "learning_rate": 2.80471536428474e-06, "epoch": 0.4880453309992168, "percentage": 48.81, "elapsed_time": "16:43:31", "remaining_time": "17:32:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5298, "total_steps": 10853, "loss": 0.147, "learning_rate": 2.8039592470422096e-06, "epoch": 0.48813746717648687, "percentage": 48.82, "elapsed_time": "16:43:43", "remaining_time": "17:32:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5299, "total_steps": 10853, "loss": 0.1493, "learning_rate": 2.8032031015770296e-06, "epoch": 0.48822960335375687, "percentage": 48.83, "elapsed_time": "16:43:55", "remaining_time": "17:32:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5300, "total_steps": 10853, "loss": 0.1383, "learning_rate": 2.8024469279594102e-06, "epoch": 0.48832173953102687, "percentage": 48.83, "elapsed_time": "16:44:06", "remaining_time": "17:32:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5301, "total_steps": 10853, "loss": 0.1333, "learning_rate": 2.80169072625956e-06, "epoch": 0.48841387570829686, "percentage": 48.84, "elapsed_time": "16:44:15", "remaining_time": "17:31:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5302, "total_steps": 10853, "loss": 0.134, "learning_rate": 2.8009344965476935e-06, "epoch": 0.48850601188556686, "percentage": 48.85, "elapsed_time": "16:44:24", "remaining_time": "17:31:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5303, "total_steps": 10853, "loss": 0.1547, "learning_rate": 2.8001782388940267e-06, "epoch": 0.48859814806283686, "percentage": 48.86, "elapsed_time": "16:44:36", "remaining_time": "17:31:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5304, "total_steps": 10853, "loss": 0.1417, "learning_rate": 2.7994219533687784e-06, "epoch": 0.48869028424010685, "percentage": 48.87, "elapsed_time": "16:44:45", "remaining_time": "17:31:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5305, "total_steps": 10853, "loss": 0.1372, "learning_rate": 2.79866564004217e-06, "epoch": 0.4887824204173769, "percentage": 48.88, "elapsed_time": "16:44:57", "remaining_time": "17:30:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5306, "total_steps": 10853, "loss": 0.1501, "learning_rate": 2.797909298984424e-06, "epoch": 0.4888745565946469, "percentage": 48.89, "elapsed_time": "16:45:08", "remaining_time": "17:30:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5307, "total_steps": 10853, "loss": 0.143, "learning_rate": 2.797152930265767e-06, "epoch": 0.4889666927719169, "percentage": 48.9, "elapsed_time": "16:45:19", "remaining_time": "17:30:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5308, "total_steps": 10853, "loss": 0.1418, "learning_rate": 2.796396533956429e-06, "epoch": 0.4890588289491869, "percentage": 48.91, "elapsed_time": "16:45:29", "remaining_time": "17:30:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5309, "total_steps": 10853, "loss": 0.1504, "learning_rate": 2.7956401101266407e-06, "epoch": 0.4891509651264569, "percentage": 48.92, "elapsed_time": "16:45:40", "remaining_time": "17:30:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5310, "total_steps": 10853, "loss": 0.1456, "learning_rate": 2.7948836588466373e-06, "epoch": 0.4892431013037269, "percentage": 48.93, "elapsed_time": "16:45:51", "remaining_time": "17:29:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5311, "total_steps": 10853, "loss": 0.1401, "learning_rate": 2.794127180186653e-06, "epoch": 0.4893352374809969, "percentage": 48.94, "elapsed_time": "16:46:02", "remaining_time": "17:29:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5312, "total_steps": 10853, "loss": 0.1482, "learning_rate": 2.7933706742169297e-06, "epoch": 0.48942737365826694, "percentage": 48.94, "elapsed_time": "16:46:13", "remaining_time": "17:29:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5313, "total_steps": 10853, "loss": 0.1437, "learning_rate": 2.792614141007707e-06, "epoch": 0.48951950983553694, "percentage": 48.95, "elapsed_time": "16:46:22", "remaining_time": "17:29:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5314, "total_steps": 10853, "loss": 0.1432, "learning_rate": 2.7918575806292305e-06, "epoch": 0.48961164601280693, "percentage": 48.96, "elapsed_time": "16:46:33", "remaining_time": "17:29:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5315, "total_steps": 10853, "loss": 0.1449, "learning_rate": 2.791100993151745e-06, "epoch": 0.48970378219007693, "percentage": 48.97, "elapsed_time": "16:46:43", "remaining_time": "17:28:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5316, "total_steps": 10853, "loss": 0.1503, "learning_rate": 2.790344378645502e-06, "epoch": 0.4897959183673469, "percentage": 48.98, "elapsed_time": "16:46:53", "remaining_time": "17:28:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5317, "total_steps": 10853, "loss": 0.1546, "learning_rate": 2.7895877371807516e-06, "epoch": 0.4898880545446169, "percentage": 48.99, "elapsed_time": "16:47:05", "remaining_time": "17:28:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5318, "total_steps": 10853, "loss": 0.1412, "learning_rate": 2.7888310688277493e-06, "epoch": 0.4899801907218869, "percentage": 49.0, "elapsed_time": "16:47:17", "remaining_time": "17:28:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5319, "total_steps": 10853, "loss": 0.141, "learning_rate": 2.7880743736567505e-06, "epoch": 0.490072326899157, "percentage": 49.01, "elapsed_time": "16:47:28", "remaining_time": "17:28:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5320, "total_steps": 10853, "loss": 0.1545, "learning_rate": 2.7873176517380157e-06, "epoch": 0.49016446307642697, "percentage": 49.02, "elapsed_time": "16:47:39", "remaining_time": "17:28:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5321, "total_steps": 10853, "loss": 0.1348, "learning_rate": 2.786560903141805e-06, "epoch": 0.49025659925369697, "percentage": 49.03, "elapsed_time": "16:47:50", "remaining_time": "17:27:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5322, "total_steps": 10853, "loss": 0.1457, "learning_rate": 2.7858041279383854e-06, "epoch": 0.49034873543096696, "percentage": 49.04, "elapsed_time": "16:48:00", "remaining_time": "17:27:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5323, "total_steps": 10853, "loss": 0.1396, "learning_rate": 2.7850473261980197e-06, "epoch": 0.49044087160823696, "percentage": 49.05, "elapsed_time": "16:48:11", "remaining_time": "17:27:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5324, "total_steps": 10853, "loss": 0.1548, "learning_rate": 2.78429049799098e-06, "epoch": 0.49053300778550696, "percentage": 49.06, "elapsed_time": "16:48:22", "remaining_time": "17:27:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5325, "total_steps": 10853, "loss": 0.1438, "learning_rate": 2.783533643387537e-06, "epoch": 0.490625143962777, "percentage": 49.06, "elapsed_time": "16:48:32", "remaining_time": "17:26:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5326, "total_steps": 10853, "loss": 0.1307, "learning_rate": 2.7827767624579645e-06, "epoch": 0.490717280140047, "percentage": 49.07, "elapsed_time": "16:48:42", "remaining_time": "17:26:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5327, "total_steps": 10853, "loss": 0.1478, "learning_rate": 2.7820198552725404e-06, "epoch": 0.490809416317317, "percentage": 49.08, "elapsed_time": "16:48:52", "remaining_time": "17:26:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5328, "total_steps": 10853, "loss": 0.1323, "learning_rate": 2.781262921901541e-06, "epoch": 0.490901552494587, "percentage": 49.09, "elapsed_time": "16:49:02", "remaining_time": "17:26:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5329, "total_steps": 10853, "loss": 0.1403, "learning_rate": 2.780505962415249e-06, "epoch": 0.490993688671857, "percentage": 49.1, "elapsed_time": "16:49:12", "remaining_time": "17:26:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5330, "total_steps": 10853, "loss": 0.1419, "learning_rate": 2.779748976883949e-06, "epoch": 0.491085824849127, "percentage": 49.11, "elapsed_time": "16:49:24", "remaining_time": "17:25:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5331, "total_steps": 10853, "loss": 0.1374, "learning_rate": 2.7789919653779257e-06, "epoch": 0.491177961026397, "percentage": 49.12, "elapsed_time": "16:49:35", "remaining_time": "17:25:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5332, "total_steps": 10853, "loss": 0.1587, "learning_rate": 2.7782349279674684e-06, "epoch": 0.49127009720366704, "percentage": 49.13, "elapsed_time": "16:49:46", "remaining_time": "17:25:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5333, "total_steps": 10853, "loss": 0.1406, "learning_rate": 2.7774778647228688e-06, "epoch": 0.49136223338093704, "percentage": 49.14, "elapsed_time": "16:49:56", "remaining_time": "17:25:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5334, "total_steps": 10853, "loss": 0.1417, "learning_rate": 2.7767207757144186e-06, "epoch": 0.49145436955820704, "percentage": 49.15, "elapsed_time": "16:50:07", "remaining_time": "17:25:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5335, "total_steps": 10853, "loss": 0.142, "learning_rate": 2.7759636610124158e-06, "epoch": 0.49154650573547704, "percentage": 49.16, "elapsed_time": "16:50:18", "remaining_time": "17:24:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5336, "total_steps": 10853, "loss": 0.1375, "learning_rate": 2.7752065206871564e-06, "epoch": 0.49163864191274703, "percentage": 49.17, "elapsed_time": "16:50:27", "remaining_time": "17:24:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5337, "total_steps": 10853, "loss": 0.1304, "learning_rate": 2.7744493548089425e-06, "epoch": 0.49173077809001703, "percentage": 49.18, "elapsed_time": "16:50:37", "remaining_time": "17:24:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5338, "total_steps": 10853, "loss": 0.1346, "learning_rate": 2.773692163448076e-06, "epoch": 0.491822914267287, "percentage": 49.18, "elapsed_time": "16:50:46", "remaining_time": "17:24:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5339, "total_steps": 10853, "loss": 0.1347, "learning_rate": 2.7729349466748634e-06, "epoch": 0.4919150504445571, "percentage": 49.19, "elapsed_time": "16:50:58", "remaining_time": "17:24:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5340, "total_steps": 10853, "loss": 0.1553, "learning_rate": 2.772177704559611e-06, "epoch": 0.4920071866218271, "percentage": 49.2, "elapsed_time": "16:51:08", "remaining_time": "17:23:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5341, "total_steps": 10853, "loss": 0.148, "learning_rate": 2.7714204371726293e-06, "epoch": 0.49209932279909707, "percentage": 49.21, "elapsed_time": "16:51:19", "remaining_time": "17:23:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5342, "total_steps": 10853, "loss": 0.1315, "learning_rate": 2.770663144584231e-06, "epoch": 0.49219145897636707, "percentage": 49.22, "elapsed_time": "16:51:28", "remaining_time": "17:23:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5343, "total_steps": 10853, "loss": 0.1541, "learning_rate": 2.769905826864731e-06, "epoch": 0.49228359515363707, "percentage": 49.23, "elapsed_time": "16:51:39", "remaining_time": "17:23:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5344, "total_steps": 10853, "loss": 0.1323, "learning_rate": 2.769148484084445e-06, "epoch": 0.49237573133090706, "percentage": 49.24, "elapsed_time": "16:51:51", "remaining_time": "17:23:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5345, "total_steps": 10853, "loss": 0.1356, "learning_rate": 2.7683911163136944e-06, "epoch": 0.49246786750817706, "percentage": 49.25, "elapsed_time": "16:52:01", "remaining_time": "17:22:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5346, "total_steps": 10853, "loss": 0.1327, "learning_rate": 2.767633723622799e-06, "epoch": 0.4925600036854471, "percentage": 49.26, "elapsed_time": "16:52:12", "remaining_time": "17:22:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5347, "total_steps": 10853, "loss": 0.1397, "learning_rate": 2.7668763060820842e-06, "epoch": 0.4926521398627171, "percentage": 49.27, "elapsed_time": "16:52:23", "remaining_time": "17:22:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5348, "total_steps": 10853, "loss": 0.1432, "learning_rate": 2.7661188637618752e-06, "epoch": 0.4927442760399871, "percentage": 49.28, "elapsed_time": "16:52:34", "remaining_time": "17:22:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5349, "total_steps": 10853, "loss": 0.1452, "learning_rate": 2.7653613967325018e-06, "epoch": 0.4928364122172571, "percentage": 49.29, "elapsed_time": "16:52:44", "remaining_time": "17:22:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5350, "total_steps": 10853, "loss": 0.141, "learning_rate": 2.7646039050642926e-06, "epoch": 0.4929285483945271, "percentage": 49.3, "elapsed_time": "16:52:55", "remaining_time": "17:21:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5351, "total_steps": 10853, "loss": 0.1323, "learning_rate": 2.763846388827584e-06, "epoch": 0.4930206845717971, "percentage": 49.3, "elapsed_time": "16:53:07", "remaining_time": "17:21:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5352, "total_steps": 10853, "loss": 0.143, "learning_rate": 2.7630888480927082e-06, "epoch": 0.49311282074906715, "percentage": 49.31, "elapsed_time": "16:53:17", "remaining_time": "17:21:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5353, "total_steps": 10853, "loss": 0.1317, "learning_rate": 2.7623312829300053e-06, "epoch": 0.49320495692633715, "percentage": 49.32, "elapsed_time": "16:53:28", "remaining_time": "17:21:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5354, "total_steps": 10853, "loss": 0.1598, "learning_rate": 2.7615736934098146e-06, "epoch": 0.49329709310360714, "percentage": 49.33, "elapsed_time": "16:53:38", "remaining_time": "17:21:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5355, "total_steps": 10853, "loss": 0.146, "learning_rate": 2.760816079602478e-06, "epoch": 0.49338922928087714, "percentage": 49.34, "elapsed_time": "16:53:49", "remaining_time": "17:20:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5356, "total_steps": 10853, "loss": 0.1339, "learning_rate": 2.760058441578341e-06, "epoch": 0.49348136545814714, "percentage": 49.35, "elapsed_time": "16:53:59", "remaining_time": "17:20:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5357, "total_steps": 10853, "loss": 0.1279, "learning_rate": 2.7593007794077493e-06, "epoch": 0.49357350163541713, "percentage": 49.36, "elapsed_time": "16:54:09", "remaining_time": "17:20:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5358, "total_steps": 10853, "loss": 0.1336, "learning_rate": 2.7585430931610526e-06, "epoch": 0.49366563781268713, "percentage": 49.37, "elapsed_time": "16:54:20", "remaining_time": "17:20:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5359, "total_steps": 10853, "loss": 0.133, "learning_rate": 2.7577853829086014e-06, "epoch": 0.4937577739899572, "percentage": 49.38, "elapsed_time": "16:54:30", "remaining_time": "17:20:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5360, "total_steps": 10853, "loss": 0.1546, "learning_rate": 2.7570276487207504e-06, "epoch": 0.4938499101672272, "percentage": 49.39, "elapsed_time": "16:54:41", "remaining_time": "17:19:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5361, "total_steps": 10853, "loss": 0.1281, "learning_rate": 2.7562698906678537e-06, "epoch": 0.4939420463444972, "percentage": 49.4, "elapsed_time": "16:54:51", "remaining_time": "17:19:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5362, "total_steps": 10853, "loss": 0.1499, "learning_rate": 2.755512108820271e-06, "epoch": 0.4940341825217672, "percentage": 49.41, "elapsed_time": "16:55:02", "remaining_time": "17:19:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5363, "total_steps": 10853, "loss": 0.1268, "learning_rate": 2.7547543032483604e-06, "epoch": 0.49412631869903717, "percentage": 49.41, "elapsed_time": "16:55:12", "remaining_time": "17:19:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5364, "total_steps": 10853, "loss": 0.1355, "learning_rate": 2.753996474022486e-06, "epoch": 0.49421845487630717, "percentage": 49.42, "elapsed_time": "16:55:23", "remaining_time": "17:19:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5365, "total_steps": 10853, "loss": 0.1412, "learning_rate": 2.753238621213012e-06, "epoch": 0.49431059105357716, "percentage": 49.43, "elapsed_time": "16:55:34", "remaining_time": "17:18:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5366, "total_steps": 10853, "loss": 0.1555, "learning_rate": 2.752480744890304e-06, "epoch": 0.4944027272308472, "percentage": 49.44, "elapsed_time": "16:55:44", "remaining_time": "17:18:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5367, "total_steps": 10853, "loss": 0.1392, "learning_rate": 2.751722845124732e-06, "epoch": 0.4944948634081172, "percentage": 49.45, "elapsed_time": "16:55:54", "remaining_time": "17:18:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5368, "total_steps": 10853, "loss": 0.1488, "learning_rate": 2.750964921986667e-06, "epoch": 0.4945869995853872, "percentage": 49.46, "elapsed_time": "16:56:05", "remaining_time": "17:18:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5369, "total_steps": 10853, "loss": 0.1361, "learning_rate": 2.750206975546481e-06, "epoch": 0.4946791357626572, "percentage": 49.47, "elapsed_time": "16:56:17", "remaining_time": "17:18:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5370, "total_steps": 10853, "loss": 0.1425, "learning_rate": 2.7494490058745514e-06, "epoch": 0.4947712719399272, "percentage": 49.48, "elapsed_time": "16:56:28", "remaining_time": "17:17:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5371, "total_steps": 10853, "loss": 0.1505, "learning_rate": 2.7486910130412543e-06, "epoch": 0.4948634081171972, "percentage": 49.49, "elapsed_time": "16:56:38", "remaining_time": "17:17:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5372, "total_steps": 10853, "loss": 0.1312, "learning_rate": 2.74793299711697e-06, "epoch": 0.4949555442944672, "percentage": 49.5, "elapsed_time": "16:56:50", "remaining_time": "17:17:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5373, "total_steps": 10853, "loss": 0.1349, "learning_rate": 2.747174958172081e-06, "epoch": 0.49504768047173725, "percentage": 49.51, "elapsed_time": "16:57:00", "remaining_time": "17:17:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5374, "total_steps": 10853, "loss": 0.1314, "learning_rate": 2.7464168962769696e-06, "epoch": 0.49513981664900725, "percentage": 49.52, "elapsed_time": "16:57:11", "remaining_time": "17:17:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5375, "total_steps": 10853, "loss": 0.1363, "learning_rate": 2.745658811502023e-06, "epoch": 0.49523195282627724, "percentage": 49.53, "elapsed_time": "16:57:21", "remaining_time": "17:16:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5376, "total_steps": 10853, "loss": 0.1473, "learning_rate": 2.7449007039176296e-06, "epoch": 0.49532408900354724, "percentage": 49.53, "elapsed_time": "16:57:32", "remaining_time": "17:16:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5377, "total_steps": 10853, "loss": 0.1443, "learning_rate": 2.7441425735941787e-06, "epoch": 0.49541622518081724, "percentage": 49.54, "elapsed_time": "16:57:43", "remaining_time": "17:16:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5378, "total_steps": 10853, "loss": 0.1395, "learning_rate": 2.7433844206020643e-06, "epoch": 0.49550836135808723, "percentage": 49.55, "elapsed_time": "16:57:54", "remaining_time": "17:16:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5379, "total_steps": 10853, "loss": 0.1301, "learning_rate": 2.7426262450116798e-06, "epoch": 0.49560049753535723, "percentage": 49.56, "elapsed_time": "16:58:05", "remaining_time": "17:16:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5380, "total_steps": 10853, "loss": 0.141, "learning_rate": 2.7418680468934227e-06, "epoch": 0.4956926337126273, "percentage": 49.57, "elapsed_time": "16:58:16", "remaining_time": "17:15:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5381, "total_steps": 10853, "loss": 0.1474, "learning_rate": 2.7411098263176917e-06, "epoch": 0.4957847698898973, "percentage": 49.58, "elapsed_time": "16:58:28", "remaining_time": "17:15:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5382, "total_steps": 10853, "loss": 0.1466, "learning_rate": 2.740351583354886e-06, "epoch": 0.4958769060671673, "percentage": 49.59, "elapsed_time": "16:58:38", "remaining_time": "17:15:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5383, "total_steps": 10853, "loss": 0.1511, "learning_rate": 2.739593318075412e-06, "epoch": 0.4959690422444373, "percentage": 49.6, "elapsed_time": "16:58:49", "remaining_time": "17:15:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5384, "total_steps": 10853, "loss": 0.1531, "learning_rate": 2.7388350305496708e-06, "epoch": 0.49606117842170727, "percentage": 49.61, "elapsed_time": "16:58:58", "remaining_time": "17:15:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5385, "total_steps": 10853, "loss": 0.1335, "learning_rate": 2.7380767208480726e-06, "epoch": 0.49615331459897727, "percentage": 49.62, "elapsed_time": "16:59:09", "remaining_time": "17:14:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5386, "total_steps": 10853, "loss": 0.1266, "learning_rate": 2.7373183890410245e-06, "epoch": 0.4962454507762473, "percentage": 49.63, "elapsed_time": "16:59:20", "remaining_time": "17:14:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5387, "total_steps": 10853, "loss": 0.139, "learning_rate": 2.7365600351989386e-06, "epoch": 0.4963375869535173, "percentage": 49.64, "elapsed_time": "16:59:31", "remaining_time": "17:14:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5388, "total_steps": 10853, "loss": 0.147, "learning_rate": 2.7358016593922283e-06, "epoch": 0.4964297231307873, "percentage": 49.65, "elapsed_time": "16:59:41", "remaining_time": "17:14:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5389, "total_steps": 10853, "loss": 0.1345, "learning_rate": 2.7350432616913083e-06, "epoch": 0.4965218593080573, "percentage": 49.65, "elapsed_time": "16:59:53", "remaining_time": "17:14:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5390, "total_steps": 10853, "loss": 0.1558, "learning_rate": 2.734284842166596e-06, "epoch": 0.4966139954853273, "percentage": 49.66, "elapsed_time": "17:00:03", "remaining_time": "17:13:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5391, "total_steps": 10853, "loss": 0.1562, "learning_rate": 2.733526400888511e-06, "epoch": 0.4967061316625973, "percentage": 49.67, "elapsed_time": "17:00:14", "remaining_time": "17:13:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5392, "total_steps": 10853, "loss": 0.1365, "learning_rate": 2.732767937927474e-06, "epoch": 0.4967982678398673, "percentage": 49.68, "elapsed_time": "17:00:25", "remaining_time": "17:13:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5393, "total_steps": 10853, "loss": 0.1372, "learning_rate": 2.73200945335391e-06, "epoch": 0.49689040401713735, "percentage": 49.69, "elapsed_time": "17:00:35", "remaining_time": "17:13:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5394, "total_steps": 10853, "loss": 0.151, "learning_rate": 2.7312509472382425e-06, "epoch": 0.49698254019440735, "percentage": 49.7, "elapsed_time": "17:00:47", "remaining_time": "17:13:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5395, "total_steps": 10853, "loss": 0.125, "learning_rate": 2.7304924196509004e-06, "epoch": 0.49707467637167735, "percentage": 49.71, "elapsed_time": "17:00:57", "remaining_time": "17:12:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5396, "total_steps": 10853, "loss": 0.1392, "learning_rate": 2.7297338706623113e-06, "epoch": 0.49716681254894735, "percentage": 49.72, "elapsed_time": "17:01:08", "remaining_time": "17:12:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5397, "total_steps": 10853, "loss": 0.1349, "learning_rate": 2.728975300342909e-06, "epoch": 0.49725894872621734, "percentage": 49.73, "elapsed_time": "17:01:19", "remaining_time": "17:12:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5398, "total_steps": 10853, "loss": 0.1487, "learning_rate": 2.7282167087631234e-06, "epoch": 0.49735108490348734, "percentage": 49.74, "elapsed_time": "17:01:30", "remaining_time": "17:12:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5399, "total_steps": 10853, "loss": 0.1452, "learning_rate": 2.7274580959933933e-06, "epoch": 0.49744322108075734, "percentage": 49.75, "elapsed_time": "17:01:41", "remaining_time": "17:12:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5400, "total_steps": 10853, "loss": 0.1327, "learning_rate": 2.726699462104154e-06, "epoch": 0.4975353572580274, "percentage": 49.76, "elapsed_time": "17:01:52", "remaining_time": "17:11:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5401, "total_steps": 10853, "loss": 0.1439, "learning_rate": 2.7259408071658456e-06, "epoch": 0.4976274934352974, "percentage": 49.77, "elapsed_time": "17:02:02", "remaining_time": "17:11:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5402, "total_steps": 10853, "loss": 0.1409, "learning_rate": 2.725182131248909e-06, "epoch": 0.4977196296125674, "percentage": 49.77, "elapsed_time": "17:02:12", "remaining_time": "17:11:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5403, "total_steps": 10853, "loss": 0.1477, "learning_rate": 2.724423434423787e-06, "epoch": 0.4978117657898374, "percentage": 49.78, "elapsed_time": "17:02:23", "remaining_time": "17:11:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5404, "total_steps": 10853, "loss": 0.1345, "learning_rate": 2.7236647167609246e-06, "epoch": 0.4979039019671074, "percentage": 49.79, "elapsed_time": "17:02:33", "remaining_time": "17:11:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5405, "total_steps": 10853, "loss": 0.1501, "learning_rate": 2.7229059783307703e-06, "epoch": 0.4979960381443774, "percentage": 49.8, "elapsed_time": "17:02:45", "remaining_time": "17:10:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5406, "total_steps": 10853, "loss": 0.1408, "learning_rate": 2.7221472192037707e-06, "epoch": 0.49808817432164737, "percentage": 49.81, "elapsed_time": "17:02:55", "remaining_time": "17:10:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5407, "total_steps": 10853, "loss": 0.1447, "learning_rate": 2.721388439450379e-06, "epoch": 0.4981803104989174, "percentage": 49.82, "elapsed_time": "17:03:07", "remaining_time": "17:10:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5408, "total_steps": 10853, "loss": 0.1448, "learning_rate": 2.7206296391410457e-06, "epoch": 0.4982724466761874, "percentage": 49.83, "elapsed_time": "17:03:17", "remaining_time": "17:10:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5409, "total_steps": 10853, "loss": 0.1367, "learning_rate": 2.7198708183462275e-06, "epoch": 0.4983645828534574, "percentage": 49.84, "elapsed_time": "17:03:28", "remaining_time": "17:10:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5410, "total_steps": 10853, "loss": 0.1422, "learning_rate": 2.71911197713638e-06, "epoch": 0.4984567190307274, "percentage": 49.85, "elapsed_time": "17:03:39", "remaining_time": "17:09:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5411, "total_steps": 10853, "loss": 0.1421, "learning_rate": 2.7183531155819607e-06, "epoch": 0.4985488552079974, "percentage": 49.86, "elapsed_time": "17:03:49", "remaining_time": "17:09:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5412, "total_steps": 10853, "loss": 0.1242, "learning_rate": 2.7175942337534326e-06, "epoch": 0.4986409913852674, "percentage": 49.87, "elapsed_time": "17:04:01", "remaining_time": "17:09:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5413, "total_steps": 10853, "loss": 0.1435, "learning_rate": 2.7168353317212565e-06, "epoch": 0.4987331275625374, "percentage": 49.88, "elapsed_time": "17:04:10", "remaining_time": "17:09:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5414, "total_steps": 10853, "loss": 0.1385, "learning_rate": 2.7160764095558954e-06, "epoch": 0.49882526373980746, "percentage": 49.88, "elapsed_time": "17:04:22", "remaining_time": "17:09:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5415, "total_steps": 10853, "loss": 0.139, "learning_rate": 2.7153174673278174e-06, "epoch": 0.49891739991707745, "percentage": 49.89, "elapsed_time": "17:04:33", "remaining_time": "17:08:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5416, "total_steps": 10853, "loss": 0.1388, "learning_rate": 2.7145585051074893e-06, "epoch": 0.49900953609434745, "percentage": 49.9, "elapsed_time": "17:04:44", "remaining_time": "17:08:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5417, "total_steps": 10853, "loss": 0.1457, "learning_rate": 2.7137995229653803e-06, "epoch": 0.49910167227161745, "percentage": 49.91, "elapsed_time": "17:04:54", "remaining_time": "17:08:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5418, "total_steps": 10853, "loss": 0.1307, "learning_rate": 2.7130405209719637e-06, "epoch": 0.49919380844888744, "percentage": 49.92, "elapsed_time": "17:05:06", "remaining_time": "17:08:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5419, "total_steps": 10853, "loss": 0.1405, "learning_rate": 2.7122814991977104e-06, "epoch": 0.49928594462615744, "percentage": 49.93, "elapsed_time": "17:05:18", "remaining_time": "17:08:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5420, "total_steps": 10853, "loss": 0.1334, "learning_rate": 2.711522457713098e-06, "epoch": 0.4993780808034275, "percentage": 49.94, "elapsed_time": "17:05:28", "remaining_time": "17:07:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5421, "total_steps": 10853, "loss": 0.1307, "learning_rate": 2.710763396588602e-06, "epoch": 0.4994702169806975, "percentage": 49.95, "elapsed_time": "17:05:39", "remaining_time": "17:07:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5422, "total_steps": 10853, "loss": 0.1405, "learning_rate": 2.7100043158947027e-06, "epoch": 0.4995623531579675, "percentage": 49.96, "elapsed_time": "17:05:49", "remaining_time": "17:07:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5423, "total_steps": 10853, "loss": 0.1536, "learning_rate": 2.7092452157018795e-06, "epoch": 0.4996544893352375, "percentage": 49.97, "elapsed_time": "17:06:00", "remaining_time": "17:07:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5424, "total_steps": 10853, "loss": 0.1362, "learning_rate": 2.708486096080616e-06, "epoch": 0.4997466255125075, "percentage": 49.98, "elapsed_time": "17:06:10", "remaining_time": "17:07:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5425, "total_steps": 10853, "loss": 0.1311, "learning_rate": 2.7077269571013947e-06, "epoch": 0.4998387616897775, "percentage": 49.99, "elapsed_time": "17:06:21", "remaining_time": "17:06:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5426, "total_steps": 10853, "loss": 0.1466, "learning_rate": 2.7069677988347048e-06, "epoch": 0.4999308978670475, "percentage": 50.0, "elapsed_time": "17:06:31", "remaining_time": "17:06:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5427, "total_steps": 10853, "loss": 0.1392, "learning_rate": 2.7062086213510315e-06, "epoch": 0.5000230340443175, "percentage": 50.0, "elapsed_time": "17:06:42", "remaining_time": "17:06:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5428, "total_steps": 10853, "loss": 0.1393, "learning_rate": 2.705449424720866e-06, "epoch": 0.5001151702215875, "percentage": 50.01, "elapsed_time": "17:06:52", "remaining_time": "17:06:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5429, "total_steps": 10853, "loss": 0.1332, "learning_rate": 2.7046902090146986e-06, "epoch": 0.5002073063988575, "percentage": 50.02, "elapsed_time": "17:07:02", "remaining_time": "17:06:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5430, "total_steps": 10853, "loss": 0.1257, "learning_rate": 2.703930974303024e-06, "epoch": 0.5002994425761275, "percentage": 50.03, "elapsed_time": "17:07:13", "remaining_time": "17:05:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5431, "total_steps": 10853, "loss": 0.1377, "learning_rate": 2.703171720656336e-06, "epoch": 0.5003915787533976, "percentage": 50.04, "elapsed_time": "17:07:24", "remaining_time": "17:05:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5432, "total_steps": 10853, "loss": 0.1342, "learning_rate": 2.7024124481451323e-06, "epoch": 0.5004837149306676, "percentage": 50.05, "elapsed_time": "17:07:34", "remaining_time": "17:05:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5433, "total_steps": 10853, "loss": 0.1407, "learning_rate": 2.701653156839911e-06, "epoch": 0.5005758511079376, "percentage": 50.06, "elapsed_time": "17:07:45", "remaining_time": "17:05:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5434, "total_steps": 10853, "loss": 0.1474, "learning_rate": 2.700893846811172e-06, "epoch": 0.5006679872852076, "percentage": 50.07, "elapsed_time": "17:07:57", "remaining_time": "17:05:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5435, "total_steps": 10853, "loss": 0.1483, "learning_rate": 2.700134518129418e-06, "epoch": 0.5007601234624776, "percentage": 50.08, "elapsed_time": "17:08:09", "remaining_time": "17:04:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5436, "total_steps": 10853, "loss": 0.1331, "learning_rate": 2.699375170865152e-06, "epoch": 0.5008522596397476, "percentage": 50.09, "elapsed_time": "17:08:20", "remaining_time": "17:04:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5437, "total_steps": 10853, "loss": 0.1182, "learning_rate": 2.6986158050888804e-06, "epoch": 0.5009443958170176, "percentage": 50.1, "elapsed_time": "17:08:31", "remaining_time": "17:04:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5438, "total_steps": 10853, "loss": 0.138, "learning_rate": 2.6978564208711098e-06, "epoch": 0.5010365319942875, "percentage": 50.11, "elapsed_time": "17:08:42", "remaining_time": "17:04:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5439, "total_steps": 10853, "loss": 0.1225, "learning_rate": 2.697097018282349e-06, "epoch": 0.5011286681715575, "percentage": 50.12, "elapsed_time": "17:08:52", "remaining_time": "17:04:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5440, "total_steps": 10853, "loss": 0.1456, "learning_rate": 2.6963375973931095e-06, "epoch": 0.5012208043488275, "percentage": 50.12, "elapsed_time": "17:09:02", "remaining_time": "17:03:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5441, "total_steps": 10853, "loss": 0.1421, "learning_rate": 2.6955781582739028e-06, "epoch": 0.5013129405260975, "percentage": 50.13, "elapsed_time": "17:09:14", "remaining_time": "17:03:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5442, "total_steps": 10853, "loss": 0.1469, "learning_rate": 2.6948187009952426e-06, "epoch": 0.5014050767033675, "percentage": 50.14, "elapsed_time": "17:09:26", "remaining_time": "17:03:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5443, "total_steps": 10853, "loss": 0.1338, "learning_rate": 2.6940592256276455e-06, "epoch": 0.5014972128806375, "percentage": 50.15, "elapsed_time": "17:09:37", "remaining_time": "17:03:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5444, "total_steps": 10853, "loss": 0.1418, "learning_rate": 2.6932997322416276e-06, "epoch": 0.5015893490579076, "percentage": 50.16, "elapsed_time": "17:09:47", "remaining_time": "17:03:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5445, "total_steps": 10853, "loss": 0.1493, "learning_rate": 2.6925402209077096e-06, "epoch": 0.5016814852351776, "percentage": 50.17, "elapsed_time": "17:09:59", "remaining_time": "17:02:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5446, "total_steps": 10853, "loss": 0.133, "learning_rate": 2.6917806916964107e-06, "epoch": 0.5017736214124476, "percentage": 50.18, "elapsed_time": "17:10:09", "remaining_time": "17:02:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5447, "total_steps": 10853, "loss": 0.139, "learning_rate": 2.691021144678254e-06, "epoch": 0.5018657575897176, "percentage": 50.19, "elapsed_time": "17:10:20", "remaining_time": "17:02:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5448, "total_steps": 10853, "loss": 0.1487, "learning_rate": 2.690261579923764e-06, "epoch": 0.5019578937669876, "percentage": 50.2, "elapsed_time": "17:10:31", "remaining_time": "17:02:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5449, "total_steps": 10853, "loss": 0.138, "learning_rate": 2.689501997503466e-06, "epoch": 0.5020500299442576, "percentage": 50.21, "elapsed_time": "17:10:42", "remaining_time": "17:02:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5450, "total_steps": 10853, "loss": 0.1475, "learning_rate": 2.688742397487887e-06, "epoch": 0.5021421661215276, "percentage": 50.22, "elapsed_time": "17:10:54", "remaining_time": "17:02:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5451, "total_steps": 10853, "loss": 0.1432, "learning_rate": 2.6879827799475557e-06, "epoch": 0.5022343022987976, "percentage": 50.23, "elapsed_time": "17:11:05", "remaining_time": "17:01:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5452, "total_steps": 10853, "loss": 0.1456, "learning_rate": 2.6872231449530027e-06, "epoch": 0.5023264384760676, "percentage": 50.23, "elapsed_time": "17:11:14", "remaining_time": "17:01:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5453, "total_steps": 10853, "loss": 0.1537, "learning_rate": 2.686463492574761e-06, "epoch": 0.5024185746533376, "percentage": 50.24, "elapsed_time": "17:11:26", "remaining_time": "17:01:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5454, "total_steps": 10853, "loss": 0.1485, "learning_rate": 2.6857038228833644e-06, "epoch": 0.5025107108306076, "percentage": 50.25, "elapsed_time": "17:11:36", "remaining_time": "17:01:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5455, "total_steps": 10853, "loss": 0.1158, "learning_rate": 2.6849441359493474e-06, "epoch": 0.5026028470078776, "percentage": 50.26, "elapsed_time": "17:11:48", "remaining_time": "17:01:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5456, "total_steps": 10853, "loss": 0.1396, "learning_rate": 2.6841844318432476e-06, "epoch": 0.5026949831851476, "percentage": 50.27, "elapsed_time": "17:11:59", "remaining_time": "17:00:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5457, "total_steps": 10853, "loss": 0.1284, "learning_rate": 2.683424710635603e-06, "epoch": 0.5027871193624176, "percentage": 50.28, "elapsed_time": "17:12:10", "remaining_time": "17:00:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5458, "total_steps": 10853, "loss": 0.1283, "learning_rate": 2.682664972396955e-06, "epoch": 0.5028792555396877, "percentage": 50.29, "elapsed_time": "17:12:22", "remaining_time": "17:00:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5459, "total_steps": 10853, "loss": 0.1394, "learning_rate": 2.6819052171978443e-06, "epoch": 0.5029713917169577, "percentage": 50.3, "elapsed_time": "17:12:31", "remaining_time": "17:00:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5460, "total_steps": 10853, "loss": 0.1299, "learning_rate": 2.681145445108814e-06, "epoch": 0.5030635278942277, "percentage": 50.31, "elapsed_time": "17:12:43", "remaining_time": "17:00:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5461, "total_steps": 10853, "loss": 0.1446, "learning_rate": 2.6803856562004112e-06, "epoch": 0.5031556640714977, "percentage": 50.32, "elapsed_time": "17:12:53", "remaining_time": "16:59:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5462, "total_steps": 10853, "loss": 0.1287, "learning_rate": 2.6796258505431786e-06, "epoch": 0.5032478002487677, "percentage": 50.33, "elapsed_time": "17:13:02", "remaining_time": "16:59:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5463, "total_steps": 10853, "loss": 0.1397, "learning_rate": 2.6788660282076682e-06, "epoch": 0.5033399364260377, "percentage": 50.34, "elapsed_time": "17:13:12", "remaining_time": "16:59:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5464, "total_steps": 10853, "loss": 0.1333, "learning_rate": 2.6781061892644273e-06, "epoch": 0.5034320726033077, "percentage": 50.35, "elapsed_time": "17:13:22", "remaining_time": "16:59:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5465, "total_steps": 10853, "loss": 0.1392, "learning_rate": 2.6773463337840078e-06, "epoch": 0.5035242087805777, "percentage": 50.35, "elapsed_time": "17:13:33", "remaining_time": "16:58:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5466, "total_steps": 10853, "loss": 0.1554, "learning_rate": 2.676586461836962e-06, "epoch": 0.5036163449578477, "percentage": 50.36, "elapsed_time": "17:13:43", "remaining_time": "16:58:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5467, "total_steps": 10853, "loss": 0.1443, "learning_rate": 2.6758265734938444e-06, "epoch": 0.5037084811351177, "percentage": 50.37, "elapsed_time": "17:13:54", "remaining_time": "16:58:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5468, "total_steps": 10853, "loss": 0.1383, "learning_rate": 2.67506666882521e-06, "epoch": 0.5038006173123877, "percentage": 50.38, "elapsed_time": "17:14:04", "remaining_time": "16:58:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5469, "total_steps": 10853, "loss": 0.147, "learning_rate": 2.6743067479016166e-06, "epoch": 0.5038927534896577, "percentage": 50.39, "elapsed_time": "17:14:15", "remaining_time": "16:58:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5470, "total_steps": 10853, "loss": 0.1298, "learning_rate": 2.673546810793623e-06, "epoch": 0.5039848896669277, "percentage": 50.4, "elapsed_time": "17:14:26", "remaining_time": "16:57:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5471, "total_steps": 10853, "loss": 0.1472, "learning_rate": 2.6727868575717893e-06, "epoch": 0.5040770258441978, "percentage": 50.41, "elapsed_time": "17:14:37", "remaining_time": "16:57:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5472, "total_steps": 10853, "loss": 0.1291, "learning_rate": 2.6720268883066773e-06, "epoch": 0.5041691620214678, "percentage": 50.42, "elapsed_time": "17:14:48", "remaining_time": "16:57:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5473, "total_steps": 10853, "loss": 0.1502, "learning_rate": 2.6712669030688503e-06, "epoch": 0.5042612981987378, "percentage": 50.43, "elapsed_time": "17:14:58", "remaining_time": "16:57:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5474, "total_steps": 10853, "loss": 0.1463, "learning_rate": 2.6705069019288733e-06, "epoch": 0.5043534343760078, "percentage": 50.44, "elapsed_time": "17:15:09", "remaining_time": "16:57:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5475, "total_steps": 10853, "loss": 0.1598, "learning_rate": 2.6697468849573114e-06, "epoch": 0.5044455705532778, "percentage": 50.45, "elapsed_time": "17:15:22", "remaining_time": "16:57:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5476, "total_steps": 10853, "loss": 0.1521, "learning_rate": 2.6689868522247334e-06, "epoch": 0.5045377067305478, "percentage": 50.46, "elapsed_time": "17:15:32", "remaining_time": "16:56:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5477, "total_steps": 10853, "loss": 0.1385, "learning_rate": 2.668226803801708e-06, "epoch": 0.5046298429078178, "percentage": 50.47, "elapsed_time": "17:15:42", "remaining_time": "16:56:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5478, "total_steps": 10853, "loss": 0.1335, "learning_rate": 2.6674667397588056e-06, "epoch": 0.5047219790850878, "percentage": 50.47, "elapsed_time": "17:15:52", "remaining_time": "16:56:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5479, "total_steps": 10853, "loss": 0.1539, "learning_rate": 2.666706660166598e-06, "epoch": 0.5048141152623578, "percentage": 50.48, "elapsed_time": "17:16:04", "remaining_time": "16:56:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5480, "total_steps": 10853, "loss": 0.1436, "learning_rate": 2.66594656509566e-06, "epoch": 0.5049062514396278, "percentage": 50.49, "elapsed_time": "17:16:14", "remaining_time": "16:56:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5481, "total_steps": 10853, "loss": 0.131, "learning_rate": 2.665186454616565e-06, "epoch": 0.5049983876168977, "percentage": 50.5, "elapsed_time": "17:16:24", "remaining_time": "16:55:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5482, "total_steps": 10853, "loss": 0.1465, "learning_rate": 2.66442632879989e-06, "epoch": 0.5050905237941677, "percentage": 50.51, "elapsed_time": "17:16:35", "remaining_time": "16:55:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5483, "total_steps": 10853, "loss": 0.1257, "learning_rate": 2.663666187716213e-06, "epoch": 0.5051826599714377, "percentage": 50.52, "elapsed_time": "17:16:46", "remaining_time": "16:55:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5484, "total_steps": 10853, "loss": 0.1379, "learning_rate": 2.662906031436112e-06, "epoch": 0.5052747961487077, "percentage": 50.53, "elapsed_time": "17:16:56", "remaining_time": "16:55:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5485, "total_steps": 10853, "loss": 0.1457, "learning_rate": 2.662145860030169e-06, "epoch": 0.5053669323259778, "percentage": 50.54, "elapsed_time": "17:17:06", "remaining_time": "16:54:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5486, "total_steps": 10853, "loss": 0.1315, "learning_rate": 2.6613856735689656e-06, "epoch": 0.5054590685032478, "percentage": 50.55, "elapsed_time": "17:17:16", "remaining_time": "16:54:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5487, "total_steps": 10853, "loss": 0.1325, "learning_rate": 2.6606254721230845e-06, "epoch": 0.5055512046805178, "percentage": 50.56, "elapsed_time": "17:17:25", "remaining_time": "16:54:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5488, "total_steps": 10853, "loss": 0.1525, "learning_rate": 2.6598652557631123e-06, "epoch": 0.5056433408577878, "percentage": 50.57, "elapsed_time": "17:17:36", "remaining_time": "16:54:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5489, "total_steps": 10853, "loss": 0.1298, "learning_rate": 2.6591050245596322e-06, "epoch": 0.5057354770350578, "percentage": 50.58, "elapsed_time": "17:17:46", "remaining_time": "16:54:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5490, "total_steps": 10853, "loss": 0.1389, "learning_rate": 2.6583447785832343e-06, "epoch": 0.5058276132123278, "percentage": 50.59, "elapsed_time": "17:17:57", "remaining_time": "16:53:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5491, "total_steps": 10853, "loss": 0.13, "learning_rate": 2.657584517904507e-06, "epoch": 0.5059197493895978, "percentage": 50.59, "elapsed_time": "17:18:08", "remaining_time": "16:53:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5492, "total_steps": 10853, "loss": 0.1443, "learning_rate": 2.65682424259404e-06, "epoch": 0.5060118855668678, "percentage": 50.6, "elapsed_time": "17:18:19", "remaining_time": "16:53:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5493, "total_steps": 10853, "loss": 0.1368, "learning_rate": 2.6560639527224246e-06, "epoch": 0.5061040217441378, "percentage": 50.61, "elapsed_time": "17:18:30", "remaining_time": "16:53:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5494, "total_steps": 10853, "loss": 0.1528, "learning_rate": 2.6553036483602553e-06, "epoch": 0.5061961579214078, "percentage": 50.62, "elapsed_time": "17:18:41", "remaining_time": "16:53:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5495, "total_steps": 10853, "loss": 0.1417, "learning_rate": 2.6545433295781242e-06, "epoch": 0.5062882940986778, "percentage": 50.63, "elapsed_time": "17:18:53", "remaining_time": "16:52:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5496, "total_steps": 10853, "loss": 0.1406, "learning_rate": 2.65378299644663e-06, "epoch": 0.5063804302759478, "percentage": 50.64, "elapsed_time": "17:19:04", "remaining_time": "16:52:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5497, "total_steps": 10853, "loss": 0.1236, "learning_rate": 2.653022649036367e-06, "epoch": 0.5064725664532178, "percentage": 50.65, "elapsed_time": "17:19:15", "remaining_time": "16:52:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5498, "total_steps": 10853, "loss": 0.1372, "learning_rate": 2.652262287417935e-06, "epoch": 0.5065647026304878, "percentage": 50.66, "elapsed_time": "17:19:26", "remaining_time": "16:52:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5499, "total_steps": 10853, "loss": 0.1374, "learning_rate": 2.6515019116619327e-06, "epoch": 0.5066568388077579, "percentage": 50.67, "elapsed_time": "17:19:36", "remaining_time": "16:52:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5500, "total_steps": 10853, "loss": 0.1344, "learning_rate": 2.6507415218389616e-06, "epoch": 0.5067489749850279, "percentage": 50.68, "elapsed_time": "17:19:46", "remaining_time": "16:51:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5500, "total_steps": 10853, "eval_loss": 0.13985012471675873, "epoch": 0.5067489749850279, "percentage": 50.68, "elapsed_time": "17:24:46", "remaining_time": "16:56:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5501, "total_steps": 10853, "loss": 0.1325, "learning_rate": 2.649981118019625e-06, "epoch": 0.5068411111622979, "percentage": 50.69, "elapsed_time": "17:24:57", "remaining_time": "16:56:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5502, "total_steps": 10853, "loss": 0.1421, "learning_rate": 2.649220700274524e-06, "epoch": 0.5069332473395679, "percentage": 50.7, "elapsed_time": "17:25:07", "remaining_time": "16:56:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5503, "total_steps": 10853, "loss": 0.1502, "learning_rate": 2.648460268674266e-06, "epoch": 0.5070253835168379, "percentage": 50.7, "elapsed_time": "17:25:18", "remaining_time": "16:56:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5504, "total_steps": 10853, "loss": 0.1352, "learning_rate": 2.6476998232894557e-06, "epoch": 0.5071175196941079, "percentage": 50.71, "elapsed_time": "17:25:30", "remaining_time": "16:56:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5505, "total_steps": 10853, "loss": 0.1425, "learning_rate": 2.646939364190701e-06, "epoch": 0.5072096558713779, "percentage": 50.72, "elapsed_time": "17:25:41", "remaining_time": "16:55:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5506, "total_steps": 10853, "loss": 0.1458, "learning_rate": 2.6461788914486098e-06, "epoch": 0.5073017920486479, "percentage": 50.73, "elapsed_time": "17:25:53", "remaining_time": "16:55:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5507, "total_steps": 10853, "loss": 0.1581, "learning_rate": 2.6454184051337946e-06, "epoch": 0.5073939282259179, "percentage": 50.74, "elapsed_time": "17:26:05", "remaining_time": "16:55:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5508, "total_steps": 10853, "loss": 0.1316, "learning_rate": 2.644657905316863e-06, "epoch": 0.5074860644031879, "percentage": 50.75, "elapsed_time": "17:26:17", "remaining_time": "16:55:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5509, "total_steps": 10853, "loss": 0.1482, "learning_rate": 2.64389739206843e-06, "epoch": 0.5075782005804579, "percentage": 50.76, "elapsed_time": "17:26:27", "remaining_time": "16:55:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5510, "total_steps": 10853, "loss": 0.1519, "learning_rate": 2.6431368654591087e-06, "epoch": 0.5076703367577279, "percentage": 50.77, "elapsed_time": "17:26:38", "remaining_time": "16:54:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5511, "total_steps": 10853, "loss": 0.146, "learning_rate": 2.6423763255595143e-06, "epoch": 0.5077624729349979, "percentage": 50.78, "elapsed_time": "17:26:50", "remaining_time": "16:54:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5512, "total_steps": 10853, "loss": 0.1381, "learning_rate": 2.6416157724402626e-06, "epoch": 0.507854609112268, "percentage": 50.79, "elapsed_time": "17:27:01", "remaining_time": "16:54:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5513, "total_steps": 10853, "loss": 0.1371, "learning_rate": 2.640855206171971e-06, "epoch": 0.507946745289538, "percentage": 50.8, "elapsed_time": "17:27:11", "remaining_time": "16:54:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5514, "total_steps": 10853, "loss": 0.1355, "learning_rate": 2.640094626825258e-06, "epoch": 0.508038881466808, "percentage": 50.81, "elapsed_time": "17:27:21", "remaining_time": "16:54:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5515, "total_steps": 10853, "loss": 0.1459, "learning_rate": 2.6393340344707448e-06, "epoch": 0.508131017644078, "percentage": 50.82, "elapsed_time": "17:27:32", "remaining_time": "16:53:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5516, "total_steps": 10853, "loss": 0.1307, "learning_rate": 2.6385734291790506e-06, "epoch": 0.508223153821348, "percentage": 50.82, "elapsed_time": "17:27:41", "remaining_time": "16:53:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5517, "total_steps": 10853, "loss": 0.1428, "learning_rate": 2.637812811020799e-06, "epoch": 0.508315289998618, "percentage": 50.83, "elapsed_time": "17:27:51", "remaining_time": "16:53:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5518, "total_steps": 10853, "loss": 0.1323, "learning_rate": 2.6370521800666127e-06, "epoch": 0.508407426175888, "percentage": 50.84, "elapsed_time": "17:28:03", "remaining_time": "16:53:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5519, "total_steps": 10853, "loss": 0.136, "learning_rate": 2.636291536387117e-06, "epoch": 0.508499562353158, "percentage": 50.85, "elapsed_time": "17:28:12", "remaining_time": "16:53:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5520, "total_steps": 10853, "loss": 0.1356, "learning_rate": 2.6355308800529377e-06, "epoch": 0.508591698530428, "percentage": 50.86, "elapsed_time": "17:28:23", "remaining_time": "16:52:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5521, "total_steps": 10853, "loss": 0.144, "learning_rate": 2.6347702111347017e-06, "epoch": 0.508683834707698, "percentage": 50.87, "elapsed_time": "17:28:34", "remaining_time": "16:52:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5522, "total_steps": 10853, "loss": 0.1344, "learning_rate": 2.634009529703036e-06, "epoch": 0.508775970884968, "percentage": 50.88, "elapsed_time": "17:28:46", "remaining_time": "16:52:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5523, "total_steps": 10853, "loss": 0.1177, "learning_rate": 2.633248835828573e-06, "epoch": 0.508868107062238, "percentage": 50.89, "elapsed_time": "17:28:54", "remaining_time": "16:52:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5524, "total_steps": 10853, "loss": 0.1525, "learning_rate": 2.6324881295819394e-06, "epoch": 0.508960243239508, "percentage": 50.9, "elapsed_time": "17:29:06", "remaining_time": "16:52:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5525, "total_steps": 10853, "loss": 0.1277, "learning_rate": 2.6317274110337692e-06, "epoch": 0.509052379416778, "percentage": 50.91, "elapsed_time": "17:29:17", "remaining_time": "16:51:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5526, "total_steps": 10853, "loss": 0.1294, "learning_rate": 2.6309666802546953e-06, "epoch": 0.509144515594048, "percentage": 50.92, "elapsed_time": "17:29:28", "remaining_time": "16:51:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5527, "total_steps": 10853, "loss": 0.1291, "learning_rate": 2.63020593731535e-06, "epoch": 0.509236651771318, "percentage": 50.93, "elapsed_time": "17:29:39", "remaining_time": "16:51:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5528, "total_steps": 10853, "loss": 0.145, "learning_rate": 2.629445182286371e-06, "epoch": 0.509328787948588, "percentage": 50.94, "elapsed_time": "17:29:51", "remaining_time": "16:51:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5529, "total_steps": 10853, "loss": 0.1384, "learning_rate": 2.6286844152383913e-06, "epoch": 0.509420924125858, "percentage": 50.94, "elapsed_time": "17:30:01", "remaining_time": "16:51:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5530, "total_steps": 10853, "loss": 0.1403, "learning_rate": 2.6279236362420503e-06, "epoch": 0.509513060303128, "percentage": 50.95, "elapsed_time": "17:30:12", "remaining_time": "16:50:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5531, "total_steps": 10853, "loss": 0.1391, "learning_rate": 2.6271628453679865e-06, "epoch": 0.509605196480398, "percentage": 50.96, "elapsed_time": "17:30:23", "remaining_time": "16:50:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5532, "total_steps": 10853, "loss": 0.1477, "learning_rate": 2.6264020426868382e-06, "epoch": 0.509697332657668, "percentage": 50.97, "elapsed_time": "17:30:34", "remaining_time": "16:50:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5533, "total_steps": 10853, "loss": 0.1334, "learning_rate": 2.6256412282692467e-06, "epoch": 0.509789468834938, "percentage": 50.98, "elapsed_time": "17:30:44", "remaining_time": "16:50:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5534, "total_steps": 10853, "loss": 0.1312, "learning_rate": 2.6248804021858538e-06, "epoch": 0.509881605012208, "percentage": 50.99, "elapsed_time": "17:30:55", "remaining_time": "16:50:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5535, "total_steps": 10853, "loss": 0.139, "learning_rate": 2.624119564507302e-06, "epoch": 0.509973741189478, "percentage": 51.0, "elapsed_time": "17:31:05", "remaining_time": "16:49:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5536, "total_steps": 10853, "loss": 0.1279, "learning_rate": 2.6233587153042356e-06, "epoch": 0.510065877366748, "percentage": 51.01, "elapsed_time": "17:31:16", "remaining_time": "16:49:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5537, "total_steps": 10853, "loss": 0.1267, "learning_rate": 2.6225978546472985e-06, "epoch": 0.510158013544018, "percentage": 51.02, "elapsed_time": "17:31:27", "remaining_time": "16:49:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5538, "total_steps": 10853, "loss": 0.133, "learning_rate": 2.621836982607138e-06, "epoch": 0.510250149721288, "percentage": 51.03, "elapsed_time": "17:31:38", "remaining_time": "16:49:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5539, "total_steps": 10853, "loss": 0.1357, "learning_rate": 2.6210760992544004e-06, "epoch": 0.5103422858985581, "percentage": 51.04, "elapsed_time": "17:31:49", "remaining_time": "16:49:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5540, "total_steps": 10853, "loss": 0.1423, "learning_rate": 2.6203152046597343e-06, "epoch": 0.5104344220758281, "percentage": 51.05, "elapsed_time": "17:31:59", "remaining_time": "16:48:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5541, "total_steps": 10853, "loss": 0.1395, "learning_rate": 2.6195542988937882e-06, "epoch": 0.5105265582530981, "percentage": 51.06, "elapsed_time": "17:32:09", "remaining_time": "16:48:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5542, "total_steps": 10853, "loss": 0.142, "learning_rate": 2.6187933820272128e-06, "epoch": 0.5106186944303681, "percentage": 51.06, "elapsed_time": "17:32:19", "remaining_time": "16:48:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5543, "total_steps": 10853, "loss": 0.1385, "learning_rate": 2.6180324541306577e-06, "epoch": 0.5107108306076381, "percentage": 51.07, "elapsed_time": "17:32:30", "remaining_time": "16:48:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5544, "total_steps": 10853, "loss": 0.129, "learning_rate": 2.6172715152747784e-06, "epoch": 0.5108029667849081, "percentage": 51.08, "elapsed_time": "17:32:40", "remaining_time": "16:48:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5545, "total_steps": 10853, "loss": 0.1359, "learning_rate": 2.6165105655302252e-06, "epoch": 0.5108951029621781, "percentage": 51.09, "elapsed_time": "17:32:51", "remaining_time": "16:47:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5546, "total_steps": 10853, "loss": 0.1406, "learning_rate": 2.615749604967654e-06, "epoch": 0.5109872391394481, "percentage": 51.1, "elapsed_time": "17:33:04", "remaining_time": "16:47:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5547, "total_steps": 10853, "loss": 0.1361, "learning_rate": 2.614988633657719e-06, "epoch": 0.5110793753167181, "percentage": 51.11, "elapsed_time": "17:33:16", "remaining_time": "16:47:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5548, "total_steps": 10853, "loss": 0.1335, "learning_rate": 2.614227651671078e-06, "epoch": 0.5111715114939881, "percentage": 51.12, "elapsed_time": "17:33:27", "remaining_time": "16:47:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5549, "total_steps": 10853, "loss": 0.1453, "learning_rate": 2.6134666590783856e-06, "epoch": 0.5112636476712581, "percentage": 51.13, "elapsed_time": "17:33:38", "remaining_time": "16:47:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5550, "total_steps": 10853, "loss": 0.1392, "learning_rate": 2.6127056559503035e-06, "epoch": 0.5113557838485281, "percentage": 51.14, "elapsed_time": "17:33:48", "remaining_time": "16:46:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5551, "total_steps": 10853, "loss": 0.1307, "learning_rate": 2.611944642357488e-06, "epoch": 0.5114479200257981, "percentage": 51.15, "elapsed_time": "17:34:00", "remaining_time": "16:46:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5552, "total_steps": 10853, "loss": 0.1424, "learning_rate": 2.611183618370601e-06, "epoch": 0.5115400562030681, "percentage": 51.16, "elapsed_time": "17:34:11", "remaining_time": "16:46:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5553, "total_steps": 10853, "loss": 0.1447, "learning_rate": 2.6104225840603026e-06, "epoch": 0.5116321923803382, "percentage": 51.17, "elapsed_time": "17:34:22", "remaining_time": "16:46:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5554, "total_steps": 10853, "loss": 0.1294, "learning_rate": 2.609661539497255e-06, "epoch": 0.5117243285576082, "percentage": 51.17, "elapsed_time": "17:34:32", "remaining_time": "16:46:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5555, "total_steps": 10853, "loss": 0.1384, "learning_rate": 2.6089004847521227e-06, "epoch": 0.5118164647348782, "percentage": 51.18, "elapsed_time": "17:34:43", "remaining_time": "16:45:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5556, "total_steps": 10853, "loss": 0.1349, "learning_rate": 2.608139419895568e-06, "epoch": 0.5119086009121482, "percentage": 51.19, "elapsed_time": "17:34:54", "remaining_time": "16:45:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5557, "total_steps": 10853, "loss": 0.138, "learning_rate": 2.6073783449982563e-06, "epoch": 0.5120007370894182, "percentage": 51.2, "elapsed_time": "17:35:04", "remaining_time": "16:45:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5558, "total_steps": 10853, "loss": 0.1302, "learning_rate": 2.6066172601308544e-06, "epoch": 0.5120928732666882, "percentage": 51.21, "elapsed_time": "17:35:15", "remaining_time": "16:45:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5559, "total_steps": 10853, "loss": 0.1362, "learning_rate": 2.605856165364028e-06, "epoch": 0.5121850094439582, "percentage": 51.22, "elapsed_time": "17:35:27", "remaining_time": "16:45:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5560, "total_steps": 10853, "loss": 0.1289, "learning_rate": 2.6050950607684454e-06, "epoch": 0.5122771456212282, "percentage": 51.23, "elapsed_time": "17:35:38", "remaining_time": "16:44:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5561, "total_steps": 10853, "loss": 0.1369, "learning_rate": 2.6043339464147754e-06, "epoch": 0.5123692817984982, "percentage": 51.24, "elapsed_time": "17:35:50", "remaining_time": "16:44:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5562, "total_steps": 10853, "loss": 0.1531, "learning_rate": 2.603572822373686e-06, "epoch": 0.5124614179757682, "percentage": 51.25, "elapsed_time": "17:36:02", "remaining_time": "16:44:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5563, "total_steps": 10853, "loss": 0.1504, "learning_rate": 2.6028116887158503e-06, "epoch": 0.5125535541530382, "percentage": 51.26, "elapsed_time": "17:36:15", "remaining_time": "16:44:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5564, "total_steps": 10853, "loss": 0.1276, "learning_rate": 2.6020505455119375e-06, "epoch": 0.5126456903303082, "percentage": 51.27, "elapsed_time": "17:36:25", "remaining_time": "16:44:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5565, "total_steps": 10853, "loss": 0.1335, "learning_rate": 2.601289392832621e-06, "epoch": 0.5127378265075782, "percentage": 51.28, "elapsed_time": "17:36:35", "remaining_time": "16:43:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5566, "total_steps": 10853, "loss": 0.1249, "learning_rate": 2.6005282307485735e-06, "epoch": 0.5128299626848482, "percentage": 51.29, "elapsed_time": "17:36:45", "remaining_time": "16:43:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5567, "total_steps": 10853, "loss": 0.1383, "learning_rate": 2.5997670593304688e-06, "epoch": 0.5129220988621183, "percentage": 51.29, "elapsed_time": "17:36:55", "remaining_time": "16:43:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5568, "total_steps": 10853, "loss": 0.1339, "learning_rate": 2.5990058786489818e-06, "epoch": 0.5130142350393883, "percentage": 51.3, "elapsed_time": "17:37:06", "remaining_time": "16:43:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5569, "total_steps": 10853, "loss": 0.125, "learning_rate": 2.5982446887747885e-06, "epoch": 0.5131063712166583, "percentage": 51.31, "elapsed_time": "17:37:16", "remaining_time": "16:43:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5570, "total_steps": 10853, "loss": 0.141, "learning_rate": 2.5974834897785646e-06, "epoch": 0.5131985073939282, "percentage": 51.32, "elapsed_time": "17:37:26", "remaining_time": "16:42:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5571, "total_steps": 10853, "loss": 0.1276, "learning_rate": 2.5967222817309893e-06, "epoch": 0.5132906435711982, "percentage": 51.33, "elapsed_time": "17:37:36", "remaining_time": "16:42:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5572, "total_steps": 10853, "loss": 0.1456, "learning_rate": 2.5959610647027388e-06, "epoch": 0.5133827797484682, "percentage": 51.34, "elapsed_time": "17:37:48", "remaining_time": "16:42:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5573, "total_steps": 10853, "loss": 0.1424, "learning_rate": 2.595199838764493e-06, "epoch": 0.5134749159257382, "percentage": 51.35, "elapsed_time": "17:38:00", "remaining_time": "16:42:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5574, "total_steps": 10853, "loss": 0.127, "learning_rate": 2.5944386039869328e-06, "epoch": 0.5135670521030082, "percentage": 51.36, "elapsed_time": "17:38:11", "remaining_time": "16:42:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5575, "total_steps": 10853, "loss": 0.1535, "learning_rate": 2.593677360440738e-06, "epoch": 0.5136591882802782, "percentage": 51.37, "elapsed_time": "17:38:22", "remaining_time": "16:41:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5576, "total_steps": 10853, "loss": 0.1252, "learning_rate": 2.5929161081965898e-06, "epoch": 0.5137513244575482, "percentage": 51.38, "elapsed_time": "17:38:34", "remaining_time": "16:41:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5577, "total_steps": 10853, "loss": 0.1411, "learning_rate": 2.592154847325171e-06, "epoch": 0.5138434606348182, "percentage": 51.39, "elapsed_time": "17:38:45", "remaining_time": "16:41:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5578, "total_steps": 10853, "loss": 0.1363, "learning_rate": 2.5913935778971644e-06, "epoch": 0.5139355968120882, "percentage": 51.4, "elapsed_time": "17:38:56", "remaining_time": "16:41:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5579, "total_steps": 10853, "loss": 0.1401, "learning_rate": 2.590632299983255e-06, "epoch": 0.5140277329893582, "percentage": 51.41, "elapsed_time": "17:39:05", "remaining_time": "16:41:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5580, "total_steps": 10853, "loss": 0.134, "learning_rate": 2.589871013654126e-06, "epoch": 0.5141198691666283, "percentage": 51.41, "elapsed_time": "17:39:15", "remaining_time": "16:40:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5581, "total_steps": 10853, "loss": 0.1469, "learning_rate": 2.589109718980464e-06, "epoch": 0.5142120053438983, "percentage": 51.42, "elapsed_time": "17:39:27", "remaining_time": "16:40:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5582, "total_steps": 10853, "loss": 0.1255, "learning_rate": 2.5883484160329552e-06, "epoch": 0.5143041415211683, "percentage": 51.43, "elapsed_time": "17:39:36", "remaining_time": "16:40:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5583, "total_steps": 10853, "loss": 0.14, "learning_rate": 2.587587104882286e-06, "epoch": 0.5143962776984383, "percentage": 51.44, "elapsed_time": "17:39:48", "remaining_time": "16:40:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5584, "total_steps": 10853, "loss": 0.1277, "learning_rate": 2.586825785599145e-06, "epoch": 0.5144884138757083, "percentage": 51.45, "elapsed_time": "17:39:58", "remaining_time": "16:40:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5585, "total_steps": 10853, "loss": 0.1567, "learning_rate": 2.5860644582542206e-06, "epoch": 0.5145805500529783, "percentage": 51.46, "elapsed_time": "17:40:08", "remaining_time": "16:39:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5586, "total_steps": 10853, "loss": 0.1218, "learning_rate": 2.5853031229182017e-06, "epoch": 0.5146726862302483, "percentage": 51.47, "elapsed_time": "17:40:18", "remaining_time": "16:39:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5587, "total_steps": 10853, "loss": 0.1325, "learning_rate": 2.584541779661779e-06, "epoch": 0.5147648224075183, "percentage": 51.48, "elapsed_time": "17:40:30", "remaining_time": "16:39:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5588, "total_steps": 10853, "loss": 0.1309, "learning_rate": 2.583780428555643e-06, "epoch": 0.5148569585847883, "percentage": 51.49, "elapsed_time": "17:40:41", "remaining_time": "16:39:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5589, "total_steps": 10853, "loss": 0.1328, "learning_rate": 2.5830190696704843e-06, "epoch": 0.5149490947620583, "percentage": 51.5, "elapsed_time": "17:40:53", "remaining_time": "16:39:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5590, "total_steps": 10853, "loss": 0.1353, "learning_rate": 2.5822577030769972e-06, "epoch": 0.5150412309393283, "percentage": 51.51, "elapsed_time": "17:41:05", "remaining_time": "16:39:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5591, "total_steps": 10853, "loss": 0.1382, "learning_rate": 2.581496328845873e-06, "epoch": 0.5151333671165983, "percentage": 51.52, "elapsed_time": "17:41:15", "remaining_time": "16:38:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5592, "total_steps": 10853, "loss": 0.1294, "learning_rate": 2.580734947047806e-06, "epoch": 0.5152255032938683, "percentage": 51.52, "elapsed_time": "17:41:25", "remaining_time": "16:38:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5593, "total_steps": 10853, "loss": 0.1582, "learning_rate": 2.57997355775349e-06, "epoch": 0.5153176394711383, "percentage": 51.53, "elapsed_time": "17:41:37", "remaining_time": "16:38:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5594, "total_steps": 10853, "loss": 0.138, "learning_rate": 2.5792121610336215e-06, "epoch": 0.5154097756484084, "percentage": 51.54, "elapsed_time": "17:41:48", "remaining_time": "16:38:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5595, "total_steps": 10853, "loss": 0.133, "learning_rate": 2.5784507569588947e-06, "epoch": 0.5155019118256784, "percentage": 51.55, "elapsed_time": "17:41:58", "remaining_time": "16:38:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5596, "total_steps": 10853, "loss": 0.1398, "learning_rate": 2.577689345600007e-06, "epoch": 0.5155940480029484, "percentage": 51.56, "elapsed_time": "17:42:09", "remaining_time": "16:37:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5597, "total_steps": 10853, "loss": 0.1359, "learning_rate": 2.5769279270276544e-06, "epoch": 0.5156861841802184, "percentage": 51.57, "elapsed_time": "17:42:19", "remaining_time": "16:37:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5598, "total_steps": 10853, "loss": 0.1266, "learning_rate": 2.5761665013125364e-06, "epoch": 0.5157783203574884, "percentage": 51.58, "elapsed_time": "17:42:31", "remaining_time": "16:37:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5599, "total_steps": 10853, "loss": 0.1495, "learning_rate": 2.5754050685253503e-06, "epoch": 0.5158704565347584, "percentage": 51.59, "elapsed_time": "17:42:43", "remaining_time": "16:37:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5600, "total_steps": 10853, "loss": 0.1411, "learning_rate": 2.5746436287367956e-06, "epoch": 0.5159625927120284, "percentage": 51.6, "elapsed_time": "17:42:55", "remaining_time": "16:37:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5601, "total_steps": 10853, "loss": 0.1462, "learning_rate": 2.5738821820175713e-06, "epoch": 0.5160547288892984, "percentage": 51.61, "elapsed_time": "17:43:06", "remaining_time": "16:36:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5602, "total_steps": 10853, "loss": 0.1567, "learning_rate": 2.573120728438379e-06, "epoch": 0.5161468650665684, "percentage": 51.62, "elapsed_time": "17:43:16", "remaining_time": "16:36:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5603, "total_steps": 10853, "loss": 0.1141, "learning_rate": 2.5723592680699194e-06, "epoch": 0.5162390012438384, "percentage": 51.63, "elapsed_time": "17:43:25", "remaining_time": "16:36:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5604, "total_steps": 10853, "loss": 0.1252, "learning_rate": 2.5715978009828934e-06, "epoch": 0.5163311374211084, "percentage": 51.64, "elapsed_time": "17:43:36", "remaining_time": "16:36:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5605, "total_steps": 10853, "loss": 0.1471, "learning_rate": 2.5708363272480034e-06, "epoch": 0.5164232735983784, "percentage": 51.64, "elapsed_time": "17:43:48", "remaining_time": "16:36:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5606, "total_steps": 10853, "loss": 0.1462, "learning_rate": 2.5700748469359542e-06, "epoch": 0.5165154097756484, "percentage": 51.65, "elapsed_time": "17:43:59", "remaining_time": "16:35:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5607, "total_steps": 10853, "loss": 0.1435, "learning_rate": 2.569313360117447e-06, "epoch": 0.5166075459529185, "percentage": 51.66, "elapsed_time": "17:44:09", "remaining_time": "16:35:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5608, "total_steps": 10853, "loss": 0.1342, "learning_rate": 2.568551866863187e-06, "epoch": 0.5166996821301885, "percentage": 51.67, "elapsed_time": "17:44:20", "remaining_time": "16:35:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5609, "total_steps": 10853, "loss": 0.1358, "learning_rate": 2.567790367243879e-06, "epoch": 0.5167918183074585, "percentage": 51.68, "elapsed_time": "17:44:32", "remaining_time": "16:35:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5610, "total_steps": 10853, "loss": 0.1363, "learning_rate": 2.5670288613302278e-06, "epoch": 0.5168839544847285, "percentage": 51.69, "elapsed_time": "17:44:42", "remaining_time": "16:35:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5611, "total_steps": 10853, "loss": 0.131, "learning_rate": 2.56626734919294e-06, "epoch": 0.5169760906619985, "percentage": 51.7, "elapsed_time": "17:44:53", "remaining_time": "16:34:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5612, "total_steps": 10853, "loss": 0.133, "learning_rate": 2.5655058309027216e-06, "epoch": 0.5170682268392685, "percentage": 51.71, "elapsed_time": "17:45:04", "remaining_time": "16:34:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5613, "total_steps": 10853, "loss": 0.1337, "learning_rate": 2.5647443065302797e-06, "epoch": 0.5171603630165384, "percentage": 51.72, "elapsed_time": "17:45:14", "remaining_time": "16:34:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5614, "total_steps": 10853, "loss": 0.1385, "learning_rate": 2.5639827761463217e-06, "epoch": 0.5172524991938084, "percentage": 51.73, "elapsed_time": "17:45:24", "remaining_time": "16:34:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5615, "total_steps": 10853, "loss": 0.1277, "learning_rate": 2.5632212398215563e-06, "epoch": 0.5173446353710784, "percentage": 51.74, "elapsed_time": "17:45:34", "remaining_time": "16:34:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5616, "total_steps": 10853, "loss": 0.1322, "learning_rate": 2.562459697626692e-06, "epoch": 0.5174367715483484, "percentage": 51.75, "elapsed_time": "17:45:45", "remaining_time": "16:33:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5617, "total_steps": 10853, "loss": 0.1425, "learning_rate": 2.561698149632438e-06, "epoch": 0.5175289077256184, "percentage": 51.76, "elapsed_time": "17:45:55", "remaining_time": "16:33:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5618, "total_steps": 10853, "loss": 0.1314, "learning_rate": 2.560936595909504e-06, "epoch": 0.5176210439028884, "percentage": 51.76, "elapsed_time": "17:46:06", "remaining_time": "16:33:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5619, "total_steps": 10853, "loss": 0.13, "learning_rate": 2.560175036528601e-06, "epoch": 0.5177131800801584, "percentage": 51.77, "elapsed_time": "17:46:16", "remaining_time": "16:33:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5620, "total_steps": 10853, "loss": 0.136, "learning_rate": 2.5594134715604384e-06, "epoch": 0.5178053162574284, "percentage": 51.78, "elapsed_time": "17:46:28", "remaining_time": "16:33:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5621, "total_steps": 10853, "loss": 0.1416, "learning_rate": 2.5586519010757295e-06, "epoch": 0.5178974524346985, "percentage": 51.79, "elapsed_time": "17:46:39", "remaining_time": "16:32:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5622, "total_steps": 10853, "loss": 0.1449, "learning_rate": 2.557890325145185e-06, "epoch": 0.5179895886119685, "percentage": 51.8, "elapsed_time": "17:46:49", "remaining_time": "16:32:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5623, "total_steps": 10853, "loss": 0.1402, "learning_rate": 2.5571287438395175e-06, "epoch": 0.5180817247892385, "percentage": 51.81, "elapsed_time": "17:47:00", "remaining_time": "16:32:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5624, "total_steps": 10853, "loss": 0.1331, "learning_rate": 2.5563671572294396e-06, "epoch": 0.5181738609665085, "percentage": 51.82, "elapsed_time": "17:47:13", "remaining_time": "16:32:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5625, "total_steps": 10853, "loss": 0.1401, "learning_rate": 2.5556055653856667e-06, "epoch": 0.5182659971437785, "percentage": 51.83, "elapsed_time": "17:47:22", "remaining_time": "16:32:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5626, "total_steps": 10853, "loss": 0.1356, "learning_rate": 2.554843968378909e-06, "epoch": 0.5183581333210485, "percentage": 51.84, "elapsed_time": "17:47:32", "remaining_time": "16:31:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5627, "total_steps": 10853, "loss": 0.1291, "learning_rate": 2.5540823662798843e-06, "epoch": 0.5184502694983185, "percentage": 51.85, "elapsed_time": "17:47:43", "remaining_time": "16:31:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5628, "total_steps": 10853, "loss": 0.1457, "learning_rate": 2.553320759159305e-06, "epoch": 0.5185424056755885, "percentage": 51.86, "elapsed_time": "17:47:54", "remaining_time": "16:31:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5629, "total_steps": 10853, "loss": 0.1322, "learning_rate": 2.5525591470878886e-06, "epoch": 0.5186345418528585, "percentage": 51.87, "elapsed_time": "17:48:04", "remaining_time": "16:31:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5630, "total_steps": 10853, "loss": 0.1291, "learning_rate": 2.551797530136349e-06, "epoch": 0.5187266780301285, "percentage": 51.88, "elapsed_time": "17:48:15", "remaining_time": "16:31:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5631, "total_steps": 10853, "loss": 0.138, "learning_rate": 2.5510359083754038e-06, "epoch": 0.5188188142073985, "percentage": 51.88, "elapsed_time": "17:48:26", "remaining_time": "16:30:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5632, "total_steps": 10853, "loss": 0.1348, "learning_rate": 2.5502742818757683e-06, "epoch": 0.5189109503846685, "percentage": 51.89, "elapsed_time": "17:48:36", "remaining_time": "16:30:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5633, "total_steps": 10853, "loss": 0.1373, "learning_rate": 2.549512650708161e-06, "epoch": 0.5190030865619385, "percentage": 51.9, "elapsed_time": "17:48:46", "remaining_time": "16:30:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5634, "total_steps": 10853, "loss": 0.1372, "learning_rate": 2.5487510149432974e-06, "epoch": 0.5190952227392085, "percentage": 51.91, "elapsed_time": "17:48:57", "remaining_time": "16:30:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5635, "total_steps": 10853, "loss": 0.1362, "learning_rate": 2.547989374651898e-06, "epoch": 0.5191873589164786, "percentage": 51.92, "elapsed_time": "17:49:08", "remaining_time": "16:30:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5636, "total_steps": 10853, "loss": 0.1312, "learning_rate": 2.54722772990468e-06, "epoch": 0.5192794950937486, "percentage": 51.93, "elapsed_time": "17:49:20", "remaining_time": "16:29:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5637, "total_steps": 10853, "loss": 0.1393, "learning_rate": 2.546466080772362e-06, "epoch": 0.5193716312710186, "percentage": 51.94, "elapsed_time": "17:49:31", "remaining_time": "16:29:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5638, "total_steps": 10853, "loss": 0.1419, "learning_rate": 2.5457044273256635e-06, "epoch": 0.5194637674482886, "percentage": 51.95, "elapsed_time": "17:49:42", "remaining_time": "16:29:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5639, "total_steps": 10853, "loss": 0.1371, "learning_rate": 2.544942769635304e-06, "epoch": 0.5195559036255586, "percentage": 51.96, "elapsed_time": "17:49:53", "remaining_time": "16:29:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5640, "total_steps": 10853, "loss": 0.1416, "learning_rate": 2.544181107772003e-06, "epoch": 0.5196480398028286, "percentage": 51.97, "elapsed_time": "17:50:05", "remaining_time": "16:29:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5641, "total_steps": 10853, "loss": 0.1418, "learning_rate": 2.543419441806482e-06, "epoch": 0.5197401759800986, "percentage": 51.98, "elapsed_time": "17:50:16", "remaining_time": "16:28:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5642, "total_steps": 10853, "loss": 0.1266, "learning_rate": 2.5426577718094607e-06, "epoch": 0.5198323121573686, "percentage": 51.99, "elapsed_time": "17:50:27", "remaining_time": "16:28:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5643, "total_steps": 10853, "loss": 0.1409, "learning_rate": 2.541896097851661e-06, "epoch": 0.5199244483346386, "percentage": 51.99, "elapsed_time": "17:50:37", "remaining_time": "16:28:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5644, "total_steps": 10853, "loss": 0.1365, "learning_rate": 2.541134420003804e-06, "epoch": 0.5200165845119086, "percentage": 52.0, "elapsed_time": "17:50:47", "remaining_time": "16:28:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5645, "total_steps": 10853, "loss": 0.1383, "learning_rate": 2.5403727383366116e-06, "epoch": 0.5201087206891786, "percentage": 52.01, "elapsed_time": "17:50:56", "remaining_time": "16:28:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5646, "total_steps": 10853, "loss": 0.1141, "learning_rate": 2.5396110529208066e-06, "epoch": 0.5202008568664486, "percentage": 52.02, "elapsed_time": "17:51:07", "remaining_time": "16:27:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5647, "total_steps": 10853, "loss": 0.1369, "learning_rate": 2.53884936382711e-06, "epoch": 0.5202929930437186, "percentage": 52.03, "elapsed_time": "17:51:17", "remaining_time": "16:27:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5648, "total_steps": 10853, "loss": 0.1406, "learning_rate": 2.538087671126247e-06, "epoch": 0.5203851292209887, "percentage": 52.04, "elapsed_time": "17:51:28", "remaining_time": "16:27:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5649, "total_steps": 10853, "loss": 0.1386, "learning_rate": 2.537325974888939e-06, "epoch": 0.5204772653982587, "percentage": 52.05, "elapsed_time": "17:51:39", "remaining_time": "16:27:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5650, "total_steps": 10853, "loss": 0.1348, "learning_rate": 2.5365642751859103e-06, "epoch": 0.5205694015755287, "percentage": 52.06, "elapsed_time": "17:51:50", "remaining_time": "16:27:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5651, "total_steps": 10853, "loss": 0.135, "learning_rate": 2.5358025720878847e-06, "epoch": 0.5206615377527987, "percentage": 52.07, "elapsed_time": "17:52:01", "remaining_time": "16:26:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5652, "total_steps": 10853, "loss": 0.1449, "learning_rate": 2.535040865665587e-06, "epoch": 0.5207536739300687, "percentage": 52.08, "elapsed_time": "17:52:13", "remaining_time": "16:26:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5653, "total_steps": 10853, "loss": 0.1393, "learning_rate": 2.53427915598974e-06, "epoch": 0.5208458101073387, "percentage": 52.09, "elapsed_time": "17:52:24", "remaining_time": "16:26:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5654, "total_steps": 10853, "loss": 0.1392, "learning_rate": 2.5335174431310705e-06, "epoch": 0.5209379462846087, "percentage": 52.1, "elapsed_time": "17:52:36", "remaining_time": "16:26:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5655, "total_steps": 10853, "loss": 0.1455, "learning_rate": 2.532755727160302e-06, "epoch": 0.5210300824618787, "percentage": 52.11, "elapsed_time": "17:52:46", "remaining_time": "16:26:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5656, "total_steps": 10853, "loss": 0.1235, "learning_rate": 2.5319940081481612e-06, "epoch": 0.5211222186391486, "percentage": 52.11, "elapsed_time": "17:52:57", "remaining_time": "16:25:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5657, "total_steps": 10853, "loss": 0.1438, "learning_rate": 2.531232286165374e-06, "epoch": 0.5212143548164186, "percentage": 52.12, "elapsed_time": "17:53:07", "remaining_time": "16:25:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5658, "total_steps": 10853, "loss": 0.1308, "learning_rate": 2.530470561282665e-06, "epoch": 0.5213064909936886, "percentage": 52.13, "elapsed_time": "17:53:18", "remaining_time": "16:25:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5659, "total_steps": 10853, "loss": 0.1461, "learning_rate": 2.5297088335707607e-06, "epoch": 0.5213986271709586, "percentage": 52.14, "elapsed_time": "17:53:28", "remaining_time": "16:25:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5660, "total_steps": 10853, "loss": 0.1396, "learning_rate": 2.5289471031003894e-06, "epoch": 0.5214907633482286, "percentage": 52.15, "elapsed_time": "17:53:38", "remaining_time": "16:25:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5661, "total_steps": 10853, "loss": 0.1323, "learning_rate": 2.528185369942275e-06, "epoch": 0.5215828995254986, "percentage": 52.16, "elapsed_time": "17:53:49", "remaining_time": "16:24:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5662, "total_steps": 10853, "loss": 0.1437, "learning_rate": 2.5274236341671464e-06, "epoch": 0.5216750357027687, "percentage": 52.17, "elapsed_time": "17:54:00", "remaining_time": "16:24:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5663, "total_steps": 10853, "loss": 0.1501, "learning_rate": 2.5266618958457305e-06, "epoch": 0.5217671718800387, "percentage": 52.18, "elapsed_time": "17:54:10", "remaining_time": "16:24:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5664, "total_steps": 10853, "loss": 0.1351, "learning_rate": 2.525900155048755e-06, "epoch": 0.5218593080573087, "percentage": 52.19, "elapsed_time": "17:54:21", "remaining_time": "16:24:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5665, "total_steps": 10853, "loss": 0.155, "learning_rate": 2.525138411846947e-06, "epoch": 0.5219514442345787, "percentage": 52.2, "elapsed_time": "17:54:33", "remaining_time": "16:24:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5666, "total_steps": 10853, "loss": 0.1552, "learning_rate": 2.524376666311035e-06, "epoch": 0.5220435804118487, "percentage": 52.21, "elapsed_time": "17:54:44", "remaining_time": "16:23:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5667, "total_steps": 10853, "loss": 0.1253, "learning_rate": 2.523614918511746e-06, "epoch": 0.5221357165891187, "percentage": 52.22, "elapsed_time": "17:54:56", "remaining_time": "16:23:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5668, "total_steps": 10853, "loss": 0.1265, "learning_rate": 2.5228531685198105e-06, "epoch": 0.5222278527663887, "percentage": 52.23, "elapsed_time": "17:55:06", "remaining_time": "16:23:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5669, "total_steps": 10853, "loss": 0.1339, "learning_rate": 2.522091416405955e-06, "epoch": 0.5223199889436587, "percentage": 52.23, "elapsed_time": "17:55:17", "remaining_time": "16:23:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5670, "total_steps": 10853, "loss": 0.1418, "learning_rate": 2.5213296622409094e-06, "epoch": 0.5224121251209287, "percentage": 52.24, "elapsed_time": "17:55:26", "remaining_time": "16:23:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5671, "total_steps": 10853, "loss": 0.1439, "learning_rate": 2.5205679060954025e-06, "epoch": 0.5225042612981987, "percentage": 52.25, "elapsed_time": "17:55:37", "remaining_time": "16:22:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5672, "total_steps": 10853, "loss": 0.1449, "learning_rate": 2.5198061480401623e-06, "epoch": 0.5225963974754687, "percentage": 52.26, "elapsed_time": "17:55:49", "remaining_time": "16:22:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5673, "total_steps": 10853, "loss": 0.1326, "learning_rate": 2.519044388145921e-06, "epoch": 0.5226885336527387, "percentage": 52.27, "elapsed_time": "17:55:58", "remaining_time": "16:22:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5674, "total_steps": 10853, "loss": 0.1359, "learning_rate": 2.5182826264834046e-06, "epoch": 0.5227806698300087, "percentage": 52.28, "elapsed_time": "17:56:09", "remaining_time": "16:22:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5675, "total_steps": 10853, "loss": 0.145, "learning_rate": 2.5175208631233454e-06, "epoch": 0.5228728060072788, "percentage": 52.29, "elapsed_time": "17:56:21", "remaining_time": "16:22:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5676, "total_steps": 10853, "loss": 0.1362, "learning_rate": 2.516759098136472e-06, "epoch": 0.5229649421845488, "percentage": 52.3, "elapsed_time": "17:56:31", "remaining_time": "16:21:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5677, "total_steps": 10853, "loss": 0.1458, "learning_rate": 2.515997331593514e-06, "epoch": 0.5230570783618188, "percentage": 52.31, "elapsed_time": "17:56:44", "remaining_time": "16:21:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5678, "total_steps": 10853, "loss": 0.137, "learning_rate": 2.5152355635652027e-06, "epoch": 0.5231492145390888, "percentage": 52.32, "elapsed_time": "17:56:56", "remaining_time": "16:21:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5679, "total_steps": 10853, "loss": 0.1471, "learning_rate": 2.5144737941222673e-06, "epoch": 0.5232413507163588, "percentage": 52.33, "elapsed_time": "17:57:06", "remaining_time": "16:21:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5680, "total_steps": 10853, "loss": 0.1413, "learning_rate": 2.513712023335438e-06, "epoch": 0.5233334868936288, "percentage": 52.34, "elapsed_time": "17:57:17", "remaining_time": "16:21:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5681, "total_steps": 10853, "loss": 0.1347, "learning_rate": 2.512950251275447e-06, "epoch": 0.5234256230708988, "percentage": 52.34, "elapsed_time": "17:57:29", "remaining_time": "16:20:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5682, "total_steps": 10853, "loss": 0.1366, "learning_rate": 2.512188478013023e-06, "epoch": 0.5235177592481688, "percentage": 52.35, "elapsed_time": "17:57:41", "remaining_time": "16:20:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5683, "total_steps": 10853, "loss": 0.13, "learning_rate": 2.5114267036188975e-06, "epoch": 0.5236098954254388, "percentage": 52.36, "elapsed_time": "17:57:50", "remaining_time": "16:20:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5684, "total_steps": 10853, "loss": 0.1517, "learning_rate": 2.510664928163802e-06, "epoch": 0.5237020316027088, "percentage": 52.37, "elapsed_time": "17:58:02", "remaining_time": "16:20:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5685, "total_steps": 10853, "loss": 0.1235, "learning_rate": 2.5099031517184665e-06, "epoch": 0.5237941677799788, "percentage": 52.38, "elapsed_time": "17:58:13", "remaining_time": "16:20:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5686, "total_steps": 10853, "loss": 0.1339, "learning_rate": 2.509141374353622e-06, "epoch": 0.5238863039572488, "percentage": 52.39, "elapsed_time": "17:58:24", "remaining_time": "16:19:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5687, "total_steps": 10853, "loss": 0.1489, "learning_rate": 2.50837959614e-06, "epoch": 0.5239784401345188, "percentage": 52.4, "elapsed_time": "17:58:35", "remaining_time": "16:19:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5688, "total_steps": 10853, "loss": 0.1415, "learning_rate": 2.5076178171483312e-06, "epoch": 0.5240705763117888, "percentage": 52.41, "elapsed_time": "17:58:45", "remaining_time": "16:19:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5689, "total_steps": 10853, "loss": 0.14, "learning_rate": 2.506856037449348e-06, "epoch": 0.5241627124890589, "percentage": 52.42, "elapsed_time": "17:58:57", "remaining_time": "16:19:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5690, "total_steps": 10853, "loss": 0.1549, "learning_rate": 2.50609425711378e-06, "epoch": 0.5242548486663289, "percentage": 52.43, "elapsed_time": "17:59:07", "remaining_time": "16:19:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5691, "total_steps": 10853, "loss": 0.1547, "learning_rate": 2.505332476212361e-06, "epoch": 0.5243469848435989, "percentage": 52.44, "elapsed_time": "17:59:18", "remaining_time": "16:18:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5692, "total_steps": 10853, "loss": 0.1412, "learning_rate": 2.50457069481582e-06, "epoch": 0.5244391210208689, "percentage": 52.45, "elapsed_time": "17:59:29", "remaining_time": "16:18:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5693, "total_steps": 10853, "loss": 0.14, "learning_rate": 2.50380891299489e-06, "epoch": 0.5245312571981389, "percentage": 52.46, "elapsed_time": "17:59:40", "remaining_time": "16:18:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5694, "total_steps": 10853, "loss": 0.1305, "learning_rate": 2.503047130820302e-06, "epoch": 0.5246233933754089, "percentage": 52.46, "elapsed_time": "17:59:50", "remaining_time": "16:18:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5695, "total_steps": 10853, "loss": 0.1291, "learning_rate": 2.5022853483627876e-06, "epoch": 0.5247155295526789, "percentage": 52.47, "elapsed_time": "18:00:01", "remaining_time": "16:18:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5696, "total_steps": 10853, "loss": 0.1468, "learning_rate": 2.5015235656930774e-06, "epoch": 0.5248076657299489, "percentage": 52.48, "elapsed_time": "18:00:11", "remaining_time": "16:17:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5697, "total_steps": 10853, "loss": 0.1402, "learning_rate": 2.500761782881905e-06, "epoch": 0.5248998019072189, "percentage": 52.49, "elapsed_time": "18:00:21", "remaining_time": "16:17:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5698, "total_steps": 10853, "loss": 0.1319, "learning_rate": 2.5e-06, "epoch": 0.5249919380844889, "percentage": 52.5, "elapsed_time": "18:00:31", "remaining_time": "16:17:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5699, "total_steps": 10853, "loss": 0.1341, "learning_rate": 2.499238217118095e-06, "epoch": 0.5250840742617588, "percentage": 52.51, "elapsed_time": "18:00:42", "remaining_time": "16:17:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5700, "total_steps": 10853, "loss": 0.1414, "learning_rate": 2.498476434306923e-06, "epoch": 0.5251762104390288, "percentage": 52.52, "elapsed_time": "18:00:53", "remaining_time": "16:17:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5701, "total_steps": 10853, "loss": 0.135, "learning_rate": 2.4977146516372137e-06, "epoch": 0.5252683466162988, "percentage": 52.53, "elapsed_time": "18:01:05", "remaining_time": "16:16:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5702, "total_steps": 10853, "loss": 0.1414, "learning_rate": 2.496952869179699e-06, "epoch": 0.525360482793569, "percentage": 52.54, "elapsed_time": "18:01:16", "remaining_time": "16:16:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5703, "total_steps": 10853, "loss": 0.1304, "learning_rate": 2.4961910870051105e-06, "epoch": 0.525452618970839, "percentage": 52.55, "elapsed_time": "18:01:26", "remaining_time": "16:16:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5704, "total_steps": 10853, "loss": 0.1421, "learning_rate": 2.49542930518418e-06, "epoch": 0.5255447551481089, "percentage": 52.56, "elapsed_time": "18:01:36", "remaining_time": "16:16:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5705, "total_steps": 10853, "loss": 0.1425, "learning_rate": 2.49466752378764e-06, "epoch": 0.5256368913253789, "percentage": 52.57, "elapsed_time": "18:01:47", "remaining_time": "16:16:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5706, "total_steps": 10853, "loss": 0.1284, "learning_rate": 2.4939057428862203e-06, "epoch": 0.5257290275026489, "percentage": 52.58, "elapsed_time": "18:02:00", "remaining_time": "16:16:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5707, "total_steps": 10853, "loss": 0.1276, "learning_rate": 2.4931439625506522e-06, "epoch": 0.5258211636799189, "percentage": 52.58, "elapsed_time": "18:02:10", "remaining_time": "16:15:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5708, "total_steps": 10853, "loss": 0.1426, "learning_rate": 2.4923821828516688e-06, "epoch": 0.5259132998571889, "percentage": 52.59, "elapsed_time": "18:02:20", "remaining_time": "16:15:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5709, "total_steps": 10853, "loss": 0.1377, "learning_rate": 2.491620403860001e-06, "epoch": 0.5260054360344589, "percentage": 52.6, "elapsed_time": "18:02:31", "remaining_time": "16:15:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5710, "total_steps": 10853, "loss": 0.1482, "learning_rate": 2.4908586256463788e-06, "epoch": 0.5260975722117289, "percentage": 52.61, "elapsed_time": "18:02:42", "remaining_time": "16:15:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5711, "total_steps": 10853, "loss": 0.1391, "learning_rate": 2.4900968482815344e-06, "epoch": 0.5261897083889989, "percentage": 52.62, "elapsed_time": "18:02:51", "remaining_time": "16:14:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5712, "total_steps": 10853, "loss": 0.1323, "learning_rate": 2.4893350718361984e-06, "epoch": 0.5262818445662689, "percentage": 52.63, "elapsed_time": "18:03:02", "remaining_time": "16:14:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5713, "total_steps": 10853, "loss": 0.1392, "learning_rate": 2.488573296381103e-06, "epoch": 0.5263739807435389, "percentage": 52.64, "elapsed_time": "18:03:12", "remaining_time": "16:14:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5714, "total_steps": 10853, "loss": 0.1366, "learning_rate": 2.487811521986978e-06, "epoch": 0.5264661169208089, "percentage": 52.65, "elapsed_time": "18:03:24", "remaining_time": "16:14:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5715, "total_steps": 10853, "loss": 0.1469, "learning_rate": 2.4870497487245534e-06, "epoch": 0.5265582530980789, "percentage": 52.66, "elapsed_time": "18:03:35", "remaining_time": "16:14:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5716, "total_steps": 10853, "loss": 0.1516, "learning_rate": 2.486287976664562e-06, "epoch": 0.526650389275349, "percentage": 52.67, "elapsed_time": "18:03:46", "remaining_time": "16:13:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5717, "total_steps": 10853, "loss": 0.1329, "learning_rate": 2.485526205877734e-06, "epoch": 0.526742525452619, "percentage": 52.68, "elapsed_time": "18:03:57", "remaining_time": "16:13:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5718, "total_steps": 10853, "loss": 0.1435, "learning_rate": 2.484764436434798e-06, "epoch": 0.526834661629889, "percentage": 52.69, "elapsed_time": "18:04:08", "remaining_time": "16:13:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5719, "total_steps": 10853, "loss": 0.1249, "learning_rate": 2.4840026684064867e-06, "epoch": 0.526926797807159, "percentage": 52.7, "elapsed_time": "18:04:17", "remaining_time": "16:13:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5720, "total_steps": 10853, "loss": 0.1428, "learning_rate": 2.4832409018635283e-06, "epoch": 0.527018933984429, "percentage": 52.7, "elapsed_time": "18:04:28", "remaining_time": "16:13:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5721, "total_steps": 10853, "loss": 0.1412, "learning_rate": 2.4824791368766555e-06, "epoch": 0.527111070161699, "percentage": 52.71, "elapsed_time": "18:04:39", "remaining_time": "16:12:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5722, "total_steps": 10853, "loss": 0.1406, "learning_rate": 2.4817173735165958e-06, "epoch": 0.527203206338969, "percentage": 52.72, "elapsed_time": "18:04:50", "remaining_time": "16:12:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5723, "total_steps": 10853, "loss": 0.1333, "learning_rate": 2.4809556118540795e-06, "epoch": 0.527295342516239, "percentage": 52.73, "elapsed_time": "18:05:01", "remaining_time": "16:12:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5724, "total_steps": 10853, "loss": 0.1201, "learning_rate": 2.4801938519598372e-06, "epoch": 0.527387478693509, "percentage": 52.74, "elapsed_time": "18:05:11", "remaining_time": "16:12:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5725, "total_steps": 10853, "loss": 0.1418, "learning_rate": 2.4794320939045988e-06, "epoch": 0.527479614870779, "percentage": 52.75, "elapsed_time": "18:05:22", "remaining_time": "16:12:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5726, "total_steps": 10853, "loss": 0.1314, "learning_rate": 2.4786703377590914e-06, "epoch": 0.527571751048049, "percentage": 52.76, "elapsed_time": "18:05:32", "remaining_time": "16:11:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5727, "total_steps": 10853, "loss": 0.1501, "learning_rate": 2.4779085835940457e-06, "epoch": 0.527663887225319, "percentage": 52.77, "elapsed_time": "18:05:43", "remaining_time": "16:11:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5728, "total_steps": 10853, "loss": 0.1368, "learning_rate": 2.47714683148019e-06, "epoch": 0.527756023402589, "percentage": 52.78, "elapsed_time": "18:05:54", "remaining_time": "16:11:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5729, "total_steps": 10853, "loss": 0.1416, "learning_rate": 2.476385081488254e-06, "epoch": 0.527848159579859, "percentage": 52.79, "elapsed_time": "18:06:06", "remaining_time": "16:11:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5730, "total_steps": 10853, "loss": 0.1331, "learning_rate": 2.4756233336889663e-06, "epoch": 0.5279402957571291, "percentage": 52.8, "elapsed_time": "18:06:17", "remaining_time": "16:11:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5731, "total_steps": 10853, "loss": 0.1434, "learning_rate": 2.474861588153054e-06, "epoch": 0.5280324319343991, "percentage": 52.81, "elapsed_time": "18:06:28", "remaining_time": "16:11:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5732, "total_steps": 10853, "loss": 0.1405, "learning_rate": 2.4740998449512456e-06, "epoch": 0.5281245681116691, "percentage": 52.81, "elapsed_time": "18:06:37", "remaining_time": "16:10:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5733, "total_steps": 10853, "loss": 0.1442, "learning_rate": 2.4733381041542695e-06, "epoch": 0.5282167042889391, "percentage": 52.82, "elapsed_time": "18:06:47", "remaining_time": "16:10:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5734, "total_steps": 10853, "loss": 0.128, "learning_rate": 2.4725763658328544e-06, "epoch": 0.5283088404662091, "percentage": 52.83, "elapsed_time": "18:06:58", "remaining_time": "16:10:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5735, "total_steps": 10853, "loss": 0.1368, "learning_rate": 2.471814630057726e-06, "epoch": 0.5284009766434791, "percentage": 52.84, "elapsed_time": "18:07:09", "remaining_time": "16:10:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5736, "total_steps": 10853, "loss": 0.149, "learning_rate": 2.4710528968996114e-06, "epoch": 0.5284931128207491, "percentage": 52.85, "elapsed_time": "18:07:20", "remaining_time": "16:09:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5737, "total_steps": 10853, "loss": 0.1365, "learning_rate": 2.4702911664292397e-06, "epoch": 0.5285852489980191, "percentage": 52.86, "elapsed_time": "18:07:30", "remaining_time": "16:09:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5738, "total_steps": 10853, "loss": 0.1373, "learning_rate": 2.469529438717336e-06, "epoch": 0.5286773851752891, "percentage": 52.87, "elapsed_time": "18:07:41", "remaining_time": "16:09:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5739, "total_steps": 10853, "loss": 0.137, "learning_rate": 2.4687677138346265e-06, "epoch": 0.5287695213525591, "percentage": 52.88, "elapsed_time": "18:07:51", "remaining_time": "16:09:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5740, "total_steps": 10853, "loss": 0.1547, "learning_rate": 2.468005991851839e-06, "epoch": 0.528861657529829, "percentage": 52.89, "elapsed_time": "18:08:02", "remaining_time": "16:09:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5741, "total_steps": 10853, "loss": 0.1402, "learning_rate": 2.467244272839698e-06, "epoch": 0.528953793707099, "percentage": 52.9, "elapsed_time": "18:08:12", "remaining_time": "16:08:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5742, "total_steps": 10853, "loss": 0.1316, "learning_rate": 2.4664825568689303e-06, "epoch": 0.529045929884369, "percentage": 52.91, "elapsed_time": "18:08:24", "remaining_time": "16:08:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5743, "total_steps": 10853, "loss": 0.1346, "learning_rate": 2.4657208440102607e-06, "epoch": 0.5291380660616392, "percentage": 52.92, "elapsed_time": "18:08:34", "remaining_time": "16:08:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5744, "total_steps": 10853, "loss": 0.1398, "learning_rate": 2.464959134334414e-06, "epoch": 0.5292302022389092, "percentage": 52.93, "elapsed_time": "18:08:44", "remaining_time": "16:08:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5745, "total_steps": 10853, "loss": 0.1338, "learning_rate": 2.4641974279121157e-06, "epoch": 0.5293223384161792, "percentage": 52.93, "elapsed_time": "18:08:55", "remaining_time": "16:08:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5746, "total_steps": 10853, "loss": 0.1363, "learning_rate": 2.463435724814091e-06, "epoch": 0.5294144745934491, "percentage": 52.94, "elapsed_time": "18:09:06", "remaining_time": "16:07:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5747, "total_steps": 10853, "loss": 0.1451, "learning_rate": 2.4626740251110615e-06, "epoch": 0.5295066107707191, "percentage": 52.95, "elapsed_time": "18:09:17", "remaining_time": "16:07:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5748, "total_steps": 10853, "loss": 0.1357, "learning_rate": 2.461912328873754e-06, "epoch": 0.5295987469479891, "percentage": 52.96, "elapsed_time": "18:09:28", "remaining_time": "16:07:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5749, "total_steps": 10853, "loss": 0.1492, "learning_rate": 2.46115063617289e-06, "epoch": 0.5296908831252591, "percentage": 52.97, "elapsed_time": "18:09:40", "remaining_time": "16:07:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5750, "total_steps": 10853, "loss": 0.128, "learning_rate": 2.4603889470791946e-06, "epoch": 0.5297830193025291, "percentage": 52.98, "elapsed_time": "18:09:50", "remaining_time": "16:07:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5751, "total_steps": 10853, "loss": 0.1339, "learning_rate": 2.4596272616633892e-06, "epoch": 0.5298751554797991, "percentage": 52.99, "elapsed_time": "18:10:01", "remaining_time": "16:07:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5752, "total_steps": 10853, "loss": 0.1365, "learning_rate": 2.4588655799961968e-06, "epoch": 0.5299672916570691, "percentage": 53.0, "elapsed_time": "18:10:13", "remaining_time": "16:06:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5753, "total_steps": 10853, "loss": 0.1388, "learning_rate": 2.45810390214834e-06, "epoch": 0.5300594278343391, "percentage": 53.01, "elapsed_time": "18:10:23", "remaining_time": "16:06:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5754, "total_steps": 10853, "loss": 0.1451, "learning_rate": 2.4573422281905405e-06, "epoch": 0.5301515640116091, "percentage": 53.02, "elapsed_time": "18:10:33", "remaining_time": "16:06:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5755, "total_steps": 10853, "loss": 0.1378, "learning_rate": 2.456580558193519e-06, "epoch": 0.5302437001888791, "percentage": 53.03, "elapsed_time": "18:10:43", "remaining_time": "16:06:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5756, "total_steps": 10853, "loss": 0.147, "learning_rate": 2.4558188922279977e-06, "epoch": 0.5303358363661491, "percentage": 53.04, "elapsed_time": "18:10:55", "remaining_time": "16:06:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5757, "total_steps": 10853, "loss": 0.155, "learning_rate": 2.4550572303646965e-06, "epoch": 0.5304279725434192, "percentage": 53.05, "elapsed_time": "18:11:06", "remaining_time": "16:05:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5758, "total_steps": 10853, "loss": 0.14, "learning_rate": 2.454295572674337e-06, "epoch": 0.5305201087206892, "percentage": 53.05, "elapsed_time": "18:11:16", "remaining_time": "16:05:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5759, "total_steps": 10853, "loss": 0.1378, "learning_rate": 2.453533919227639e-06, "epoch": 0.5306122448979592, "percentage": 53.06, "elapsed_time": "18:11:27", "remaining_time": "16:05:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5760, "total_steps": 10853, "loss": 0.1348, "learning_rate": 2.4527722700953205e-06, "epoch": 0.5307043810752292, "percentage": 53.07, "elapsed_time": "18:11:39", "remaining_time": "16:05:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5761, "total_steps": 10853, "loss": 0.1408, "learning_rate": 2.4520106253481025e-06, "epoch": 0.5307965172524992, "percentage": 53.08, "elapsed_time": "18:11:52", "remaining_time": "16:05:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5762, "total_steps": 10853, "loss": 0.1464, "learning_rate": 2.451248985056702e-06, "epoch": 0.5308886534297692, "percentage": 53.09, "elapsed_time": "18:12:04", "remaining_time": "16:04:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5763, "total_steps": 10853, "loss": 0.1252, "learning_rate": 2.4504873492918404e-06, "epoch": 0.5309807896070392, "percentage": 53.1, "elapsed_time": "18:12:13", "remaining_time": "16:04:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5764, "total_steps": 10853, "loss": 0.1401, "learning_rate": 2.449725718124233e-06, "epoch": 0.5310729257843092, "percentage": 53.11, "elapsed_time": "18:12:24", "remaining_time": "16:04:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5765, "total_steps": 10853, "loss": 0.1383, "learning_rate": 2.448964091624597e-06, "epoch": 0.5311650619615792, "percentage": 53.12, "elapsed_time": "18:12:35", "remaining_time": "16:04:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5766, "total_steps": 10853, "loss": 0.1334, "learning_rate": 2.4482024698636514e-06, "epoch": 0.5312571981388492, "percentage": 53.13, "elapsed_time": "18:12:46", "remaining_time": "16:04:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5767, "total_steps": 10853, "loss": 0.1379, "learning_rate": 2.4474408529121126e-06, "epoch": 0.5313493343161192, "percentage": 53.14, "elapsed_time": "18:12:57", "remaining_time": "16:03:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5768, "total_steps": 10853, "loss": 0.1158, "learning_rate": 2.4466792408406953e-06, "epoch": 0.5314414704933892, "percentage": 53.15, "elapsed_time": "18:13:08", "remaining_time": "16:03:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5769, "total_steps": 10853, "loss": 0.1366, "learning_rate": 2.445917633720117e-06, "epoch": 0.5315336066706592, "percentage": 53.16, "elapsed_time": "18:13:20", "remaining_time": "16:03:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5770, "total_steps": 10853, "loss": 0.1298, "learning_rate": 2.4451560316210913e-06, "epoch": 0.5316257428479293, "percentage": 53.17, "elapsed_time": "18:13:32", "remaining_time": "16:03:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5771, "total_steps": 10853, "loss": 0.1448, "learning_rate": 2.444394434614335e-06, "epoch": 0.5317178790251993, "percentage": 53.17, "elapsed_time": "18:13:42", "remaining_time": "16:03:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5772, "total_steps": 10853, "loss": 0.1484, "learning_rate": 2.4436328427705612e-06, "epoch": 0.5318100152024693, "percentage": 53.18, "elapsed_time": "18:13:53", "remaining_time": "16:02:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5773, "total_steps": 10853, "loss": 0.1463, "learning_rate": 2.442871256160483e-06, "epoch": 0.5319021513797393, "percentage": 53.19, "elapsed_time": "18:14:05", "remaining_time": "16:02:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5774, "total_steps": 10853, "loss": 0.1435, "learning_rate": 2.442109674854815e-06, "epoch": 0.5319942875570093, "percentage": 53.2, "elapsed_time": "18:14:15", "remaining_time": "16:02:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5775, "total_steps": 10853, "loss": 0.1247, "learning_rate": 2.4413480989242718e-06, "epoch": 0.5320864237342793, "percentage": 53.21, "elapsed_time": "18:14:25", "remaining_time": "16:02:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5776, "total_steps": 10853, "loss": 0.1404, "learning_rate": 2.440586528439562e-06, "epoch": 0.5321785599115493, "percentage": 53.22, "elapsed_time": "18:14:37", "remaining_time": "16:02:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5777, "total_steps": 10853, "loss": 0.1332, "learning_rate": 2.4398249634713996e-06, "epoch": 0.5322706960888193, "percentage": 53.23, "elapsed_time": "18:14:47", "remaining_time": "16:01:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5778, "total_steps": 10853, "loss": 0.1182, "learning_rate": 2.4390634040904965e-06, "epoch": 0.5323628322660893, "percentage": 53.24, "elapsed_time": "18:14:58", "remaining_time": "16:01:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5779, "total_steps": 10853, "loss": 0.1345, "learning_rate": 2.4383018503675633e-06, "epoch": 0.5324549684433593, "percentage": 53.25, "elapsed_time": "18:15:09", "remaining_time": "16:01:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5780, "total_steps": 10853, "loss": 0.125, "learning_rate": 2.437540302373309e-06, "epoch": 0.5325471046206293, "percentage": 53.26, "elapsed_time": "18:15:21", "remaining_time": "16:01:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5781, "total_steps": 10853, "loss": 0.1371, "learning_rate": 2.4367787601784446e-06, "epoch": 0.5326392407978993, "percentage": 53.27, "elapsed_time": "18:15:33", "remaining_time": "16:01:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5782, "total_steps": 10853, "loss": 0.1364, "learning_rate": 2.4360172238536787e-06, "epoch": 0.5327313769751693, "percentage": 53.28, "elapsed_time": "18:15:43", "remaining_time": "16:00:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5783, "total_steps": 10853, "loss": 0.1423, "learning_rate": 2.435255693469721e-06, "epoch": 0.5328235131524393, "percentage": 53.28, "elapsed_time": "18:15:54", "remaining_time": "16:00:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5784, "total_steps": 10853, "loss": 0.1498, "learning_rate": 2.4344941690972797e-06, "epoch": 0.5329156493297094, "percentage": 53.29, "elapsed_time": "18:16:05", "remaining_time": "16:00:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5785, "total_steps": 10853, "loss": 0.139, "learning_rate": 2.4337326508070604e-06, "epoch": 0.5330077855069794, "percentage": 53.3, "elapsed_time": "18:16:15", "remaining_time": "16:00:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5786, "total_steps": 10853, "loss": 0.1298, "learning_rate": 2.4329711386697726e-06, "epoch": 0.5330999216842494, "percentage": 53.31, "elapsed_time": "18:16:28", "remaining_time": "16:00:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5787, "total_steps": 10853, "loss": 0.1489, "learning_rate": 2.432209632756121e-06, "epoch": 0.5331920578615194, "percentage": 53.32, "elapsed_time": "18:16:37", "remaining_time": "16:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5788, "total_steps": 10853, "loss": 0.135, "learning_rate": 2.4314481331368133e-06, "epoch": 0.5332841940387893, "percentage": 53.33, "elapsed_time": "18:16:49", "remaining_time": "15:59:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5789, "total_steps": 10853, "loss": 0.132, "learning_rate": 2.430686639882554e-06, "epoch": 0.5333763302160593, "percentage": 53.34, "elapsed_time": "18:17:00", "remaining_time": "15:59:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5790, "total_steps": 10853, "loss": 0.1237, "learning_rate": 2.429925153064046e-06, "epoch": 0.5334684663933293, "percentage": 53.35, "elapsed_time": "18:17:10", "remaining_time": "15:59:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5791, "total_steps": 10853, "loss": 0.1287, "learning_rate": 2.4291636727519966e-06, "epoch": 0.5335606025705993, "percentage": 53.36, "elapsed_time": "18:17:20", "remaining_time": "15:59:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5792, "total_steps": 10853, "loss": 0.1265, "learning_rate": 2.428402199017108e-06, "epoch": 0.5336527387478693, "percentage": 53.37, "elapsed_time": "18:17:31", "remaining_time": "15:59:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5793, "total_steps": 10853, "loss": 0.1515, "learning_rate": 2.4276407319300815e-06, "epoch": 0.5337448749251393, "percentage": 53.38, "elapsed_time": "18:17:42", "remaining_time": "15:58:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5794, "total_steps": 10853, "loss": 0.1386, "learning_rate": 2.4268792715616217e-06, "epoch": 0.5338370111024093, "percentage": 53.39, "elapsed_time": "18:17:52", "remaining_time": "15:58:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5795, "total_steps": 10853, "loss": 0.1312, "learning_rate": 2.4261178179824287e-06, "epoch": 0.5339291472796793, "percentage": 53.4, "elapsed_time": "18:18:03", "remaining_time": "15:58:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5796, "total_steps": 10853, "loss": 0.1329, "learning_rate": 2.4253563712632057e-06, "epoch": 0.5340212834569493, "percentage": 53.4, "elapsed_time": "18:18:13", "remaining_time": "15:58:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5797, "total_steps": 10853, "loss": 0.1367, "learning_rate": 2.4245949314746506e-06, "epoch": 0.5341134196342193, "percentage": 53.41, "elapsed_time": "18:18:24", "remaining_time": "15:58:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5798, "total_steps": 10853, "loss": 0.1374, "learning_rate": 2.423833498687464e-06, "epoch": 0.5342055558114894, "percentage": 53.42, "elapsed_time": "18:18:35", "remaining_time": "15:57:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5799, "total_steps": 10853, "loss": 0.1346, "learning_rate": 2.423072072972346e-06, "epoch": 0.5342976919887594, "percentage": 53.43, "elapsed_time": "18:18:47", "remaining_time": "15:57:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5800, "total_steps": 10853, "loss": 0.1378, "learning_rate": 2.4223106543999943e-06, "epoch": 0.5343898281660294, "percentage": 53.44, "elapsed_time": "18:18:59", "remaining_time": "15:57:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5801, "total_steps": 10853, "loss": 0.1275, "learning_rate": 2.4215492430411057e-06, "epoch": 0.5344819643432994, "percentage": 53.45, "elapsed_time": "18:19:10", "remaining_time": "15:57:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5802, "total_steps": 10853, "loss": 0.1372, "learning_rate": 2.4207878389663794e-06, "epoch": 0.5345741005205694, "percentage": 53.46, "elapsed_time": "18:19:20", "remaining_time": "15:57:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5803, "total_steps": 10853, "loss": 0.1415, "learning_rate": 2.4200264422465096e-06, "epoch": 0.5346662366978394, "percentage": 53.47, "elapsed_time": "18:19:31", "remaining_time": "15:56:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5804, "total_steps": 10853, "loss": 0.131, "learning_rate": 2.4192650529521948e-06, "epoch": 0.5347583728751094, "percentage": 53.48, "elapsed_time": "18:19:42", "remaining_time": "15:56:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5805, "total_steps": 10853, "loss": 0.1416, "learning_rate": 2.418503671154128e-06, "epoch": 0.5348505090523794, "percentage": 53.49, "elapsed_time": "18:19:52", "remaining_time": "15:56:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5806, "total_steps": 10853, "loss": 0.1298, "learning_rate": 2.417742296923003e-06, "epoch": 0.5349426452296494, "percentage": 53.5, "elapsed_time": "18:20:04", "remaining_time": "15:56:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5807, "total_steps": 10853, "loss": 0.1372, "learning_rate": 2.4169809303295157e-06, "epoch": 0.5350347814069194, "percentage": 53.51, "elapsed_time": "18:20:15", "remaining_time": "15:56:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5808, "total_steps": 10853, "loss": 0.1336, "learning_rate": 2.4162195714443584e-06, "epoch": 0.5351269175841894, "percentage": 53.52, "elapsed_time": "18:20:27", "remaining_time": "15:55:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5809, "total_steps": 10853, "loss": 0.1377, "learning_rate": 2.4154582203382216e-06, "epoch": 0.5352190537614594, "percentage": 53.52, "elapsed_time": "18:20:36", "remaining_time": "15:55:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5810, "total_steps": 10853, "loss": 0.1252, "learning_rate": 2.4146968770817988e-06, "epoch": 0.5353111899387294, "percentage": 53.53, "elapsed_time": "18:20:47", "remaining_time": "15:55:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5811, "total_steps": 10853, "loss": 0.1499, "learning_rate": 2.41393554174578e-06, "epoch": 0.5354033261159995, "percentage": 53.54, "elapsed_time": "18:20:58", "remaining_time": "15:55:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5812, "total_steps": 10853, "loss": 0.1366, "learning_rate": 2.4131742144008557e-06, "epoch": 0.5354954622932695, "percentage": 53.55, "elapsed_time": "18:21:08", "remaining_time": "15:55:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5813, "total_steps": 10853, "loss": 0.119, "learning_rate": 2.4124128951177146e-06, "epoch": 0.5355875984705395, "percentage": 53.56, "elapsed_time": "18:21:18", "remaining_time": "15:54:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5814, "total_steps": 10853, "loss": 0.1358, "learning_rate": 2.4116515839670456e-06, "epoch": 0.5356797346478095, "percentage": 53.57, "elapsed_time": "18:21:29", "remaining_time": "15:54:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5815, "total_steps": 10853, "loss": 0.1468, "learning_rate": 2.4108902810195367e-06, "epoch": 0.5357718708250795, "percentage": 53.58, "elapsed_time": "18:21:41", "remaining_time": "15:54:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5816, "total_steps": 10853, "loss": 0.1255, "learning_rate": 2.4101289863458744e-06, "epoch": 0.5358640070023495, "percentage": 53.59, "elapsed_time": "18:21:52", "remaining_time": "15:54:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5817, "total_steps": 10853, "loss": 0.1344, "learning_rate": 2.409367700016746e-06, "epoch": 0.5359561431796195, "percentage": 53.6, "elapsed_time": "18:22:03", "remaining_time": "15:54:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5818, "total_steps": 10853, "loss": 0.1302, "learning_rate": 2.4086064221028365e-06, "epoch": 0.5360482793568895, "percentage": 53.61, "elapsed_time": "18:22:12", "remaining_time": "15:53:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5819, "total_steps": 10853, "loss": 0.1407, "learning_rate": 2.40784515267483e-06, "epoch": 0.5361404155341595, "percentage": 53.62, "elapsed_time": "18:22:23", "remaining_time": "15:53:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5820, "total_steps": 10853, "loss": 0.1394, "learning_rate": 2.407083891803411e-06, "epoch": 0.5362325517114295, "percentage": 53.63, "elapsed_time": "18:22:34", "remaining_time": "15:53:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5821, "total_steps": 10853, "loss": 0.1358, "learning_rate": 2.4063226395592635e-06, "epoch": 0.5363246878886995, "percentage": 53.63, "elapsed_time": "18:22:44", "remaining_time": "15:53:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5822, "total_steps": 10853, "loss": 0.1376, "learning_rate": 2.4055613960130676e-06, "epoch": 0.5364168240659695, "percentage": 53.64, "elapsed_time": "18:22:55", "remaining_time": "15:53:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5823, "total_steps": 10853, "loss": 0.1375, "learning_rate": 2.4048001612355072e-06, "epoch": 0.5365089602432395, "percentage": 53.65, "elapsed_time": "18:23:05", "remaining_time": "15:52:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5824, "total_steps": 10853, "loss": 0.1345, "learning_rate": 2.4040389352972616e-06, "epoch": 0.5366010964205095, "percentage": 53.66, "elapsed_time": "18:23:15", "remaining_time": "15:52:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5825, "total_steps": 10853, "loss": 0.1287, "learning_rate": 2.403277718269012e-06, "epoch": 0.5366932325977796, "percentage": 53.67, "elapsed_time": "18:23:25", "remaining_time": "15:52:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5826, "total_steps": 10853, "loss": 0.1274, "learning_rate": 2.4025165102214363e-06, "epoch": 0.5367853687750496, "percentage": 53.68, "elapsed_time": "18:23:35", "remaining_time": "15:52:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5827, "total_steps": 10853, "loss": 0.1427, "learning_rate": 2.4017553112252123e-06, "epoch": 0.5368775049523196, "percentage": 53.69, "elapsed_time": "18:23:45", "remaining_time": "15:52:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5828, "total_steps": 10853, "loss": 0.1422, "learning_rate": 2.400994121351019e-06, "epoch": 0.5369696411295896, "percentage": 53.7, "elapsed_time": "18:23:57", "remaining_time": "15:51:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5829, "total_steps": 10853, "loss": 0.135, "learning_rate": 2.4002329406695325e-06, "epoch": 0.5370617773068596, "percentage": 53.71, "elapsed_time": "18:24:08", "remaining_time": "15:51:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5830, "total_steps": 10853, "loss": 0.1479, "learning_rate": 2.3994717692514274e-06, "epoch": 0.5371539134841296, "percentage": 53.72, "elapsed_time": "18:24:18", "remaining_time": "15:51:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5831, "total_steps": 10853, "loss": 0.1339, "learning_rate": 2.3987106071673797e-06, "epoch": 0.5372460496613995, "percentage": 53.73, "elapsed_time": "18:24:30", "remaining_time": "15:51:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5832, "total_steps": 10853, "loss": 0.117, "learning_rate": 2.3979494544880625e-06, "epoch": 0.5373381858386695, "percentage": 53.74, "elapsed_time": "18:24:41", "remaining_time": "15:51:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5833, "total_steps": 10853, "loss": 0.1481, "learning_rate": 2.3971883112841505e-06, "epoch": 0.5374303220159395, "percentage": 53.75, "elapsed_time": "18:24:52", "remaining_time": "15:50:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5834, "total_steps": 10853, "loss": 0.1448, "learning_rate": 2.3964271776263146e-06, "epoch": 0.5375224581932095, "percentage": 53.75, "elapsed_time": "18:25:02", "remaining_time": "15:50:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5835, "total_steps": 10853, "loss": 0.1403, "learning_rate": 2.3956660535852254e-06, "epoch": 0.5376145943704795, "percentage": 53.76, "elapsed_time": "18:25:12", "remaining_time": "15:50:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5836, "total_steps": 10853, "loss": 0.1313, "learning_rate": 2.3949049392315555e-06, "epoch": 0.5377067305477495, "percentage": 53.77, "elapsed_time": "18:25:23", "remaining_time": "15:50:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5837, "total_steps": 10853, "loss": 0.132, "learning_rate": 2.394143834635973e-06, "epoch": 0.5377988667250195, "percentage": 53.78, "elapsed_time": "18:25:35", "remaining_time": "15:50:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5838, "total_steps": 10853, "loss": 0.1291, "learning_rate": 2.3933827398691464e-06, "epoch": 0.5378910029022896, "percentage": 53.79, "elapsed_time": "18:25:45", "remaining_time": "15:49:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5839, "total_steps": 10853, "loss": 0.1402, "learning_rate": 2.3926216550017445e-06, "epoch": 0.5379831390795596, "percentage": 53.8, "elapsed_time": "18:25:56", "remaining_time": "15:49:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5840, "total_steps": 10853, "loss": 0.1403, "learning_rate": 2.3918605801044325e-06, "epoch": 0.5380752752568296, "percentage": 53.81, "elapsed_time": "18:26:07", "remaining_time": "15:49:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5841, "total_steps": 10853, "loss": 0.1399, "learning_rate": 2.3910995152478786e-06, "epoch": 0.5381674114340996, "percentage": 53.82, "elapsed_time": "18:26:18", "remaining_time": "15:49:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5842, "total_steps": 10853, "loss": 0.1339, "learning_rate": 2.3903384605027462e-06, "epoch": 0.5382595476113696, "percentage": 53.83, "elapsed_time": "18:26:29", "remaining_time": "15:49:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5843, "total_steps": 10853, "loss": 0.1425, "learning_rate": 2.3895774159396982e-06, "epoch": 0.5383516837886396, "percentage": 53.84, "elapsed_time": "18:26:39", "remaining_time": "15:48:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5844, "total_steps": 10853, "loss": 0.1345, "learning_rate": 2.3888163816294e-06, "epoch": 0.5384438199659096, "percentage": 53.85, "elapsed_time": "18:26:50", "remaining_time": "15:48:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5845, "total_steps": 10853, "loss": 0.1313, "learning_rate": 2.3880553576425124e-06, "epoch": 0.5385359561431796, "percentage": 53.86, "elapsed_time": "18:27:01", "remaining_time": "15:48:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5846, "total_steps": 10853, "loss": 0.1472, "learning_rate": 2.3872943440496978e-06, "epoch": 0.5386280923204496, "percentage": 53.87, "elapsed_time": "18:27:13", "remaining_time": "15:48:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5847, "total_steps": 10853, "loss": 0.1413, "learning_rate": 2.386533340921615e-06, "epoch": 0.5387202284977196, "percentage": 53.87, "elapsed_time": "18:27:25", "remaining_time": "15:48:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5848, "total_steps": 10853, "loss": 0.1584, "learning_rate": 2.385772348328923e-06, "epoch": 0.5388123646749896, "percentage": 53.88, "elapsed_time": "18:27:36", "remaining_time": "15:47:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5849, "total_steps": 10853, "loss": 0.1407, "learning_rate": 2.385011366342281e-06, "epoch": 0.5389045008522596, "percentage": 53.89, "elapsed_time": "18:27:47", "remaining_time": "15:47:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5850, "total_steps": 10853, "loss": 0.136, "learning_rate": 2.3842503950323473e-06, "epoch": 0.5389966370295296, "percentage": 53.9, "elapsed_time": "18:27:57", "remaining_time": "15:47:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5851, "total_steps": 10853, "loss": 0.1426, "learning_rate": 2.383489434469775e-06, "epoch": 0.5390887732067996, "percentage": 53.91, "elapsed_time": "18:28:08", "remaining_time": "15:47:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5852, "total_steps": 10853, "loss": 0.1341, "learning_rate": 2.382728484725222e-06, "epoch": 0.5391809093840697, "percentage": 53.92, "elapsed_time": "18:28:20", "remaining_time": "15:47:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5853, "total_steps": 10853, "loss": 0.1409, "learning_rate": 2.3819675458693422e-06, "epoch": 0.5392730455613397, "percentage": 53.93, "elapsed_time": "18:28:31", "remaining_time": "15:46:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5854, "total_steps": 10853, "loss": 0.1444, "learning_rate": 2.381206617972789e-06, "epoch": 0.5393651817386097, "percentage": 53.94, "elapsed_time": "18:28:43", "remaining_time": "15:46:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5855, "total_steps": 10853, "loss": 0.1398, "learning_rate": 2.3804457011062126e-06, "epoch": 0.5394573179158797, "percentage": 53.95, "elapsed_time": "18:28:52", "remaining_time": "15:46:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5856, "total_steps": 10853, "loss": 0.1225, "learning_rate": 2.3796847953402665e-06, "epoch": 0.5395494540931497, "percentage": 53.96, "elapsed_time": "18:29:01", "remaining_time": "15:46:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5857, "total_steps": 10853, "loss": 0.1405, "learning_rate": 2.3789239007455996e-06, "epoch": 0.5396415902704197, "percentage": 53.97, "elapsed_time": "18:29:13", "remaining_time": "15:46:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5858, "total_steps": 10853, "loss": 0.1347, "learning_rate": 2.3781630173928627e-06, "epoch": 0.5397337264476897, "percentage": 53.98, "elapsed_time": "18:29:22", "remaining_time": "15:45:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5859, "total_steps": 10853, "loss": 0.1193, "learning_rate": 2.3774021453527023e-06, "epoch": 0.5398258626249597, "percentage": 53.99, "elapsed_time": "18:29:33", "remaining_time": "15:45:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5860, "total_steps": 10853, "loss": 0.1485, "learning_rate": 2.3766412846957652e-06, "epoch": 0.5399179988022297, "percentage": 53.99, "elapsed_time": "18:29:44", "remaining_time": "15:45:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5861, "total_steps": 10853, "loss": 0.1391, "learning_rate": 2.3758804354926986e-06, "epoch": 0.5400101349794997, "percentage": 54.0, "elapsed_time": "18:29:56", "remaining_time": "15:45:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5862, "total_steps": 10853, "loss": 0.1455, "learning_rate": 2.375119597814147e-06, "epoch": 0.5401022711567697, "percentage": 54.01, "elapsed_time": "18:30:05", "remaining_time": "15:45:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5863, "total_steps": 10853, "loss": 0.1285, "learning_rate": 2.374358771730754e-06, "epoch": 0.5401944073340397, "percentage": 54.02, "elapsed_time": "18:30:15", "remaining_time": "15:44:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5864, "total_steps": 10853, "loss": 0.147, "learning_rate": 2.3735979573131626e-06, "epoch": 0.5402865435113097, "percentage": 54.03, "elapsed_time": "18:30:26", "remaining_time": "15:44:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5865, "total_steps": 10853, "loss": 0.1289, "learning_rate": 2.372837154632014e-06, "epoch": 0.5403786796885797, "percentage": 54.04, "elapsed_time": "18:30:37", "remaining_time": "15:44:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5866, "total_steps": 10853, "loss": 0.132, "learning_rate": 2.37207636375795e-06, "epoch": 0.5404708158658498, "percentage": 54.05, "elapsed_time": "18:30:47", "remaining_time": "15:44:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5867, "total_steps": 10853, "loss": 0.1444, "learning_rate": 2.3713155847616095e-06, "epoch": 0.5405629520431198, "percentage": 54.06, "elapsed_time": "18:30:58", "remaining_time": "15:44:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5868, "total_steps": 10853, "loss": 0.1257, "learning_rate": 2.37055481771363e-06, "epoch": 0.5406550882203898, "percentage": 54.07, "elapsed_time": "18:31:08", "remaining_time": "15:43:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5869, "total_steps": 10853, "loss": 0.1366, "learning_rate": 2.3697940626846504e-06, "epoch": 0.5407472243976598, "percentage": 54.08, "elapsed_time": "18:31:21", "remaining_time": "15:43:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5870, "total_steps": 10853, "loss": 0.1278, "learning_rate": 2.369033319745306e-06, "epoch": 0.5408393605749298, "percentage": 54.09, "elapsed_time": "18:31:32", "remaining_time": "15:43:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5871, "total_steps": 10853, "loss": 0.1316, "learning_rate": 2.3682725889662316e-06, "epoch": 0.5409314967521998, "percentage": 54.1, "elapsed_time": "18:31:43", "remaining_time": "15:43:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5872, "total_steps": 10853, "loss": 0.1375, "learning_rate": 2.3675118704180614e-06, "epoch": 0.5410236329294698, "percentage": 54.1, "elapsed_time": "18:31:54", "remaining_time": "15:43:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5873, "total_steps": 10853, "loss": 0.1433, "learning_rate": 2.366751164171428e-06, "epoch": 0.5411157691067398, "percentage": 54.11, "elapsed_time": "18:32:06", "remaining_time": "15:43:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5874, "total_steps": 10853, "loss": 0.1339, "learning_rate": 2.3659904702969636e-06, "epoch": 0.5412079052840097, "percentage": 54.12, "elapsed_time": "18:32:16", "remaining_time": "15:42:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5875, "total_steps": 10853, "loss": 0.1409, "learning_rate": 2.3652297888653e-06, "epoch": 0.5413000414612797, "percentage": 54.13, "elapsed_time": "18:32:28", "remaining_time": "15:42:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5876, "total_steps": 10853, "loss": 0.1369, "learning_rate": 2.3644691199470628e-06, "epoch": 0.5413921776385497, "percentage": 54.14, "elapsed_time": "18:32:39", "remaining_time": "15:42:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5877, "total_steps": 10853, "loss": 0.1356, "learning_rate": 2.3637084636128836e-06, "epoch": 0.5414843138158197, "percentage": 54.15, "elapsed_time": "18:32:50", "remaining_time": "15:42:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5878, "total_steps": 10853, "loss": 0.1328, "learning_rate": 2.3629478199333873e-06, "epoch": 0.5415764499930897, "percentage": 54.16, "elapsed_time": "18:33:01", "remaining_time": "15:42:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5879, "total_steps": 10853, "loss": 0.1368, "learning_rate": 2.362187188979202e-06, "epoch": 0.5416685861703598, "percentage": 54.17, "elapsed_time": "18:33:13", "remaining_time": "15:41:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5880, "total_steps": 10853, "loss": 0.1324, "learning_rate": 2.3614265708209503e-06, "epoch": 0.5417607223476298, "percentage": 54.18, "elapsed_time": "18:33:24", "remaining_time": "15:41:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5881, "total_steps": 10853, "loss": 0.1336, "learning_rate": 2.360665965529256e-06, "epoch": 0.5418528585248998, "percentage": 54.19, "elapsed_time": "18:33:35", "remaining_time": "15:41:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5882, "total_steps": 10853, "loss": 0.1396, "learning_rate": 2.3599053731747424e-06, "epoch": 0.5419449947021698, "percentage": 54.2, "elapsed_time": "18:33:44", "remaining_time": "15:41:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5883, "total_steps": 10853, "loss": 0.1349, "learning_rate": 2.3591447938280304e-06, "epoch": 0.5420371308794398, "percentage": 54.21, "elapsed_time": "18:33:56", "remaining_time": "15:41:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5884, "total_steps": 10853, "loss": 0.1362, "learning_rate": 2.3583842275597382e-06, "epoch": 0.5421292670567098, "percentage": 54.22, "elapsed_time": "18:34:06", "remaining_time": "15:40:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5885, "total_steps": 10853, "loss": 0.1383, "learning_rate": 2.3576236744404866e-06, "epoch": 0.5422214032339798, "percentage": 54.22, "elapsed_time": "18:34:16", "remaining_time": "15:40:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5886, "total_steps": 10853, "loss": 0.1326, "learning_rate": 2.3568631345408912e-06, "epoch": 0.5423135394112498, "percentage": 54.23, "elapsed_time": "18:34:27", "remaining_time": "15:40:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5887, "total_steps": 10853, "loss": 0.1271, "learning_rate": 2.3561026079315707e-06, "epoch": 0.5424056755885198, "percentage": 54.24, "elapsed_time": "18:34:36", "remaining_time": "15:40:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5888, "total_steps": 10853, "loss": 0.159, "learning_rate": 2.3553420946831377e-06, "epoch": 0.5424978117657898, "percentage": 54.25, "elapsed_time": "18:34:47", "remaining_time": "15:40:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5889, "total_steps": 10853, "loss": 0.1246, "learning_rate": 2.3545815948662066e-06, "epoch": 0.5425899479430598, "percentage": 54.26, "elapsed_time": "18:34:58", "remaining_time": "15:39:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5890, "total_steps": 10853, "loss": 0.1258, "learning_rate": 2.3538211085513902e-06, "epoch": 0.5426820841203298, "percentage": 54.27, "elapsed_time": "18:35:09", "remaining_time": "15:39:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5891, "total_steps": 10853, "loss": 0.1336, "learning_rate": 2.3530606358093e-06, "epoch": 0.5427742202975998, "percentage": 54.28, "elapsed_time": "18:35:19", "remaining_time": "15:39:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5892, "total_steps": 10853, "loss": 0.1367, "learning_rate": 2.352300176710545e-06, "epoch": 0.5428663564748698, "percentage": 54.29, "elapsed_time": "18:35:29", "remaining_time": "15:39:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5893, "total_steps": 10853, "loss": 0.1397, "learning_rate": 2.351539731325735e-06, "epoch": 0.5429584926521399, "percentage": 54.3, "elapsed_time": "18:35:41", "remaining_time": "15:39:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5894, "total_steps": 10853, "loss": 0.1364, "learning_rate": 2.350779299725476e-06, "epoch": 0.5430506288294099, "percentage": 54.31, "elapsed_time": "18:35:51", "remaining_time": "15:38:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5895, "total_steps": 10853, "loss": 0.1488, "learning_rate": 2.3500188819803764e-06, "epoch": 0.5431427650066799, "percentage": 54.32, "elapsed_time": "18:36:02", "remaining_time": "15:38:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5896, "total_steps": 10853, "loss": 0.1199, "learning_rate": 2.3492584781610392e-06, "epoch": 0.5432349011839499, "percentage": 54.33, "elapsed_time": "18:36:12", "remaining_time": "15:38:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5897, "total_steps": 10853, "loss": 0.1389, "learning_rate": 2.3484980883380677e-06, "epoch": 0.5433270373612199, "percentage": 54.34, "elapsed_time": "18:36:22", "remaining_time": "15:38:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5898, "total_steps": 10853, "loss": 0.1288, "learning_rate": 2.347737712582066e-06, "epoch": 0.5434191735384899, "percentage": 54.34, "elapsed_time": "18:36:34", "remaining_time": "15:38:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5899, "total_steps": 10853, "loss": 0.1253, "learning_rate": 2.3469773509636346e-06, "epoch": 0.5435113097157599, "percentage": 54.35, "elapsed_time": "18:36:44", "remaining_time": "15:37:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5900, "total_steps": 10853, "loss": 0.1383, "learning_rate": 2.3462170035533713e-06, "epoch": 0.5436034458930299, "percentage": 54.36, "elapsed_time": "18:36:55", "remaining_time": "15:37:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5901, "total_steps": 10853, "loss": 0.1444, "learning_rate": 2.345456670421876e-06, "epoch": 0.5436955820702999, "percentage": 54.37, "elapsed_time": "18:37:06", "remaining_time": "15:37:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5902, "total_steps": 10853, "loss": 0.1432, "learning_rate": 2.3446963516397455e-06, "epoch": 0.5437877182475699, "percentage": 54.38, "elapsed_time": "18:37:17", "remaining_time": "15:37:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5903, "total_steps": 10853, "loss": 0.1398, "learning_rate": 2.3439360472775758e-06, "epoch": 0.5438798544248399, "percentage": 54.39, "elapsed_time": "18:37:27", "remaining_time": "15:37:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5904, "total_steps": 10853, "loss": 0.1324, "learning_rate": 2.3431757574059616e-06, "epoch": 0.5439719906021099, "percentage": 54.4, "elapsed_time": "18:37:38", "remaining_time": "15:36:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5905, "total_steps": 10853, "loss": 0.1322, "learning_rate": 2.342415482095494e-06, "epoch": 0.5440641267793799, "percentage": 54.41, "elapsed_time": "18:37:49", "remaining_time": "15:36:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5906, "total_steps": 10853, "loss": 0.1367, "learning_rate": 2.341655221416766e-06, "epoch": 0.54415626295665, "percentage": 54.42, "elapsed_time": "18:38:00", "remaining_time": "15:36:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5907, "total_steps": 10853, "loss": 0.1257, "learning_rate": 2.3408949754403678e-06, "epoch": 0.54424839913392, "percentage": 54.43, "elapsed_time": "18:38:10", "remaining_time": "15:36:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5908, "total_steps": 10853, "loss": 0.1194, "learning_rate": 2.340134744236889e-06, "epoch": 0.54434053531119, "percentage": 54.44, "elapsed_time": "18:38:21", "remaining_time": "15:36:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5909, "total_steps": 10853, "loss": 0.1393, "learning_rate": 2.3393745278769163e-06, "epoch": 0.54443267148846, "percentage": 54.45, "elapsed_time": "18:38:32", "remaining_time": "15:35:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5910, "total_steps": 10853, "loss": 0.1338, "learning_rate": 2.3386143264310348e-06, "epoch": 0.54452480766573, "percentage": 54.45, "elapsed_time": "18:38:43", "remaining_time": "15:35:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5911, "total_steps": 10853, "loss": 0.1367, "learning_rate": 2.3378541399698314e-06, "epoch": 0.544616943843, "percentage": 54.46, "elapsed_time": "18:38:53", "remaining_time": "15:35:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5912, "total_steps": 10853, "loss": 0.1267, "learning_rate": 2.337093968563889e-06, "epoch": 0.54470908002027, "percentage": 54.47, "elapsed_time": "18:39:04", "remaining_time": "15:35:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5913, "total_steps": 10853, "loss": 0.1214, "learning_rate": 2.336333812283788e-06, "epoch": 0.54480121619754, "percentage": 54.48, "elapsed_time": "18:39:14", "remaining_time": "15:35:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5914, "total_steps": 10853, "loss": 0.1425, "learning_rate": 2.3355736712001107e-06, "epoch": 0.54489335237481, "percentage": 54.49, "elapsed_time": "18:39:25", "remaining_time": "15:34:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5915, "total_steps": 10853, "loss": 0.1477, "learning_rate": 2.3348135453834353e-06, "epoch": 0.54498548855208, "percentage": 54.5, "elapsed_time": "18:39:36", "remaining_time": "15:34:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5916, "total_steps": 10853, "loss": 0.1324, "learning_rate": 2.3340534349043407e-06, "epoch": 0.54507762472935, "percentage": 54.51, "elapsed_time": "18:39:47", "remaining_time": "15:34:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5917, "total_steps": 10853, "loss": 0.1348, "learning_rate": 2.3332933398334028e-06, "epoch": 0.54516976090662, "percentage": 54.52, "elapsed_time": "18:39:58", "remaining_time": "15:34:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5918, "total_steps": 10853, "loss": 0.146, "learning_rate": 2.332533260241195e-06, "epoch": 0.54526189708389, "percentage": 54.53, "elapsed_time": "18:40:10", "remaining_time": "15:34:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5919, "total_steps": 10853, "loss": 0.1422, "learning_rate": 2.3317731961982926e-06, "epoch": 0.5453540332611599, "percentage": 54.54, "elapsed_time": "18:40:21", "remaining_time": "15:33:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5920, "total_steps": 10853, "loss": 0.1322, "learning_rate": 2.331013147775268e-06, "epoch": 0.54544616943843, "percentage": 54.55, "elapsed_time": "18:40:33", "remaining_time": "15:33:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5921, "total_steps": 10853, "loss": 0.1514, "learning_rate": 2.3302531150426894e-06, "epoch": 0.5455383056157, "percentage": 54.56, "elapsed_time": "18:40:43", "remaining_time": "15:33:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5922, "total_steps": 10853, "loss": 0.1377, "learning_rate": 2.329493098071128e-06, "epoch": 0.54563044179297, "percentage": 54.57, "elapsed_time": "18:40:54", "remaining_time": "15:33:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5923, "total_steps": 10853, "loss": 0.1292, "learning_rate": 2.32873309693115e-06, "epoch": 0.54572257797024, "percentage": 54.57, "elapsed_time": "18:41:04", "remaining_time": "15:33:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5924, "total_steps": 10853, "loss": 0.1382, "learning_rate": 2.3279731116933235e-06, "epoch": 0.54581471414751, "percentage": 54.58, "elapsed_time": "18:41:17", "remaining_time": "15:32:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5925, "total_steps": 10853, "loss": 0.1412, "learning_rate": 2.327213142428212e-06, "epoch": 0.54590685032478, "percentage": 54.59, "elapsed_time": "18:41:28", "remaining_time": "15:32:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5926, "total_steps": 10853, "loss": 0.137, "learning_rate": 2.326453189206378e-06, "epoch": 0.54599898650205, "percentage": 54.6, "elapsed_time": "18:41:39", "remaining_time": "15:32:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5927, "total_steps": 10853, "loss": 0.1302, "learning_rate": 2.325693252098384e-06, "epoch": 0.54609112267932, "percentage": 54.61, "elapsed_time": "18:41:49", "remaining_time": "15:32:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5928, "total_steps": 10853, "loss": 0.1399, "learning_rate": 2.324933331174792e-06, "epoch": 0.54618325885659, "percentage": 54.62, "elapsed_time": "18:42:00", "remaining_time": "15:32:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5929, "total_steps": 10853, "loss": 0.134, "learning_rate": 2.3241734265061573e-06, "epoch": 0.54627539503386, "percentage": 54.63, "elapsed_time": "18:42:10", "remaining_time": "15:31:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5930, "total_steps": 10853, "loss": 0.137, "learning_rate": 2.323413538163039e-06, "epoch": 0.54636753121113, "percentage": 54.64, "elapsed_time": "18:42:21", "remaining_time": "15:31:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5931, "total_steps": 10853, "loss": 0.1499, "learning_rate": 2.322653666215993e-06, "epoch": 0.5464596673884, "percentage": 54.65, "elapsed_time": "18:42:33", "remaining_time": "15:31:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5932, "total_steps": 10853, "loss": 0.1367, "learning_rate": 2.3218938107355727e-06, "epoch": 0.54655180356567, "percentage": 54.66, "elapsed_time": "18:42:44", "remaining_time": "15:31:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5933, "total_steps": 10853, "loss": 0.1226, "learning_rate": 2.3211339717923326e-06, "epoch": 0.54664393974294, "percentage": 54.67, "elapsed_time": "18:42:52", "remaining_time": "15:31:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5934, "total_steps": 10853, "loss": 0.1346, "learning_rate": 2.320374149456822e-06, "epoch": 0.5467360759202101, "percentage": 54.68, "elapsed_time": "18:43:04", "remaining_time": "15:30:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5935, "total_steps": 10853, "loss": 0.1442, "learning_rate": 2.31961434379959e-06, "epoch": 0.5468282120974801, "percentage": 54.69, "elapsed_time": "18:43:13", "remaining_time": "15:30:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5936, "total_steps": 10853, "loss": 0.1176, "learning_rate": 2.3188545548911863e-06, "epoch": 0.5469203482747501, "percentage": 54.69, "elapsed_time": "18:43:24", "remaining_time": "15:30:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5937, "total_steps": 10853, "loss": 0.1255, "learning_rate": 2.3180947828021574e-06, "epoch": 0.5470124844520201, "percentage": 54.7, "elapsed_time": "18:43:35", "remaining_time": "15:30:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5938, "total_steps": 10853, "loss": 0.1382, "learning_rate": 2.317335027603046e-06, "epoch": 0.5471046206292901, "percentage": 54.71, "elapsed_time": "18:43:46", "remaining_time": "15:30:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5939, "total_steps": 10853, "loss": 0.1218, "learning_rate": 2.3165752893643974e-06, "epoch": 0.5471967568065601, "percentage": 54.72, "elapsed_time": "18:43:56", "remaining_time": "15:29:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5940, "total_steps": 10853, "loss": 0.1274, "learning_rate": 2.315815568156753e-06, "epoch": 0.5472888929838301, "percentage": 54.73, "elapsed_time": "18:44:06", "remaining_time": "15:29:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5941, "total_steps": 10853, "loss": 0.1343, "learning_rate": 2.315055864050654e-06, "epoch": 0.5473810291611001, "percentage": 54.74, "elapsed_time": "18:44:16", "remaining_time": "15:29:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5942, "total_steps": 10853, "loss": 0.1456, "learning_rate": 2.314296177116637e-06, "epoch": 0.5474731653383701, "percentage": 54.75, "elapsed_time": "18:44:28", "remaining_time": "15:29:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5943, "total_steps": 10853, "loss": 0.1229, "learning_rate": 2.3135365074252393e-06, "epoch": 0.5475653015156401, "percentage": 54.76, "elapsed_time": "18:44:38", "remaining_time": "15:29:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5944, "total_steps": 10853, "loss": 0.1517, "learning_rate": 2.3127768550469977e-06, "epoch": 0.5476574376929101, "percentage": 54.77, "elapsed_time": "18:44:50", "remaining_time": "15:28:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5945, "total_steps": 10853, "loss": 0.1409, "learning_rate": 2.3120172200524456e-06, "epoch": 0.5477495738701801, "percentage": 54.78, "elapsed_time": "18:45:00", "remaining_time": "15:28:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5946, "total_steps": 10853, "loss": 0.1375, "learning_rate": 2.311257602512114e-06, "epoch": 0.5478417100474501, "percentage": 54.79, "elapsed_time": "18:45:11", "remaining_time": "15:28:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5947, "total_steps": 10853, "loss": 0.125, "learning_rate": 2.310498002496535e-06, "epoch": 0.5479338462247202, "percentage": 54.8, "elapsed_time": "18:45:22", "remaining_time": "15:28:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5948, "total_steps": 10853, "loss": 0.1362, "learning_rate": 2.309738420076236e-06, "epoch": 0.5480259824019902, "percentage": 54.81, "elapsed_time": "18:45:31", "remaining_time": "15:28:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5949, "total_steps": 10853, "loss": 0.1381, "learning_rate": 2.308978855321746e-06, "epoch": 0.5481181185792602, "percentage": 54.81, "elapsed_time": "18:45:42", "remaining_time": "15:27:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5950, "total_steps": 10853, "loss": 0.1344, "learning_rate": 2.30821930830359e-06, "epoch": 0.5482102547565302, "percentage": 54.82, "elapsed_time": "18:45:52", "remaining_time": "15:27:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5951, "total_steps": 10853, "loss": 0.1391, "learning_rate": 2.307459779092291e-06, "epoch": 0.5483023909338002, "percentage": 54.83, "elapsed_time": "18:46:02", "remaining_time": "15:27:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5952, "total_steps": 10853, "loss": 0.1244, "learning_rate": 2.306700267758373e-06, "epoch": 0.5483945271110702, "percentage": 54.84, "elapsed_time": "18:46:12", "remaining_time": "15:27:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5953, "total_steps": 10853, "loss": 0.1236, "learning_rate": 2.3059407743723562e-06, "epoch": 0.5484866632883402, "percentage": 54.85, "elapsed_time": "18:46:22", "remaining_time": "15:27:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5954, "total_steps": 10853, "loss": 0.1319, "learning_rate": 2.305181299004758e-06, "epoch": 0.5485787994656102, "percentage": 54.86, "elapsed_time": "18:46:32", "remaining_time": "15:26:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5955, "total_steps": 10853, "loss": 0.1375, "learning_rate": 2.304421841726098e-06, "epoch": 0.5486709356428802, "percentage": 54.87, "elapsed_time": "18:46:44", "remaining_time": "15:26:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5956, "total_steps": 10853, "loss": 0.1394, "learning_rate": 2.303662402606891e-06, "epoch": 0.5487630718201502, "percentage": 54.88, "elapsed_time": "18:46:56", "remaining_time": "15:26:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5957, "total_steps": 10853, "loss": 0.1241, "learning_rate": 2.3029029817176513e-06, "epoch": 0.5488552079974202, "percentage": 54.89, "elapsed_time": "18:47:07", "remaining_time": "15:26:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5958, "total_steps": 10853, "loss": 0.1452, "learning_rate": 2.302143579128891e-06, "epoch": 0.5489473441746902, "percentage": 54.9, "elapsed_time": "18:47:19", "remaining_time": "15:26:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5959, "total_steps": 10853, "loss": 0.1393, "learning_rate": 2.30138419491112e-06, "epoch": 0.5490394803519602, "percentage": 54.91, "elapsed_time": "18:47:30", "remaining_time": "15:25:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5960, "total_steps": 10853, "loss": 0.1458, "learning_rate": 2.3006248291348483e-06, "epoch": 0.5491316165292301, "percentage": 54.92, "elapsed_time": "18:47:41", "remaining_time": "15:25:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5961, "total_steps": 10853, "loss": 0.1258, "learning_rate": 2.2998654818705824e-06, "epoch": 0.5492237527065003, "percentage": 54.92, "elapsed_time": "18:47:50", "remaining_time": "15:25:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5962, "total_steps": 10853, "loss": 0.146, "learning_rate": 2.2991061531888285e-06, "epoch": 0.5493158888837703, "percentage": 54.93, "elapsed_time": "18:48:02", "remaining_time": "15:25:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5963, "total_steps": 10853, "loss": 0.1387, "learning_rate": 2.29834684316009e-06, "epoch": 0.5494080250610403, "percentage": 54.94, "elapsed_time": "18:48:13", "remaining_time": "15:25:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5964, "total_steps": 10853, "loss": 0.1313, "learning_rate": 2.297587551854868e-06, "epoch": 0.5495001612383102, "percentage": 54.95, "elapsed_time": "18:48:25", "remaining_time": "15:25:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5965, "total_steps": 10853, "loss": 0.1291, "learning_rate": 2.296828279343664e-06, "epoch": 0.5495922974155802, "percentage": 54.96, "elapsed_time": "18:48:36", "remaining_time": "15:24:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5966, "total_steps": 10853, "loss": 0.1261, "learning_rate": 2.2960690256969774e-06, "epoch": 0.5496844335928502, "percentage": 54.97, "elapsed_time": "18:48:47", "remaining_time": "15:24:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5967, "total_steps": 10853, "loss": 0.15, "learning_rate": 2.2953097909853018e-06, "epoch": 0.5497765697701202, "percentage": 54.98, "elapsed_time": "18:48:59", "remaining_time": "15:24:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5968, "total_steps": 10853, "loss": 0.1263, "learning_rate": 2.294550575279135e-06, "epoch": 0.5498687059473902, "percentage": 54.99, "elapsed_time": "18:49:10", "remaining_time": "15:24:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5969, "total_steps": 10853, "loss": 0.1267, "learning_rate": 2.293791378648969e-06, "epoch": 0.5499608421246602, "percentage": 55.0, "elapsed_time": "18:49:21", "remaining_time": "15:24:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5970, "total_steps": 10853, "loss": 0.1332, "learning_rate": 2.2930322011652965e-06, "epoch": 0.5500529783019302, "percentage": 55.01, "elapsed_time": "18:49:32", "remaining_time": "15:23:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5971, "total_steps": 10853, "loss": 0.1323, "learning_rate": 2.2922730428986057e-06, "epoch": 0.5501451144792002, "percentage": 55.02, "elapsed_time": "18:49:41", "remaining_time": "15:23:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5972, "total_steps": 10853, "loss": 0.1587, "learning_rate": 2.291513903919385e-06, "epoch": 0.5502372506564702, "percentage": 55.03, "elapsed_time": "18:49:52", "remaining_time": "15:23:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5973, "total_steps": 10853, "loss": 0.1322, "learning_rate": 2.2907547842981213e-06, "epoch": 0.5503293868337402, "percentage": 55.04, "elapsed_time": "18:50:03", "remaining_time": "15:23:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5974, "total_steps": 10853, "loss": 0.1416, "learning_rate": 2.289995684105299e-06, "epoch": 0.5504215230110103, "percentage": 55.04, "elapsed_time": "18:50:15", "remaining_time": "15:23:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5975, "total_steps": 10853, "loss": 0.1305, "learning_rate": 2.2892366034113988e-06, "epoch": 0.5505136591882803, "percentage": 55.05, "elapsed_time": "18:50:26", "remaining_time": "15:22:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5976, "total_steps": 10853, "loss": 0.1392, "learning_rate": 2.288477542286903e-06, "epoch": 0.5506057953655503, "percentage": 55.06, "elapsed_time": "18:50:36", "remaining_time": "15:22:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5977, "total_steps": 10853, "loss": 0.143, "learning_rate": 2.2877185008022896e-06, "epoch": 0.5506979315428203, "percentage": 55.07, "elapsed_time": "18:50:48", "remaining_time": "15:22:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5978, "total_steps": 10853, "loss": 0.1456, "learning_rate": 2.2869594790280376e-06, "epoch": 0.5507900677200903, "percentage": 55.08, "elapsed_time": "18:50:58", "remaining_time": "15:22:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5979, "total_steps": 10853, "loss": 0.1407, "learning_rate": 2.2862004770346205e-06, "epoch": 0.5508822038973603, "percentage": 55.09, "elapsed_time": "18:51:09", "remaining_time": "15:22:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5980, "total_steps": 10853, "loss": 0.1245, "learning_rate": 2.285441494892511e-06, "epoch": 0.5509743400746303, "percentage": 55.1, "elapsed_time": "18:51:19", "remaining_time": "15:21:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5981, "total_steps": 10853, "loss": 0.1445, "learning_rate": 2.284682532672183e-06, "epoch": 0.5510664762519003, "percentage": 55.11, "elapsed_time": "18:51:30", "remaining_time": "15:21:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5982, "total_steps": 10853, "loss": 0.1344, "learning_rate": 2.2839235904441054e-06, "epoch": 0.5511586124291703, "percentage": 55.12, "elapsed_time": "18:51:40", "remaining_time": "15:21:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5983, "total_steps": 10853, "loss": 0.1343, "learning_rate": 2.2831646682787443e-06, "epoch": 0.5512507486064403, "percentage": 55.13, "elapsed_time": "18:51:51", "remaining_time": "15:21:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5984, "total_steps": 10853, "loss": 0.1287, "learning_rate": 2.282405766246568e-06, "epoch": 0.5513428847837103, "percentage": 55.14, "elapsed_time": "18:52:02", "remaining_time": "15:21:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5985, "total_steps": 10853, "loss": 0.1135, "learning_rate": 2.281646884418039e-06, "epoch": 0.5514350209609803, "percentage": 55.15, "elapsed_time": "18:52:12", "remaining_time": "15:20:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5986, "total_steps": 10853, "loss": 0.1405, "learning_rate": 2.280888022863621e-06, "epoch": 0.5515271571382503, "percentage": 55.16, "elapsed_time": "18:52:22", "remaining_time": "15:20:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5987, "total_steps": 10853, "loss": 0.1265, "learning_rate": 2.2801291816537738e-06, "epoch": 0.5516192933155203, "percentage": 55.16, "elapsed_time": "18:52:33", "remaining_time": "15:20:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5988, "total_steps": 10853, "loss": 0.1432, "learning_rate": 2.2793703608589547e-06, "epoch": 0.5517114294927904, "percentage": 55.17, "elapsed_time": "18:52:45", "remaining_time": "15:20:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5989, "total_steps": 10853, "loss": 0.1372, "learning_rate": 2.2786115605496224e-06, "epoch": 0.5518035656700604, "percentage": 55.18, "elapsed_time": "18:52:57", "remaining_time": "15:20:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5990, "total_steps": 10853, "loss": 0.1289, "learning_rate": 2.2778527807962297e-06, "epoch": 0.5518957018473304, "percentage": 55.19, "elapsed_time": "18:53:08", "remaining_time": "15:19:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5991, "total_steps": 10853, "loss": 0.1451, "learning_rate": 2.277094021669231e-06, "epoch": 0.5519878380246004, "percentage": 55.2, "elapsed_time": "18:53:19", "remaining_time": "15:19:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5992, "total_steps": 10853, "loss": 0.1209, "learning_rate": 2.2763352832390762e-06, "epoch": 0.5520799742018704, "percentage": 55.21, "elapsed_time": "18:53:30", "remaining_time": "15:19:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5993, "total_steps": 10853, "loss": 0.1273, "learning_rate": 2.2755765655762135e-06, "epoch": 0.5521721103791404, "percentage": 55.22, "elapsed_time": "18:53:42", "remaining_time": "15:19:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5994, "total_steps": 10853, "loss": 0.1426, "learning_rate": 2.2748178687510915e-06, "epoch": 0.5522642465564104, "percentage": 55.23, "elapsed_time": "18:53:53", "remaining_time": "15:19:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5995, "total_steps": 10853, "loss": 0.1335, "learning_rate": 2.2740591928341552e-06, "epoch": 0.5523563827336804, "percentage": 55.24, "elapsed_time": "18:54:03", "remaining_time": "15:18:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5996, "total_steps": 10853, "loss": 0.1343, "learning_rate": 2.2733005378958462e-06, "epoch": 0.5524485189109504, "percentage": 55.25, "elapsed_time": "18:54:14", "remaining_time": "15:18:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5997, "total_steps": 10853, "loss": 0.1346, "learning_rate": 2.2725419040066075e-06, "epoch": 0.5525406550882204, "percentage": 55.26, "elapsed_time": "18:54:25", "remaining_time": "15:18:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5998, "total_steps": 10853, "loss": 0.133, "learning_rate": 2.2717832912368766e-06, "epoch": 0.5526327912654904, "percentage": 55.27, "elapsed_time": "18:54:35", "remaining_time": "15:18:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5999, "total_steps": 10853, "loss": 0.1397, "learning_rate": 2.271024699657093e-06, "epoch": 0.5527249274427604, "percentage": 55.28, "elapsed_time": "18:54:46", "remaining_time": "15:18:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6000, "total_steps": 10853, "loss": 0.1195, "learning_rate": 2.2702661293376895e-06, "epoch": 0.5528170636200304, "percentage": 55.28, "elapsed_time": "18:54:56", "remaining_time": "15:17:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6000, "total_steps": 10853, "eval_loss": 0.13545145094394684, "epoch": 0.5528170636200304, "percentage": 55.28, "elapsed_time": "18:59:56", "remaining_time": "15:22:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6001, "total_steps": 10853, "loss": 0.1426, "learning_rate": 2.269507580349101e-06, "epoch": 0.5529091997973004, "percentage": 55.29, "elapsed_time": "19:00:08", "remaining_time": "15:21:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6002, "total_steps": 10853, "loss": 0.1308, "learning_rate": 2.2687490527617575e-06, "epoch": 0.5530013359745705, "percentage": 55.3, "elapsed_time": "19:00:19", "remaining_time": "15:21:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6003, "total_steps": 10853, "loss": 0.1319, "learning_rate": 2.2679905466460917e-06, "epoch": 0.5530934721518405, "percentage": 55.31, "elapsed_time": "19:00:29", "remaining_time": "15:21:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6004, "total_steps": 10853, "loss": 0.143, "learning_rate": 2.2672320620725265e-06, "epoch": 0.5531856083291105, "percentage": 55.32, "elapsed_time": "19:00:40", "remaining_time": "15:21:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6005, "total_steps": 10853, "loss": 0.1325, "learning_rate": 2.2664735991114893e-06, "epoch": 0.5532777445063805, "percentage": 55.33, "elapsed_time": "19:00:51", "remaining_time": "15:21:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6006, "total_steps": 10853, "loss": 0.131, "learning_rate": 2.2657151578334046e-06, "epoch": 0.5533698806836505, "percentage": 55.34, "elapsed_time": "19:01:03", "remaining_time": "15:20:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6007, "total_steps": 10853, "loss": 0.1286, "learning_rate": 2.264956738308693e-06, "epoch": 0.5534620168609204, "percentage": 55.35, "elapsed_time": "19:01:13", "remaining_time": "15:20:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6008, "total_steps": 10853, "loss": 0.1287, "learning_rate": 2.2641983406077726e-06, "epoch": 0.5535541530381904, "percentage": 55.36, "elapsed_time": "19:01:23", "remaining_time": "15:20:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6009, "total_steps": 10853, "loss": 0.1358, "learning_rate": 2.2634399648010623e-06, "epoch": 0.5536462892154604, "percentage": 55.37, "elapsed_time": "19:01:33", "remaining_time": "15:20:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6010, "total_steps": 10853, "loss": 0.1461, "learning_rate": 2.262681610958976e-06, "epoch": 0.5537384253927304, "percentage": 55.38, "elapsed_time": "19:01:45", "remaining_time": "15:20:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6011, "total_steps": 10853, "loss": 0.1358, "learning_rate": 2.2619232791519287e-06, "epoch": 0.5538305615700004, "percentage": 55.39, "elapsed_time": "19:01:55", "remaining_time": "15:19:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6012, "total_steps": 10853, "loss": 0.1298, "learning_rate": 2.26116496945033e-06, "epoch": 0.5539226977472704, "percentage": 55.39, "elapsed_time": "19:02:06", "remaining_time": "15:19:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6013, "total_steps": 10853, "loss": 0.1398, "learning_rate": 2.260406681924589e-06, "epoch": 0.5540148339245404, "percentage": 55.4, "elapsed_time": "19:02:16", "remaining_time": "15:19:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6014, "total_steps": 10853, "loss": 0.1393, "learning_rate": 2.2596484166451136e-06, "epoch": 0.5541069701018104, "percentage": 55.41, "elapsed_time": "19:02:26", "remaining_time": "15:19:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6015, "total_steps": 10853, "loss": 0.1195, "learning_rate": 2.2588901736823087e-06, "epoch": 0.5541991062790805, "percentage": 55.42, "elapsed_time": "19:02:36", "remaining_time": "15:19:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6016, "total_steps": 10853, "loss": 0.1411, "learning_rate": 2.2581319531065777e-06, "epoch": 0.5542912424563505, "percentage": 55.43, "elapsed_time": "19:02:47", "remaining_time": "15:18:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6017, "total_steps": 10853, "loss": 0.1265, "learning_rate": 2.257373754988321e-06, "epoch": 0.5543833786336205, "percentage": 55.44, "elapsed_time": "19:02:58", "remaining_time": "15:18:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6018, "total_steps": 10853, "loss": 0.1339, "learning_rate": 2.256615579397936e-06, "epoch": 0.5544755148108905, "percentage": 55.45, "elapsed_time": "19:03:09", "remaining_time": "15:18:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6019, "total_steps": 10853, "loss": 0.145, "learning_rate": 2.2558574264058218e-06, "epoch": 0.5545676509881605, "percentage": 55.46, "elapsed_time": "19:03:20", "remaining_time": "15:18:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6020, "total_steps": 10853, "loss": 0.1253, "learning_rate": 2.255099296082372e-06, "epoch": 0.5546597871654305, "percentage": 55.47, "elapsed_time": "19:03:30", "remaining_time": "15:18:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6021, "total_steps": 10853, "loss": 0.131, "learning_rate": 2.2543411884979775e-06, "epoch": 0.5547519233427005, "percentage": 55.48, "elapsed_time": "19:03:41", "remaining_time": "15:17:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6022, "total_steps": 10853, "loss": 0.129, "learning_rate": 2.2535831037230313e-06, "epoch": 0.5548440595199705, "percentage": 55.49, "elapsed_time": "19:03:51", "remaining_time": "15:17:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6023, "total_steps": 10853, "loss": 0.1421, "learning_rate": 2.2528250418279196e-06, "epoch": 0.5549361956972405, "percentage": 55.5, "elapsed_time": "19:04:02", "remaining_time": "15:17:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6024, "total_steps": 10853, "loss": 0.1337, "learning_rate": 2.2520670028830305e-06, "epoch": 0.5550283318745105, "percentage": 55.51, "elapsed_time": "19:04:12", "remaining_time": "15:17:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6025, "total_steps": 10853, "loss": 0.1342, "learning_rate": 2.251308986958746e-06, "epoch": 0.5551204680517805, "percentage": 55.51, "elapsed_time": "19:04:23", "remaining_time": "15:17:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6026, "total_steps": 10853, "loss": 0.1377, "learning_rate": 2.250550994125449e-06, "epoch": 0.5552126042290505, "percentage": 55.52, "elapsed_time": "19:04:34", "remaining_time": "15:16:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6027, "total_steps": 10853, "loss": 0.1243, "learning_rate": 2.249793024453519e-06, "epoch": 0.5553047404063205, "percentage": 55.53, "elapsed_time": "19:04:43", "remaining_time": "15:16:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6028, "total_steps": 10853, "loss": 0.1447, "learning_rate": 2.2490350780133344e-06, "epoch": 0.5553968765835905, "percentage": 55.54, "elapsed_time": "19:04:53", "remaining_time": "15:16:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6029, "total_steps": 10853, "loss": 0.137, "learning_rate": 2.2482771548752684e-06, "epoch": 0.5554890127608606, "percentage": 55.55, "elapsed_time": "19:05:06", "remaining_time": "15:16:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6030, "total_steps": 10853, "loss": 0.1369, "learning_rate": 2.247519255109697e-06, "epoch": 0.5555811489381306, "percentage": 55.56, "elapsed_time": "19:05:16", "remaining_time": "15:16:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6031, "total_steps": 10853, "loss": 0.1387, "learning_rate": 2.2467613787869886e-06, "epoch": 0.5556732851154006, "percentage": 55.57, "elapsed_time": "19:05:26", "remaining_time": "15:15:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6032, "total_steps": 10853, "loss": 0.1373, "learning_rate": 2.2460035259775147e-06, "epoch": 0.5557654212926706, "percentage": 55.58, "elapsed_time": "19:05:38", "remaining_time": "15:15:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6033, "total_steps": 10853, "loss": 0.1349, "learning_rate": 2.2452456967516404e-06, "epoch": 0.5558575574699406, "percentage": 55.59, "elapsed_time": "19:05:48", "remaining_time": "15:15:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6034, "total_steps": 10853, "loss": 0.1378, "learning_rate": 2.2444878911797295e-06, "epoch": 0.5559496936472106, "percentage": 55.6, "elapsed_time": "19:05:59", "remaining_time": "15:15:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6035, "total_steps": 10853, "loss": 0.149, "learning_rate": 2.2437301093321467e-06, "epoch": 0.5560418298244806, "percentage": 55.61, "elapsed_time": "19:06:10", "remaining_time": "15:15:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6036, "total_steps": 10853, "loss": 0.133, "learning_rate": 2.242972351279251e-06, "epoch": 0.5561339660017506, "percentage": 55.62, "elapsed_time": "19:06:20", "remaining_time": "15:14:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6037, "total_steps": 10853, "loss": 0.1269, "learning_rate": 2.242214617091399e-06, "epoch": 0.5562261021790206, "percentage": 55.63, "elapsed_time": "19:06:31", "remaining_time": "15:14:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6038, "total_steps": 10853, "loss": 0.1248, "learning_rate": 2.241456906838948e-06, "epoch": 0.5563182383562906, "percentage": 55.63, "elapsed_time": "19:06:42", "remaining_time": "15:14:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6039, "total_steps": 10853, "loss": 0.1332, "learning_rate": 2.2406992205922506e-06, "epoch": 0.5564103745335606, "percentage": 55.64, "elapsed_time": "19:06:52", "remaining_time": "15:14:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6040, "total_steps": 10853, "loss": 0.1199, "learning_rate": 2.2399415584216595e-06, "epoch": 0.5565025107108306, "percentage": 55.65, "elapsed_time": "19:07:02", "remaining_time": "15:14:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6041, "total_steps": 10853, "loss": 0.1291, "learning_rate": 2.2391839203975225e-06, "epoch": 0.5565946468881006, "percentage": 55.66, "elapsed_time": "19:07:12", "remaining_time": "15:13:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6042, "total_steps": 10853, "loss": 0.1504, "learning_rate": 2.238426306590186e-06, "epoch": 0.5566867830653707, "percentage": 55.67, "elapsed_time": "19:07:23", "remaining_time": "15:13:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6043, "total_steps": 10853, "loss": 0.1338, "learning_rate": 2.237668717069995e-06, "epoch": 0.5567789192426407, "percentage": 55.68, "elapsed_time": "19:07:35", "remaining_time": "15:13:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6044, "total_steps": 10853, "loss": 0.1402, "learning_rate": 2.2369111519072917e-06, "epoch": 0.5568710554199107, "percentage": 55.69, "elapsed_time": "19:07:45", "remaining_time": "15:13:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6045, "total_steps": 10853, "loss": 0.1285, "learning_rate": 2.2361536111724176e-06, "epoch": 0.5569631915971807, "percentage": 55.7, "elapsed_time": "19:07:56", "remaining_time": "15:13:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6046, "total_steps": 10853, "loss": 0.1327, "learning_rate": 2.2353960949357082e-06, "epoch": 0.5570553277744507, "percentage": 55.71, "elapsed_time": "19:08:06", "remaining_time": "15:12:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6047, "total_steps": 10853, "loss": 0.137, "learning_rate": 2.2346386032674995e-06, "epoch": 0.5571474639517207, "percentage": 55.72, "elapsed_time": "19:08:16", "remaining_time": "15:12:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6048, "total_steps": 10853, "loss": 0.1324, "learning_rate": 2.2338811362381256e-06, "epoch": 0.5572396001289907, "percentage": 55.73, "elapsed_time": "19:08:26", "remaining_time": "15:12:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6049, "total_steps": 10853, "loss": 0.1322, "learning_rate": 2.233123693917917e-06, "epoch": 0.5573317363062606, "percentage": 55.74, "elapsed_time": "19:08:37", "remaining_time": "15:12:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6050, "total_steps": 10853, "loss": 0.1258, "learning_rate": 2.232366276377201e-06, "epoch": 0.5574238724835306, "percentage": 55.74, "elapsed_time": "19:08:49", "remaining_time": "15:12:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6051, "total_steps": 10853, "loss": 0.1243, "learning_rate": 2.2316088836863064e-06, "epoch": 0.5575160086608006, "percentage": 55.75, "elapsed_time": "19:09:01", "remaining_time": "15:11:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6052, "total_steps": 10853, "loss": 0.1417, "learning_rate": 2.2308515159155546e-06, "epoch": 0.5576081448380706, "percentage": 55.76, "elapsed_time": "19:09:12", "remaining_time": "15:11:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6053, "total_steps": 10853, "loss": 0.1259, "learning_rate": 2.23009417313527e-06, "epoch": 0.5577002810153406, "percentage": 55.77, "elapsed_time": "19:09:24", "remaining_time": "15:11:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6054, "total_steps": 10853, "loss": 0.1311, "learning_rate": 2.2293368554157695e-06, "epoch": 0.5577924171926106, "percentage": 55.78, "elapsed_time": "19:09:36", "remaining_time": "15:11:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6055, "total_steps": 10853, "loss": 0.1452, "learning_rate": 2.228579562827371e-06, "epoch": 0.5578845533698806, "percentage": 55.79, "elapsed_time": "19:09:48", "remaining_time": "15:11:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6056, "total_steps": 10853, "loss": 0.1345, "learning_rate": 2.2278222954403895e-06, "epoch": 0.5579766895471507, "percentage": 55.8, "elapsed_time": "19:09:59", "remaining_time": "15:10:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6057, "total_steps": 10853, "loss": 0.1531, "learning_rate": 2.2270650533251383e-06, "epoch": 0.5580688257244207, "percentage": 55.81, "elapsed_time": "19:10:09", "remaining_time": "15:10:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6058, "total_steps": 10853, "loss": 0.1315, "learning_rate": 2.2263078365519244e-06, "epoch": 0.5581609619016907, "percentage": 55.82, "elapsed_time": "19:10:20", "remaining_time": "15:10:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6059, "total_steps": 10853, "loss": 0.1389, "learning_rate": 2.2255506451910584e-06, "epoch": 0.5582530980789607, "percentage": 55.83, "elapsed_time": "19:10:30", "remaining_time": "15:10:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6060, "total_steps": 10853, "loss": 0.1507, "learning_rate": 2.2247934793128436e-06, "epoch": 0.5583452342562307, "percentage": 55.84, "elapsed_time": "19:10:41", "remaining_time": "15:10:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6061, "total_steps": 10853, "loss": 0.1416, "learning_rate": 2.224036338987585e-06, "epoch": 0.5584373704335007, "percentage": 55.85, "elapsed_time": "19:10:50", "remaining_time": "15:09:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6062, "total_steps": 10853, "loss": 0.1465, "learning_rate": 2.223279224285582e-06, "epoch": 0.5585295066107707, "percentage": 55.86, "elapsed_time": "19:11:01", "remaining_time": "15:09:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6063, "total_steps": 10853, "loss": 0.1333, "learning_rate": 2.2225221352771316e-06, "epoch": 0.5586216427880407, "percentage": 55.86, "elapsed_time": "19:11:13", "remaining_time": "15:09:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6064, "total_steps": 10853, "loss": 0.1354, "learning_rate": 2.221765072032532e-06, "epoch": 0.5587137789653107, "percentage": 55.87, "elapsed_time": "19:11:22", "remaining_time": "15:09:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6065, "total_steps": 10853, "loss": 0.1495, "learning_rate": 2.2210080346220755e-06, "epoch": 0.5588059151425807, "percentage": 55.88, "elapsed_time": "19:11:34", "remaining_time": "15:09:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6066, "total_steps": 10853, "loss": 0.1395, "learning_rate": 2.220251023116052e-06, "epoch": 0.5588980513198507, "percentage": 55.89, "elapsed_time": "19:11:46", "remaining_time": "15:08:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6067, "total_steps": 10853, "loss": 0.1491, "learning_rate": 2.2194940375847517e-06, "epoch": 0.5589901874971207, "percentage": 55.9, "elapsed_time": "19:11:58", "remaining_time": "15:08:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6068, "total_steps": 10853, "loss": 0.1489, "learning_rate": 2.2187370780984596e-06, "epoch": 0.5590823236743907, "percentage": 55.91, "elapsed_time": "19:12:09", "remaining_time": "15:08:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6069, "total_steps": 10853, "loss": 0.1385, "learning_rate": 2.2179801447274613e-06, "epoch": 0.5591744598516608, "percentage": 55.92, "elapsed_time": "19:12:20", "remaining_time": "15:08:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6070, "total_steps": 10853, "loss": 0.1235, "learning_rate": 2.217223237542036e-06, "epoch": 0.5592665960289308, "percentage": 55.93, "elapsed_time": "19:12:31", "remaining_time": "15:08:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6071, "total_steps": 10853, "loss": 0.1376, "learning_rate": 2.2164663566124635e-06, "epoch": 0.5593587322062008, "percentage": 55.94, "elapsed_time": "19:12:42", "remaining_time": "15:07:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6072, "total_steps": 10853, "loss": 0.1316, "learning_rate": 2.2157095020090207e-06, "epoch": 0.5594508683834708, "percentage": 55.95, "elapsed_time": "19:12:53", "remaining_time": "15:07:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6073, "total_steps": 10853, "loss": 0.1233, "learning_rate": 2.2149526738019802e-06, "epoch": 0.5595430045607408, "percentage": 55.96, "elapsed_time": "19:13:04", "remaining_time": "15:07:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6074, "total_steps": 10853, "loss": 0.1279, "learning_rate": 2.2141958720616163e-06, "epoch": 0.5596351407380108, "percentage": 55.97, "elapsed_time": "19:13:12", "remaining_time": "15:07:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6075, "total_steps": 10853, "loss": 0.1243, "learning_rate": 2.2134390968581958e-06, "epoch": 0.5597272769152808, "percentage": 55.98, "elapsed_time": "19:13:23", "remaining_time": "15:07:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6076, "total_steps": 10853, "loss": 0.1242, "learning_rate": 2.212682348261985e-06, "epoch": 0.5598194130925508, "percentage": 55.98, "elapsed_time": "19:13:34", "remaining_time": "15:06:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6077, "total_steps": 10853, "loss": 0.1336, "learning_rate": 2.21192562634325e-06, "epoch": 0.5599115492698208, "percentage": 55.99, "elapsed_time": "19:13:45", "remaining_time": "15:06:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6078, "total_steps": 10853, "loss": 0.1327, "learning_rate": 2.2111689311722524e-06, "epoch": 0.5600036854470908, "percentage": 56.0, "elapsed_time": "19:13:55", "remaining_time": "15:06:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6079, "total_steps": 10853, "loss": 0.1314, "learning_rate": 2.210412262819249e-06, "epoch": 0.5600958216243608, "percentage": 56.01, "elapsed_time": "19:14:06", "remaining_time": "15:06:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6080, "total_steps": 10853, "loss": 0.1288, "learning_rate": 2.209655621354499e-06, "epoch": 0.5601879578016308, "percentage": 56.02, "elapsed_time": "19:14:17", "remaining_time": "15:06:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6081, "total_steps": 10853, "loss": 0.1638, "learning_rate": 2.2088990068482554e-06, "epoch": 0.5602800939789008, "percentage": 56.03, "elapsed_time": "19:14:27", "remaining_time": "15:05:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6082, "total_steps": 10853, "loss": 0.1286, "learning_rate": 2.208142419370771e-06, "epoch": 0.5603722301561708, "percentage": 56.04, "elapsed_time": "19:14:38", "remaining_time": "15:05:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6083, "total_steps": 10853, "loss": 0.1303, "learning_rate": 2.207385858992294e-06, "epoch": 0.5604643663334409, "percentage": 56.05, "elapsed_time": "19:14:48", "remaining_time": "15:05:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6084, "total_steps": 10853, "loss": 0.1278, "learning_rate": 2.206629325783071e-06, "epoch": 0.5605565025107109, "percentage": 56.06, "elapsed_time": "19:14:58", "remaining_time": "15:05:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6085, "total_steps": 10853, "loss": 0.1449, "learning_rate": 2.2058728198133466e-06, "epoch": 0.5606486386879809, "percentage": 56.07, "elapsed_time": "19:15:08", "remaining_time": "15:05:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6086, "total_steps": 10853, "loss": 0.1308, "learning_rate": 2.2051163411533644e-06, "epoch": 0.5607407748652509, "percentage": 56.08, "elapsed_time": "19:15:20", "remaining_time": "15:04:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6087, "total_steps": 10853, "loss": 0.1243, "learning_rate": 2.2043598898733597e-06, "epoch": 0.5608329110425209, "percentage": 56.09, "elapsed_time": "19:15:31", "remaining_time": "15:04:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6088, "total_steps": 10853, "loss": 0.1404, "learning_rate": 2.2036034660435714e-06, "epoch": 0.5609250472197909, "percentage": 56.1, "elapsed_time": "19:15:43", "remaining_time": "15:04:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6089, "total_steps": 10853, "loss": 0.1459, "learning_rate": 2.2028470697342334e-06, "epoch": 0.5610171833970609, "percentage": 56.1, "elapsed_time": "19:15:55", "remaining_time": "15:04:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6090, "total_steps": 10853, "loss": 0.136, "learning_rate": 2.2020907010155775e-06, "epoch": 0.5611093195743309, "percentage": 56.11, "elapsed_time": "19:16:05", "remaining_time": "15:04:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6091, "total_steps": 10853, "loss": 0.1334, "learning_rate": 2.2013343599578314e-06, "epoch": 0.5612014557516009, "percentage": 56.12, "elapsed_time": "19:16:16", "remaining_time": "15:03:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6092, "total_steps": 10853, "loss": 0.1453, "learning_rate": 2.2005780466312224e-06, "epoch": 0.5612935919288708, "percentage": 56.13, "elapsed_time": "19:16:28", "remaining_time": "15:03:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6093, "total_steps": 10853, "loss": 0.118, "learning_rate": 2.1998217611059733e-06, "epoch": 0.5613857281061408, "percentage": 56.14, "elapsed_time": "19:16:38", "remaining_time": "15:03:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6094, "total_steps": 10853, "loss": 0.1483, "learning_rate": 2.1990655034523073e-06, "epoch": 0.5614778642834108, "percentage": 56.15, "elapsed_time": "19:16:49", "remaining_time": "15:03:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6095, "total_steps": 10853, "loss": 0.1184, "learning_rate": 2.198309273740441e-06, "epoch": 0.5615700004606808, "percentage": 56.16, "elapsed_time": "19:17:00", "remaining_time": "15:03:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6096, "total_steps": 10853, "loss": 0.1316, "learning_rate": 2.1975530720405906e-06, "epoch": 0.5616621366379508, "percentage": 56.17, "elapsed_time": "19:17:12", "remaining_time": "15:03:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6097, "total_steps": 10853, "loss": 0.131, "learning_rate": 2.1967968984229704e-06, "epoch": 0.561754272815221, "percentage": 56.18, "elapsed_time": "19:17:23", "remaining_time": "15:02:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6098, "total_steps": 10853, "loss": 0.1323, "learning_rate": 2.1960407529577917e-06, "epoch": 0.5618464089924909, "percentage": 56.19, "elapsed_time": "19:17:34", "remaining_time": "15:02:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6099, "total_steps": 10853, "loss": 0.1332, "learning_rate": 2.1952846357152603e-06, "epoch": 0.5619385451697609, "percentage": 56.2, "elapsed_time": "19:17:45", "remaining_time": "15:02:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6100, "total_steps": 10853, "loss": 0.1312, "learning_rate": 2.1945285467655843e-06, "epoch": 0.5620306813470309, "percentage": 56.21, "elapsed_time": "19:17:56", "remaining_time": "15:02:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6101, "total_steps": 10853, "loss": 0.1443, "learning_rate": 2.1937724861789645e-06, "epoch": 0.5621228175243009, "percentage": 56.21, "elapsed_time": "19:18:06", "remaining_time": "15:02:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6102, "total_steps": 10853, "loss": 0.1343, "learning_rate": 2.1930164540256035e-06, "epoch": 0.5622149537015709, "percentage": 56.22, "elapsed_time": "19:18:16", "remaining_time": "15:01:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6103, "total_steps": 10853, "loss": 0.1312, "learning_rate": 2.1922604503756977e-06, "epoch": 0.5623070898788409, "percentage": 56.23, "elapsed_time": "19:18:27", "remaining_time": "15:01:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6104, "total_steps": 10853, "loss": 0.1254, "learning_rate": 2.1915044752994417e-06, "epoch": 0.5623992260561109, "percentage": 56.24, "elapsed_time": "19:18:38", "remaining_time": "15:01:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6105, "total_steps": 10853, "loss": 0.1367, "learning_rate": 2.1907485288670288e-06, "epoch": 0.5624913622333809, "percentage": 56.25, "elapsed_time": "19:18:50", "remaining_time": "15:01:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6106, "total_steps": 10853, "loss": 0.1374, "learning_rate": 2.1899926111486473e-06, "epoch": 0.5625834984106509, "percentage": 56.26, "elapsed_time": "19:19:02", "remaining_time": "15:01:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6107, "total_steps": 10853, "loss": 0.1449, "learning_rate": 2.1892367222144863e-06, "epoch": 0.5626756345879209, "percentage": 56.27, "elapsed_time": "19:19:13", "remaining_time": "15:00:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6108, "total_steps": 10853, "loss": 0.1249, "learning_rate": 2.1884808621347288e-06, "epoch": 0.5627677707651909, "percentage": 56.28, "elapsed_time": "19:19:23", "remaining_time": "15:00:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6109, "total_steps": 10853, "loss": 0.1458, "learning_rate": 2.1877250309795565e-06, "epoch": 0.5628599069424609, "percentage": 56.29, "elapsed_time": "19:19:34", "remaining_time": "15:00:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6110, "total_steps": 10853, "loss": 0.1356, "learning_rate": 2.186969228819149e-06, "epoch": 0.562952043119731, "percentage": 56.3, "elapsed_time": "19:19:44", "remaining_time": "15:00:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6111, "total_steps": 10853, "loss": 0.1358, "learning_rate": 2.1862134557236826e-06, "epoch": 0.563044179297001, "percentage": 56.31, "elapsed_time": "19:19:56", "remaining_time": "15:00:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6112, "total_steps": 10853, "loss": 0.1459, "learning_rate": 2.1854577117633297e-06, "epoch": 0.563136315474271, "percentage": 56.32, "elapsed_time": "19:20:07", "remaining_time": "14:59:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6113, "total_steps": 10853, "loss": 0.1366, "learning_rate": 2.1847019970082628e-06, "epoch": 0.563228451651541, "percentage": 56.33, "elapsed_time": "19:20:18", "remaining_time": "14:59:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6114, "total_steps": 10853, "loss": 0.1188, "learning_rate": 2.1839463115286484e-06, "epoch": 0.563320587828811, "percentage": 56.33, "elapsed_time": "19:20:28", "remaining_time": "14:59:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6115, "total_steps": 10853, "loss": 0.1404, "learning_rate": 2.183190655394655e-06, "epoch": 0.563412724006081, "percentage": 56.34, "elapsed_time": "19:20:39", "remaining_time": "14:59:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6116, "total_steps": 10853, "loss": 0.1413, "learning_rate": 2.182435028676442e-06, "epoch": 0.563504860183351, "percentage": 56.35, "elapsed_time": "19:20:49", "remaining_time": "14:59:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6117, "total_steps": 10853, "loss": 0.1234, "learning_rate": 2.1816794314441704e-06, "epoch": 0.563596996360621, "percentage": 56.36, "elapsed_time": "19:21:00", "remaining_time": "14:58:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6118, "total_steps": 10853, "loss": 0.1295, "learning_rate": 2.1809238637679984e-06, "epoch": 0.563689132537891, "percentage": 56.37, "elapsed_time": "19:21:10", "remaining_time": "14:58:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6119, "total_steps": 10853, "loss": 0.1291, "learning_rate": 2.1801683257180807e-06, "epoch": 0.563781268715161, "percentage": 56.38, "elapsed_time": "19:21:20", "remaining_time": "14:58:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6120, "total_steps": 10853, "loss": 0.1305, "learning_rate": 2.179412817364567e-06, "epoch": 0.563873404892431, "percentage": 56.39, "elapsed_time": "19:21:30", "remaining_time": "14:58:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6121, "total_steps": 10853, "loss": 0.1385, "learning_rate": 2.1786573387776085e-06, "epoch": 0.563965541069701, "percentage": 56.4, "elapsed_time": "19:21:42", "remaining_time": "14:58:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6122, "total_steps": 10853, "loss": 0.1284, "learning_rate": 2.17790189002735e-06, "epoch": 0.564057677246971, "percentage": 56.41, "elapsed_time": "19:21:53", "remaining_time": "14:57:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6123, "total_steps": 10853, "loss": 0.1342, "learning_rate": 2.177146471183937e-06, "epoch": 0.564149813424241, "percentage": 56.42, "elapsed_time": "19:22:05", "remaining_time": "14:57:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6124, "total_steps": 10853, "loss": 0.141, "learning_rate": 2.176391082317508e-06, "epoch": 0.5642419496015111, "percentage": 56.43, "elapsed_time": "19:22:16", "remaining_time": "14:57:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6125, "total_steps": 10853, "loss": 0.1378, "learning_rate": 2.175635723498201e-06, "epoch": 0.5643340857787811, "percentage": 56.44, "elapsed_time": "19:22:27", "remaining_time": "14:57:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6126, "total_steps": 10853, "loss": 0.1264, "learning_rate": 2.1748803947961533e-06, "epoch": 0.5644262219560511, "percentage": 56.45, "elapsed_time": "19:22:38", "remaining_time": "14:57:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6127, "total_steps": 10853, "loss": 0.1409, "learning_rate": 2.174125096281496e-06, "epoch": 0.5645183581333211, "percentage": 56.45, "elapsed_time": "19:22:48", "remaining_time": "14:56:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6128, "total_steps": 10853, "loss": 0.1307, "learning_rate": 2.1733698280243578e-06, "epoch": 0.5646104943105911, "percentage": 56.46, "elapsed_time": "19:23:01", "remaining_time": "14:56:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6129, "total_steps": 10853, "loss": 0.1326, "learning_rate": 2.1726145900948664e-06, "epoch": 0.5647026304878611, "percentage": 56.47, "elapsed_time": "19:23:11", "remaining_time": "14:56:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6130, "total_steps": 10853, "loss": 0.1407, "learning_rate": 2.1718593825631454e-06, "epoch": 0.5647947666651311, "percentage": 56.48, "elapsed_time": "19:23:22", "remaining_time": "14:56:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6131, "total_steps": 10853, "loss": 0.144, "learning_rate": 2.1711042054993164e-06, "epoch": 0.5648869028424011, "percentage": 56.49, "elapsed_time": "19:23:34", "remaining_time": "14:56:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6132, "total_steps": 10853, "loss": 0.1406, "learning_rate": 2.1703490589734976e-06, "epoch": 0.5649790390196711, "percentage": 56.5, "elapsed_time": "19:23:44", "remaining_time": "14:55:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6133, "total_steps": 10853, "loss": 0.1337, "learning_rate": 2.1695939430558035e-06, "epoch": 0.5650711751969411, "percentage": 56.51, "elapsed_time": "19:23:56", "remaining_time": "14:55:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6134, "total_steps": 10853, "loss": 0.1334, "learning_rate": 2.1688388578163476e-06, "epoch": 0.565163311374211, "percentage": 56.52, "elapsed_time": "19:24:06", "remaining_time": "14:55:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6135, "total_steps": 10853, "loss": 0.1333, "learning_rate": 2.168083803325239e-06, "epoch": 0.565255447551481, "percentage": 56.53, "elapsed_time": "19:24:17", "remaining_time": "14:55:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6136, "total_steps": 10853, "loss": 0.134, "learning_rate": 2.167328779652586e-06, "epoch": 0.565347583728751, "percentage": 56.54, "elapsed_time": "19:24:27", "remaining_time": "14:55:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6137, "total_steps": 10853, "loss": 0.1385, "learning_rate": 2.166573786868491e-06, "epoch": 0.5654397199060212, "percentage": 56.55, "elapsed_time": "19:24:37", "remaining_time": "14:54:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6138, "total_steps": 10853, "loss": 0.1428, "learning_rate": 2.1658188250430556e-06, "epoch": 0.5655318560832912, "percentage": 56.56, "elapsed_time": "19:24:48", "remaining_time": "14:54:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6139, "total_steps": 10853, "loss": 0.131, "learning_rate": 2.1650638942463785e-06, "epoch": 0.5656239922605611, "percentage": 56.57, "elapsed_time": "19:24:59", "remaining_time": "14:54:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6140, "total_steps": 10853, "loss": 0.1335, "learning_rate": 2.1643089945485555e-06, "epoch": 0.5657161284378311, "percentage": 56.57, "elapsed_time": "19:25:10", "remaining_time": "14:54:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6141, "total_steps": 10853, "loss": 0.143, "learning_rate": 2.163554126019677e-06, "epoch": 0.5658082646151011, "percentage": 56.58, "elapsed_time": "19:25:21", "remaining_time": "14:54:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6142, "total_steps": 10853, "loss": 0.1359, "learning_rate": 2.162799288729835e-06, "epoch": 0.5659004007923711, "percentage": 56.59, "elapsed_time": "19:25:32", "remaining_time": "14:53:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6143, "total_steps": 10853, "loss": 0.142, "learning_rate": 2.162044482749115e-06, "epoch": 0.5659925369696411, "percentage": 56.6, "elapsed_time": "19:25:43", "remaining_time": "14:53:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6144, "total_steps": 10853, "loss": 0.1347, "learning_rate": 2.161289708147602e-06, "epoch": 0.5660846731469111, "percentage": 56.61, "elapsed_time": "19:25:55", "remaining_time": "14:53:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6145, "total_steps": 10853, "loss": 0.1568, "learning_rate": 2.1605349649953756e-06, "epoch": 0.5661768093241811, "percentage": 56.62, "elapsed_time": "19:26:06", "remaining_time": "14:53:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6146, "total_steps": 10853, "loss": 0.126, "learning_rate": 2.1597802533625135e-06, "epoch": 0.5662689455014511, "percentage": 56.63, "elapsed_time": "19:26:17", "remaining_time": "14:53:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6147, "total_steps": 10853, "loss": 0.129, "learning_rate": 2.159025573319092e-06, "epoch": 0.5663610816787211, "percentage": 56.64, "elapsed_time": "19:26:28", "remaining_time": "14:53:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6148, "total_steps": 10853, "loss": 0.1256, "learning_rate": 2.1582709249351834e-06, "epoch": 0.5664532178559911, "percentage": 56.65, "elapsed_time": "19:26:39", "remaining_time": "14:52:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6149, "total_steps": 10853, "loss": 0.1377, "learning_rate": 2.157516308280855e-06, "epoch": 0.5665453540332611, "percentage": 56.66, "elapsed_time": "19:26:49", "remaining_time": "14:52:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6150, "total_steps": 10853, "loss": 0.1191, "learning_rate": 2.156761723426175e-06, "epoch": 0.5666374902105311, "percentage": 56.67, "elapsed_time": "19:27:00", "remaining_time": "14:52:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6151, "total_steps": 10853, "loss": 0.1386, "learning_rate": 2.1560071704412052e-06, "epoch": 0.5667296263878012, "percentage": 56.68, "elapsed_time": "19:27:10", "remaining_time": "14:52:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6152, "total_steps": 10853, "loss": 0.124, "learning_rate": 2.155252649396008e-06, "epoch": 0.5668217625650712, "percentage": 56.68, "elapsed_time": "19:27:21", "remaining_time": "14:52:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6153, "total_steps": 10853, "loss": 0.131, "learning_rate": 2.1544981603606386e-06, "epoch": 0.5669138987423412, "percentage": 56.69, "elapsed_time": "19:27:32", "remaining_time": "14:51:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6154, "total_steps": 10853, "loss": 0.1221, "learning_rate": 2.1537437034051516e-06, "epoch": 0.5670060349196112, "percentage": 56.7, "elapsed_time": "19:27:43", "remaining_time": "14:51:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6155, "total_steps": 10853, "loss": 0.1279, "learning_rate": 2.1529892785995996e-06, "epoch": 0.5670981710968812, "percentage": 56.71, "elapsed_time": "19:27:53", "remaining_time": "14:51:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6156, "total_steps": 10853, "loss": 0.1314, "learning_rate": 2.152234886014031e-06, "epoch": 0.5671903072741512, "percentage": 56.72, "elapsed_time": "19:28:04", "remaining_time": "14:51:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6157, "total_steps": 10853, "loss": 0.1375, "learning_rate": 2.1514805257184894e-06, "epoch": 0.5672824434514212, "percentage": 56.73, "elapsed_time": "19:28:15", "remaining_time": "14:51:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6158, "total_steps": 10853, "loss": 0.1345, "learning_rate": 2.1507261977830198e-06, "epoch": 0.5673745796286912, "percentage": 56.74, "elapsed_time": "19:28:26", "remaining_time": "14:50:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6159, "total_steps": 10853, "loss": 0.1385, "learning_rate": 2.1499719022776588e-06, "epoch": 0.5674667158059612, "percentage": 56.75, "elapsed_time": "19:28:37", "remaining_time": "14:50:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6160, "total_steps": 10853, "loss": 0.1306, "learning_rate": 2.149217639272445e-06, "epoch": 0.5675588519832312, "percentage": 56.76, "elapsed_time": "19:28:47", "remaining_time": "14:50:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6161, "total_steps": 10853, "loss": 0.1327, "learning_rate": 2.1484634088374124e-06, "epoch": 0.5676509881605012, "percentage": 56.77, "elapsed_time": "19:28:57", "remaining_time": "14:50:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6162, "total_steps": 10853, "loss": 0.1435, "learning_rate": 2.1477092110425887e-06, "epoch": 0.5677431243377712, "percentage": 56.78, "elapsed_time": "19:29:08", "remaining_time": "14:50:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6163, "total_steps": 10853, "loss": 0.1493, "learning_rate": 2.1469550459580025e-06, "epoch": 0.5678352605150412, "percentage": 56.79, "elapsed_time": "19:29:19", "remaining_time": "14:49:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6164, "total_steps": 10853, "loss": 0.1302, "learning_rate": 2.1462009136536787e-06, "epoch": 0.5679273966923112, "percentage": 56.8, "elapsed_time": "19:29:31", "remaining_time": "14:49:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6165, "total_steps": 10853, "loss": 0.1317, "learning_rate": 2.145446814199639e-06, "epoch": 0.5680195328695813, "percentage": 56.8, "elapsed_time": "19:29:40", "remaining_time": "14:49:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6166, "total_steps": 10853, "loss": 0.1398, "learning_rate": 2.1446927476658996e-06, "epoch": 0.5681116690468513, "percentage": 56.81, "elapsed_time": "19:29:50", "remaining_time": "14:49:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6167, "total_steps": 10853, "loss": 0.1232, "learning_rate": 2.1439387141224775e-06, "epoch": 0.5682038052241213, "percentage": 56.82, "elapsed_time": "19:30:00", "remaining_time": "14:49:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6168, "total_steps": 10853, "loss": 0.1311, "learning_rate": 2.1431847136393832e-06, "epoch": 0.5682959414013913, "percentage": 56.83, "elapsed_time": "19:30:12", "remaining_time": "14:48:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6169, "total_steps": 10853, "loss": 0.1292, "learning_rate": 2.1424307462866283e-06, "epoch": 0.5683880775786613, "percentage": 56.84, "elapsed_time": "19:30:22", "remaining_time": "14:48:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6170, "total_steps": 10853, "loss": 0.1217, "learning_rate": 2.141676812134216e-06, "epoch": 0.5684802137559313, "percentage": 56.85, "elapsed_time": "19:30:34", "remaining_time": "14:48:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6171, "total_steps": 10853, "loss": 0.1394, "learning_rate": 2.1409229112521498e-06, "epoch": 0.5685723499332013, "percentage": 56.86, "elapsed_time": "19:30:46", "remaining_time": "14:48:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6172, "total_steps": 10853, "loss": 0.1227, "learning_rate": 2.1401690437104306e-06, "epoch": 0.5686644861104713, "percentage": 56.87, "elapsed_time": "19:30:58", "remaining_time": "14:48:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6173, "total_steps": 10853, "loss": 0.1361, "learning_rate": 2.139415209579055e-06, "epoch": 0.5687566222877413, "percentage": 56.88, "elapsed_time": "19:31:08", "remaining_time": "14:47:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6174, "total_steps": 10853, "loss": 0.1446, "learning_rate": 2.1386614089280145e-06, "epoch": 0.5688487584650113, "percentage": 56.89, "elapsed_time": "19:31:19", "remaining_time": "14:47:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6175, "total_steps": 10853, "loss": 0.1437, "learning_rate": 2.137907641827302e-06, "epoch": 0.5689408946422813, "percentage": 56.9, "elapsed_time": "19:31:30", "remaining_time": "14:47:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6176, "total_steps": 10853, "loss": 0.1397, "learning_rate": 2.1371539083469033e-06, "epoch": 0.5690330308195513, "percentage": 56.91, "elapsed_time": "19:31:40", "remaining_time": "14:47:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6177, "total_steps": 10853, "loss": 0.1355, "learning_rate": 2.1364002085568046e-06, "epoch": 0.5691251669968213, "percentage": 56.92, "elapsed_time": "19:31:51", "remaining_time": "14:47:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6178, "total_steps": 10853, "loss": 0.1288, "learning_rate": 2.135646542526985e-06, "epoch": 0.5692173031740914, "percentage": 56.92, "elapsed_time": "19:32:01", "remaining_time": "14:46:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6179, "total_steps": 10853, "loss": 0.1296, "learning_rate": 2.1348929103274223e-06, "epoch": 0.5693094393513614, "percentage": 56.93, "elapsed_time": "19:32:10", "remaining_time": "14:46:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6180, "total_steps": 10853, "loss": 0.1366, "learning_rate": 2.134139312028093e-06, "epoch": 0.5694015755286314, "percentage": 56.94, "elapsed_time": "19:32:22", "remaining_time": "14:46:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6181, "total_steps": 10853, "loss": 0.1348, "learning_rate": 2.1333857476989685e-06, "epoch": 0.5694937117059014, "percentage": 56.95, "elapsed_time": "19:32:34", "remaining_time": "14:46:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6182, "total_steps": 10853, "loss": 0.1265, "learning_rate": 2.1326322174100156e-06, "epoch": 0.5695858478831713, "percentage": 56.96, "elapsed_time": "19:32:44", "remaining_time": "14:46:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6183, "total_steps": 10853, "loss": 0.14, "learning_rate": 2.1318787212312015e-06, "epoch": 0.5696779840604413, "percentage": 56.97, "elapsed_time": "19:32:55", "remaining_time": "14:45:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6184, "total_steps": 10853, "loss": 0.1319, "learning_rate": 2.131125259232487e-06, "epoch": 0.5697701202377113, "percentage": 56.98, "elapsed_time": "19:33:05", "remaining_time": "14:45:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6185, "total_steps": 10853, "loss": 0.1226, "learning_rate": 2.130371831483833e-06, "epoch": 0.5698622564149813, "percentage": 56.99, "elapsed_time": "19:33:16", "remaining_time": "14:45:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6186, "total_steps": 10853, "loss": 0.128, "learning_rate": 2.1296184380551936e-06, "epoch": 0.5699543925922513, "percentage": 57.0, "elapsed_time": "19:33:28", "remaining_time": "14:45:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6187, "total_steps": 10853, "loss": 0.1402, "learning_rate": 2.128865079016522e-06, "epoch": 0.5700465287695213, "percentage": 57.01, "elapsed_time": "19:33:39", "remaining_time": "14:45:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6188, "total_steps": 10853, "loss": 0.1391, "learning_rate": 2.128111754437768e-06, "epoch": 0.5701386649467913, "percentage": 57.02, "elapsed_time": "19:33:49", "remaining_time": "14:44:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6189, "total_steps": 10853, "loss": 0.1366, "learning_rate": 2.127358464388877e-06, "epoch": 0.5702308011240613, "percentage": 57.03, "elapsed_time": "19:34:01", "remaining_time": "14:44:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6190, "total_steps": 10853, "loss": 0.1467, "learning_rate": 2.1266052089397936e-06, "epoch": 0.5703229373013313, "percentage": 57.03, "elapsed_time": "19:34:11", "remaining_time": "14:44:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6191, "total_steps": 10853, "loss": 0.1287, "learning_rate": 2.1258519881604566e-06, "epoch": 0.5704150734786013, "percentage": 57.04, "elapsed_time": "19:34:22", "remaining_time": "14:44:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6192, "total_steps": 10853, "loss": 0.1304, "learning_rate": 2.125098802120802e-06, "epoch": 0.5705072096558714, "percentage": 57.05, "elapsed_time": "19:34:32", "remaining_time": "14:44:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6193, "total_steps": 10853, "loss": 0.1394, "learning_rate": 2.1243456508907643e-06, "epoch": 0.5705993458331414, "percentage": 57.06, "elapsed_time": "19:34:43", "remaining_time": "14:43:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6194, "total_steps": 10853, "loss": 0.1232, "learning_rate": 2.1235925345402746e-06, "epoch": 0.5706914820104114, "percentage": 57.07, "elapsed_time": "19:34:54", "remaining_time": "14:43:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6195, "total_steps": 10853, "loss": 0.1274, "learning_rate": 2.122839453139257e-06, "epoch": 0.5707836181876814, "percentage": 57.08, "elapsed_time": "19:35:03", "remaining_time": "14:43:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6196, "total_steps": 10853, "loss": 0.1307, "learning_rate": 2.122086406757637e-06, "epoch": 0.5708757543649514, "percentage": 57.09, "elapsed_time": "19:35:14", "remaining_time": "14:43:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6197, "total_steps": 10853, "loss": 0.1343, "learning_rate": 2.121333395465335e-06, "epoch": 0.5709678905422214, "percentage": 57.1, "elapsed_time": "19:35:24", "remaining_time": "14:43:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6198, "total_steps": 10853, "loss": 0.138, "learning_rate": 2.1205804193322685e-06, "epoch": 0.5710600267194914, "percentage": 57.11, "elapsed_time": "19:35:35", "remaining_time": "14:42:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6199, "total_steps": 10853, "loss": 0.1314, "learning_rate": 2.119827478428351e-06, "epoch": 0.5711521628967614, "percentage": 57.12, "elapsed_time": "19:35:45", "remaining_time": "14:42:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6200, "total_steps": 10853, "loss": 0.1361, "learning_rate": 2.1190745728234916e-06, "epoch": 0.5712442990740314, "percentage": 57.13, "elapsed_time": "19:35:55", "remaining_time": "14:42:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6201, "total_steps": 10853, "loss": 0.1381, "learning_rate": 2.1183217025876e-06, "epoch": 0.5713364352513014, "percentage": 57.14, "elapsed_time": "19:36:06", "remaining_time": "14:42:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6202, "total_steps": 10853, "loss": 0.1211, "learning_rate": 2.1175688677905804e-06, "epoch": 0.5714285714285714, "percentage": 57.15, "elapsed_time": "19:36:18", "remaining_time": "14:42:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6203, "total_steps": 10853, "loss": 0.1392, "learning_rate": 2.116816068502331e-06, "epoch": 0.5715207076058414, "percentage": 57.15, "elapsed_time": "19:36:28", "remaining_time": "14:41:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6204, "total_steps": 10853, "loss": 0.1346, "learning_rate": 2.1160633047927515e-06, "epoch": 0.5716128437831114, "percentage": 57.16, "elapsed_time": "19:36:40", "remaining_time": "14:41:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6205, "total_steps": 10853, "loss": 0.132, "learning_rate": 2.115310576731735e-06, "epoch": 0.5717049799603815, "percentage": 57.17, "elapsed_time": "19:36:51", "remaining_time": "14:41:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6206, "total_steps": 10853, "loss": 0.1338, "learning_rate": 2.114557884389174e-06, "epoch": 0.5717971161376515, "percentage": 57.18, "elapsed_time": "19:37:02", "remaining_time": "14:41:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6207, "total_steps": 10853, "loss": 0.1359, "learning_rate": 2.1138052278349543e-06, "epoch": 0.5718892523149215, "percentage": 57.19, "elapsed_time": "19:37:13", "remaining_time": "14:41:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6208, "total_steps": 10853, "loss": 0.1155, "learning_rate": 2.1130526071389603e-06, "epoch": 0.5719813884921915, "percentage": 57.2, "elapsed_time": "19:37:23", "remaining_time": "14:40:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6209, "total_steps": 10853, "loss": 0.1303, "learning_rate": 2.1123000223710737e-06, "epoch": 0.5720735246694615, "percentage": 57.21, "elapsed_time": "19:37:34", "remaining_time": "14:40:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6210, "total_steps": 10853, "loss": 0.1321, "learning_rate": 2.1115474736011725e-06, "epoch": 0.5721656608467315, "percentage": 57.22, "elapsed_time": "19:37:45", "remaining_time": "14:40:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6211, "total_steps": 10853, "loss": 0.1383, "learning_rate": 2.110794960899129e-06, "epoch": 0.5722577970240015, "percentage": 57.23, "elapsed_time": "19:37:57", "remaining_time": "14:40:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6212, "total_steps": 10853, "loss": 0.1328, "learning_rate": 2.1100424843348157e-06, "epoch": 0.5723499332012715, "percentage": 57.24, "elapsed_time": "19:38:08", "remaining_time": "14:40:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6213, "total_steps": 10853, "loss": 0.1393, "learning_rate": 2.1092900439780993e-06, "epoch": 0.5724420693785415, "percentage": 57.25, "elapsed_time": "19:38:19", "remaining_time": "14:40:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6214, "total_steps": 10853, "loss": 0.1343, "learning_rate": 2.108537639898845e-06, "epoch": 0.5725342055558115, "percentage": 57.26, "elapsed_time": "19:38:28", "remaining_time": "14:39:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6215, "total_steps": 10853, "loss": 0.125, "learning_rate": 2.1077852721669132e-06, "epoch": 0.5726263417330815, "percentage": 57.27, "elapsed_time": "19:38:39", "remaining_time": "14:39:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6216, "total_steps": 10853, "loss": 0.1222, "learning_rate": 2.10703294085216e-06, "epoch": 0.5727184779103515, "percentage": 57.27, "elapsed_time": "19:38:49", "remaining_time": "14:39:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6217, "total_steps": 10853, "loss": 0.1351, "learning_rate": 2.1062806460244415e-06, "epoch": 0.5728106140876215, "percentage": 57.28, "elapsed_time": "19:38:59", "remaining_time": "14:39:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6218, "total_steps": 10853, "loss": 0.1376, "learning_rate": 2.1055283877536066e-06, "epoch": 0.5729027502648915, "percentage": 57.29, "elapsed_time": "19:39:10", "remaining_time": "14:38:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6219, "total_steps": 10853, "loss": 0.134, "learning_rate": 2.1047761661095043e-06, "epoch": 0.5729948864421616, "percentage": 57.3, "elapsed_time": "19:39:21", "remaining_time": "14:38:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6220, "total_steps": 10853, "loss": 0.1382, "learning_rate": 2.1040239811619774e-06, "epoch": 0.5730870226194316, "percentage": 57.31, "elapsed_time": "19:39:31", "remaining_time": "14:38:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6221, "total_steps": 10853, "loss": 0.135, "learning_rate": 2.1032718329808656e-06, "epoch": 0.5731791587967016, "percentage": 57.32, "elapsed_time": "19:39:41", "remaining_time": "14:38:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6222, "total_steps": 10853, "loss": 0.1269, "learning_rate": 2.102519721636007e-06, "epoch": 0.5732712949739716, "percentage": 57.33, "elapsed_time": "19:39:50", "remaining_time": "14:38:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6223, "total_steps": 10853, "loss": 0.1194, "learning_rate": 2.1017676471972363e-06, "epoch": 0.5733634311512416, "percentage": 57.34, "elapsed_time": "19:40:01", "remaining_time": "14:37:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6224, "total_steps": 10853, "loss": 0.1358, "learning_rate": 2.101015609734381e-06, "epoch": 0.5734555673285116, "percentage": 57.35, "elapsed_time": "19:40:11", "remaining_time": "14:37:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6225, "total_steps": 10853, "loss": 0.1404, "learning_rate": 2.1002636093172694e-06, "epoch": 0.5735477035057815, "percentage": 57.36, "elapsed_time": "19:40:20", "remaining_time": "14:37:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6226, "total_steps": 10853, "loss": 0.1358, "learning_rate": 2.099511646015725e-06, "epoch": 0.5736398396830515, "percentage": 57.37, "elapsed_time": "19:40:31", "remaining_time": "14:37:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6227, "total_steps": 10853, "loss": 0.1365, "learning_rate": 2.098759719899568e-06, "epoch": 0.5737319758603215, "percentage": 57.38, "elapsed_time": "19:40:41", "remaining_time": "14:37:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6228, "total_steps": 10853, "loss": 0.1368, "learning_rate": 2.0980078310386135e-06, "epoch": 0.5738241120375915, "percentage": 57.39, "elapsed_time": "19:40:52", "remaining_time": "14:36:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6229, "total_steps": 10853, "loss": 0.1374, "learning_rate": 2.097255979502675e-06, "epoch": 0.5739162482148615, "percentage": 57.39, "elapsed_time": "19:41:02", "remaining_time": "14:36:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6230, "total_steps": 10853, "loss": 0.1503, "learning_rate": 2.096504165361562e-06, "epoch": 0.5740083843921315, "percentage": 57.4, "elapsed_time": "19:41:13", "remaining_time": "14:36:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6231, "total_steps": 10853, "loss": 0.142, "learning_rate": 2.0957523886850815e-06, "epoch": 0.5741005205694015, "percentage": 57.41, "elapsed_time": "19:41:24", "remaining_time": "14:36:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6232, "total_steps": 10853, "loss": 0.1287, "learning_rate": 2.095000649543035e-06, "epoch": 0.5741926567466715, "percentage": 57.42, "elapsed_time": "19:41:35", "remaining_time": "14:36:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6233, "total_steps": 10853, "loss": 0.1242, "learning_rate": 2.0942489480052214e-06, "epoch": 0.5742847929239416, "percentage": 57.43, "elapsed_time": "19:41:46", "remaining_time": "14:35:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6234, "total_steps": 10853, "loss": 0.1393, "learning_rate": 2.093497284141436e-06, "epoch": 0.5743769291012116, "percentage": 57.44, "elapsed_time": "19:41:57", "remaining_time": "14:35:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6235, "total_steps": 10853, "loss": 0.1421, "learning_rate": 2.0927456580214733e-06, "epoch": 0.5744690652784816, "percentage": 57.45, "elapsed_time": "19:42:07", "remaining_time": "14:35:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6236, "total_steps": 10853, "loss": 0.1242, "learning_rate": 2.091994069715119e-06, "epoch": 0.5745612014557516, "percentage": 57.46, "elapsed_time": "19:42:18", "remaining_time": "14:35:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6237, "total_steps": 10853, "loss": 0.1312, "learning_rate": 2.0912425192921588e-06, "epoch": 0.5746533376330216, "percentage": 57.47, "elapsed_time": "19:42:29", "remaining_time": "14:35:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6238, "total_steps": 10853, "loss": 0.147, "learning_rate": 2.0904910068223745e-06, "epoch": 0.5747454738102916, "percentage": 57.48, "elapsed_time": "19:42:40", "remaining_time": "14:34:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6239, "total_steps": 10853, "loss": 0.115, "learning_rate": 2.0897395323755464e-06, "epoch": 0.5748376099875616, "percentage": 57.49, "elapsed_time": "19:42:49", "remaining_time": "14:34:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6240, "total_steps": 10853, "loss": 0.1237, "learning_rate": 2.088988096021445e-06, "epoch": 0.5749297461648316, "percentage": 57.5, "elapsed_time": "19:42:59", "remaining_time": "14:34:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6241, "total_steps": 10853, "loss": 0.1366, "learning_rate": 2.088236697829843e-06, "epoch": 0.5750218823421016, "percentage": 57.5, "elapsed_time": "19:43:09", "remaining_time": "14:34:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6242, "total_steps": 10853, "loss": 0.1229, "learning_rate": 2.0874853378705085e-06, "epoch": 0.5751140185193716, "percentage": 57.51, "elapsed_time": "19:43:19", "remaining_time": "14:34:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6243, "total_steps": 10853, "loss": 0.1303, "learning_rate": 2.0867340162132054e-06, "epoch": 0.5752061546966416, "percentage": 57.52, "elapsed_time": "19:43:32", "remaining_time": "14:33:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6244, "total_steps": 10853, "loss": 0.1418, "learning_rate": 2.0859827329276926e-06, "epoch": 0.5752982908739116, "percentage": 57.53, "elapsed_time": "19:43:42", "remaining_time": "14:33:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6245, "total_steps": 10853, "loss": 0.1397, "learning_rate": 2.0852314880837278e-06, "epoch": 0.5753904270511816, "percentage": 57.54, "elapsed_time": "19:43:54", "remaining_time": "14:33:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6246, "total_steps": 10853, "loss": 0.1341, "learning_rate": 2.0844802817510633e-06, "epoch": 0.5754825632284517, "percentage": 57.55, "elapsed_time": "19:44:05", "remaining_time": "14:33:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6247, "total_steps": 10853, "loss": 0.1185, "learning_rate": 2.08372911399945e-06, "epoch": 0.5755746994057217, "percentage": 57.56, "elapsed_time": "19:44:15", "remaining_time": "14:33:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6248, "total_steps": 10853, "loss": 0.1445, "learning_rate": 2.0829779848986337e-06, "epoch": 0.5756668355829917, "percentage": 57.57, "elapsed_time": "19:44:26", "remaining_time": "14:32:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6249, "total_steps": 10853, "loss": 0.1301, "learning_rate": 2.0822268945183555e-06, "epoch": 0.5757589717602617, "percentage": 57.58, "elapsed_time": "19:44:38", "remaining_time": "14:32:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6250, "total_steps": 10853, "loss": 0.1242, "learning_rate": 2.081475842928356e-06, "epoch": 0.5758511079375317, "percentage": 57.59, "elapsed_time": "19:44:47", "remaining_time": "14:32:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6251, "total_steps": 10853, "loss": 0.1479, "learning_rate": 2.0807248301983682e-06, "epoch": 0.5759432441148017, "percentage": 57.6, "elapsed_time": "19:44:59", "remaining_time": "14:32:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6252, "total_steps": 10853, "loss": 0.1287, "learning_rate": 2.0799738563981263e-06, "epoch": 0.5760353802920717, "percentage": 57.61, "elapsed_time": "19:45:09", "remaining_time": "14:32:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6253, "total_steps": 10853, "loss": 0.1386, "learning_rate": 2.079222921597357e-06, "epoch": 0.5761275164693417, "percentage": 57.62, "elapsed_time": "19:45:19", "remaining_time": "14:31:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6254, "total_steps": 10853, "loss": 0.1375, "learning_rate": 2.078472025865784e-06, "epoch": 0.5762196526466117, "percentage": 57.62, "elapsed_time": "19:45:30", "remaining_time": "14:31:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6255, "total_steps": 10853, "loss": 0.1344, "learning_rate": 2.077721169273129e-06, "epoch": 0.5763117888238817, "percentage": 57.63, "elapsed_time": "19:45:40", "remaining_time": "14:31:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6256, "total_steps": 10853, "loss": 0.1339, "learning_rate": 2.0769703518891096e-06, "epoch": 0.5764039250011517, "percentage": 57.64, "elapsed_time": "19:45:51", "remaining_time": "14:31:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6257, "total_steps": 10853, "loss": 0.1295, "learning_rate": 2.076219573783437e-06, "epoch": 0.5764960611784217, "percentage": 57.65, "elapsed_time": "19:46:02", "remaining_time": "14:31:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6258, "total_steps": 10853, "loss": 0.1332, "learning_rate": 2.075468835025824e-06, "epoch": 0.5765881973556917, "percentage": 57.66, "elapsed_time": "19:46:13", "remaining_time": "14:30:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6259, "total_steps": 10853, "loss": 0.1383, "learning_rate": 2.0747181356859743e-06, "epoch": 0.5766803335329617, "percentage": 57.67, "elapsed_time": "19:46:25", "remaining_time": "14:30:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6260, "total_steps": 10853, "loss": 0.1301, "learning_rate": 2.073967475833593e-06, "epoch": 0.5767724697102318, "percentage": 57.68, "elapsed_time": "19:46:36", "remaining_time": "14:30:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6261, "total_steps": 10853, "loss": 0.1358, "learning_rate": 2.0732168555383764e-06, "epoch": 0.5768646058875018, "percentage": 57.69, "elapsed_time": "19:46:47", "remaining_time": "14:30:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6262, "total_steps": 10853, "loss": 0.1328, "learning_rate": 2.0724662748700205e-06, "epoch": 0.5769567420647718, "percentage": 57.7, "elapsed_time": "19:46:59", "remaining_time": "14:30:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6263, "total_steps": 10853, "loss": 0.1328, "learning_rate": 2.0717157338982172e-06, "epoch": 0.5770488782420418, "percentage": 57.71, "elapsed_time": "19:47:10", "remaining_time": "14:30:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6264, "total_steps": 10853, "loss": 0.1309, "learning_rate": 2.0709652326926547e-06, "epoch": 0.5771410144193118, "percentage": 57.72, "elapsed_time": "19:47:21", "remaining_time": "14:29:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6265, "total_steps": 10853, "loss": 0.1547, "learning_rate": 2.070214771323015e-06, "epoch": 0.5772331505965818, "percentage": 57.73, "elapsed_time": "19:47:33", "remaining_time": "14:29:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6266, "total_steps": 10853, "loss": 0.1291, "learning_rate": 2.0694643498589816e-06, "epoch": 0.5773252867738518, "percentage": 57.74, "elapsed_time": "19:47:43", "remaining_time": "14:29:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6267, "total_steps": 10853, "loss": 0.1235, "learning_rate": 2.0687139683702284e-06, "epoch": 0.5774174229511218, "percentage": 57.74, "elapsed_time": "19:47:55", "remaining_time": "14:29:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6268, "total_steps": 10853, "loss": 0.1375, "learning_rate": 2.067963626926431e-06, "epoch": 0.5775095591283917, "percentage": 57.75, "elapsed_time": "19:48:04", "remaining_time": "14:29:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6269, "total_steps": 10853, "loss": 0.1354, "learning_rate": 2.0672133255972567e-06, "epoch": 0.5776016953056617, "percentage": 57.76, "elapsed_time": "19:48:15", "remaining_time": "14:28:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6270, "total_steps": 10853, "loss": 0.1378, "learning_rate": 2.066463064452371e-06, "epoch": 0.5776938314829317, "percentage": 57.77, "elapsed_time": "19:48:26", "remaining_time": "14:28:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6271, "total_steps": 10853, "loss": 0.1426, "learning_rate": 2.0657128435614372e-06, "epoch": 0.5777859676602017, "percentage": 57.78, "elapsed_time": "19:48:38", "remaining_time": "14:28:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6272, "total_steps": 10853, "loss": 0.1383, "learning_rate": 2.0649626629941134e-06, "epoch": 0.5778781038374717, "percentage": 57.79, "elapsed_time": "19:48:49", "remaining_time": "14:28:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6273, "total_steps": 10853, "loss": 0.1231, "learning_rate": 2.0642125228200515e-06, "epoch": 0.5779702400147418, "percentage": 57.8, "elapsed_time": "19:49:00", "remaining_time": "14:28:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6274, "total_steps": 10853, "loss": 0.1317, "learning_rate": 2.0634624231089047e-06, "epoch": 0.5780623761920118, "percentage": 57.81, "elapsed_time": "19:49:11", "remaining_time": "14:27:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6275, "total_steps": 10853, "loss": 0.1306, "learning_rate": 2.062712363930318e-06, "epoch": 0.5781545123692818, "percentage": 57.82, "elapsed_time": "19:49:21", "remaining_time": "14:27:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6276, "total_steps": 10853, "loss": 0.1311, "learning_rate": 2.0619623453539365e-06, "epoch": 0.5782466485465518, "percentage": 57.83, "elapsed_time": "19:49:32", "remaining_time": "14:27:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6277, "total_steps": 10853, "loss": 0.1349, "learning_rate": 2.0612123674493983e-06, "epoch": 0.5783387847238218, "percentage": 57.84, "elapsed_time": "19:49:42", "remaining_time": "14:27:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6278, "total_steps": 10853, "loss": 0.1488, "learning_rate": 2.060462430286338e-06, "epoch": 0.5784309209010918, "percentage": 57.85, "elapsed_time": "19:49:53", "remaining_time": "14:27:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6279, "total_steps": 10853, "loss": 0.1353, "learning_rate": 2.059712533934389e-06, "epoch": 0.5785230570783618, "percentage": 57.85, "elapsed_time": "19:50:04", "remaining_time": "14:26:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6280, "total_steps": 10853, "loss": 0.1323, "learning_rate": 2.0589626784631784e-06, "epoch": 0.5786151932556318, "percentage": 57.86, "elapsed_time": "19:50:14", "remaining_time": "14:26:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6281, "total_steps": 10853, "loss": 0.1536, "learning_rate": 2.0582128639423316e-06, "epoch": 0.5787073294329018, "percentage": 57.87, "elapsed_time": "19:50:25", "remaining_time": "14:26:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6282, "total_steps": 10853, "loss": 0.1436, "learning_rate": 2.057463090441467e-06, "epoch": 0.5787994656101718, "percentage": 57.88, "elapsed_time": "19:50:35", "remaining_time": "14:26:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6283, "total_steps": 10853, "loss": 0.1441, "learning_rate": 2.056713358030202e-06, "epoch": 0.5788916017874418, "percentage": 57.89, "elapsed_time": "19:50:47", "remaining_time": "14:26:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6284, "total_steps": 10853, "loss": 0.1318, "learning_rate": 2.0559636667781493e-06, "epoch": 0.5789837379647118, "percentage": 57.9, "elapsed_time": "19:50:57", "remaining_time": "14:25:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6285, "total_steps": 10853, "loss": 0.1303, "learning_rate": 2.055214016754919e-06, "epoch": 0.5790758741419818, "percentage": 57.91, "elapsed_time": "19:51:07", "remaining_time": "14:25:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6286, "total_steps": 10853, "loss": 0.1401, "learning_rate": 2.0544644080301138e-06, "epoch": 0.5791680103192518, "percentage": 57.92, "elapsed_time": "19:51:18", "remaining_time": "14:25:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6287, "total_steps": 10853, "loss": 0.1358, "learning_rate": 2.053714840673337e-06, "epoch": 0.5792601464965219, "percentage": 57.93, "elapsed_time": "19:51:30", "remaining_time": "14:25:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6288, "total_steps": 10853, "loss": 0.1357, "learning_rate": 2.0529653147541844e-06, "epoch": 0.5793522826737919, "percentage": 57.94, "elapsed_time": "19:51:40", "remaining_time": "14:25:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6289, "total_steps": 10853, "loss": 0.1441, "learning_rate": 2.0522158303422518e-06, "epoch": 0.5794444188510619, "percentage": 57.95, "elapsed_time": "19:51:51", "remaining_time": "14:24:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6290, "total_steps": 10853, "loss": 0.1353, "learning_rate": 2.051466387507127e-06, "epoch": 0.5795365550283319, "percentage": 57.96, "elapsed_time": "19:52:04", "remaining_time": "14:24:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6291, "total_steps": 10853, "loss": 0.1207, "learning_rate": 2.0507169863183956e-06, "epoch": 0.5796286912056019, "percentage": 57.97, "elapsed_time": "19:52:14", "remaining_time": "14:24:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6292, "total_steps": 10853, "loss": 0.1329, "learning_rate": 2.0499676268456412e-06, "epoch": 0.5797208273828719, "percentage": 57.97, "elapsed_time": "19:52:24", "remaining_time": "14:24:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6293, "total_steps": 10853, "loss": 0.1381, "learning_rate": 2.0492183091584414e-06, "epoch": 0.5798129635601419, "percentage": 57.98, "elapsed_time": "19:52:34", "remaining_time": "14:24:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6294, "total_steps": 10853, "loss": 0.139, "learning_rate": 2.048469033326369e-06, "epoch": 0.5799050997374119, "percentage": 57.99, "elapsed_time": "19:52:46", "remaining_time": "14:23:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6295, "total_steps": 10853, "loss": 0.1408, "learning_rate": 2.047719799418996e-06, "epoch": 0.5799972359146819, "percentage": 58.0, "elapsed_time": "19:52:57", "remaining_time": "14:23:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6296, "total_steps": 10853, "loss": 0.1238, "learning_rate": 2.046970607505888e-06, "epoch": 0.5800893720919519, "percentage": 58.01, "elapsed_time": "19:53:08", "remaining_time": "14:23:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6297, "total_steps": 10853, "loss": 0.1467, "learning_rate": 2.046221457656609e-06, "epoch": 0.5801815082692219, "percentage": 58.02, "elapsed_time": "19:53:19", "remaining_time": "14:23:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6298, "total_steps": 10853, "loss": 0.142, "learning_rate": 2.0454723499407158e-06, "epoch": 0.5802736444464919, "percentage": 58.03, "elapsed_time": "19:53:30", "remaining_time": "14:23:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6299, "total_steps": 10853, "loss": 0.1337, "learning_rate": 2.044723284427763e-06, "epoch": 0.5803657806237619, "percentage": 58.04, "elapsed_time": "19:53:39", "remaining_time": "14:22:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6300, "total_steps": 10853, "loss": 0.1311, "learning_rate": 2.043974261187303e-06, "epoch": 0.5804579168010319, "percentage": 58.05, "elapsed_time": "19:53:50", "remaining_time": "14:22:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6301, "total_steps": 10853, "loss": 0.1319, "learning_rate": 2.0432252802888827e-06, "epoch": 0.580550052978302, "percentage": 58.06, "elapsed_time": "19:54:01", "remaining_time": "14:22:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6302, "total_steps": 10853, "loss": 0.1321, "learning_rate": 2.042476341802043e-06, "epoch": 0.580642189155572, "percentage": 58.07, "elapsed_time": "19:54:11", "remaining_time": "14:22:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6303, "total_steps": 10853, "loss": 0.1351, "learning_rate": 2.0417274457963247e-06, "epoch": 0.580734325332842, "percentage": 58.08, "elapsed_time": "19:54:20", "remaining_time": "14:22:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6304, "total_steps": 10853, "loss": 0.1174, "learning_rate": 2.040978592341262e-06, "epoch": 0.580826461510112, "percentage": 58.09, "elapsed_time": "19:54:30", "remaining_time": "14:21:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6305, "total_steps": 10853, "loss": 0.1301, "learning_rate": 2.0402297815063867e-06, "epoch": 0.580918597687382, "percentage": 58.09, "elapsed_time": "19:54:43", "remaining_time": "14:21:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6306, "total_steps": 10853, "loss": 0.1365, "learning_rate": 2.0394810133612263e-06, "epoch": 0.581010733864652, "percentage": 58.1, "elapsed_time": "19:54:52", "remaining_time": "14:21:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6307, "total_steps": 10853, "loss": 0.1295, "learning_rate": 2.0387322879753025e-06, "epoch": 0.581102870041922, "percentage": 58.11, "elapsed_time": "19:55:02", "remaining_time": "14:21:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6308, "total_steps": 10853, "loss": 0.1348, "learning_rate": 2.0379836054181356e-06, "epoch": 0.581195006219192, "percentage": 58.12, "elapsed_time": "19:55:15", "remaining_time": "14:21:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6309, "total_steps": 10853, "loss": 0.1422, "learning_rate": 2.0372349657592404e-06, "epoch": 0.581287142396462, "percentage": 58.13, "elapsed_time": "19:55:26", "remaining_time": "14:21:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6310, "total_steps": 10853, "loss": 0.1291, "learning_rate": 2.0364863690681293e-06, "epoch": 0.581379278573732, "percentage": 58.14, "elapsed_time": "19:55:35", "remaining_time": "14:20:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6311, "total_steps": 10853, "loss": 0.1305, "learning_rate": 2.0357378154143083e-06, "epoch": 0.581471414751002, "percentage": 58.15, "elapsed_time": "19:55:45", "remaining_time": "14:20:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6312, "total_steps": 10853, "loss": 0.1249, "learning_rate": 2.0349893048672806e-06, "epoch": 0.5815635509282719, "percentage": 58.16, "elapsed_time": "19:55:55", "remaining_time": "14:20:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6313, "total_steps": 10853, "loss": 0.136, "learning_rate": 2.0342408374965457e-06, "epoch": 0.5816556871055419, "percentage": 58.17, "elapsed_time": "19:56:06", "remaining_time": "14:20:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6314, "total_steps": 10853, "loss": 0.137, "learning_rate": 2.033492413371601e-06, "epoch": 0.581747823282812, "percentage": 58.18, "elapsed_time": "19:56:18", "remaining_time": "14:20:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6315, "total_steps": 10853, "loss": 0.1299, "learning_rate": 2.0327440325619345e-06, "epoch": 0.581839959460082, "percentage": 58.19, "elapsed_time": "19:56:29", "remaining_time": "14:19:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6316, "total_steps": 10853, "loss": 0.1427, "learning_rate": 2.0319956951370346e-06, "epoch": 0.581932095637352, "percentage": 58.2, "elapsed_time": "19:56:40", "remaining_time": "14:19:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6317, "total_steps": 10853, "loss": 0.1479, "learning_rate": 2.0312474011663857e-06, "epoch": 0.582024231814622, "percentage": 58.21, "elapsed_time": "19:56:51", "remaining_time": "14:19:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6318, "total_steps": 10853, "loss": 0.1337, "learning_rate": 2.030499150719466e-06, "epoch": 0.582116367991892, "percentage": 58.21, "elapsed_time": "19:57:01", "remaining_time": "14:19:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6319, "total_steps": 10853, "loss": 0.1309, "learning_rate": 2.02975094386575e-06, "epoch": 0.582208504169162, "percentage": 58.22, "elapsed_time": "19:57:13", "remaining_time": "14:19:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6320, "total_steps": 10853, "loss": 0.1258, "learning_rate": 2.02900278067471e-06, "epoch": 0.582300640346432, "percentage": 58.23, "elapsed_time": "19:57:23", "remaining_time": "14:18:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6321, "total_steps": 10853, "loss": 0.1372, "learning_rate": 2.0282546612158116e-06, "epoch": 0.582392776523702, "percentage": 58.24, "elapsed_time": "19:57:34", "remaining_time": "14:18:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6322, "total_steps": 10853, "loss": 0.1211, "learning_rate": 2.02750658555852e-06, "epoch": 0.582484912700972, "percentage": 58.25, "elapsed_time": "19:57:43", "remaining_time": "14:18:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6323, "total_steps": 10853, "loss": 0.1305, "learning_rate": 2.026758553772292e-06, "epoch": 0.582577048878242, "percentage": 58.26, "elapsed_time": "19:57:54", "remaining_time": "14:18:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6324, "total_steps": 10853, "loss": 0.152, "learning_rate": 2.026010565926583e-06, "epoch": 0.582669185055512, "percentage": 58.27, "elapsed_time": "19:58:06", "remaining_time": "14:18:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6325, "total_steps": 10853, "loss": 0.1376, "learning_rate": 2.0252626220908448e-06, "epoch": 0.582761321232782, "percentage": 58.28, "elapsed_time": "19:58:18", "remaining_time": "14:17:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6326, "total_steps": 10853, "loss": 0.1316, "learning_rate": 2.0245147223345235e-06, "epoch": 0.582853457410052, "percentage": 58.29, "elapsed_time": "19:58:31", "remaining_time": "14:17:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6327, "total_steps": 10853, "loss": 0.1303, "learning_rate": 2.0237668667270603e-06, "epoch": 0.582945593587322, "percentage": 58.3, "elapsed_time": "19:58:43", "remaining_time": "14:17:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6328, "total_steps": 10853, "loss": 0.1328, "learning_rate": 2.023019055337895e-06, "epoch": 0.5830377297645921, "percentage": 58.31, "elapsed_time": "19:58:55", "remaining_time": "14:17:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6329, "total_steps": 10853, "loss": 0.1386, "learning_rate": 2.0222712882364617e-06, "epoch": 0.5831298659418621, "percentage": 58.32, "elapsed_time": "19:59:05", "remaining_time": "14:17:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6330, "total_steps": 10853, "loss": 0.1362, "learning_rate": 2.0215235654921912e-06, "epoch": 0.5832220021191321, "percentage": 58.32, "elapsed_time": "19:59:15", "remaining_time": "14:16:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6331, "total_steps": 10853, "loss": 0.1229, "learning_rate": 2.0207758871745088e-06, "epoch": 0.5833141382964021, "percentage": 58.33, "elapsed_time": "19:59:27", "remaining_time": "14:16:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6332, "total_steps": 10853, "loss": 0.1373, "learning_rate": 2.0200282533528367e-06, "epoch": 0.5834062744736721, "percentage": 58.34, "elapsed_time": "19:59:38", "remaining_time": "14:16:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6333, "total_steps": 10853, "loss": 0.1378, "learning_rate": 2.019280664096593e-06, "epoch": 0.5834984106509421, "percentage": 58.35, "elapsed_time": "19:59:48", "remaining_time": "14:16:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6334, "total_steps": 10853, "loss": 0.1215, "learning_rate": 2.018533119475191e-06, "epoch": 0.5835905468282121, "percentage": 58.36, "elapsed_time": "19:59:58", "remaining_time": "14:16:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6335, "total_steps": 10853, "loss": 0.1355, "learning_rate": 2.017785619558042e-06, "epoch": 0.5836826830054821, "percentage": 58.37, "elapsed_time": "20:00:09", "remaining_time": "14:15:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6336, "total_steps": 10853, "loss": 0.1224, "learning_rate": 2.0170381644145492e-06, "epoch": 0.5837748191827521, "percentage": 58.38, "elapsed_time": "20:00:19", "remaining_time": "14:15:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6337, "total_steps": 10853, "loss": 0.1348, "learning_rate": 2.0162907541141146e-06, "epoch": 0.5838669553600221, "percentage": 58.39, "elapsed_time": "20:00:31", "remaining_time": "14:15:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6338, "total_steps": 10853, "loss": 0.1289, "learning_rate": 2.0155433887261362e-06, "epoch": 0.5839590915372921, "percentage": 58.4, "elapsed_time": "20:00:42", "remaining_time": "14:15:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6339, "total_steps": 10853, "loss": 0.1351, "learning_rate": 2.0147960683200064e-06, "epoch": 0.5840512277145621, "percentage": 58.41, "elapsed_time": "20:00:52", "remaining_time": "14:15:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6340, "total_steps": 10853, "loss": 0.1306, "learning_rate": 2.014048792965113e-06, "epoch": 0.5841433638918321, "percentage": 58.42, "elapsed_time": "20:01:03", "remaining_time": "14:14:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6341, "total_steps": 10853, "loss": 0.1384, "learning_rate": 2.013301562730842e-06, "epoch": 0.5842355000691022, "percentage": 58.43, "elapsed_time": "20:01:15", "remaining_time": "14:14:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6342, "total_steps": 10853, "loss": 0.1213, "learning_rate": 2.0125543776865723e-06, "epoch": 0.5843276362463722, "percentage": 58.44, "elapsed_time": "20:01:25", "remaining_time": "14:14:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6343, "total_steps": 10853, "loss": 0.1168, "learning_rate": 2.011807237901683e-06, "epoch": 0.5844197724236422, "percentage": 58.44, "elapsed_time": "20:01:35", "remaining_time": "14:14:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6344, "total_steps": 10853, "loss": 0.141, "learning_rate": 2.011060143445543e-06, "epoch": 0.5845119086009122, "percentage": 58.45, "elapsed_time": "20:01:46", "remaining_time": "14:14:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6345, "total_steps": 10853, "loss": 0.1324, "learning_rate": 2.010313094387521e-06, "epoch": 0.5846040447781822, "percentage": 58.46, "elapsed_time": "20:01:57", "remaining_time": "14:13:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6346, "total_steps": 10853, "loss": 0.1331, "learning_rate": 2.0095660907969816e-06, "epoch": 0.5846961809554522, "percentage": 58.47, "elapsed_time": "20:02:08", "remaining_time": "14:13:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6347, "total_steps": 10853, "loss": 0.1205, "learning_rate": 2.0088191327432838e-06, "epoch": 0.5847883171327222, "percentage": 58.48, "elapsed_time": "20:02:18", "remaining_time": "14:13:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6348, "total_steps": 10853, "loss": 0.1269, "learning_rate": 2.0080722202957813e-06, "epoch": 0.5848804533099922, "percentage": 58.49, "elapsed_time": "20:02:30", "remaining_time": "14:13:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6349, "total_steps": 10853, "loss": 0.1348, "learning_rate": 2.0073253535238266e-06, "epoch": 0.5849725894872622, "percentage": 58.5, "elapsed_time": "20:02:40", "remaining_time": "14:13:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6350, "total_steps": 10853, "loss": 0.1231, "learning_rate": 2.0065785324967654e-06, "epoch": 0.5850647256645322, "percentage": 58.51, "elapsed_time": "20:02:51", "remaining_time": "14:12:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6351, "total_steps": 10853, "loss": 0.1361, "learning_rate": 2.0058317572839418e-06, "epoch": 0.5851568618418022, "percentage": 58.52, "elapsed_time": "20:03:01", "remaining_time": "14:12:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6352, "total_steps": 10853, "loss": 0.1421, "learning_rate": 2.0050850279546918e-06, "epoch": 0.5852489980190722, "percentage": 58.53, "elapsed_time": "20:03:12", "remaining_time": "14:12:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6353, "total_steps": 10853, "loss": 0.1311, "learning_rate": 2.00433834457835e-06, "epoch": 0.5853411341963421, "percentage": 58.54, "elapsed_time": "20:03:22", "remaining_time": "14:12:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6354, "total_steps": 10853, "loss": 0.1365, "learning_rate": 2.0035917072242463e-06, "epoch": 0.5854332703736121, "percentage": 58.55, "elapsed_time": "20:03:33", "remaining_time": "14:12:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6355, "total_steps": 10853, "loss": 0.1304, "learning_rate": 2.002845115961707e-06, "epoch": 0.5855254065508823, "percentage": 58.56, "elapsed_time": "20:03:45", "remaining_time": "14:12:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6356, "total_steps": 10853, "loss": 0.1341, "learning_rate": 2.002098570860051e-06, "epoch": 0.5856175427281523, "percentage": 58.56, "elapsed_time": "20:03:56", "remaining_time": "14:11:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6357, "total_steps": 10853, "loss": 0.1395, "learning_rate": 2.001352071988597e-06, "epoch": 0.5857096789054222, "percentage": 58.57, "elapsed_time": "20:04:07", "remaining_time": "14:11:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6358, "total_steps": 10853, "loss": 0.133, "learning_rate": 2.000605619416656e-06, "epoch": 0.5858018150826922, "percentage": 58.58, "elapsed_time": "20:04:18", "remaining_time": "14:11:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6359, "total_steps": 10853, "loss": 0.1437, "learning_rate": 1.999859213213538e-06, "epoch": 0.5858939512599622, "percentage": 58.59, "elapsed_time": "20:04:29", "remaining_time": "14:11:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6360, "total_steps": 10853, "loss": 0.1315, "learning_rate": 1.9991128534485454e-06, "epoch": 0.5859860874372322, "percentage": 58.6, "elapsed_time": "20:04:40", "remaining_time": "14:11:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6361, "total_steps": 10853, "loss": 0.1228, "learning_rate": 1.998366540190978e-06, "epoch": 0.5860782236145022, "percentage": 58.61, "elapsed_time": "20:04:52", "remaining_time": "14:10:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6362, "total_steps": 10853, "loss": 0.1385, "learning_rate": 1.9976202735101314e-06, "epoch": 0.5861703597917722, "percentage": 58.62, "elapsed_time": "20:05:03", "remaining_time": "14:10:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6363, "total_steps": 10853, "loss": 0.1201, "learning_rate": 1.9968740534752965e-06, "epoch": 0.5862624959690422, "percentage": 58.63, "elapsed_time": "20:05:14", "remaining_time": "14:10:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6364, "total_steps": 10853, "loss": 0.1402, "learning_rate": 1.9961278801557606e-06, "epoch": 0.5863546321463122, "percentage": 58.64, "elapsed_time": "20:05:25", "remaining_time": "14:10:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6365, "total_steps": 10853, "loss": 0.1289, "learning_rate": 1.9953817536208046e-06, "epoch": 0.5864467683235822, "percentage": 58.65, "elapsed_time": "20:05:35", "remaining_time": "14:10:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6366, "total_steps": 10853, "loss": 0.1401, "learning_rate": 1.994635673939707e-06, "epoch": 0.5865389045008522, "percentage": 58.66, "elapsed_time": "20:05:47", "remaining_time": "14:09:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6367, "total_steps": 10853, "loss": 0.1389, "learning_rate": 1.9938896411817416e-06, "epoch": 0.5866310406781222, "percentage": 58.67, "elapsed_time": "20:05:57", "remaining_time": "14:09:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6368, "total_steps": 10853, "loss": 0.1194, "learning_rate": 1.9931436554161783e-06, "epoch": 0.5867231768553922, "percentage": 58.68, "elapsed_time": "20:06:07", "remaining_time": "14:09:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6369, "total_steps": 10853, "loss": 0.1489, "learning_rate": 1.9923977167122797e-06, "epoch": 0.5868153130326623, "percentage": 58.68, "elapsed_time": "20:06:18", "remaining_time": "14:09:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6370, "total_steps": 10853, "loss": 0.1354, "learning_rate": 1.9916518251393085e-06, "epoch": 0.5869074492099323, "percentage": 58.69, "elapsed_time": "20:06:30", "remaining_time": "14:09:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6371, "total_steps": 10853, "loss": 0.1257, "learning_rate": 1.9909059807665195e-06, "epoch": 0.5869995853872023, "percentage": 58.7, "elapsed_time": "20:06:41", "remaining_time": "14:08:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6372, "total_steps": 10853, "loss": 0.1348, "learning_rate": 1.990160183663166e-06, "epoch": 0.5870917215644723, "percentage": 58.71, "elapsed_time": "20:06:52", "remaining_time": "14:08:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6373, "total_steps": 10853, "loss": 0.132, "learning_rate": 1.9894144338984937e-06, "epoch": 0.5871838577417423, "percentage": 58.72, "elapsed_time": "20:07:03", "remaining_time": "14:08:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6374, "total_steps": 10853, "loss": 0.1344, "learning_rate": 1.9886687315417456e-06, "epoch": 0.5872759939190123, "percentage": 58.73, "elapsed_time": "20:07:14", "remaining_time": "14:08:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6375, "total_steps": 10853, "loss": 0.1354, "learning_rate": 1.9879230766621616e-06, "epoch": 0.5873681300962823, "percentage": 58.74, "elapsed_time": "20:07:25", "remaining_time": "14:08:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6376, "total_steps": 10853, "loss": 0.1279, "learning_rate": 1.9871774693289754e-06, "epoch": 0.5874602662735523, "percentage": 58.75, "elapsed_time": "20:07:35", "remaining_time": "14:07:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6377, "total_steps": 10853, "loss": 0.1301, "learning_rate": 1.9864319096114152e-06, "epoch": 0.5875524024508223, "percentage": 58.76, "elapsed_time": "20:07:46", "remaining_time": "14:07:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6378, "total_steps": 10853, "loss": 0.1477, "learning_rate": 1.985686397578708e-06, "epoch": 0.5876445386280923, "percentage": 58.77, "elapsed_time": "20:07:58", "remaining_time": "14:07:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6379, "total_steps": 10853, "loss": 0.1174, "learning_rate": 1.984940933300074e-06, "epoch": 0.5877366748053623, "percentage": 58.78, "elapsed_time": "20:08:08", "remaining_time": "14:07:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6380, "total_steps": 10853, "loss": 0.1329, "learning_rate": 1.984195516844731e-06, "epoch": 0.5878288109826323, "percentage": 58.79, "elapsed_time": "20:08:18", "remaining_time": "14:07:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6381, "total_steps": 10853, "loss": 0.1394, "learning_rate": 1.9834501482818885e-06, "epoch": 0.5879209471599023, "percentage": 58.79, "elapsed_time": "20:08:29", "remaining_time": "14:06:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6382, "total_steps": 10853, "loss": 0.1361, "learning_rate": 1.9827048276807552e-06, "epoch": 0.5880130833371724, "percentage": 58.8, "elapsed_time": "20:08:41", "remaining_time": "14:06:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6383, "total_steps": 10853, "loss": 0.142, "learning_rate": 1.9819595551105346e-06, "epoch": 0.5881052195144424, "percentage": 58.81, "elapsed_time": "20:08:52", "remaining_time": "14:06:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6384, "total_steps": 10853, "loss": 0.1325, "learning_rate": 1.9812143306404262e-06, "epoch": 0.5881973556917124, "percentage": 58.82, "elapsed_time": "20:09:02", "remaining_time": "14:06:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6385, "total_steps": 10853, "loss": 0.1255, "learning_rate": 1.9804691543396213e-06, "epoch": 0.5882894918689824, "percentage": 58.83, "elapsed_time": "20:09:12", "remaining_time": "14:06:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6386, "total_steps": 10853, "loss": 0.1325, "learning_rate": 1.9797240262773122e-06, "epoch": 0.5883816280462524, "percentage": 58.84, "elapsed_time": "20:09:23", "remaining_time": "14:05:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6387, "total_steps": 10853, "loss": 0.1253, "learning_rate": 1.9789789465226825e-06, "epoch": 0.5884737642235224, "percentage": 58.85, "elapsed_time": "20:09:34", "remaining_time": "14:05:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6388, "total_steps": 10853, "loss": 0.1401, "learning_rate": 1.978233915144915e-06, "epoch": 0.5885659004007924, "percentage": 58.86, "elapsed_time": "20:09:45", "remaining_time": "14:05:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6389, "total_steps": 10853, "loss": 0.1397, "learning_rate": 1.977488932213184e-06, "epoch": 0.5886580365780624, "percentage": 58.87, "elapsed_time": "20:09:56", "remaining_time": "14:05:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6390, "total_steps": 10853, "loss": 0.1431, "learning_rate": 1.976743997796661e-06, "epoch": 0.5887501727553324, "percentage": 58.88, "elapsed_time": "20:10:08", "remaining_time": "14:05:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6391, "total_steps": 10853, "loss": 0.1311, "learning_rate": 1.975999111964515e-06, "epoch": 0.5888423089326024, "percentage": 58.89, "elapsed_time": "20:10:20", "remaining_time": "14:05:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6392, "total_steps": 10853, "loss": 0.1332, "learning_rate": 1.9752542747859076e-06, "epoch": 0.5889344451098724, "percentage": 58.9, "elapsed_time": "20:10:30", "remaining_time": "14:04:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6393, "total_steps": 10853, "loss": 0.1185, "learning_rate": 1.974509486329998e-06, "epoch": 0.5890265812871424, "percentage": 58.91, "elapsed_time": "20:10:40", "remaining_time": "14:04:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6394, "total_steps": 10853, "loss": 0.1244, "learning_rate": 1.973764746665938e-06, "epoch": 0.5891187174644124, "percentage": 58.91, "elapsed_time": "20:10:52", "remaining_time": "14:04:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6395, "total_steps": 10853, "loss": 0.1361, "learning_rate": 1.9730200558628784e-06, "epoch": 0.5892108536416824, "percentage": 58.92, "elapsed_time": "20:11:03", "remaining_time": "14:04:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6396, "total_steps": 10853, "loss": 0.1276, "learning_rate": 1.972275413989963e-06, "epoch": 0.5893029898189525, "percentage": 58.93, "elapsed_time": "20:11:14", "remaining_time": "14:04:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6397, "total_steps": 10853, "loss": 0.1351, "learning_rate": 1.971530821116333e-06, "epoch": 0.5893951259962225, "percentage": 58.94, "elapsed_time": "20:11:26", "remaining_time": "14:03:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6398, "total_steps": 10853, "loss": 0.135, "learning_rate": 1.970786277311123e-06, "epoch": 0.5894872621734925, "percentage": 58.95, "elapsed_time": "20:11:36", "remaining_time": "14:03:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6399, "total_steps": 10853, "loss": 0.1351, "learning_rate": 1.9700417826434633e-06, "epoch": 0.5895793983507625, "percentage": 58.96, "elapsed_time": "20:11:47", "remaining_time": "14:03:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6400, "total_steps": 10853, "loss": 0.1521, "learning_rate": 1.969297337182482e-06, "epoch": 0.5896715345280324, "percentage": 58.97, "elapsed_time": "20:11:59", "remaining_time": "14:03:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6401, "total_steps": 10853, "loss": 0.1278, "learning_rate": 1.9685529409973e-06, "epoch": 0.5897636707053024, "percentage": 58.98, "elapsed_time": "20:12:08", "remaining_time": "14:03:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6402, "total_steps": 10853, "loss": 0.1267, "learning_rate": 1.967808594157034e-06, "epoch": 0.5898558068825724, "percentage": 58.99, "elapsed_time": "20:12:19", "remaining_time": "14:02:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6403, "total_steps": 10853, "loss": 0.1399, "learning_rate": 1.9670642967307974e-06, "epoch": 0.5899479430598424, "percentage": 59.0, "elapsed_time": "20:12:28", "remaining_time": "14:02:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6404, "total_steps": 10853, "loss": 0.1282, "learning_rate": 1.9663200487876983e-06, "epoch": 0.5900400792371124, "percentage": 59.01, "elapsed_time": "20:12:39", "remaining_time": "14:02:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6405, "total_steps": 10853, "loss": 0.1313, "learning_rate": 1.965575850396841e-06, "epoch": 0.5901322154143824, "percentage": 59.02, "elapsed_time": "20:12:49", "remaining_time": "14:02:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6406, "total_steps": 10853, "loss": 0.1169, "learning_rate": 1.9648317016273227e-06, "epoch": 0.5902243515916524, "percentage": 59.03, "elapsed_time": "20:13:00", "remaining_time": "14:02:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6407, "total_steps": 10853, "loss": 0.134, "learning_rate": 1.964087602548238e-06, "epoch": 0.5903164877689224, "percentage": 59.03, "elapsed_time": "20:13:11", "remaining_time": "14:01:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6408, "total_steps": 10853, "loss": 0.1397, "learning_rate": 1.9633435532286775e-06, "epoch": 0.5904086239461924, "percentage": 59.04, "elapsed_time": "20:13:21", "remaining_time": "14:01:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6409, "total_steps": 10853, "loss": 0.1155, "learning_rate": 1.9625995537377268e-06, "epoch": 0.5905007601234625, "percentage": 59.05, "elapsed_time": "20:13:30", "remaining_time": "14:01:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6410, "total_steps": 10853, "loss": 0.1409, "learning_rate": 1.961855604144464e-06, "epoch": 0.5905928963007325, "percentage": 59.06, "elapsed_time": "20:13:42", "remaining_time": "14:01:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6411, "total_steps": 10853, "loss": 0.1441, "learning_rate": 1.961111704517967e-06, "epoch": 0.5906850324780025, "percentage": 59.07, "elapsed_time": "20:13:52", "remaining_time": "14:01:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6412, "total_steps": 10853, "loss": 0.1392, "learning_rate": 1.9603678549273054e-06, "epoch": 0.5907771686552725, "percentage": 59.08, "elapsed_time": "20:14:03", "remaining_time": "14:00:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6413, "total_steps": 10853, "loss": 0.1309, "learning_rate": 1.959624055441548e-06, "epoch": 0.5908693048325425, "percentage": 59.09, "elapsed_time": "20:14:14", "remaining_time": "14:00:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6414, "total_steps": 10853, "loss": 0.1469, "learning_rate": 1.9588803061297544e-06, "epoch": 0.5909614410098125, "percentage": 59.1, "elapsed_time": "20:14:25", "remaining_time": "14:00:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6415, "total_steps": 10853, "loss": 0.1137, "learning_rate": 1.9581366070609824e-06, "epoch": 0.5910535771870825, "percentage": 59.11, "elapsed_time": "20:14:35", "remaining_time": "14:00:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6416, "total_steps": 10853, "loss": 0.1302, "learning_rate": 1.957392958304285e-06, "epoch": 0.5911457133643525, "percentage": 59.12, "elapsed_time": "20:14:46", "remaining_time": "14:00:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6417, "total_steps": 10853, "loss": 0.1378, "learning_rate": 1.9566493599287103e-06, "epoch": 0.5912378495416225, "percentage": 59.13, "elapsed_time": "20:14:57", "remaining_time": "13:59:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6418, "total_steps": 10853, "loss": 0.1172, "learning_rate": 1.9559058120032997e-06, "epoch": 0.5913299857188925, "percentage": 59.14, "elapsed_time": "20:15:08", "remaining_time": "13:59:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6419, "total_steps": 10853, "loss": 0.1382, "learning_rate": 1.955162314597094e-06, "epoch": 0.5914221218961625, "percentage": 59.14, "elapsed_time": "20:15:18", "remaining_time": "13:59:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6420, "total_steps": 10853, "loss": 0.1395, "learning_rate": 1.9544188677791253e-06, "epoch": 0.5915142580734325, "percentage": 59.15, "elapsed_time": "20:15:29", "remaining_time": "13:59:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6421, "total_steps": 10853, "loss": 0.1324, "learning_rate": 1.9536754716184244e-06, "epoch": 0.5916063942507025, "percentage": 59.16, "elapsed_time": "20:15:41", "remaining_time": "13:59:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6422, "total_steps": 10853, "loss": 0.1286, "learning_rate": 1.9529321261840148e-06, "epoch": 0.5916985304279725, "percentage": 59.17, "elapsed_time": "20:15:51", "remaining_time": "13:58:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6423, "total_steps": 10853, "loss": 0.1425, "learning_rate": 1.952188831544915e-06, "epoch": 0.5917906666052426, "percentage": 59.18, "elapsed_time": "20:16:02", "remaining_time": "13:58:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6424, "total_steps": 10853, "loss": 0.1236, "learning_rate": 1.951445587770142e-06, "epoch": 0.5918828027825126, "percentage": 59.19, "elapsed_time": "20:16:12", "remaining_time": "13:58:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6425, "total_steps": 10853, "loss": 0.135, "learning_rate": 1.9507023949287045e-06, "epoch": 0.5919749389597826, "percentage": 59.2, "elapsed_time": "20:16:23", "remaining_time": "13:58:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6426, "total_steps": 10853, "loss": 0.1191, "learning_rate": 1.94995925308961e-06, "epoch": 0.5920670751370526, "percentage": 59.21, "elapsed_time": "20:16:33", "remaining_time": "13:58:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6427, "total_steps": 10853, "loss": 0.1347, "learning_rate": 1.9492161623218576e-06, "epoch": 0.5921592113143226, "percentage": 59.22, "elapsed_time": "20:16:44", "remaining_time": "13:57:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6428, "total_steps": 10853, "loss": 0.1301, "learning_rate": 1.9484731226944427e-06, "epoch": 0.5922513474915926, "percentage": 59.23, "elapsed_time": "20:16:56", "remaining_time": "13:57:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6429, "total_steps": 10853, "loss": 0.1356, "learning_rate": 1.9477301342763587e-06, "epoch": 0.5923434836688626, "percentage": 59.24, "elapsed_time": "20:17:08", "remaining_time": "13:57:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6430, "total_steps": 10853, "loss": 0.1356, "learning_rate": 1.946987197136592e-06, "epoch": 0.5924356198461326, "percentage": 59.25, "elapsed_time": "20:17:20", "remaining_time": "13:57:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6431, "total_steps": 10853, "loss": 0.1442, "learning_rate": 1.946244311344122e-06, "epoch": 0.5925277560234026, "percentage": 59.26, "elapsed_time": "20:17:30", "remaining_time": "13:57:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6432, "total_steps": 10853, "loss": 0.1334, "learning_rate": 1.945501476967928e-06, "epoch": 0.5926198922006726, "percentage": 59.26, "elapsed_time": "20:17:41", "remaining_time": "13:56:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6433, "total_steps": 10853, "loss": 0.1251, "learning_rate": 1.9447586940769808e-06, "epoch": 0.5927120283779426, "percentage": 59.27, "elapsed_time": "20:17:52", "remaining_time": "13:56:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6434, "total_steps": 10853, "loss": 0.1224, "learning_rate": 1.9440159627402497e-06, "epoch": 0.5928041645552126, "percentage": 59.28, "elapsed_time": "20:18:04", "remaining_time": "13:56:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6435, "total_steps": 10853, "loss": 0.1314, "learning_rate": 1.9432732830266958e-06, "epoch": 0.5928963007324826, "percentage": 59.29, "elapsed_time": "20:18:16", "remaining_time": "13:56:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6436, "total_steps": 10853, "loss": 0.1438, "learning_rate": 1.9425306550052774e-06, "epoch": 0.5929884369097527, "percentage": 59.3, "elapsed_time": "20:18:26", "remaining_time": "13:56:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6437, "total_steps": 10853, "loss": 0.1359, "learning_rate": 1.9417880787449476e-06, "epoch": 0.5930805730870227, "percentage": 59.31, "elapsed_time": "20:18:37", "remaining_time": "13:56:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6438, "total_steps": 10853, "loss": 0.1305, "learning_rate": 1.9410455543146554e-06, "epoch": 0.5931727092642927, "percentage": 59.32, "elapsed_time": "20:18:48", "remaining_time": "13:55:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6439, "total_steps": 10853, "loss": 0.134, "learning_rate": 1.9403030817833428e-06, "epoch": 0.5932648454415627, "percentage": 59.33, "elapsed_time": "20:18:58", "remaining_time": "13:55:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6440, "total_steps": 10853, "loss": 0.1367, "learning_rate": 1.93956066121995e-06, "epoch": 0.5933569816188327, "percentage": 59.34, "elapsed_time": "20:19:09", "remaining_time": "13:55:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6441, "total_steps": 10853, "loss": 0.1379, "learning_rate": 1.938818292693409e-06, "epoch": 0.5934491177961027, "percentage": 59.35, "elapsed_time": "20:19:21", "remaining_time": "13:55:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6442, "total_steps": 10853, "loss": 0.1439, "learning_rate": 1.9380759762726512e-06, "epoch": 0.5935412539733727, "percentage": 59.36, "elapsed_time": "20:19:32", "remaining_time": "13:55:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6443, "total_steps": 10853, "loss": 0.1262, "learning_rate": 1.9373337120265993e-06, "epoch": 0.5936333901506426, "percentage": 59.37, "elapsed_time": "20:19:43", "remaining_time": "13:54:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6444, "total_steps": 10853, "loss": 0.1448, "learning_rate": 1.936591500024172e-06, "epoch": 0.5937255263279126, "percentage": 59.38, "elapsed_time": "20:19:54", "remaining_time": "13:54:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6445, "total_steps": 10853, "loss": 0.1316, "learning_rate": 1.935849340334285e-06, "epoch": 0.5938176625051826, "percentage": 59.38, "elapsed_time": "20:20:04", "remaining_time": "13:54:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6446, "total_steps": 10853, "loss": 0.1345, "learning_rate": 1.9351072330258483e-06, "epoch": 0.5939097986824526, "percentage": 59.39, "elapsed_time": "20:20:15", "remaining_time": "13:54:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6447, "total_steps": 10853, "loss": 0.142, "learning_rate": 1.9343651781677648e-06, "epoch": 0.5940019348597226, "percentage": 59.4, "elapsed_time": "20:20:25", "remaining_time": "13:54:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6448, "total_steps": 10853, "loss": 0.1385, "learning_rate": 1.933623175828935e-06, "epoch": 0.5940940710369926, "percentage": 59.41, "elapsed_time": "20:20:34", "remaining_time": "13:53:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6449, "total_steps": 10853, "loss": 0.1287, "learning_rate": 1.932881226078255e-06, "epoch": 0.5941862072142626, "percentage": 59.42, "elapsed_time": "20:20:46", "remaining_time": "13:53:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6450, "total_steps": 10853, "loss": 0.1265, "learning_rate": 1.932139328984614e-06, "epoch": 0.5942783433915327, "percentage": 59.43, "elapsed_time": "20:20:57", "remaining_time": "13:53:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6451, "total_steps": 10853, "loss": 0.1322, "learning_rate": 1.931397484616898e-06, "epoch": 0.5943704795688027, "percentage": 59.44, "elapsed_time": "20:21:08", "remaining_time": "13:53:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6452, "total_steps": 10853, "loss": 0.1389, "learning_rate": 1.9306556930439857e-06, "epoch": 0.5944626157460727, "percentage": 59.45, "elapsed_time": "20:21:18", "remaining_time": "13:53:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6453, "total_steps": 10853, "loss": 0.1404, "learning_rate": 1.929913954334754e-06, "epoch": 0.5945547519233427, "percentage": 59.46, "elapsed_time": "20:21:28", "remaining_time": "13:52:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6454, "total_steps": 10853, "loss": 0.1386, "learning_rate": 1.929172268558073e-06, "epoch": 0.5946468881006127, "percentage": 59.47, "elapsed_time": "20:21:40", "remaining_time": "13:52:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6455, "total_steps": 10853, "loss": 0.1194, "learning_rate": 1.928430635782809e-06, "epoch": 0.5947390242778827, "percentage": 59.48, "elapsed_time": "20:21:51", "remaining_time": "13:52:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6456, "total_steps": 10853, "loss": 0.1148, "learning_rate": 1.9276890560778215e-06, "epoch": 0.5948311604551527, "percentage": 59.49, "elapsed_time": "20:22:02", "remaining_time": "13:52:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6457, "total_steps": 10853, "loss": 0.1354, "learning_rate": 1.9269475295119663e-06, "epoch": 0.5949232966324227, "percentage": 59.5, "elapsed_time": "20:22:14", "remaining_time": "13:52:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6458, "total_steps": 10853, "loss": 0.1336, "learning_rate": 1.9262060561540946e-06, "epoch": 0.5950154328096927, "percentage": 59.5, "elapsed_time": "20:22:25", "remaining_time": "13:51:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6459, "total_steps": 10853, "loss": 0.1215, "learning_rate": 1.9254646360730533e-06, "epoch": 0.5951075689869627, "percentage": 59.51, "elapsed_time": "20:22:35", "remaining_time": "13:51:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6460, "total_steps": 10853, "loss": 0.1241, "learning_rate": 1.9247232693376815e-06, "epoch": 0.5951997051642327, "percentage": 59.52, "elapsed_time": "20:22:45", "remaining_time": "13:51:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6461, "total_steps": 10853, "loss": 0.1386, "learning_rate": 1.9239819560168165e-06, "epoch": 0.5952918413415027, "percentage": 59.53, "elapsed_time": "20:22:56", "remaining_time": "13:51:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6462, "total_steps": 10853, "loss": 0.1361, "learning_rate": 1.9232406961792884e-06, "epoch": 0.5953839775187727, "percentage": 59.54, "elapsed_time": "20:23:06", "remaining_time": "13:51:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6463, "total_steps": 10853, "loss": 0.1223, "learning_rate": 1.9224994898939247e-06, "epoch": 0.5954761136960427, "percentage": 59.55, "elapsed_time": "20:23:18", "remaining_time": "13:50:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6464, "total_steps": 10853, "loss": 0.1257, "learning_rate": 1.9217583372295446e-06, "epoch": 0.5955682498733128, "percentage": 59.56, "elapsed_time": "20:23:28", "remaining_time": "13:50:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6465, "total_steps": 10853, "loss": 0.145, "learning_rate": 1.921017238254965e-06, "epoch": 0.5956603860505828, "percentage": 59.57, "elapsed_time": "20:23:38", "remaining_time": "13:50:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6466, "total_steps": 10853, "loss": 0.1299, "learning_rate": 1.920276193038997e-06, "epoch": 0.5957525222278528, "percentage": 59.58, "elapsed_time": "20:23:48", "remaining_time": "13:50:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6467, "total_steps": 10853, "loss": 0.1288, "learning_rate": 1.9195352016504486e-06, "epoch": 0.5958446584051228, "percentage": 59.59, "elapsed_time": "20:23:59", "remaining_time": "13:50:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6468, "total_steps": 10853, "loss": 0.1367, "learning_rate": 1.9187942641581174e-06, "epoch": 0.5959367945823928, "percentage": 59.6, "elapsed_time": "20:24:09", "remaining_time": "13:49:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6469, "total_steps": 10853, "loss": 0.1256, "learning_rate": 1.9180533806308017e-06, "epoch": 0.5960289307596628, "percentage": 59.61, "elapsed_time": "20:24:20", "remaining_time": "13:49:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6470, "total_steps": 10853, "loss": 0.1349, "learning_rate": 1.9173125511372923e-06, "epoch": 0.5961210669369328, "percentage": 59.61, "elapsed_time": "20:24:31", "remaining_time": "13:49:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6471, "total_steps": 10853, "loss": 0.1375, "learning_rate": 1.916571775746376e-06, "epoch": 0.5962132031142028, "percentage": 59.62, "elapsed_time": "20:24:40", "remaining_time": "13:49:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6472, "total_steps": 10853, "loss": 0.1412, "learning_rate": 1.915831054526832e-06, "epoch": 0.5963053392914728, "percentage": 59.63, "elapsed_time": "20:24:52", "remaining_time": "13:49:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6473, "total_steps": 10853, "loss": 0.1223, "learning_rate": 1.915090387547438e-06, "epoch": 0.5963974754687428, "percentage": 59.64, "elapsed_time": "20:25:04", "remaining_time": "13:48:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6474, "total_steps": 10853, "loss": 0.1307, "learning_rate": 1.914349774876964e-06, "epoch": 0.5964896116460128, "percentage": 59.65, "elapsed_time": "20:25:16", "remaining_time": "13:48:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6475, "total_steps": 10853, "loss": 0.1385, "learning_rate": 1.9136092165841776e-06, "epoch": 0.5965817478232828, "percentage": 59.66, "elapsed_time": "20:25:27", "remaining_time": "13:48:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6476, "total_steps": 10853, "loss": 0.1324, "learning_rate": 1.9128687127378376e-06, "epoch": 0.5966738840005528, "percentage": 59.67, "elapsed_time": "20:25:38", "remaining_time": "13:48:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6477, "total_steps": 10853, "loss": 0.1299, "learning_rate": 1.9121282634067008e-06, "epoch": 0.5967660201778229, "percentage": 59.68, "elapsed_time": "20:25:49", "remaining_time": "13:48:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6478, "total_steps": 10853, "loss": 0.1314, "learning_rate": 1.911387868659518e-06, "epoch": 0.5968581563550929, "percentage": 59.69, "elapsed_time": "20:25:59", "remaining_time": "13:47:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6479, "total_steps": 10853, "loss": 0.1144, "learning_rate": 1.9106475285650345e-06, "epoch": 0.5969502925323629, "percentage": 59.7, "elapsed_time": "20:26:09", "remaining_time": "13:47:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6480, "total_steps": 10853, "loss": 0.1352, "learning_rate": 1.909907243191993e-06, "epoch": 0.5970424287096329, "percentage": 59.71, "elapsed_time": "20:26:20", "remaining_time": "13:47:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6481, "total_steps": 10853, "loss": 0.1368, "learning_rate": 1.9091670126091264e-06, "epoch": 0.5971345648869029, "percentage": 59.72, "elapsed_time": "20:26:31", "remaining_time": "13:47:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6482, "total_steps": 10853, "loss": 0.1277, "learning_rate": 1.908426836885166e-06, "epoch": 0.5972267010641729, "percentage": 59.73, "elapsed_time": "20:26:42", "remaining_time": "13:47:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6483, "total_steps": 10853, "loss": 0.13, "learning_rate": 1.907686716088838e-06, "epoch": 0.5973188372414429, "percentage": 59.73, "elapsed_time": "20:26:51", "remaining_time": "13:46:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6484, "total_steps": 10853, "loss": 0.123, "learning_rate": 1.9069466502888625e-06, "epoch": 0.5974109734187129, "percentage": 59.74, "elapsed_time": "20:27:02", "remaining_time": "13:46:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6485, "total_steps": 10853, "loss": 0.1436, "learning_rate": 1.9062066395539535e-06, "epoch": 0.5975031095959829, "percentage": 59.75, "elapsed_time": "20:27:12", "remaining_time": "13:46:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6486, "total_steps": 10853, "loss": 0.1232, "learning_rate": 1.9054666839528225e-06, "epoch": 0.5975952457732528, "percentage": 59.76, "elapsed_time": "20:27:23", "remaining_time": "13:46:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6487, "total_steps": 10853, "loss": 0.1331, "learning_rate": 1.904726783554173e-06, "epoch": 0.5976873819505228, "percentage": 59.77, "elapsed_time": "20:27:33", "remaining_time": "13:46:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6488, "total_steps": 10853, "loss": 0.1305, "learning_rate": 1.903986938426707e-06, "epoch": 0.5977795181277928, "percentage": 59.78, "elapsed_time": "20:27:44", "remaining_time": "13:46:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6489, "total_steps": 10853, "loss": 0.1359, "learning_rate": 1.9032471486391175e-06, "epoch": 0.5978716543050628, "percentage": 59.79, "elapsed_time": "20:27:56", "remaining_time": "13:45:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6490, "total_steps": 10853, "loss": 0.1244, "learning_rate": 1.9025074142600935e-06, "epoch": 0.5979637904823328, "percentage": 59.8, "elapsed_time": "20:28:06", "remaining_time": "13:45:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6491, "total_steps": 10853, "loss": 0.1312, "learning_rate": 1.9017677353583213e-06, "epoch": 0.5980559266596029, "percentage": 59.81, "elapsed_time": "20:28:18", "remaining_time": "13:45:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6492, "total_steps": 10853, "loss": 0.1354, "learning_rate": 1.90102811200248e-06, "epoch": 0.5981480628368729, "percentage": 59.82, "elapsed_time": "20:28:30", "remaining_time": "13:45:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6493, "total_steps": 10853, "loss": 0.1296, "learning_rate": 1.9002885442612413e-06, "epoch": 0.5982401990141429, "percentage": 59.83, "elapsed_time": "20:28:40", "remaining_time": "13:45:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6494, "total_steps": 10853, "loss": 0.1177, "learning_rate": 1.8995490322032767e-06, "epoch": 0.5983323351914129, "percentage": 59.84, "elapsed_time": "20:28:49", "remaining_time": "13:44:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6495, "total_steps": 10853, "loss": 0.126, "learning_rate": 1.8988095758972485e-06, "epoch": 0.5984244713686829, "percentage": 59.85, "elapsed_time": "20:29:00", "remaining_time": "13:44:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6496, "total_steps": 10853, "loss": 0.1407, "learning_rate": 1.8980701754118168e-06, "epoch": 0.5985166075459529, "percentage": 59.85, "elapsed_time": "20:29:10", "remaining_time": "13:44:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6497, "total_steps": 10853, "loss": 0.146, "learning_rate": 1.8973308308156337e-06, "epoch": 0.5986087437232229, "percentage": 59.86, "elapsed_time": "20:29:21", "remaining_time": "13:44:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6498, "total_steps": 10853, "loss": 0.1385, "learning_rate": 1.8965915421773473e-06, "epoch": 0.5987008799004929, "percentage": 59.87, "elapsed_time": "20:29:31", "remaining_time": "13:44:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6499, "total_steps": 10853, "loss": 0.1264, "learning_rate": 1.8958523095656016e-06, "epoch": 0.5987930160777629, "percentage": 59.88, "elapsed_time": "20:29:41", "remaining_time": "13:43:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6500, "total_steps": 10853, "loss": 0.1209, "learning_rate": 1.8951131330490347e-06, "epoch": 0.5988851522550329, "percentage": 59.89, "elapsed_time": "20:29:51", "remaining_time": "13:43:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6500, "total_steps": 10853, "eval_loss": 0.1315893828868866, "epoch": 0.5988851522550329, "percentage": 59.89, "elapsed_time": "20:34:50", "remaining_time": "13:46:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6501, "total_steps": 10853, "loss": 0.1333, "learning_rate": 1.8943740126962774e-06, "epoch": 0.5989772884323029, "percentage": 59.9, "elapsed_time": "20:35:00", "remaining_time": "13:46:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6502, "total_steps": 10853, "loss": 0.1216, "learning_rate": 1.8936349485759586e-06, "epoch": 0.5990694246095729, "percentage": 59.91, "elapsed_time": "20:35:11", "remaining_time": "13:46:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6503, "total_steps": 10853, "loss": 0.1378, "learning_rate": 1.8928959407566994e-06, "epoch": 0.5991615607868429, "percentage": 59.92, "elapsed_time": "20:35:22", "remaining_time": "13:46:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6504, "total_steps": 10853, "loss": 0.1238, "learning_rate": 1.8921569893071187e-06, "epoch": 0.599253696964113, "percentage": 59.93, "elapsed_time": "20:35:32", "remaining_time": "13:46:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6505, "total_steps": 10853, "loss": 0.1328, "learning_rate": 1.8914180942958265e-06, "epoch": 0.599345833141383, "percentage": 59.94, "elapsed_time": "20:35:43", "remaining_time": "13:45:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6506, "total_steps": 10853, "loss": 0.1387, "learning_rate": 1.890679255791429e-06, "epoch": 0.599437969318653, "percentage": 59.95, "elapsed_time": "20:35:56", "remaining_time": "13:45:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6507, "total_steps": 10853, "loss": 0.1357, "learning_rate": 1.8899404738625288e-06, "epoch": 0.599530105495923, "percentage": 59.96, "elapsed_time": "20:36:09", "remaining_time": "13:45:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6508, "total_steps": 10853, "loss": 0.1314, "learning_rate": 1.8892017485777208e-06, "epoch": 0.599622241673193, "percentage": 59.96, "elapsed_time": "20:36:20", "remaining_time": "13:45:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6509, "total_steps": 10853, "loss": 0.1223, "learning_rate": 1.8884630800055973e-06, "epoch": 0.599714377850463, "percentage": 59.97, "elapsed_time": "20:36:29", "remaining_time": "13:45:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6510, "total_steps": 10853, "loss": 0.1371, "learning_rate": 1.8877244682147419e-06, "epoch": 0.599806514027733, "percentage": 59.98, "elapsed_time": "20:36:41", "remaining_time": "13:45:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6511, "total_steps": 10853, "loss": 0.1346, "learning_rate": 1.886985913273735e-06, "epoch": 0.599898650205003, "percentage": 59.99, "elapsed_time": "20:36:51", "remaining_time": "13:44:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6512, "total_steps": 10853, "loss": 0.1506, "learning_rate": 1.8862474152511529e-06, "epoch": 0.599990786382273, "percentage": 60.0, "elapsed_time": "20:37:02", "remaining_time": "13:44:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6513, "total_steps": 10853, "loss": 0.1314, "learning_rate": 1.8855089742155647e-06, "epoch": 0.600082922559543, "percentage": 60.01, "elapsed_time": "20:37:13", "remaining_time": "13:44:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6514, "total_steps": 10853, "loss": 0.1349, "learning_rate": 1.8847705902355332e-06, "epoch": 0.600175058736813, "percentage": 60.02, "elapsed_time": "20:37:24", "remaining_time": "13:44:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6515, "total_steps": 10853, "loss": 0.126, "learning_rate": 1.8840322633796191e-06, "epoch": 0.600267194914083, "percentage": 60.03, "elapsed_time": "20:37:34", "remaining_time": "13:44:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6516, "total_steps": 10853, "loss": 0.1241, "learning_rate": 1.8832939937163753e-06, "epoch": 0.600359331091353, "percentage": 60.04, "elapsed_time": "20:37:45", "remaining_time": "13:43:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6517, "total_steps": 10853, "loss": 0.1313, "learning_rate": 1.8825557813143513e-06, "epoch": 0.600451467268623, "percentage": 60.05, "elapsed_time": "20:37:57", "remaining_time": "13:43:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6518, "total_steps": 10853, "loss": 0.1217, "learning_rate": 1.8818176262420893e-06, "epoch": 0.6005436034458931, "percentage": 60.06, "elapsed_time": "20:38:07", "remaining_time": "13:43:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6519, "total_steps": 10853, "loss": 0.1133, "learning_rate": 1.8810795285681263e-06, "epoch": 0.6006357396231631, "percentage": 60.07, "elapsed_time": "20:38:18", "remaining_time": "13:43:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6520, "total_steps": 10853, "loss": 0.1384, "learning_rate": 1.8803414883609967e-06, "epoch": 0.6007278758004331, "percentage": 60.08, "elapsed_time": "20:38:28", "remaining_time": "13:43:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6521, "total_steps": 10853, "loss": 0.1218, "learning_rate": 1.8796035056892268e-06, "epoch": 0.6008200119777031, "percentage": 60.08, "elapsed_time": "20:38:38", "remaining_time": "13:42:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6522, "total_steps": 10853, "loss": 0.1251, "learning_rate": 1.8788655806213372e-06, "epoch": 0.6009121481549731, "percentage": 60.09, "elapsed_time": "20:38:49", "remaining_time": "13:42:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6523, "total_steps": 10853, "loss": 0.1349, "learning_rate": 1.8781277132258458e-06, "epoch": 0.6010042843322431, "percentage": 60.1, "elapsed_time": "20:38:59", "remaining_time": "13:42:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6524, "total_steps": 10853, "loss": 0.1349, "learning_rate": 1.8773899035712622e-06, "epoch": 0.6010964205095131, "percentage": 60.11, "elapsed_time": "20:39:09", "remaining_time": "13:42:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6525, "total_steps": 10853, "loss": 0.1216, "learning_rate": 1.8766521517260946e-06, "epoch": 0.6011885566867831, "percentage": 60.12, "elapsed_time": "20:39:18", "remaining_time": "13:42:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6526, "total_steps": 10853, "loss": 0.1414, "learning_rate": 1.875914457758841e-06, "epoch": 0.6012806928640531, "percentage": 60.13, "elapsed_time": "20:39:29", "remaining_time": "13:41:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6527, "total_steps": 10853, "loss": 0.1283, "learning_rate": 1.8751768217379973e-06, "epoch": 0.601372829041323, "percentage": 60.14, "elapsed_time": "20:39:39", "remaining_time": "13:41:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6528, "total_steps": 10853, "loss": 0.1317, "learning_rate": 1.874439243732053e-06, "epoch": 0.601464965218593, "percentage": 60.15, "elapsed_time": "20:39:48", "remaining_time": "13:41:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6529, "total_steps": 10853, "loss": 0.1323, "learning_rate": 1.8737017238094926e-06, "epoch": 0.601557101395863, "percentage": 60.16, "elapsed_time": "20:40:00", "remaining_time": "13:41:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6530, "total_steps": 10853, "loss": 0.1264, "learning_rate": 1.8729642620387935e-06, "epoch": 0.601649237573133, "percentage": 60.17, "elapsed_time": "20:40:11", "remaining_time": "13:41:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6531, "total_steps": 10853, "loss": 0.1385, "learning_rate": 1.8722268584884312e-06, "epoch": 0.601741373750403, "percentage": 60.18, "elapsed_time": "20:40:22", "remaining_time": "13:40:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6532, "total_steps": 10853, "loss": 0.1387, "learning_rate": 1.8714895132268718e-06, "epoch": 0.6018335099276731, "percentage": 60.19, "elapsed_time": "20:40:34", "remaining_time": "13:40:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6533, "total_steps": 10853, "loss": 0.1388, "learning_rate": 1.8707522263225797e-06, "epoch": 0.6019256461049431, "percentage": 60.2, "elapsed_time": "20:40:45", "remaining_time": "13:40:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6534, "total_steps": 10853, "loss": 0.1287, "learning_rate": 1.8700149978440105e-06, "epoch": 0.6020177822822131, "percentage": 60.2, "elapsed_time": "20:40:55", "remaining_time": "13:40:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6535, "total_steps": 10853, "loss": 0.1321, "learning_rate": 1.8692778278596162e-06, "epoch": 0.6021099184594831, "percentage": 60.21, "elapsed_time": "20:41:06", "remaining_time": "13:40:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6536, "total_steps": 10853, "loss": 0.1338, "learning_rate": 1.868540716437844e-06, "epoch": 0.6022020546367531, "percentage": 60.22, "elapsed_time": "20:41:16", "remaining_time": "13:39:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6537, "total_steps": 10853, "loss": 0.1269, "learning_rate": 1.8678036636471336e-06, "epoch": 0.6022941908140231, "percentage": 60.23, "elapsed_time": "20:41:27", "remaining_time": "13:39:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6538, "total_steps": 10853, "loss": 0.1431, "learning_rate": 1.867066669555922e-06, "epoch": 0.6023863269912931, "percentage": 60.24, "elapsed_time": "20:41:38", "remaining_time": "13:39:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6539, "total_steps": 10853, "loss": 0.1363, "learning_rate": 1.8663297342326381e-06, "epoch": 0.6024784631685631, "percentage": 60.25, "elapsed_time": "20:41:49", "remaining_time": "13:39:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6540, "total_steps": 10853, "loss": 0.1231, "learning_rate": 1.8655928577457058e-06, "epoch": 0.6025705993458331, "percentage": 60.26, "elapsed_time": "20:42:00", "remaining_time": "13:39:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6541, "total_steps": 10853, "loss": 0.134, "learning_rate": 1.8648560401635448e-06, "epoch": 0.6026627355231031, "percentage": 60.27, "elapsed_time": "20:42:10", "remaining_time": "13:38:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6542, "total_steps": 10853, "loss": 0.1301, "learning_rate": 1.8641192815545705e-06, "epoch": 0.6027548717003731, "percentage": 60.28, "elapsed_time": "20:42:20", "remaining_time": "13:38:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6543, "total_steps": 10853, "loss": 0.1347, "learning_rate": 1.8633825819871881e-06, "epoch": 0.6028470078776431, "percentage": 60.29, "elapsed_time": "20:42:31", "remaining_time": "13:38:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6544, "total_steps": 10853, "loss": 0.122, "learning_rate": 1.8626459415298012e-06, "epoch": 0.6029391440549131, "percentage": 60.3, "elapsed_time": "20:42:42", "remaining_time": "13:38:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6545, "total_steps": 10853, "loss": 0.1173, "learning_rate": 1.8619093602508075e-06, "epoch": 0.6030312802321832, "percentage": 60.31, "elapsed_time": "20:42:53", "remaining_time": "13:38:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6546, "total_steps": 10853, "loss": 0.1338, "learning_rate": 1.8611728382185995e-06, "epoch": 0.6031234164094532, "percentage": 60.32, "elapsed_time": "20:43:05", "remaining_time": "13:37:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6547, "total_steps": 10853, "loss": 0.1228, "learning_rate": 1.860436375501561e-06, "epoch": 0.6032155525867232, "percentage": 60.32, "elapsed_time": "20:43:16", "remaining_time": "13:37:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6548, "total_steps": 10853, "loss": 0.138, "learning_rate": 1.8596999721680743e-06, "epoch": 0.6033076887639932, "percentage": 60.33, "elapsed_time": "20:43:26", "remaining_time": "13:37:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6549, "total_steps": 10853, "loss": 0.136, "learning_rate": 1.858963628286513e-06, "epoch": 0.6033998249412632, "percentage": 60.34, "elapsed_time": "20:43:37", "remaining_time": "13:37:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6550, "total_steps": 10853, "loss": 0.1295, "learning_rate": 1.8582273439252497e-06, "epoch": 0.6034919611185332, "percentage": 60.35, "elapsed_time": "20:43:47", "remaining_time": "13:37:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6551, "total_steps": 10853, "loss": 0.1199, "learning_rate": 1.8574911191526456e-06, "epoch": 0.6035840972958032, "percentage": 60.36, "elapsed_time": "20:43:58", "remaining_time": "13:36:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6552, "total_steps": 10853, "loss": 0.1419, "learning_rate": 1.85675495403706e-06, "epoch": 0.6036762334730732, "percentage": 60.37, "elapsed_time": "20:44:10", "remaining_time": "13:36:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6553, "total_steps": 10853, "loss": 0.1257, "learning_rate": 1.8560188486468463e-06, "epoch": 0.6037683696503432, "percentage": 60.38, "elapsed_time": "20:44:22", "remaining_time": "13:36:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6554, "total_steps": 10853, "loss": 0.1362, "learning_rate": 1.8552828030503528e-06, "epoch": 0.6038605058276132, "percentage": 60.39, "elapsed_time": "20:44:32", "remaining_time": "13:36:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6555, "total_steps": 10853, "loss": 0.1247, "learning_rate": 1.854546817315919e-06, "epoch": 0.6039526420048832, "percentage": 60.4, "elapsed_time": "20:44:42", "remaining_time": "13:36:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6556, "total_steps": 10853, "loss": 0.1385, "learning_rate": 1.8538108915118833e-06, "epoch": 0.6040447781821532, "percentage": 60.41, "elapsed_time": "20:44:54", "remaining_time": "13:35:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6557, "total_steps": 10853, "loss": 0.1299, "learning_rate": 1.8530750257065752e-06, "epoch": 0.6041369143594232, "percentage": 60.42, "elapsed_time": "20:45:06", "remaining_time": "13:35:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6558, "total_steps": 10853, "loss": 0.1232, "learning_rate": 1.8523392199683218e-06, "epoch": 0.6042290505366932, "percentage": 60.43, "elapsed_time": "20:45:17", "remaining_time": "13:35:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6559, "total_steps": 10853, "loss": 0.1381, "learning_rate": 1.851603474365441e-06, "epoch": 0.6043211867139633, "percentage": 60.43, "elapsed_time": "20:45:27", "remaining_time": "13:35:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6560, "total_steps": 10853, "loss": 0.1425, "learning_rate": 1.8508677889662469e-06, "epoch": 0.6044133228912333, "percentage": 60.44, "elapsed_time": "20:45:37", "remaining_time": "13:35:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6561, "total_steps": 10853, "loss": 0.1305, "learning_rate": 1.850132163839049e-06, "epoch": 0.6045054590685033, "percentage": 60.45, "elapsed_time": "20:45:48", "remaining_time": "13:34:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6562, "total_steps": 10853, "loss": 0.1161, "learning_rate": 1.849396599052149e-06, "epoch": 0.6045975952457733, "percentage": 60.46, "elapsed_time": "20:45:59", "remaining_time": "13:34:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6563, "total_steps": 10853, "loss": 0.126, "learning_rate": 1.848661094673846e-06, "epoch": 0.6046897314230433, "percentage": 60.47, "elapsed_time": "20:46:09", "remaining_time": "13:34:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6564, "total_steps": 10853, "loss": 0.1187, "learning_rate": 1.8479256507724297e-06, "epoch": 0.6047818676003133, "percentage": 60.48, "elapsed_time": "20:46:20", "remaining_time": "13:34:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6565, "total_steps": 10853, "loss": 0.1475, "learning_rate": 1.8471902674161863e-06, "epoch": 0.6048740037775833, "percentage": 60.49, "elapsed_time": "20:46:31", "remaining_time": "13:34:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6566, "total_steps": 10853, "loss": 0.1355, "learning_rate": 1.8464549446733976e-06, "epoch": 0.6049661399548533, "percentage": 60.5, "elapsed_time": "20:46:42", "remaining_time": "13:33:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6567, "total_steps": 10853, "loss": 0.1254, "learning_rate": 1.8457196826123381e-06, "epoch": 0.6050582761321233, "percentage": 60.51, "elapsed_time": "20:46:52", "remaining_time": "13:33:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6568, "total_steps": 10853, "loss": 0.1238, "learning_rate": 1.8449844813012755e-06, "epoch": 0.6051504123093933, "percentage": 60.52, "elapsed_time": "20:47:01", "remaining_time": "13:33:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6569, "total_steps": 10853, "loss": 0.135, "learning_rate": 1.8442493408084746e-06, "epoch": 0.6052425484866633, "percentage": 60.53, "elapsed_time": "20:47:11", "remaining_time": "13:33:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6570, "total_steps": 10853, "loss": 0.1356, "learning_rate": 1.8435142612021929e-06, "epoch": 0.6053346846639333, "percentage": 60.54, "elapsed_time": "20:47:22", "remaining_time": "13:33:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6571, "total_steps": 10853, "loss": 0.1255, "learning_rate": 1.8427792425506833e-06, "epoch": 0.6054268208412033, "percentage": 60.55, "elapsed_time": "20:47:33", "remaining_time": "13:32:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6572, "total_steps": 10853, "loss": 0.136, "learning_rate": 1.8420442849221915e-06, "epoch": 0.6055189570184734, "percentage": 60.55, "elapsed_time": "20:47:44", "remaining_time": "13:32:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6573, "total_steps": 10853, "loss": 0.1181, "learning_rate": 1.8413093883849579e-06, "epoch": 0.6056110931957434, "percentage": 60.56, "elapsed_time": "20:47:54", "remaining_time": "13:32:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6574, "total_steps": 10853, "loss": 0.1281, "learning_rate": 1.840574553007219e-06, "epoch": 0.6057032293730134, "percentage": 60.57, "elapsed_time": "20:48:05", "remaining_time": "13:32:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6575, "total_steps": 10853, "loss": 0.1345, "learning_rate": 1.8398397788572046e-06, "epoch": 0.6057953655502833, "percentage": 60.58, "elapsed_time": "20:48:15", "remaining_time": "13:32:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6576, "total_steps": 10853, "loss": 0.142, "learning_rate": 1.8391050660031364e-06, "epoch": 0.6058875017275533, "percentage": 60.59, "elapsed_time": "20:48:27", "remaining_time": "13:31:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6577, "total_steps": 10853, "loss": 0.1328, "learning_rate": 1.8383704145132347e-06, "epoch": 0.6059796379048233, "percentage": 60.6, "elapsed_time": "20:48:38", "remaining_time": "13:31:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6578, "total_steps": 10853, "loss": 0.1405, "learning_rate": 1.8376358244557108e-06, "epoch": 0.6060717740820933, "percentage": 60.61, "elapsed_time": "20:48:49", "remaining_time": "13:31:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6579, "total_steps": 10853, "loss": 0.1294, "learning_rate": 1.8369012958987728e-06, "epoch": 0.6061639102593633, "percentage": 60.62, "elapsed_time": "20:49:00", "remaining_time": "13:31:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6580, "total_steps": 10853, "loss": 0.1404, "learning_rate": 1.8361668289106204e-06, "epoch": 0.6062560464366333, "percentage": 60.63, "elapsed_time": "20:49:11", "remaining_time": "13:31:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6581, "total_steps": 10853, "loss": 0.1409, "learning_rate": 1.8354324235594488e-06, "epoch": 0.6063481826139033, "percentage": 60.64, "elapsed_time": "20:49:21", "remaining_time": "13:31:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6582, "total_steps": 10853, "loss": 0.1232, "learning_rate": 1.8346980799134485e-06, "epoch": 0.6064403187911733, "percentage": 60.65, "elapsed_time": "20:49:31", "remaining_time": "13:30:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6583, "total_steps": 10853, "loss": 0.1153, "learning_rate": 1.8339637980408038e-06, "epoch": 0.6065324549684433, "percentage": 60.66, "elapsed_time": "20:49:42", "remaining_time": "13:30:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6584, "total_steps": 10853, "loss": 0.1303, "learning_rate": 1.833229578009691e-06, "epoch": 0.6066245911457133, "percentage": 60.67, "elapsed_time": "20:49:54", "remaining_time": "13:30:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6585, "total_steps": 10853, "loss": 0.1438, "learning_rate": 1.8324954198882843e-06, "epoch": 0.6067167273229833, "percentage": 60.67, "elapsed_time": "20:50:06", "remaining_time": "13:30:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6586, "total_steps": 10853, "loss": 0.1214, "learning_rate": 1.831761323744749e-06, "epoch": 0.6068088635002534, "percentage": 60.68, "elapsed_time": "20:50:16", "remaining_time": "13:30:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6587, "total_steps": 10853, "loss": 0.1257, "learning_rate": 1.831027289647248e-06, "epoch": 0.6069009996775234, "percentage": 60.69, "elapsed_time": "20:50:26", "remaining_time": "13:29:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6588, "total_steps": 10853, "loss": 0.1326, "learning_rate": 1.8302933176639346e-06, "epoch": 0.6069931358547934, "percentage": 60.7, "elapsed_time": "20:50:37", "remaining_time": "13:29:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6589, "total_steps": 10853, "loss": 0.1313, "learning_rate": 1.829559407862958e-06, "epoch": 0.6070852720320634, "percentage": 60.71, "elapsed_time": "20:50:48", "remaining_time": "13:29:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6590, "total_steps": 10853, "loss": 0.1338, "learning_rate": 1.8288255603124632e-06, "epoch": 0.6071774082093334, "percentage": 60.72, "elapsed_time": "20:50:59", "remaining_time": "13:29:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6591, "total_steps": 10853, "loss": 0.1259, "learning_rate": 1.8280917750805865e-06, "epoch": 0.6072695443866034, "percentage": 60.73, "elapsed_time": "20:51:10", "remaining_time": "13:29:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6592, "total_steps": 10853, "loss": 0.1189, "learning_rate": 1.8273580522354622e-06, "epoch": 0.6073616805638734, "percentage": 60.74, "elapsed_time": "20:51:18", "remaining_time": "13:28:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6593, "total_steps": 10853, "loss": 0.128, "learning_rate": 1.8266243918452149e-06, "epoch": 0.6074538167411434, "percentage": 60.75, "elapsed_time": "20:51:30", "remaining_time": "13:28:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6594, "total_steps": 10853, "loss": 0.128, "learning_rate": 1.825890793977964e-06, "epoch": 0.6075459529184134, "percentage": 60.76, "elapsed_time": "20:51:40", "remaining_time": "13:28:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6595, "total_steps": 10853, "loss": 0.1515, "learning_rate": 1.8251572587018268e-06, "epoch": 0.6076380890956834, "percentage": 60.77, "elapsed_time": "20:51:50", "remaining_time": "13:28:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6596, "total_steps": 10853, "loss": 0.1322, "learning_rate": 1.8244237860849108e-06, "epoch": 0.6077302252729534, "percentage": 60.78, "elapsed_time": "20:52:01", "remaining_time": "13:28:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6597, "total_steps": 10853, "loss": 0.1176, "learning_rate": 1.8236903761953178e-06, "epoch": 0.6078223614502234, "percentage": 60.79, "elapsed_time": "20:52:12", "remaining_time": "13:27:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6598, "total_steps": 10853, "loss": 0.1168, "learning_rate": 1.8229570291011468e-06, "epoch": 0.6079144976274934, "percentage": 60.79, "elapsed_time": "20:52:24", "remaining_time": "13:27:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6599, "total_steps": 10853, "loss": 0.1301, "learning_rate": 1.8222237448704882e-06, "epoch": 0.6080066338047634, "percentage": 60.8, "elapsed_time": "20:52:37", "remaining_time": "13:27:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6600, "total_steps": 10853, "loss": 0.128, "learning_rate": 1.8214905235714286e-06, "epoch": 0.6080987699820335, "percentage": 60.81, "elapsed_time": "20:52:47", "remaining_time": "13:27:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6601, "total_steps": 10853, "loss": 0.1161, "learning_rate": 1.8207573652720467e-06, "epoch": 0.6081909061593035, "percentage": 60.82, "elapsed_time": "20:52:58", "remaining_time": "13:27:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6602, "total_steps": 10853, "loss": 0.1201, "learning_rate": 1.8200242700404159e-06, "epoch": 0.6082830423365735, "percentage": 60.83, "elapsed_time": "20:53:09", "remaining_time": "13:26:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6603, "total_steps": 10853, "loss": 0.1226, "learning_rate": 1.8192912379446048e-06, "epoch": 0.6083751785138435, "percentage": 60.84, "elapsed_time": "20:53:18", "remaining_time": "13:26:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6604, "total_steps": 10853, "loss": 0.1332, "learning_rate": 1.8185582690526765e-06, "epoch": 0.6084673146911135, "percentage": 60.85, "elapsed_time": "20:53:29", "remaining_time": "13:26:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6605, "total_steps": 10853, "loss": 0.1323, "learning_rate": 1.8178253634326854e-06, "epoch": 0.6085594508683835, "percentage": 60.86, "elapsed_time": "20:53:39", "remaining_time": "13:26:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6606, "total_steps": 10853, "loss": 0.1243, "learning_rate": 1.817092521152683e-06, "epoch": 0.6086515870456535, "percentage": 60.87, "elapsed_time": "20:53:50", "remaining_time": "13:26:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6607, "total_steps": 10853, "loss": 0.1309, "learning_rate": 1.816359742280713e-06, "epoch": 0.6087437232229235, "percentage": 60.88, "elapsed_time": "20:54:01", "remaining_time": "13:25:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6608, "total_steps": 10853, "loss": 0.1183, "learning_rate": 1.8156270268848155e-06, "epoch": 0.6088358594001935, "percentage": 60.89, "elapsed_time": "20:54:11", "remaining_time": "13:25:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6609, "total_steps": 10853, "loss": 0.1296, "learning_rate": 1.8148943750330216e-06, "epoch": 0.6089279955774635, "percentage": 60.9, "elapsed_time": "20:54:23", "remaining_time": "13:25:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6610, "total_steps": 10853, "loss": 0.1215, "learning_rate": 1.8141617867933586e-06, "epoch": 0.6090201317547335, "percentage": 60.9, "elapsed_time": "20:54:33", "remaining_time": "13:25:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6611, "total_steps": 10853, "loss": 0.1316, "learning_rate": 1.813429262233848e-06, "epoch": 0.6091122679320035, "percentage": 60.91, "elapsed_time": "20:54:45", "remaining_time": "13:25:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6612, "total_steps": 10853, "loss": 0.1381, "learning_rate": 1.8126968014225044e-06, "epoch": 0.6092044041092735, "percentage": 60.92, "elapsed_time": "20:54:58", "remaining_time": "13:24:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6613, "total_steps": 10853, "loss": 0.1357, "learning_rate": 1.811964404427336e-06, "epoch": 0.6092965402865436, "percentage": 60.93, "elapsed_time": "20:55:08", "remaining_time": "13:24:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6614, "total_steps": 10853, "loss": 0.1118, "learning_rate": 1.811232071316347e-06, "epoch": 0.6093886764638136, "percentage": 60.94, "elapsed_time": "20:55:19", "remaining_time": "13:24:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6615, "total_steps": 10853, "loss": 0.1295, "learning_rate": 1.8104998021575337e-06, "epoch": 0.6094808126410836, "percentage": 60.95, "elapsed_time": "20:55:30", "remaining_time": "13:24:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6616, "total_steps": 10853, "loss": 0.1327, "learning_rate": 1.8097675970188894e-06, "epoch": 0.6095729488183536, "percentage": 60.96, "elapsed_time": "20:55:40", "remaining_time": "13:24:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6617, "total_steps": 10853, "loss": 0.1378, "learning_rate": 1.8090354559683972e-06, "epoch": 0.6096650849956236, "percentage": 60.97, "elapsed_time": "20:55:50", "remaining_time": "13:23:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6618, "total_steps": 10853, "loss": 0.1289, "learning_rate": 1.8083033790740368e-06, "epoch": 0.6097572211728935, "percentage": 60.98, "elapsed_time": "20:56:01", "remaining_time": "13:23:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6619, "total_steps": 10853, "loss": 0.1289, "learning_rate": 1.8075713664037823e-06, "epoch": 0.6098493573501635, "percentage": 60.99, "elapsed_time": "20:56:11", "remaining_time": "13:23:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6620, "total_steps": 10853, "loss": 0.1275, "learning_rate": 1.806839418025601e-06, "epoch": 0.6099414935274335, "percentage": 61.0, "elapsed_time": "20:56:22", "remaining_time": "13:23:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6621, "total_steps": 10853, "loss": 0.1297, "learning_rate": 1.8061075340074556e-06, "epoch": 0.6100336297047035, "percentage": 61.01, "elapsed_time": "20:56:33", "remaining_time": "13:23:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6622, "total_steps": 10853, "loss": 0.1237, "learning_rate": 1.8053757144172987e-06, "epoch": 0.6101257658819735, "percentage": 61.02, "elapsed_time": "20:56:44", "remaining_time": "13:22:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6623, "total_steps": 10853, "loss": 0.1147, "learning_rate": 1.8046439593230822e-06, "epoch": 0.6102179020592435, "percentage": 61.02, "elapsed_time": "20:56:55", "remaining_time": "13:22:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6624, "total_steps": 10853, "loss": 0.1386, "learning_rate": 1.8039122687927485e-06, "epoch": 0.6103100382365135, "percentage": 61.03, "elapsed_time": "20:57:06", "remaining_time": "13:22:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6625, "total_steps": 10853, "loss": 0.1389, "learning_rate": 1.803180642894236e-06, "epoch": 0.6104021744137835, "percentage": 61.04, "elapsed_time": "20:57:18", "remaining_time": "13:22:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6626, "total_steps": 10853, "loss": 0.1269, "learning_rate": 1.802449081695476e-06, "epoch": 0.6104943105910535, "percentage": 61.05, "elapsed_time": "20:57:29", "remaining_time": "13:22:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6627, "total_steps": 10853, "loss": 0.1282, "learning_rate": 1.801717585264393e-06, "epoch": 0.6105864467683236, "percentage": 61.06, "elapsed_time": "20:57:40", "remaining_time": "13:22:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6628, "total_steps": 10853, "loss": 0.125, "learning_rate": 1.800986153668908e-06, "epoch": 0.6106785829455936, "percentage": 61.07, "elapsed_time": "20:57:52", "remaining_time": "13:21:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6629, "total_steps": 10853, "loss": 0.1297, "learning_rate": 1.8002547869769344e-06, "epoch": 0.6107707191228636, "percentage": 61.08, "elapsed_time": "20:58:02", "remaining_time": "13:21:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6630, "total_steps": 10853, "loss": 0.1228, "learning_rate": 1.7995234852563779e-06, "epoch": 0.6108628553001336, "percentage": 61.09, "elapsed_time": "20:58:11", "remaining_time": "13:21:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6631, "total_steps": 10853, "loss": 0.1383, "learning_rate": 1.7987922485751418e-06, "epoch": 0.6109549914774036, "percentage": 61.1, "elapsed_time": "20:58:22", "remaining_time": "13:21:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6632, "total_steps": 10853, "loss": 0.1217, "learning_rate": 1.7980610770011203e-06, "epoch": 0.6110471276546736, "percentage": 61.11, "elapsed_time": "20:58:32", "remaining_time": "13:21:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6633, "total_steps": 10853, "loss": 0.1289, "learning_rate": 1.7973299706022046e-06, "epoch": 0.6111392638319436, "percentage": 61.12, "elapsed_time": "20:58:42", "remaining_time": "13:20:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6634, "total_steps": 10853, "loss": 0.1196, "learning_rate": 1.796598929446276e-06, "epoch": 0.6112314000092136, "percentage": 61.13, "elapsed_time": "20:58:53", "remaining_time": "13:20:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6635, "total_steps": 10853, "loss": 0.1207, "learning_rate": 1.7958679536012118e-06, "epoch": 0.6113235361864836, "percentage": 61.14, "elapsed_time": "20:59:04", "remaining_time": "13:20:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6636, "total_steps": 10853, "loss": 0.1232, "learning_rate": 1.795137043134885e-06, "epoch": 0.6114156723637536, "percentage": 61.14, "elapsed_time": "20:59:16", "remaining_time": "13:20:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6637, "total_steps": 10853, "loss": 0.1374, "learning_rate": 1.7944061981151598e-06, "epoch": 0.6115078085410236, "percentage": 61.15, "elapsed_time": "20:59:27", "remaining_time": "13:20:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6638, "total_steps": 10853, "loss": 0.124, "learning_rate": 1.793675418609894e-06, "epoch": 0.6115999447182936, "percentage": 61.16, "elapsed_time": "20:59:38", "remaining_time": "13:19:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6639, "total_steps": 10853, "loss": 0.1253, "learning_rate": 1.792944704686942e-06, "epoch": 0.6116920808955636, "percentage": 61.17, "elapsed_time": "20:59:50", "remaining_time": "13:19:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6640, "total_steps": 10853, "loss": 0.1204, "learning_rate": 1.79221405641415e-06, "epoch": 0.6117842170728337, "percentage": 61.18, "elapsed_time": "21:00:01", "remaining_time": "13:19:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6641, "total_steps": 10853, "loss": 0.1339, "learning_rate": 1.79148347385936e-06, "epoch": 0.6118763532501037, "percentage": 61.19, "elapsed_time": "21:00:11", "remaining_time": "13:19:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6642, "total_steps": 10853, "loss": 0.1285, "learning_rate": 1.790752957090405e-06, "epoch": 0.6119684894273737, "percentage": 61.2, "elapsed_time": "21:00:22", "remaining_time": "13:19:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6643, "total_steps": 10853, "loss": 0.1305, "learning_rate": 1.7900225061751136e-06, "epoch": 0.6120606256046437, "percentage": 61.21, "elapsed_time": "21:00:33", "remaining_time": "13:18:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6644, "total_steps": 10853, "loss": 0.1205, "learning_rate": 1.78929212118131e-06, "epoch": 0.6121527617819137, "percentage": 61.22, "elapsed_time": "21:00:44", "remaining_time": "13:18:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6645, "total_steps": 10853, "loss": 0.1253, "learning_rate": 1.7885618021768097e-06, "epoch": 0.6122448979591837, "percentage": 61.23, "elapsed_time": "21:00:55", "remaining_time": "13:18:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6646, "total_steps": 10853, "loss": 0.1248, "learning_rate": 1.7878315492294213e-06, "epoch": 0.6123370341364537, "percentage": 61.24, "elapsed_time": "21:01:04", "remaining_time": "13:18:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6647, "total_steps": 10853, "loss": 0.1391, "learning_rate": 1.7871013624069511e-06, "epoch": 0.6124291703137237, "percentage": 61.25, "elapsed_time": "21:01:13", "remaining_time": "13:18:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6648, "total_steps": 10853, "loss": 0.1348, "learning_rate": 1.7863712417771956e-06, "epoch": 0.6125213064909937, "percentage": 61.25, "elapsed_time": "21:01:24", "remaining_time": "13:17:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6649, "total_steps": 10853, "loss": 0.1402, "learning_rate": 1.7856411874079475e-06, "epoch": 0.6126134426682637, "percentage": 61.26, "elapsed_time": "21:01:35", "remaining_time": "13:17:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6650, "total_steps": 10853, "loss": 0.1345, "learning_rate": 1.7849111993669924e-06, "epoch": 0.6127055788455337, "percentage": 61.27, "elapsed_time": "21:01:46", "remaining_time": "13:17:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6651, "total_steps": 10853, "loss": 0.1246, "learning_rate": 1.7841812777221085e-06, "epoch": 0.6127977150228037, "percentage": 61.28, "elapsed_time": "21:01:57", "remaining_time": "13:17:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6652, "total_steps": 10853, "loss": 0.1283, "learning_rate": 1.7834514225410704e-06, "epoch": 0.6128898512000737, "percentage": 61.29, "elapsed_time": "21:02:08", "remaining_time": "13:17:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6653, "total_steps": 10853, "loss": 0.1362, "learning_rate": 1.7827216338916444e-06, "epoch": 0.6129819873773437, "percentage": 61.3, "elapsed_time": "21:02:20", "remaining_time": "13:16:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6654, "total_steps": 10853, "loss": 0.1384, "learning_rate": 1.781991911841593e-06, "epoch": 0.6130741235546138, "percentage": 61.31, "elapsed_time": "21:02:30", "remaining_time": "13:16:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6655, "total_steps": 10853, "loss": 0.1197, "learning_rate": 1.7812622564586695e-06, "epoch": 0.6131662597318838, "percentage": 61.32, "elapsed_time": "21:02:40", "remaining_time": "13:16:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6656, "total_steps": 10853, "loss": 0.1306, "learning_rate": 1.7805326678106221e-06, "epoch": 0.6132583959091538, "percentage": 61.33, "elapsed_time": "21:02:51", "remaining_time": "13:16:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6657, "total_steps": 10853, "loss": 0.1205, "learning_rate": 1.7798031459651942e-06, "epoch": 0.6133505320864238, "percentage": 61.34, "elapsed_time": "21:03:02", "remaining_time": "13:16:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6658, "total_steps": 10853, "loss": 0.1251, "learning_rate": 1.7790736909901228e-06, "epoch": 0.6134426682636938, "percentage": 61.35, "elapsed_time": "21:03:12", "remaining_time": "13:15:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6659, "total_steps": 10853, "loss": 0.1252, "learning_rate": 1.7783443029531352e-06, "epoch": 0.6135348044409638, "percentage": 61.36, "elapsed_time": "21:03:22", "remaining_time": "13:15:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6660, "total_steps": 10853, "loss": 0.1355, "learning_rate": 1.7776149819219574e-06, "epoch": 0.6136269406182338, "percentage": 61.37, "elapsed_time": "21:03:33", "remaining_time": "13:15:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6661, "total_steps": 10853, "loss": 0.1263, "learning_rate": 1.776885727964306e-06, "epoch": 0.6137190767955037, "percentage": 61.37, "elapsed_time": "21:03:41", "remaining_time": "13:15:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6662, "total_steps": 10853, "loss": 0.1341, "learning_rate": 1.7761565411478935e-06, "epoch": 0.6138112129727737, "percentage": 61.38, "elapsed_time": "21:03:53", "remaining_time": "13:15:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6663, "total_steps": 10853, "loss": 0.139, "learning_rate": 1.7754274215404234e-06, "epoch": 0.6139033491500437, "percentage": 61.39, "elapsed_time": "21:04:04", "remaining_time": "13:14:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6664, "total_steps": 10853, "loss": 0.1273, "learning_rate": 1.7746983692095947e-06, "epoch": 0.6139954853273137, "percentage": 61.4, "elapsed_time": "21:04:14", "remaining_time": "13:14:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6665, "total_steps": 10853, "loss": 0.1192, "learning_rate": 1.7739693842231008e-06, "epoch": 0.6140876215045837, "percentage": 61.41, "elapsed_time": "21:04:24", "remaining_time": "13:14:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6666, "total_steps": 10853, "loss": 0.1402, "learning_rate": 1.7732404666486289e-06, "epoch": 0.6141797576818537, "percentage": 61.42, "elapsed_time": "21:04:36", "remaining_time": "13:14:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6667, "total_steps": 10853, "loss": 0.1391, "learning_rate": 1.7725116165538564e-06, "epoch": 0.6142718938591237, "percentage": 61.43, "elapsed_time": "21:04:46", "remaining_time": "13:14:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6668, "total_steps": 10853, "loss": 0.1262, "learning_rate": 1.7717828340064592e-06, "epoch": 0.6143640300363938, "percentage": 61.44, "elapsed_time": "21:04:57", "remaining_time": "13:13:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6669, "total_steps": 10853, "loss": 0.1242, "learning_rate": 1.7710541190741037e-06, "epoch": 0.6144561662136638, "percentage": 61.45, "elapsed_time": "21:05:08", "remaining_time": "13:13:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6670, "total_steps": 10853, "loss": 0.1339, "learning_rate": 1.7703254718244525e-06, "epoch": 0.6145483023909338, "percentage": 61.46, "elapsed_time": "21:05:18", "remaining_time": "13:13:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6671, "total_steps": 10853, "loss": 0.1309, "learning_rate": 1.7695968923251593e-06, "epoch": 0.6146404385682038, "percentage": 61.47, "elapsed_time": "21:05:29", "remaining_time": "13:13:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6672, "total_steps": 10853, "loss": 0.1339, "learning_rate": 1.7688683806438731e-06, "epoch": 0.6147325747454738, "percentage": 61.48, "elapsed_time": "21:05:37", "remaining_time": "13:13:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6673, "total_steps": 10853, "loss": 0.1306, "learning_rate": 1.7681399368482367e-06, "epoch": 0.6148247109227438, "percentage": 61.49, "elapsed_time": "21:05:48", "remaining_time": "13:12:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6674, "total_steps": 10853, "loss": 0.133, "learning_rate": 1.7674115610058864e-06, "epoch": 0.6149168471000138, "percentage": 61.49, "elapsed_time": "21:05:58", "remaining_time": "13:12:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6675, "total_steps": 10853, "loss": 0.1258, "learning_rate": 1.7666832531844508e-06, "epoch": 0.6150089832772838, "percentage": 61.5, "elapsed_time": "21:06:09", "remaining_time": "13:12:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6676, "total_steps": 10853, "loss": 0.1313, "learning_rate": 1.765955013451554e-06, "epoch": 0.6151011194545538, "percentage": 61.51, "elapsed_time": "21:06:18", "remaining_time": "13:12:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6677, "total_steps": 10853, "loss": 0.1447, "learning_rate": 1.765226841874813e-06, "epoch": 0.6151932556318238, "percentage": 61.52, "elapsed_time": "21:06:30", "remaining_time": "13:12:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6678, "total_steps": 10853, "loss": 0.1345, "learning_rate": 1.7644987385218395e-06, "epoch": 0.6152853918090938, "percentage": 61.53, "elapsed_time": "21:06:41", "remaining_time": "13:11:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6679, "total_steps": 10853, "loss": 0.1464, "learning_rate": 1.7637707034602378e-06, "epoch": 0.6153775279863638, "percentage": 61.54, "elapsed_time": "21:06:52", "remaining_time": "13:11:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6680, "total_steps": 10853, "loss": 0.131, "learning_rate": 1.7630427367576042e-06, "epoch": 0.6154696641636338, "percentage": 61.55, "elapsed_time": "21:07:01", "remaining_time": "13:11:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6681, "total_steps": 10853, "loss": 0.1251, "learning_rate": 1.7623148384815326e-06, "epoch": 0.6155618003409039, "percentage": 61.56, "elapsed_time": "21:07:13", "remaining_time": "13:11:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6682, "total_steps": 10853, "loss": 0.1384, "learning_rate": 1.7615870086996067e-06, "epoch": 0.6156539365181739, "percentage": 61.57, "elapsed_time": "21:07:24", "remaining_time": "13:11:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6683, "total_steps": 10853, "loss": 0.1295, "learning_rate": 1.7608592474794078e-06, "epoch": 0.6157460726954439, "percentage": 61.58, "elapsed_time": "21:07:34", "remaining_time": "13:10:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6684, "total_steps": 10853, "loss": 0.1295, "learning_rate": 1.760131554888507e-06, "epoch": 0.6158382088727139, "percentage": 61.59, "elapsed_time": "21:07:45", "remaining_time": "13:10:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6685, "total_steps": 10853, "loss": 0.1392, "learning_rate": 1.7594039309944702e-06, "epoch": 0.6159303450499839, "percentage": 61.6, "elapsed_time": "21:07:56", "remaining_time": "13:10:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6686, "total_steps": 10853, "loss": 0.1485, "learning_rate": 1.7586763758648587e-06, "epoch": 0.6160224812272539, "percentage": 61.61, "elapsed_time": "21:08:05", "remaining_time": "13:10:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6687, "total_steps": 10853, "loss": 0.1287, "learning_rate": 1.757948889567226e-06, "epoch": 0.6161146174045239, "percentage": 61.61, "elapsed_time": "21:08:16", "remaining_time": "13:10:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6688, "total_steps": 10853, "loss": 0.1213, "learning_rate": 1.7572214721691178e-06, "epoch": 0.6162067535817939, "percentage": 61.62, "elapsed_time": "21:08:26", "remaining_time": "13:09:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6689, "total_steps": 10853, "loss": 0.1293, "learning_rate": 1.7564941237380761e-06, "epoch": 0.6162988897590639, "percentage": 61.63, "elapsed_time": "21:08:37", "remaining_time": "13:09:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6690, "total_steps": 10853, "loss": 0.124, "learning_rate": 1.7557668443416348e-06, "epoch": 0.6163910259363339, "percentage": 61.64, "elapsed_time": "21:08:47", "remaining_time": "13:09:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6691, "total_steps": 10853, "loss": 0.1228, "learning_rate": 1.755039634047323e-06, "epoch": 0.6164831621136039, "percentage": 61.65, "elapsed_time": "21:08:57", "remaining_time": "13:09:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6692, "total_steps": 10853, "loss": 0.1355, "learning_rate": 1.7543124929226608e-06, "epoch": 0.6165752982908739, "percentage": 61.66, "elapsed_time": "21:09:09", "remaining_time": "13:09:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6693, "total_steps": 10853, "loss": 0.1368, "learning_rate": 1.7535854210351635e-06, "epoch": 0.6166674344681439, "percentage": 61.67, "elapsed_time": "21:09:20", "remaining_time": "13:08:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6694, "total_steps": 10853, "loss": 0.1232, "learning_rate": 1.7528584184523407e-06, "epoch": 0.6167595706454139, "percentage": 61.68, "elapsed_time": "21:09:30", "remaining_time": "13:08:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6695, "total_steps": 10853, "loss": 0.1412, "learning_rate": 1.7521314852416946e-06, "epoch": 0.616851706822684, "percentage": 61.69, "elapsed_time": "21:09:42", "remaining_time": "13:08:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6696, "total_steps": 10853, "loss": 0.1163, "learning_rate": 1.7514046214707195e-06, "epoch": 0.616943842999954, "percentage": 61.7, "elapsed_time": "21:09:54", "remaining_time": "13:08:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6697, "total_steps": 10853, "loss": 0.1381, "learning_rate": 1.7506778272069064e-06, "epoch": 0.617035979177224, "percentage": 61.71, "elapsed_time": "21:10:06", "remaining_time": "13:08:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6698, "total_steps": 10853, "loss": 0.1264, "learning_rate": 1.7499511025177373e-06, "epoch": 0.617128115354494, "percentage": 61.72, "elapsed_time": "21:10:17", "remaining_time": "13:08:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6699, "total_steps": 10853, "loss": 0.1423, "learning_rate": 1.7492244474706898e-06, "epoch": 0.617220251531764, "percentage": 61.72, "elapsed_time": "21:10:28", "remaining_time": "13:07:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6700, "total_steps": 10853, "loss": 0.1265, "learning_rate": 1.748497862133233e-06, "epoch": 0.617312387709034, "percentage": 61.73, "elapsed_time": "21:10:38", "remaining_time": "13:07:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6701, "total_steps": 10853, "loss": 0.1246, "learning_rate": 1.7477713465728296e-06, "epoch": 0.617404523886304, "percentage": 61.74, "elapsed_time": "21:10:49", "remaining_time": "13:07:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6702, "total_steps": 10853, "loss": 0.1244, "learning_rate": 1.747044900856938e-06, "epoch": 0.617496660063574, "percentage": 61.75, "elapsed_time": "21:10:59", "remaining_time": "13:07:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6703, "total_steps": 10853, "loss": 0.1309, "learning_rate": 1.7463185250530102e-06, "epoch": 0.617588796240844, "percentage": 61.76, "elapsed_time": "21:11:09", "remaining_time": "13:07:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6704, "total_steps": 10853, "loss": 0.1313, "learning_rate": 1.7455922192284864e-06, "epoch": 0.617680932418114, "percentage": 61.77, "elapsed_time": "21:11:19", "remaining_time": "13:06:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6705, "total_steps": 10853, "loss": 0.1298, "learning_rate": 1.7448659834508064e-06, "epoch": 0.617773068595384, "percentage": 61.78, "elapsed_time": "21:11:30", "remaining_time": "13:06:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6706, "total_steps": 10853, "loss": 0.1308, "learning_rate": 1.7441398177874015e-06, "epoch": 0.6178652047726539, "percentage": 61.79, "elapsed_time": "21:11:42", "remaining_time": "13:06:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6707, "total_steps": 10853, "loss": 0.1253, "learning_rate": 1.7434137223056954e-06, "epoch": 0.6179573409499239, "percentage": 61.8, "elapsed_time": "21:11:52", "remaining_time": "13:06:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6708, "total_steps": 10853, "loss": 0.1267, "learning_rate": 1.7426876970731076e-06, "epoch": 0.618049477127194, "percentage": 61.81, "elapsed_time": "21:12:04", "remaining_time": "13:06:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6709, "total_steps": 10853, "loss": 0.1298, "learning_rate": 1.7419617421570483e-06, "epoch": 0.618141613304464, "percentage": 61.82, "elapsed_time": "21:12:15", "remaining_time": "13:05:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6710, "total_steps": 10853, "loss": 0.1242, "learning_rate": 1.7412358576249222e-06, "epoch": 0.618233749481734, "percentage": 61.83, "elapsed_time": "21:12:27", "remaining_time": "13:05:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6711, "total_steps": 10853, "loss": 0.1433, "learning_rate": 1.740510043544129e-06, "epoch": 0.618325885659004, "percentage": 61.84, "elapsed_time": "21:12:39", "remaining_time": "13:05:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6712, "total_steps": 10853, "loss": 0.1228, "learning_rate": 1.7397842999820605e-06, "epoch": 0.618418021836274, "percentage": 61.84, "elapsed_time": "21:12:49", "remaining_time": "13:05:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6713, "total_steps": 10853, "loss": 0.1304, "learning_rate": 1.7390586270061005e-06, "epoch": 0.618510158013544, "percentage": 61.85, "elapsed_time": "21:13:00", "remaining_time": "13:05:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6714, "total_steps": 10853, "loss": 0.1266, "learning_rate": 1.7383330246836294e-06, "epoch": 0.618602294190814, "percentage": 61.86, "elapsed_time": "21:13:11", "remaining_time": "13:04:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6715, "total_steps": 10853, "loss": 0.1252, "learning_rate": 1.737607493082018e-06, "epoch": 0.618694430368084, "percentage": 61.87, "elapsed_time": "21:13:21", "remaining_time": "13:04:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6716, "total_steps": 10853, "loss": 0.1294, "learning_rate": 1.7368820322686345e-06, "epoch": 0.618786566545354, "percentage": 61.88, "elapsed_time": "21:13:33", "remaining_time": "13:04:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6717, "total_steps": 10853, "loss": 0.1312, "learning_rate": 1.7361566423108355e-06, "epoch": 0.618878702722624, "percentage": 61.89, "elapsed_time": "21:13:44", "remaining_time": "13:04:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6718, "total_steps": 10853, "loss": 0.1179, "learning_rate": 1.7354313232759745e-06, "epoch": 0.618970838899894, "percentage": 61.9, "elapsed_time": "21:13:54", "remaining_time": "13:04:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6719, "total_steps": 10853, "loss": 0.1235, "learning_rate": 1.7347060752313978e-06, "epoch": 0.619062975077164, "percentage": 61.91, "elapsed_time": "21:14:04", "remaining_time": "13:03:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6720, "total_steps": 10853, "loss": 0.1394, "learning_rate": 1.7339808982444444e-06, "epoch": 0.619155111254434, "percentage": 61.92, "elapsed_time": "21:14:15", "remaining_time": "13:03:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6721, "total_steps": 10853, "loss": 0.1355, "learning_rate": 1.7332557923824463e-06, "epoch": 0.619247247431704, "percentage": 61.93, "elapsed_time": "21:14:26", "remaining_time": "13:03:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6722, "total_steps": 10853, "loss": 0.121, "learning_rate": 1.732530757712731e-06, "epoch": 0.6193393836089741, "percentage": 61.94, "elapsed_time": "21:14:37", "remaining_time": "13:03:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6723, "total_steps": 10853, "loss": 0.1194, "learning_rate": 1.7318057943026169e-06, "epoch": 0.6194315197862441, "percentage": 61.95, "elapsed_time": "21:14:48", "remaining_time": "13:03:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6724, "total_steps": 10853, "loss": 0.1279, "learning_rate": 1.7310809022194184e-06, "epoch": 0.6195236559635141, "percentage": 61.96, "elapsed_time": "21:14:58", "remaining_time": "13:02:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6725, "total_steps": 10853, "loss": 0.1274, "learning_rate": 1.7303560815304404e-06, "epoch": 0.6196157921407841, "percentage": 61.96, "elapsed_time": "21:15:10", "remaining_time": "13:02:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6726, "total_steps": 10853, "loss": 0.129, "learning_rate": 1.7296313323029825e-06, "epoch": 0.6197079283180541, "percentage": 61.97, "elapsed_time": "21:15:21", "remaining_time": "13:02:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6727, "total_steps": 10853, "loss": 0.1189, "learning_rate": 1.7289066546043386e-06, "epoch": 0.6198000644953241, "percentage": 61.98, "elapsed_time": "21:15:32", "remaining_time": "13:02:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6728, "total_steps": 10853, "loss": 0.1359, "learning_rate": 1.7281820485017958e-06, "epoch": 0.6198922006725941, "percentage": 61.99, "elapsed_time": "21:15:44", "remaining_time": "13:02:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6729, "total_steps": 10853, "loss": 0.1287, "learning_rate": 1.7274575140626318e-06, "epoch": 0.6199843368498641, "percentage": 62.0, "elapsed_time": "21:15:54", "remaining_time": "13:01:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6730, "total_steps": 10853, "loss": 0.1325, "learning_rate": 1.726733051354121e-06, "epoch": 0.6200764730271341, "percentage": 62.01, "elapsed_time": "21:16:05", "remaining_time": "13:01:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6731, "total_steps": 10853, "loss": 0.1222, "learning_rate": 1.7260086604435295e-06, "epoch": 0.6201686092044041, "percentage": 62.02, "elapsed_time": "21:16:15", "remaining_time": "13:01:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6732, "total_steps": 10853, "loss": 0.1291, "learning_rate": 1.7252843413981176e-06, "epoch": 0.6202607453816741, "percentage": 62.03, "elapsed_time": "21:16:25", "remaining_time": "13:01:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6733, "total_steps": 10853, "loss": 0.1168, "learning_rate": 1.7245600942851378e-06, "epoch": 0.6203528815589441, "percentage": 62.04, "elapsed_time": "21:16:36", "remaining_time": "13:01:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6734, "total_steps": 10853, "loss": 0.1158, "learning_rate": 1.7238359191718362e-06, "epoch": 0.6204450177362141, "percentage": 62.05, "elapsed_time": "21:16:46", "remaining_time": "13:00:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6735, "total_steps": 10853, "loss": 0.1201, "learning_rate": 1.7231118161254534e-06, "epoch": 0.6205371539134841, "percentage": 62.06, "elapsed_time": "21:16:56", "remaining_time": "13:00:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6736, "total_steps": 10853, "loss": 0.1349, "learning_rate": 1.7223877852132218e-06, "epoch": 0.6206292900907542, "percentage": 62.07, "elapsed_time": "21:17:07", "remaining_time": "13:00:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6737, "total_steps": 10853, "loss": 0.1218, "learning_rate": 1.721663826502369e-06, "epoch": 0.6207214262680242, "percentage": 62.08, "elapsed_time": "21:17:19", "remaining_time": "13:00:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6738, "total_steps": 10853, "loss": 0.1346, "learning_rate": 1.7209399400601128e-06, "epoch": 0.6208135624452942, "percentage": 62.08, "elapsed_time": "21:17:30", "remaining_time": "13:00:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6739, "total_steps": 10853, "loss": 0.1334, "learning_rate": 1.720216125953667e-06, "epoch": 0.6209056986225642, "percentage": 62.09, "elapsed_time": "21:17:40", "remaining_time": "12:59:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6740, "total_steps": 10853, "loss": 0.1324, "learning_rate": 1.7194923842502382e-06, "epoch": 0.6209978347998342, "percentage": 62.1, "elapsed_time": "21:17:51", "remaining_time": "12:59:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6741, "total_steps": 10853, "loss": 0.1345, "learning_rate": 1.7187687150170257e-06, "epoch": 0.6210899709771042, "percentage": 62.11, "elapsed_time": "21:18:01", "remaining_time": "12:59:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6742, "total_steps": 10853, "loss": 0.1211, "learning_rate": 1.7180451183212217e-06, "epoch": 0.6211821071543742, "percentage": 62.12, "elapsed_time": "21:18:12", "remaining_time": "12:59:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6743, "total_steps": 10853, "loss": 0.1428, "learning_rate": 1.7173215942300125e-06, "epoch": 0.6212742433316442, "percentage": 62.13, "elapsed_time": "21:18:23", "remaining_time": "12:59:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6744, "total_steps": 10853, "loss": 0.14, "learning_rate": 1.7165981428105771e-06, "epoch": 0.6213663795089142, "percentage": 62.14, "elapsed_time": "21:18:34", "remaining_time": "12:59:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6745, "total_steps": 10853, "loss": 0.1354, "learning_rate": 1.71587476413009e-06, "epoch": 0.6214585156861842, "percentage": 62.15, "elapsed_time": "21:18:46", "remaining_time": "12:58:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6746, "total_steps": 10853, "loss": 0.1295, "learning_rate": 1.7151514582557144e-06, "epoch": 0.6215506518634542, "percentage": 62.16, "elapsed_time": "21:18:58", "remaining_time": "12:58:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6747, "total_steps": 10853, "loss": 0.1472, "learning_rate": 1.71442822525461e-06, "epoch": 0.6216427880407241, "percentage": 62.17, "elapsed_time": "21:19:09", "remaining_time": "12:58:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6748, "total_steps": 10853, "loss": 0.1251, "learning_rate": 1.71370506519393e-06, "epoch": 0.6217349242179941, "percentage": 62.18, "elapsed_time": "21:19:18", "remaining_time": "12:58:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6749, "total_steps": 10853, "loss": 0.1278, "learning_rate": 1.7129819781408197e-06, "epoch": 0.6218270603952643, "percentage": 62.19, "elapsed_time": "21:19:30", "remaining_time": "12:58:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6750, "total_steps": 10853, "loss": 0.1181, "learning_rate": 1.7122589641624166e-06, "epoch": 0.6219191965725342, "percentage": 62.19, "elapsed_time": "21:19:41", "remaining_time": "12:57:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6751, "total_steps": 10853, "loss": 0.1202, "learning_rate": 1.7115360233258537e-06, "epoch": 0.6220113327498042, "percentage": 62.2, "elapsed_time": "21:19:52", "remaining_time": "12:57:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6752, "total_steps": 10853, "loss": 0.1372, "learning_rate": 1.7108131556982554e-06, "epoch": 0.6221034689270742, "percentage": 62.21, "elapsed_time": "21:20:02", "remaining_time": "12:57:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6753, "total_steps": 10853, "loss": 0.1214, "learning_rate": 1.7100903613467419e-06, "epoch": 0.6221956051043442, "percentage": 62.22, "elapsed_time": "21:20:12", "remaining_time": "12:57:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6754, "total_steps": 10853, "loss": 0.1301, "learning_rate": 1.7093676403384223e-06, "epoch": 0.6222877412816142, "percentage": 62.23, "elapsed_time": "21:20:23", "remaining_time": "12:57:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6755, "total_steps": 10853, "loss": 0.1243, "learning_rate": 1.7086449927404025e-06, "epoch": 0.6223798774588842, "percentage": 62.24, "elapsed_time": "21:20:34", "remaining_time": "12:56:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6756, "total_steps": 10853, "loss": 0.1294, "learning_rate": 1.7079224186197804e-06, "epoch": 0.6224720136361542, "percentage": 62.25, "elapsed_time": "21:20:46", "remaining_time": "12:56:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6757, "total_steps": 10853, "loss": 0.133, "learning_rate": 1.7071999180436477e-06, "epoch": 0.6225641498134242, "percentage": 62.26, "elapsed_time": "21:20:58", "remaining_time": "12:56:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6758, "total_steps": 10853, "loss": 0.1234, "learning_rate": 1.7064774910790865e-06, "epoch": 0.6226562859906942, "percentage": 62.27, "elapsed_time": "21:21:08", "remaining_time": "12:56:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6759, "total_steps": 10853, "loss": 0.1307, "learning_rate": 1.7057551377931767e-06, "epoch": 0.6227484221679642, "percentage": 62.28, "elapsed_time": "21:21:20", "remaining_time": "12:56:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6760, "total_steps": 10853, "loss": 0.1422, "learning_rate": 1.705032858252987e-06, "epoch": 0.6228405583452342, "percentage": 62.29, "elapsed_time": "21:21:31", "remaining_time": "12:55:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6761, "total_steps": 10853, "loss": 0.1395, "learning_rate": 1.7043106525255831e-06, "epoch": 0.6229326945225042, "percentage": 62.3, "elapsed_time": "21:21:42", "remaining_time": "12:55:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6762, "total_steps": 10853, "loss": 0.1226, "learning_rate": 1.70358852067802e-06, "epoch": 0.6230248306997742, "percentage": 62.31, "elapsed_time": "21:21:53", "remaining_time": "12:55:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6763, "total_steps": 10853, "loss": 0.138, "learning_rate": 1.7028664627773483e-06, "epoch": 0.6231169668770443, "percentage": 62.31, "elapsed_time": "21:22:04", "remaining_time": "12:55:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6764, "total_steps": 10853, "loss": 0.1271, "learning_rate": 1.7021444788906117e-06, "epoch": 0.6232091030543143, "percentage": 62.32, "elapsed_time": "21:22:14", "remaining_time": "12:55:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6765, "total_steps": 10853, "loss": 0.1285, "learning_rate": 1.7014225690848458e-06, "epoch": 0.6233012392315843, "percentage": 62.33, "elapsed_time": "21:22:26", "remaining_time": "12:54:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6766, "total_steps": 10853, "loss": 0.1205, "learning_rate": 1.7007007334270809e-06, "epoch": 0.6233933754088543, "percentage": 62.34, "elapsed_time": "21:22:37", "remaining_time": "12:54:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6767, "total_steps": 10853, "loss": 0.1272, "learning_rate": 1.6999789719843388e-06, "epoch": 0.6234855115861243, "percentage": 62.35, "elapsed_time": "21:22:49", "remaining_time": "12:54:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6768, "total_steps": 10853, "loss": 0.1181, "learning_rate": 1.6992572848236343e-06, "epoch": 0.6235776477633943, "percentage": 62.36, "elapsed_time": "21:23:01", "remaining_time": "12:54:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6769, "total_steps": 10853, "loss": 0.1341, "learning_rate": 1.698535672011978e-06, "epoch": 0.6236697839406643, "percentage": 62.37, "elapsed_time": "21:23:11", "remaining_time": "12:54:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6770, "total_steps": 10853, "loss": 0.1263, "learning_rate": 1.6978141336163713e-06, "epoch": 0.6237619201179343, "percentage": 62.38, "elapsed_time": "21:23:20", "remaining_time": "12:53:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6771, "total_steps": 10853, "loss": 0.1247, "learning_rate": 1.6970926697038073e-06, "epoch": 0.6238540562952043, "percentage": 62.39, "elapsed_time": "21:23:30", "remaining_time": "12:53:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6772, "total_steps": 10853, "loss": 0.126, "learning_rate": 1.6963712803412761e-06, "epoch": 0.6239461924724743, "percentage": 62.4, "elapsed_time": "21:23:41", "remaining_time": "12:53:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6773, "total_steps": 10853, "loss": 0.1434, "learning_rate": 1.6956499655957577e-06, "epoch": 0.6240383286497443, "percentage": 62.41, "elapsed_time": "21:23:53", "remaining_time": "12:53:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6774, "total_steps": 10853, "loss": 0.1342, "learning_rate": 1.694928725534227e-06, "epoch": 0.6241304648270143, "percentage": 62.42, "elapsed_time": "21:24:03", "remaining_time": "12:53:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6775, "total_steps": 10853, "loss": 0.125, "learning_rate": 1.6942075602236507e-06, "epoch": 0.6242226010042843, "percentage": 62.43, "elapsed_time": "21:24:13", "remaining_time": "12:53:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6776, "total_steps": 10853, "loss": 0.1469, "learning_rate": 1.6934864697309883e-06, "epoch": 0.6243147371815544, "percentage": 62.43, "elapsed_time": "21:24:25", "remaining_time": "12:52:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6777, "total_steps": 10853, "loss": 0.1304, "learning_rate": 1.6927654541231941e-06, "epoch": 0.6244068733588244, "percentage": 62.44, "elapsed_time": "21:24:35", "remaining_time": "12:52:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6778, "total_steps": 10853, "loss": 0.126, "learning_rate": 1.6920445134672162e-06, "epoch": 0.6244990095360944, "percentage": 62.45, "elapsed_time": "21:24:46", "remaining_time": "12:52:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6779, "total_steps": 10853, "loss": 0.1314, "learning_rate": 1.6913236478299906e-06, "epoch": 0.6245911457133644, "percentage": 62.46, "elapsed_time": "21:24:56", "remaining_time": "12:52:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6780, "total_steps": 10853, "loss": 0.1298, "learning_rate": 1.6906028572784511e-06, "epoch": 0.6246832818906344, "percentage": 62.47, "elapsed_time": "21:25:06", "remaining_time": "12:52:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6781, "total_steps": 10853, "loss": 0.1349, "learning_rate": 1.6898821418795237e-06, "epoch": 0.6247754180679044, "percentage": 62.48, "elapsed_time": "21:25:16", "remaining_time": "12:51:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6782, "total_steps": 10853, "loss": 0.1137, "learning_rate": 1.6891615017001272e-06, "epoch": 0.6248675542451744, "percentage": 62.49, "elapsed_time": "21:25:26", "remaining_time": "12:51:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6783, "total_steps": 10853, "loss": 0.1231, "learning_rate": 1.6884409368071718e-06, "epoch": 0.6249596904224444, "percentage": 62.5, "elapsed_time": "21:25:37", "remaining_time": "12:51:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6784, "total_steps": 10853, "loss": 0.1291, "learning_rate": 1.6877204472675634e-06, "epoch": 0.6250518265997144, "percentage": 62.51, "elapsed_time": "21:25:49", "remaining_time": "12:51:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6785, "total_steps": 10853, "loss": 0.1289, "learning_rate": 1.687000033148198e-06, "epoch": 0.6251439627769844, "percentage": 62.52, "elapsed_time": "21:26:00", "remaining_time": "12:51:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6786, "total_steps": 10853, "loss": 0.1313, "learning_rate": 1.686279694515968e-06, "epoch": 0.6252360989542544, "percentage": 62.53, "elapsed_time": "21:26:10", "remaining_time": "12:50:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6787, "total_steps": 10853, "loss": 0.1176, "learning_rate": 1.685559431437756e-06, "epoch": 0.6253282351315244, "percentage": 62.54, "elapsed_time": "21:26:22", "remaining_time": "12:50:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6788, "total_steps": 10853, "loss": 0.1247, "learning_rate": 1.6848392439804374e-06, "epoch": 0.6254203713087944, "percentage": 62.54, "elapsed_time": "21:26:31", "remaining_time": "12:50:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6789, "total_steps": 10853, "loss": 0.1316, "learning_rate": 1.6841191322108835e-06, "epoch": 0.6255125074860644, "percentage": 62.55, "elapsed_time": "21:26:41", "remaining_time": "12:50:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6790, "total_steps": 10853, "loss": 0.1105, "learning_rate": 1.6833990961959562e-06, "epoch": 0.6256046436633345, "percentage": 62.56, "elapsed_time": "21:26:51", "remaining_time": "12:50:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6791, "total_steps": 10853, "loss": 0.118, "learning_rate": 1.6826791360025103e-06, "epoch": 0.6256967798406045, "percentage": 62.57, "elapsed_time": "21:27:01", "remaining_time": "12:49:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6792, "total_steps": 10853, "loss": 0.1294, "learning_rate": 1.6819592516973942e-06, "epoch": 0.6257889160178745, "percentage": 62.58, "elapsed_time": "21:27:11", "remaining_time": "12:49:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6793, "total_steps": 10853, "loss": 0.1303, "learning_rate": 1.6812394433474497e-06, "epoch": 0.6258810521951444, "percentage": 62.59, "elapsed_time": "21:27:23", "remaining_time": "12:49:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6794, "total_steps": 10853, "loss": 0.1366, "learning_rate": 1.6805197110195115e-06, "epoch": 0.6259731883724144, "percentage": 62.6, "elapsed_time": "21:27:34", "remaining_time": "12:49:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6795, "total_steps": 10853, "loss": 0.1138, "learning_rate": 1.6798000547804066e-06, "epoch": 0.6260653245496844, "percentage": 62.61, "elapsed_time": "21:27:45", "remaining_time": "12:49:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6796, "total_steps": 10853, "loss": 0.1318, "learning_rate": 1.6790804746969542e-06, "epoch": 0.6261574607269544, "percentage": 62.62, "elapsed_time": "21:27:56", "remaining_time": "12:48:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6797, "total_steps": 10853, "loss": 0.1272, "learning_rate": 1.6783609708359683e-06, "epoch": 0.6262495969042244, "percentage": 62.63, "elapsed_time": "21:28:07", "remaining_time": "12:48:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6798, "total_steps": 10853, "loss": 0.1356, "learning_rate": 1.677641543264254e-06, "epoch": 0.6263417330814944, "percentage": 62.64, "elapsed_time": "21:28:19", "remaining_time": "12:48:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6799, "total_steps": 10853, "loss": 0.1333, "learning_rate": 1.6769221920486123e-06, "epoch": 0.6264338692587644, "percentage": 62.65, "elapsed_time": "21:28:30", "remaining_time": "12:48:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6800, "total_steps": 10853, "loss": 0.1236, "learning_rate": 1.676202917255833e-06, "epoch": 0.6265260054360344, "percentage": 62.66, "elapsed_time": "21:28:41", "remaining_time": "12:48:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6801, "total_steps": 10853, "loss": 0.1505, "learning_rate": 1.675483718952701e-06, "epoch": 0.6266181416133044, "percentage": 62.66, "elapsed_time": "21:28:53", "remaining_time": "12:47:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6802, "total_steps": 10853, "loss": 0.1156, "learning_rate": 1.6747645972059949e-06, "epoch": 0.6267102777905744, "percentage": 62.67, "elapsed_time": "21:29:03", "remaining_time": "12:47:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6803, "total_steps": 10853, "loss": 0.1311, "learning_rate": 1.6740455520824852e-06, "epoch": 0.6268024139678445, "percentage": 62.68, "elapsed_time": "21:29:14", "remaining_time": "12:47:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6804, "total_steps": 10853, "loss": 0.1223, "learning_rate": 1.673326583648934e-06, "epoch": 0.6268945501451145, "percentage": 62.69, "elapsed_time": "21:29:25", "remaining_time": "12:47:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6805, "total_steps": 10853, "loss": 0.1327, "learning_rate": 1.672607691972099e-06, "epoch": 0.6269866863223845, "percentage": 62.7, "elapsed_time": "21:29:37", "remaining_time": "12:47:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6806, "total_steps": 10853, "loss": 0.1394, "learning_rate": 1.671888877118728e-06, "epoch": 0.6270788224996545, "percentage": 62.71, "elapsed_time": "21:29:49", "remaining_time": "12:46:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6807, "total_steps": 10853, "loss": 0.1458, "learning_rate": 1.6711701391555654e-06, "epoch": 0.6271709586769245, "percentage": 62.72, "elapsed_time": "21:30:00", "remaining_time": "12:46:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6808, "total_steps": 10853, "loss": 0.1318, "learning_rate": 1.6704514781493439e-06, "epoch": 0.6272630948541945, "percentage": 62.73, "elapsed_time": "21:30:11", "remaining_time": "12:46:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6809, "total_steps": 10853, "loss": 0.1309, "learning_rate": 1.6697328941667911e-06, "epoch": 0.6273552310314645, "percentage": 62.74, "elapsed_time": "21:30:22", "remaining_time": "12:46:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6810, "total_steps": 10853, "loss": 0.1359, "learning_rate": 1.6690143872746295e-06, "epoch": 0.6274473672087345, "percentage": 62.75, "elapsed_time": "21:30:33", "remaining_time": "12:46:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6811, "total_steps": 10853, "loss": 0.13, "learning_rate": 1.6682959575395717e-06, "epoch": 0.6275395033860045, "percentage": 62.76, "elapsed_time": "21:30:44", "remaining_time": "12:45:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6812, "total_steps": 10853, "loss": 0.1117, "learning_rate": 1.6675776050283228e-06, "epoch": 0.6276316395632745, "percentage": 62.77, "elapsed_time": "21:30:55", "remaining_time": "12:45:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6813, "total_steps": 10853, "loss": 0.1362, "learning_rate": 1.666859329807583e-06, "epoch": 0.6277237757405445, "percentage": 62.78, "elapsed_time": "21:31:05", "remaining_time": "12:45:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6814, "total_steps": 10853, "loss": 0.1323, "learning_rate": 1.666141131944044e-06, "epoch": 0.6278159119178145, "percentage": 62.78, "elapsed_time": "21:31:16", "remaining_time": "12:45:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6815, "total_steps": 10853, "loss": 0.1275, "learning_rate": 1.6654230115043915e-06, "epoch": 0.6279080480950845, "percentage": 62.79, "elapsed_time": "21:31:27", "remaining_time": "12:45:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6816, "total_steps": 10853, "loss": 0.1295, "learning_rate": 1.6647049685553018e-06, "epoch": 0.6280001842723545, "percentage": 62.8, "elapsed_time": "21:31:38", "remaining_time": "12:45:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6817, "total_steps": 10853, "loss": 0.1289, "learning_rate": 1.663987003163445e-06, "epoch": 0.6280923204496246, "percentage": 62.81, "elapsed_time": "21:31:49", "remaining_time": "12:44:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6818, "total_steps": 10853, "loss": 0.1281, "learning_rate": 1.6632691153954855e-06, "epoch": 0.6281844566268946, "percentage": 62.82, "elapsed_time": "21:32:00", "remaining_time": "12:44:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6819, "total_steps": 10853, "loss": 0.1255, "learning_rate": 1.6625513053180791e-06, "epoch": 0.6282765928041646, "percentage": 62.83, "elapsed_time": "21:32:10", "remaining_time": "12:44:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6820, "total_steps": 10853, "loss": 0.1263, "learning_rate": 1.6618335729978736e-06, "epoch": 0.6283687289814346, "percentage": 62.84, "elapsed_time": "21:32:21", "remaining_time": "12:44:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6821, "total_steps": 10853, "loss": 0.1254, "learning_rate": 1.661115918501511e-06, "epoch": 0.6284608651587046, "percentage": 62.85, "elapsed_time": "21:32:33", "remaining_time": "12:44:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6822, "total_steps": 10853, "loss": 0.1328, "learning_rate": 1.6603983418956254e-06, "epoch": 0.6285530013359746, "percentage": 62.86, "elapsed_time": "21:32:43", "remaining_time": "12:43:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6823, "total_steps": 10853, "loss": 0.1394, "learning_rate": 1.6596808432468445e-06, "epoch": 0.6286451375132446, "percentage": 62.87, "elapsed_time": "21:32:54", "remaining_time": "12:43:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6824, "total_steps": 10853, "loss": 0.1328, "learning_rate": 1.6589634226217883e-06, "epoch": 0.6287372736905146, "percentage": 62.88, "elapsed_time": "21:33:07", "remaining_time": "12:43:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6825, "total_steps": 10853, "loss": 0.1284, "learning_rate": 1.6582460800870675e-06, "epoch": 0.6288294098677846, "percentage": 62.89, "elapsed_time": "21:33:18", "remaining_time": "12:43:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6826, "total_steps": 10853, "loss": 0.1236, "learning_rate": 1.6575288157092898e-06, "epoch": 0.6289215460450546, "percentage": 62.9, "elapsed_time": "21:33:27", "remaining_time": "12:43:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6827, "total_steps": 10853, "loss": 0.1313, "learning_rate": 1.6568116295550515e-06, "epoch": 0.6290136822223246, "percentage": 62.9, "elapsed_time": "21:33:38", "remaining_time": "12:42:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6828, "total_steps": 10853, "loss": 0.1144, "learning_rate": 1.6560945216909451e-06, "epoch": 0.6291058183995946, "percentage": 62.91, "elapsed_time": "21:33:48", "remaining_time": "12:42:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6829, "total_steps": 10853, "loss": 0.1107, "learning_rate": 1.6553774921835528e-06, "epoch": 0.6291979545768646, "percentage": 62.92, "elapsed_time": "21:33:59", "remaining_time": "12:42:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6830, "total_steps": 10853, "loss": 0.1255, "learning_rate": 1.6546605410994507e-06, "epoch": 0.6292900907541346, "percentage": 62.93, "elapsed_time": "21:34:10", "remaining_time": "12:42:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6831, "total_steps": 10853, "loss": 0.1263, "learning_rate": 1.6539436685052087e-06, "epoch": 0.6293822269314047, "percentage": 62.94, "elapsed_time": "21:34:21", "remaining_time": "12:42:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6832, "total_steps": 10853, "loss": 0.1154, "learning_rate": 1.6532268744673887e-06, "epoch": 0.6294743631086747, "percentage": 62.95, "elapsed_time": "21:34:30", "remaining_time": "12:41:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6833, "total_steps": 10853, "loss": 0.1241, "learning_rate": 1.6525101590525435e-06, "epoch": 0.6295664992859447, "percentage": 62.96, "elapsed_time": "21:34:41", "remaining_time": "12:41:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6834, "total_steps": 10853, "loss": 0.1275, "learning_rate": 1.651793522327222e-06, "epoch": 0.6296586354632147, "percentage": 62.97, "elapsed_time": "21:34:52", "remaining_time": "12:41:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6835, "total_steps": 10853, "loss": 0.133, "learning_rate": 1.6510769643579625e-06, "epoch": 0.6297507716404847, "percentage": 62.98, "elapsed_time": "21:35:03", "remaining_time": "12:41:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6836, "total_steps": 10853, "loss": 0.1174, "learning_rate": 1.6503604852112992e-06, "epoch": 0.6298429078177546, "percentage": 62.99, "elapsed_time": "21:35:14", "remaining_time": "12:41:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6837, "total_steps": 10853, "loss": 0.1335, "learning_rate": 1.649644084953756e-06, "epoch": 0.6299350439950246, "percentage": 63.0, "elapsed_time": "21:35:24", "remaining_time": "12:40:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6838, "total_steps": 10853, "loss": 0.1364, "learning_rate": 1.6489277636518503e-06, "epoch": 0.6300271801722946, "percentage": 63.01, "elapsed_time": "21:35:35", "remaining_time": "12:40:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6839, "total_steps": 10853, "loss": 0.128, "learning_rate": 1.6482115213720939e-06, "epoch": 0.6301193163495646, "percentage": 63.01, "elapsed_time": "21:35:45", "remaining_time": "12:40:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6840, "total_steps": 10853, "loss": 0.1234, "learning_rate": 1.64749535818099e-06, "epoch": 0.6302114525268346, "percentage": 63.02, "elapsed_time": "21:35:57", "remaining_time": "12:40:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6841, "total_steps": 10853, "loss": 0.1262, "learning_rate": 1.6467792741450328e-06, "epoch": 0.6303035887041046, "percentage": 63.03, "elapsed_time": "21:36:07", "remaining_time": "12:40:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6842, "total_steps": 10853, "loss": 0.1332, "learning_rate": 1.6460632693307122e-06, "epoch": 0.6303957248813746, "percentage": 63.04, "elapsed_time": "21:36:18", "remaining_time": "12:39:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6843, "total_steps": 10853, "loss": 0.1282, "learning_rate": 1.6453473438045088e-06, "epoch": 0.6304878610586446, "percentage": 63.05, "elapsed_time": "21:36:29", "remaining_time": "12:39:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6844, "total_steps": 10853, "loss": 0.1268, "learning_rate": 1.644631497632897e-06, "epoch": 0.6305799972359147, "percentage": 63.06, "elapsed_time": "21:36:41", "remaining_time": "12:39:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6845, "total_steps": 10853, "loss": 0.1281, "learning_rate": 1.6439157308823425e-06, "epoch": 0.6306721334131847, "percentage": 63.07, "elapsed_time": "21:36:53", "remaining_time": "12:39:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6846, "total_steps": 10853, "loss": 0.14, "learning_rate": 1.6432000436193042e-06, "epoch": 0.6307642695904547, "percentage": 63.08, "elapsed_time": "21:37:04", "remaining_time": "12:39:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6847, "total_steps": 10853, "loss": 0.1275, "learning_rate": 1.642484435910234e-06, "epoch": 0.6308564057677247, "percentage": 63.09, "elapsed_time": "21:37:15", "remaining_time": "12:38:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6848, "total_steps": 10853, "loss": 0.1317, "learning_rate": 1.6417689078215771e-06, "epoch": 0.6309485419449947, "percentage": 63.1, "elapsed_time": "21:37:26", "remaining_time": "12:38:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6849, "total_steps": 10853, "loss": 0.1243, "learning_rate": 1.6410534594197687e-06, "epoch": 0.6310406781222647, "percentage": 63.11, "elapsed_time": "21:37:36", "remaining_time": "12:38:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6850, "total_steps": 10853, "loss": 0.126, "learning_rate": 1.640338090771239e-06, "epoch": 0.6311328142995347, "percentage": 63.12, "elapsed_time": "21:37:46", "remaining_time": "12:38:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6851, "total_steps": 10853, "loss": 0.1193, "learning_rate": 1.6396228019424099e-06, "epoch": 0.6312249504768047, "percentage": 63.13, "elapsed_time": "21:37:58", "remaining_time": "12:38:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6852, "total_steps": 10853, "loss": 0.1425, "learning_rate": 1.6389075929996961e-06, "epoch": 0.6313170866540747, "percentage": 63.13, "elapsed_time": "21:38:09", "remaining_time": "12:38:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6853, "total_steps": 10853, "loss": 0.1232, "learning_rate": 1.6381924640095065e-06, "epoch": 0.6314092228313447, "percentage": 63.14, "elapsed_time": "21:38:20", "remaining_time": "12:37:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6854, "total_steps": 10853, "loss": 0.1191, "learning_rate": 1.6374774150382377e-06, "epoch": 0.6315013590086147, "percentage": 63.15, "elapsed_time": "21:38:31", "remaining_time": "12:37:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6855, "total_steps": 10853, "loss": 0.1303, "learning_rate": 1.6367624461522841e-06, "epoch": 0.6315934951858847, "percentage": 63.16, "elapsed_time": "21:38:42", "remaining_time": "12:37:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6856, "total_steps": 10853, "loss": 0.136, "learning_rate": 1.6360475574180306e-06, "epoch": 0.6316856313631547, "percentage": 63.17, "elapsed_time": "21:38:53", "remaining_time": "12:37:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6857, "total_steps": 10853, "loss": 0.1294, "learning_rate": 1.635332748901855e-06, "epoch": 0.6317777675404247, "percentage": 63.18, "elapsed_time": "21:39:03", "remaining_time": "12:37:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6858, "total_steps": 10853, "loss": 0.1237, "learning_rate": 1.6346180206701256e-06, "epoch": 0.6318699037176948, "percentage": 63.19, "elapsed_time": "21:39:15", "remaining_time": "12:36:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6859, "total_steps": 10853, "loss": 0.1271, "learning_rate": 1.6339033727892067e-06, "epoch": 0.6319620398949648, "percentage": 63.2, "elapsed_time": "21:39:25", "remaining_time": "12:36:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6860, "total_steps": 10853, "loss": 0.1287, "learning_rate": 1.6331888053254521e-06, "epoch": 0.6320541760722348, "percentage": 63.21, "elapsed_time": "21:39:36", "remaining_time": "12:36:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6861, "total_steps": 10853, "loss": 0.1316, "learning_rate": 1.6324743183452113e-06, "epoch": 0.6321463122495048, "percentage": 63.22, "elapsed_time": "21:39:47", "remaining_time": "12:36:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6862, "total_steps": 10853, "loss": 0.1232, "learning_rate": 1.631759911914823e-06, "epoch": 0.6322384484267748, "percentage": 63.23, "elapsed_time": "21:39:57", "remaining_time": "12:36:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6863, "total_steps": 10853, "loss": 0.1279, "learning_rate": 1.63104558610062e-06, "epoch": 0.6323305846040448, "percentage": 63.24, "elapsed_time": "21:40:08", "remaining_time": "12:35:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6864, "total_steps": 10853, "loss": 0.139, "learning_rate": 1.630331340968928e-06, "epoch": 0.6324227207813148, "percentage": 63.25, "elapsed_time": "21:40:19", "remaining_time": "12:35:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6865, "total_steps": 10853, "loss": 0.1392, "learning_rate": 1.6296171765860651e-06, "epoch": 0.6325148569585848, "percentage": 63.25, "elapsed_time": "21:40:31", "remaining_time": "12:35:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6866, "total_steps": 10853, "loss": 0.1261, "learning_rate": 1.6289030930183403e-06, "epoch": 0.6326069931358548, "percentage": 63.26, "elapsed_time": "21:40:41", "remaining_time": "12:35:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6867, "total_steps": 10853, "loss": 0.1349, "learning_rate": 1.6281890903320574e-06, "epoch": 0.6326991293131248, "percentage": 63.27, "elapsed_time": "21:40:51", "remaining_time": "12:35:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6868, "total_steps": 10853, "loss": 0.1232, "learning_rate": 1.627475168593511e-06, "epoch": 0.6327912654903948, "percentage": 63.28, "elapsed_time": "21:41:02", "remaining_time": "12:34:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6869, "total_steps": 10853, "loss": 0.1172, "learning_rate": 1.6267613278689898e-06, "epoch": 0.6328834016676648, "percentage": 63.29, "elapsed_time": "21:41:12", "remaining_time": "12:34:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6870, "total_steps": 10853, "loss": 0.1346, "learning_rate": 1.626047568224773e-06, "epoch": 0.6329755378449348, "percentage": 63.3, "elapsed_time": "21:41:22", "remaining_time": "12:34:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6871, "total_steps": 10853, "loss": 0.1305, "learning_rate": 1.625333889727133e-06, "epoch": 0.6330676740222049, "percentage": 63.31, "elapsed_time": "21:41:32", "remaining_time": "12:34:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6872, "total_steps": 10853, "loss": 0.1128, "learning_rate": 1.624620292442336e-06, "epoch": 0.6331598101994749, "percentage": 63.32, "elapsed_time": "21:41:42", "remaining_time": "12:34:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6873, "total_steps": 10853, "loss": 0.1295, "learning_rate": 1.6239067764366396e-06, "epoch": 0.6332519463767449, "percentage": 63.33, "elapsed_time": "21:41:52", "remaining_time": "12:33:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6874, "total_steps": 10853, "loss": 0.132, "learning_rate": 1.6231933417762918e-06, "epoch": 0.6333440825540149, "percentage": 63.34, "elapsed_time": "21:42:02", "remaining_time": "12:33:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6875, "total_steps": 10853, "loss": 0.131, "learning_rate": 1.6224799885275378e-06, "epoch": 0.6334362187312849, "percentage": 63.35, "elapsed_time": "21:42:14", "remaining_time": "12:33:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6876, "total_steps": 10853, "loss": 0.1214, "learning_rate": 1.6217667167566103e-06, "epoch": 0.6335283549085549, "percentage": 63.36, "elapsed_time": "21:42:26", "remaining_time": "12:33:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6877, "total_steps": 10853, "loss": 0.1195, "learning_rate": 1.6210535265297389e-06, "epoch": 0.6336204910858249, "percentage": 63.36, "elapsed_time": "21:42:37", "remaining_time": "12:33:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6878, "total_steps": 10853, "loss": 0.1269, "learning_rate": 1.6203404179131415e-06, "epoch": 0.6337126272630949, "percentage": 63.37, "elapsed_time": "21:42:48", "remaining_time": "12:32:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6879, "total_steps": 10853, "loss": 0.1291, "learning_rate": 1.6196273909730303e-06, "epoch": 0.6338047634403648, "percentage": 63.38, "elapsed_time": "21:42:59", "remaining_time": "12:32:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6880, "total_steps": 10853, "loss": 0.1282, "learning_rate": 1.6189144457756118e-06, "epoch": 0.6338968996176348, "percentage": 63.39, "elapsed_time": "21:43:10", "remaining_time": "12:32:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6881, "total_steps": 10853, "loss": 0.129, "learning_rate": 1.6182015823870805e-06, "epoch": 0.6339890357949048, "percentage": 63.4, "elapsed_time": "21:43:21", "remaining_time": "12:32:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6882, "total_steps": 10853, "loss": 0.1364, "learning_rate": 1.617488800873629e-06, "epoch": 0.6340811719721748, "percentage": 63.41, "elapsed_time": "21:43:32", "remaining_time": "12:32:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6883, "total_steps": 10853, "loss": 0.1343, "learning_rate": 1.616776101301436e-06, "epoch": 0.6341733081494448, "percentage": 63.42, "elapsed_time": "21:43:43", "remaining_time": "12:31:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6884, "total_steps": 10853, "loss": 0.1162, "learning_rate": 1.6160634837366771e-06, "epoch": 0.6342654443267148, "percentage": 63.43, "elapsed_time": "21:43:54", "remaining_time": "12:31:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6885, "total_steps": 10853, "loss": 0.1304, "learning_rate": 1.615350948245519e-06, "epoch": 0.6343575805039849, "percentage": 63.44, "elapsed_time": "21:44:06", "remaining_time": "12:31:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6886, "total_steps": 10853, "loss": 0.1257, "learning_rate": 1.6146384948941213e-06, "epoch": 0.6344497166812549, "percentage": 63.45, "elapsed_time": "21:44:15", "remaining_time": "12:31:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6887, "total_steps": 10853, "loss": 0.1316, "learning_rate": 1.6139261237486337e-06, "epoch": 0.6345418528585249, "percentage": 63.46, "elapsed_time": "21:44:26", "remaining_time": "12:31:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6888, "total_steps": 10853, "loss": 0.1396, "learning_rate": 1.6132138348752013e-06, "epoch": 0.6346339890357949, "percentage": 63.47, "elapsed_time": "21:44:37", "remaining_time": "12:30:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6889, "total_steps": 10853, "loss": 0.1238, "learning_rate": 1.6125016283399592e-06, "epoch": 0.6347261252130649, "percentage": 63.48, "elapsed_time": "21:44:47", "remaining_time": "12:30:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6890, "total_steps": 10853, "loss": 0.1369, "learning_rate": 1.6117895042090374e-06, "epoch": 0.6348182613903349, "percentage": 63.48, "elapsed_time": "21:44:58", "remaining_time": "12:30:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6891, "total_steps": 10853, "loss": 0.1277, "learning_rate": 1.6110774625485554e-06, "epoch": 0.6349103975676049, "percentage": 63.49, "elapsed_time": "21:45:09", "remaining_time": "12:30:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6892, "total_steps": 10853, "loss": 0.1293, "learning_rate": 1.6103655034246256e-06, "epoch": 0.6350025337448749, "percentage": 63.5, "elapsed_time": "21:45:19", "remaining_time": "12:30:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6893, "total_steps": 10853, "loss": 0.1253, "learning_rate": 1.6096536269033557e-06, "epoch": 0.6350946699221449, "percentage": 63.51, "elapsed_time": "21:45:30", "remaining_time": "12:30:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6894, "total_steps": 10853, "loss": 0.1303, "learning_rate": 1.6089418330508427e-06, "epoch": 0.6351868060994149, "percentage": 63.52, "elapsed_time": "21:45:40", "remaining_time": "12:29:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6895, "total_steps": 10853, "loss": 0.1361, "learning_rate": 1.6082301219331754e-06, "epoch": 0.6352789422766849, "percentage": 63.53, "elapsed_time": "21:45:51", "remaining_time": "12:29:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6896, "total_steps": 10853, "loss": 0.1186, "learning_rate": 1.6075184936164377e-06, "epoch": 0.6353710784539549, "percentage": 63.54, "elapsed_time": "21:46:02", "remaining_time": "12:29:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6897, "total_steps": 10853, "loss": 0.1283, "learning_rate": 1.606806948166703e-06, "epoch": 0.6354632146312249, "percentage": 63.55, "elapsed_time": "21:46:12", "remaining_time": "12:29:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6898, "total_steps": 10853, "loss": 0.1385, "learning_rate": 1.606095485650041e-06, "epoch": 0.6355553508084949, "percentage": 63.56, "elapsed_time": "21:46:24", "remaining_time": "12:29:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6899, "total_steps": 10853, "loss": 0.1298, "learning_rate": 1.6053841061325086e-06, "epoch": 0.635647486985765, "percentage": 63.57, "elapsed_time": "21:46:34", "remaining_time": "12:28:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6900, "total_steps": 10853, "loss": 0.1357, "learning_rate": 1.6046728096801575e-06, "epoch": 0.635739623163035, "percentage": 63.58, "elapsed_time": "21:46:45", "remaining_time": "12:28:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6901, "total_steps": 10853, "loss": 0.126, "learning_rate": 1.6039615963590332e-06, "epoch": 0.635831759340305, "percentage": 63.59, "elapsed_time": "21:46:56", "remaining_time": "12:28:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6902, "total_steps": 10853, "loss": 0.1325, "learning_rate": 1.6032504662351713e-06, "epoch": 0.635923895517575, "percentage": 63.6, "elapsed_time": "21:47:06", "remaining_time": "12:28:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6903, "total_steps": 10853, "loss": 0.1276, "learning_rate": 1.6025394193745993e-06, "epoch": 0.636016031694845, "percentage": 63.6, "elapsed_time": "21:47:17", "remaining_time": "12:28:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6904, "total_steps": 10853, "loss": 0.1302, "learning_rate": 1.6018284558433395e-06, "epoch": 0.636108167872115, "percentage": 63.61, "elapsed_time": "21:47:28", "remaining_time": "12:27:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6905, "total_steps": 10853, "loss": 0.1273, "learning_rate": 1.6011175757074035e-06, "epoch": 0.636200304049385, "percentage": 63.62, "elapsed_time": "21:47:38", "remaining_time": "12:27:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6906, "total_steps": 10853, "loss": 0.1332, "learning_rate": 1.6004067790327983e-06, "epoch": 0.636292440226655, "percentage": 63.63, "elapsed_time": "21:47:50", "remaining_time": "12:27:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6907, "total_steps": 10853, "loss": 0.1453, "learning_rate": 1.5996960658855201e-06, "epoch": 0.636384576403925, "percentage": 63.64, "elapsed_time": "21:48:01", "remaining_time": "12:27:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6908, "total_steps": 10853, "loss": 0.136, "learning_rate": 1.5989854363315585e-06, "epoch": 0.636476712581195, "percentage": 63.65, "elapsed_time": "21:48:12", "remaining_time": "12:27:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6909, "total_steps": 10853, "loss": 0.132, "learning_rate": 1.5982748904368966e-06, "epoch": 0.636568848758465, "percentage": 63.66, "elapsed_time": "21:48:24", "remaining_time": "12:26:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6910, "total_steps": 10853, "loss": 0.1229, "learning_rate": 1.5975644282675077e-06, "epoch": 0.636660984935735, "percentage": 63.67, "elapsed_time": "21:48:36", "remaining_time": "12:26:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6911, "total_steps": 10853, "loss": 0.1399, "learning_rate": 1.5968540498893598e-06, "epoch": 0.636753121113005, "percentage": 63.68, "elapsed_time": "21:48:46", "remaining_time": "12:26:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6912, "total_steps": 10853, "loss": 0.1325, "learning_rate": 1.59614375536841e-06, "epoch": 0.6368452572902751, "percentage": 63.69, "elapsed_time": "21:48:57", "remaining_time": "12:26:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6913, "total_steps": 10853, "loss": 0.1202, "learning_rate": 1.5954335447706093e-06, "epoch": 0.6369373934675451, "percentage": 63.7, "elapsed_time": "21:49:07", "remaining_time": "12:26:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6914, "total_steps": 10853, "loss": 0.126, "learning_rate": 1.5947234181619017e-06, "epoch": 0.6370295296448151, "percentage": 63.71, "elapsed_time": "21:49:17", "remaining_time": "12:25:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6915, "total_steps": 10853, "loss": 0.1235, "learning_rate": 1.5940133756082226e-06, "epoch": 0.6371216658220851, "percentage": 63.72, "elapsed_time": "21:49:29", "remaining_time": "12:25:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6916, "total_steps": 10853, "loss": 0.1233, "learning_rate": 1.5933034171754985e-06, "epoch": 0.6372138019993551, "percentage": 63.72, "elapsed_time": "21:49:39", "remaining_time": "12:25:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6917, "total_steps": 10853, "loss": 0.1227, "learning_rate": 1.5925935429296499e-06, "epoch": 0.6373059381766251, "percentage": 63.73, "elapsed_time": "21:49:50", "remaining_time": "12:25:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6918, "total_steps": 10853, "loss": 0.1197, "learning_rate": 1.5918837529365884e-06, "epoch": 0.6373980743538951, "percentage": 63.74, "elapsed_time": "21:50:01", "remaining_time": "12:25:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6919, "total_steps": 10853, "loss": 0.1325, "learning_rate": 1.5911740472622184e-06, "epoch": 0.6374902105311651, "percentage": 63.75, "elapsed_time": "21:50:11", "remaining_time": "12:24:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6920, "total_steps": 10853, "loss": 0.1369, "learning_rate": 1.590464425972436e-06, "epoch": 0.637582346708435, "percentage": 63.76, "elapsed_time": "21:50:22", "remaining_time": "12:24:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6921, "total_steps": 10853, "loss": 0.1424, "learning_rate": 1.5897548891331288e-06, "epoch": 0.637674482885705, "percentage": 63.77, "elapsed_time": "21:50:34", "remaining_time": "12:24:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6922, "total_steps": 10853, "loss": 0.1319, "learning_rate": 1.5890454368101788e-06, "epoch": 0.637766619062975, "percentage": 63.78, "elapsed_time": "21:50:45", "remaining_time": "12:24:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6923, "total_steps": 10853, "loss": 0.1248, "learning_rate": 1.5883360690694582e-06, "epoch": 0.637858755240245, "percentage": 63.79, "elapsed_time": "21:50:56", "remaining_time": "12:24:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6924, "total_steps": 10853, "loss": 0.1156, "learning_rate": 1.587626785976831e-06, "epoch": 0.637950891417515, "percentage": 63.8, "elapsed_time": "21:51:07", "remaining_time": "12:23:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6925, "total_steps": 10853, "loss": 0.1228, "learning_rate": 1.5869175875981551e-06, "epoch": 0.638043027594785, "percentage": 63.81, "elapsed_time": "21:51:18", "remaining_time": "12:23:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6926, "total_steps": 10853, "loss": 0.1425, "learning_rate": 1.5862084739992794e-06, "epoch": 0.6381351637720551, "percentage": 63.82, "elapsed_time": "21:51:28", "remaining_time": "12:23:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6927, "total_steps": 10853, "loss": 0.1381, "learning_rate": 1.585499445246046e-06, "epoch": 0.6382272999493251, "percentage": 63.83, "elapsed_time": "21:51:40", "remaining_time": "12:23:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6928, "total_steps": 10853, "loss": 0.1414, "learning_rate": 1.584790501404287e-06, "epoch": 0.6383194361265951, "percentage": 63.83, "elapsed_time": "21:51:50", "remaining_time": "12:23:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6929, "total_steps": 10853, "loss": 0.1329, "learning_rate": 1.5840816425398282e-06, "epoch": 0.6384115723038651, "percentage": 63.84, "elapsed_time": "21:52:01", "remaining_time": "12:23:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6930, "total_steps": 10853, "loss": 0.1288, "learning_rate": 1.5833728687184868e-06, "epoch": 0.6385037084811351, "percentage": 63.85, "elapsed_time": "21:52:13", "remaining_time": "12:22:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6931, "total_steps": 10853, "loss": 0.1235, "learning_rate": 1.5826641800060755e-06, "epoch": 0.6385958446584051, "percentage": 63.86, "elapsed_time": "21:52:24", "remaining_time": "12:22:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6932, "total_steps": 10853, "loss": 0.1297, "learning_rate": 1.581955576468392e-06, "epoch": 0.6386879808356751, "percentage": 63.87, "elapsed_time": "21:52:36", "remaining_time": "12:22:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6933, "total_steps": 10853, "loss": 0.1308, "learning_rate": 1.581247058171232e-06, "epoch": 0.6387801170129451, "percentage": 63.88, "elapsed_time": "21:52:47", "remaining_time": "12:22:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6934, "total_steps": 10853, "loss": 0.1183, "learning_rate": 1.5805386251803818e-06, "epoch": 0.6388722531902151, "percentage": 63.89, "elapsed_time": "21:52:57", "remaining_time": "12:22:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6935, "total_steps": 10853, "loss": 0.1257, "learning_rate": 1.5798302775616198e-06, "epoch": 0.6389643893674851, "percentage": 63.9, "elapsed_time": "21:53:06", "remaining_time": "12:21:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6936, "total_steps": 10853, "loss": 0.1099, "learning_rate": 1.5791220153807146e-06, "epoch": 0.6390565255447551, "percentage": 63.91, "elapsed_time": "21:53:17", "remaining_time": "12:21:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6937, "total_steps": 10853, "loss": 0.1283, "learning_rate": 1.5784138387034302e-06, "epoch": 0.6391486617220251, "percentage": 63.92, "elapsed_time": "21:53:28", "remaining_time": "12:21:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6938, "total_steps": 10853, "loss": 0.1332, "learning_rate": 1.5777057475955194e-06, "epoch": 0.6392407978992951, "percentage": 63.93, "elapsed_time": "21:53:39", "remaining_time": "12:21:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6939, "total_steps": 10853, "loss": 0.1201, "learning_rate": 1.5769977421227295e-06, "epoch": 0.6393329340765652, "percentage": 63.94, "elapsed_time": "21:53:50", "remaining_time": "12:21:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6940, "total_steps": 10853, "loss": 0.1368, "learning_rate": 1.5762898223507989e-06, "epoch": 0.6394250702538352, "percentage": 63.95, "elapsed_time": "21:54:01", "remaining_time": "12:20:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6941, "total_steps": 10853, "loss": 0.1377, "learning_rate": 1.575581988345457e-06, "epoch": 0.6395172064311052, "percentage": 63.95, "elapsed_time": "21:54:11", "remaining_time": "12:20:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6942, "total_steps": 10853, "loss": 0.1277, "learning_rate": 1.5748742401724276e-06, "epoch": 0.6396093426083752, "percentage": 63.96, "elapsed_time": "21:54:23", "remaining_time": "12:20:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6943, "total_steps": 10853, "loss": 0.1288, "learning_rate": 1.5741665778974239e-06, "epoch": 0.6397014787856452, "percentage": 63.97, "elapsed_time": "21:54:32", "remaining_time": "12:20:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6944, "total_steps": 10853, "loss": 0.1309, "learning_rate": 1.5734590015861539e-06, "epoch": 0.6397936149629152, "percentage": 63.98, "elapsed_time": "21:54:45", "remaining_time": "12:20:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6945, "total_steps": 10853, "loss": 0.1398, "learning_rate": 1.5727515113043152e-06, "epoch": 0.6398857511401852, "percentage": 63.99, "elapsed_time": "21:54:55", "remaining_time": "12:19:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6946, "total_steps": 10853, "loss": 0.1145, "learning_rate": 1.5720441071175976e-06, "epoch": 0.6399778873174552, "percentage": 64.0, "elapsed_time": "21:55:07", "remaining_time": "12:19:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6947, "total_steps": 10853, "loss": 0.1225, "learning_rate": 1.5713367890916852e-06, "epoch": 0.6400700234947252, "percentage": 64.01, "elapsed_time": "21:55:16", "remaining_time": "12:19:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6948, "total_steps": 10853, "loss": 0.1173, "learning_rate": 1.5706295572922524e-06, "epoch": 0.6401621596719952, "percentage": 64.02, "elapsed_time": "21:55:27", "remaining_time": "12:19:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6949, "total_steps": 10853, "loss": 0.1382, "learning_rate": 1.5699224117849644e-06, "epoch": 0.6402542958492652, "percentage": 64.03, "elapsed_time": "21:55:39", "remaining_time": "12:19:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6950, "total_steps": 10853, "loss": 0.1172, "learning_rate": 1.569215352635481e-06, "epoch": 0.6403464320265352, "percentage": 64.04, "elapsed_time": "21:55:51", "remaining_time": "12:18:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6951, "total_steps": 10853, "loss": 0.1246, "learning_rate": 1.5685083799094513e-06, "epoch": 0.6404385682038052, "percentage": 64.05, "elapsed_time": "21:56:01", "remaining_time": "12:18:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6952, "total_steps": 10853, "loss": 0.1306, "learning_rate": 1.56780149367252e-06, "epoch": 0.6405307043810752, "percentage": 64.06, "elapsed_time": "21:56:13", "remaining_time": "12:18:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6953, "total_steps": 10853, "loss": 0.1317, "learning_rate": 1.5670946939903201e-06, "epoch": 0.6406228405583453, "percentage": 64.07, "elapsed_time": "21:56:22", "remaining_time": "12:18:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6954, "total_steps": 10853, "loss": 0.1223, "learning_rate": 1.5663879809284777e-06, "epoch": 0.6407149767356153, "percentage": 64.07, "elapsed_time": "21:56:32", "remaining_time": "12:18:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6955, "total_steps": 10853, "loss": 0.1322, "learning_rate": 1.565681354552612e-06, "epoch": 0.6408071129128853, "percentage": 64.08, "elapsed_time": "21:56:41", "remaining_time": "12:17:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6956, "total_steps": 10853, "loss": 0.1156, "learning_rate": 1.5649748149283339e-06, "epoch": 0.6408992490901553, "percentage": 64.09, "elapsed_time": "21:56:52", "remaining_time": "12:17:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6957, "total_steps": 10853, "loss": 0.1264, "learning_rate": 1.5642683621212435e-06, "epoch": 0.6409913852674253, "percentage": 64.1, "elapsed_time": "21:57:03", "remaining_time": "12:17:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6958, "total_steps": 10853, "loss": 0.1224, "learning_rate": 1.5635619961969372e-06, "epoch": 0.6410835214446953, "percentage": 64.11, "elapsed_time": "21:57:13", "remaining_time": "12:17:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6959, "total_steps": 10853, "loss": 0.1242, "learning_rate": 1.5628557172209997e-06, "epoch": 0.6411756576219653, "percentage": 64.12, "elapsed_time": "21:57:23", "remaining_time": "12:17:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6960, "total_steps": 10853, "loss": 0.1232, "learning_rate": 1.5621495252590108e-06, "epoch": 0.6412677937992353, "percentage": 64.13, "elapsed_time": "21:57:34", "remaining_time": "12:16:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6961, "total_steps": 10853, "loss": 0.1318, "learning_rate": 1.561443420376539e-06, "epoch": 0.6413599299765053, "percentage": 64.14, "elapsed_time": "21:57:45", "remaining_time": "12:16:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6962, "total_steps": 10853, "loss": 0.1142, "learning_rate": 1.560737402639146e-06, "epoch": 0.6414520661537753, "percentage": 64.15, "elapsed_time": "21:57:57", "remaining_time": "12:16:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6963, "total_steps": 10853, "loss": 0.1305, "learning_rate": 1.5600314721123866e-06, "epoch": 0.6415442023310453, "percentage": 64.16, "elapsed_time": "21:58:09", "remaining_time": "12:16:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6964, "total_steps": 10853, "loss": 0.1388, "learning_rate": 1.5593256288618067e-06, "epoch": 0.6416363385083153, "percentage": 64.17, "elapsed_time": "21:58:20", "remaining_time": "12:16:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6965, "total_steps": 10853, "loss": 0.1224, "learning_rate": 1.5586198729529422e-06, "epoch": 0.6417284746855852, "percentage": 64.18, "elapsed_time": "21:58:31", "remaining_time": "12:16:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6966, "total_steps": 10853, "loss": 0.1296, "learning_rate": 1.5579142044513248e-06, "epoch": 0.6418206108628552, "percentage": 64.19, "elapsed_time": "21:58:42", "remaining_time": "12:15:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6967, "total_steps": 10853, "loss": 0.127, "learning_rate": 1.5572086234224743e-06, "epoch": 0.6419127470401254, "percentage": 64.19, "elapsed_time": "21:58:53", "remaining_time": "12:15:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6968, "total_steps": 10853, "loss": 0.1329, "learning_rate": 1.556503129931905e-06, "epoch": 0.6420048832173954, "percentage": 64.2, "elapsed_time": "21:59:04", "remaining_time": "12:15:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6969, "total_steps": 10853, "loss": 0.1153, "learning_rate": 1.5557977240451223e-06, "epoch": 0.6420970193946653, "percentage": 64.21, "elapsed_time": "21:59:15", "remaining_time": "12:15:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6970, "total_steps": 10853, "loss": 0.127, "learning_rate": 1.5550924058276213e-06, "epoch": 0.6421891555719353, "percentage": 64.22, "elapsed_time": "21:59:26", "remaining_time": "12:15:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6971, "total_steps": 10853, "loss": 0.1355, "learning_rate": 1.5543871753448924e-06, "epoch": 0.6422812917492053, "percentage": 64.23, "elapsed_time": "21:59:37", "remaining_time": "12:14:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6972, "total_steps": 10853, "loss": 0.1134, "learning_rate": 1.5536820326624159e-06, "epoch": 0.6423734279264753, "percentage": 64.24, "elapsed_time": "21:59:47", "remaining_time": "12:14:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6973, "total_steps": 10853, "loss": 0.1255, "learning_rate": 1.5529769778456654e-06, "epoch": 0.6424655641037453, "percentage": 64.25, "elapsed_time": "21:59:58", "remaining_time": "12:14:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6974, "total_steps": 10853, "loss": 0.1338, "learning_rate": 1.5522720109601039e-06, "epoch": 0.6425577002810153, "percentage": 64.26, "elapsed_time": "22:00:09", "remaining_time": "12:14:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6975, "total_steps": 10853, "loss": 0.1239, "learning_rate": 1.5515671320711877e-06, "epoch": 0.6426498364582853, "percentage": 64.27, "elapsed_time": "22:00:20", "remaining_time": "12:14:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6976, "total_steps": 10853, "loss": 0.1302, "learning_rate": 1.5508623412443657e-06, "epoch": 0.6427419726355553, "percentage": 64.28, "elapsed_time": "22:00:33", "remaining_time": "12:13:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6977, "total_steps": 10853, "loss": 0.138, "learning_rate": 1.5501576385450785e-06, "epoch": 0.6428341088128253, "percentage": 64.29, "elapsed_time": "22:00:44", "remaining_time": "12:13:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6978, "total_steps": 10853, "loss": 0.1157, "learning_rate": 1.5494530240387552e-06, "epoch": 0.6429262449900953, "percentage": 64.3, "elapsed_time": "22:00:55", "remaining_time": "12:13:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6979, "total_steps": 10853, "loss": 0.1209, "learning_rate": 1.5487484977908219e-06, "epoch": 0.6430183811673653, "percentage": 64.3, "elapsed_time": "22:01:05", "remaining_time": "12:13:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6980, "total_steps": 10853, "loss": 0.1286, "learning_rate": 1.5480440598666918e-06, "epoch": 0.6431105173446354, "percentage": 64.31, "elapsed_time": "22:01:16", "remaining_time": "12:13:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6981, "total_steps": 10853, "loss": 0.1289, "learning_rate": 1.5473397103317748e-06, "epoch": 0.6432026535219054, "percentage": 64.32, "elapsed_time": "22:01:25", "remaining_time": "12:12:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6982, "total_steps": 10853, "loss": 0.1234, "learning_rate": 1.5466354492514675e-06, "epoch": 0.6432947896991754, "percentage": 64.33, "elapsed_time": "22:01:37", "remaining_time": "12:12:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6983, "total_steps": 10853, "loss": 0.1147, "learning_rate": 1.5459312766911607e-06, "epoch": 0.6433869258764454, "percentage": 64.34, "elapsed_time": "22:01:49", "remaining_time": "12:12:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6984, "total_steps": 10853, "loss": 0.1332, "learning_rate": 1.5452271927162381e-06, "epoch": 0.6434790620537154, "percentage": 64.35, "elapsed_time": "22:01:59", "remaining_time": "12:12:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6985, "total_steps": 10853, "loss": 0.1383, "learning_rate": 1.5445231973920744e-06, "epoch": 0.6435711982309854, "percentage": 64.36, "elapsed_time": "22:02:10", "remaining_time": "12:12:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6986, "total_steps": 10853, "loss": 0.1203, "learning_rate": 1.543819290784033e-06, "epoch": 0.6436633344082554, "percentage": 64.37, "elapsed_time": "22:02:22", "remaining_time": "12:11:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6987, "total_steps": 10853, "loss": 0.1382, "learning_rate": 1.5431154729574743e-06, "epoch": 0.6437554705855254, "percentage": 64.38, "elapsed_time": "22:02:32", "remaining_time": "12:11:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6988, "total_steps": 10853, "loss": 0.1241, "learning_rate": 1.5424117439777458e-06, "epoch": 0.6438476067627954, "percentage": 64.39, "elapsed_time": "22:02:42", "remaining_time": "12:11:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6989, "total_steps": 10853, "loss": 0.1356, "learning_rate": 1.5417081039101916e-06, "epoch": 0.6439397429400654, "percentage": 64.4, "elapsed_time": "22:02:52", "remaining_time": "12:11:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6990, "total_steps": 10853, "loss": 0.1152, "learning_rate": 1.5410045528201423e-06, "epoch": 0.6440318791173354, "percentage": 64.41, "elapsed_time": "22:03:02", "remaining_time": "12:11:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6991, "total_steps": 10853, "loss": 0.1225, "learning_rate": 1.5403010907729233e-06, "epoch": 0.6441240152946054, "percentage": 64.42, "elapsed_time": "22:03:14", "remaining_time": "12:10:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6992, "total_steps": 10853, "loss": 0.1231, "learning_rate": 1.5395977178338511e-06, "epoch": 0.6442161514718754, "percentage": 64.42, "elapsed_time": "22:03:25", "remaining_time": "12:10:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6993, "total_steps": 10853, "loss": 0.1293, "learning_rate": 1.5388944340682352e-06, "epoch": 0.6443082876491454, "percentage": 64.43, "elapsed_time": "22:03:37", "remaining_time": "12:10:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6994, "total_steps": 10853, "loss": 0.1328, "learning_rate": 1.5381912395413733e-06, "epoch": 0.6444004238264155, "percentage": 64.44, "elapsed_time": "22:03:49", "remaining_time": "12:10:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6995, "total_steps": 10853, "loss": 0.1175, "learning_rate": 1.5374881343185592e-06, "epoch": 0.6444925600036855, "percentage": 64.45, "elapsed_time": "22:04:00", "remaining_time": "12:10:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6996, "total_steps": 10853, "loss": 0.1366, "learning_rate": 1.5367851184650745e-06, "epoch": 0.6445846961809555, "percentage": 64.46, "elapsed_time": "22:04:12", "remaining_time": "12:10:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6997, "total_steps": 10853, "loss": 0.1241, "learning_rate": 1.536082192046196e-06, "epoch": 0.6446768323582255, "percentage": 64.47, "elapsed_time": "22:04:21", "remaining_time": "12:09:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6998, "total_steps": 10853, "loss": 0.124, "learning_rate": 1.53537935512719e-06, "epoch": 0.6447689685354955, "percentage": 64.48, "elapsed_time": "22:04:33", "remaining_time": "12:09:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6999, "total_steps": 10853, "loss": 0.1266, "learning_rate": 1.5346766077733138e-06, "epoch": 0.6448611047127655, "percentage": 64.49, "elapsed_time": "22:04:45", "remaining_time": "12:09:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7000, "total_steps": 10853, "loss": 0.137, "learning_rate": 1.5339739500498189e-06, "epoch": 0.6449532408900355, "percentage": 64.5, "elapsed_time": "22:04:57", "remaining_time": "12:09:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7000, "total_steps": 10853, "eval_loss": 0.1284143477678299, "epoch": 0.6449532408900355, "percentage": 64.5, "elapsed_time": "22:09:56", "remaining_time": "12:12:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7001, "total_steps": 10853, "loss": 0.124, "learning_rate": 1.5332713820219461e-06, "epoch": 0.6450453770673055, "percentage": 64.51, "elapsed_time": "22:10:08", "remaining_time": "12:11:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7002, "total_steps": 10853, "loss": 0.1278, "learning_rate": 1.5325689037549307e-06, "epoch": 0.6451375132445755, "percentage": 64.52, "elapsed_time": "22:10:17", "remaining_time": "12:11:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7003, "total_steps": 10853, "loss": 0.1294, "learning_rate": 1.531866515313996e-06, "epoch": 0.6452296494218455, "percentage": 64.53, "elapsed_time": "22:10:27", "remaining_time": "12:11:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7004, "total_steps": 10853, "loss": 0.1127, "learning_rate": 1.5311642167643592e-06, "epoch": 0.6453217855991155, "percentage": 64.54, "elapsed_time": "22:10:38", "remaining_time": "12:11:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7005, "total_steps": 10853, "loss": 0.1284, "learning_rate": 1.530462008171229e-06, "epoch": 0.6454139217763855, "percentage": 64.54, "elapsed_time": "22:10:48", "remaining_time": "12:11:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7006, "total_steps": 10853, "loss": 0.128, "learning_rate": 1.5297598895998076e-06, "epoch": 0.6455060579536555, "percentage": 64.55, "elapsed_time": "22:10:59", "remaining_time": "12:10:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7007, "total_steps": 10853, "loss": 0.1225, "learning_rate": 1.529057861115283e-06, "epoch": 0.6455981941309256, "percentage": 64.56, "elapsed_time": "22:11:09", "remaining_time": "12:10:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7008, "total_steps": 10853, "loss": 0.1292, "learning_rate": 1.5283559227828404e-06, "epoch": 0.6456903303081956, "percentage": 64.57, "elapsed_time": "22:11:20", "remaining_time": "12:10:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7009, "total_steps": 10853, "loss": 0.1184, "learning_rate": 1.5276540746676558e-06, "epoch": 0.6457824664854656, "percentage": 64.58, "elapsed_time": "22:11:30", "remaining_time": "12:10:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7010, "total_steps": 10853, "loss": 0.1319, "learning_rate": 1.5269523168348954e-06, "epoch": 0.6458746026627356, "percentage": 64.59, "elapsed_time": "22:11:39", "remaining_time": "12:10:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7011, "total_steps": 10853, "loss": 0.1259, "learning_rate": 1.5262506493497159e-06, "epoch": 0.6459667388400055, "percentage": 64.6, "elapsed_time": "22:11:49", "remaining_time": "12:09:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7012, "total_steps": 10853, "loss": 0.1288, "learning_rate": 1.525549072277269e-06, "epoch": 0.6460588750172755, "percentage": 64.61, "elapsed_time": "22:12:00", "remaining_time": "12:09:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7013, "total_steps": 10853, "loss": 0.1265, "learning_rate": 1.524847585682695e-06, "epoch": 0.6461510111945455, "percentage": 64.62, "elapsed_time": "22:12:11", "remaining_time": "12:09:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7014, "total_steps": 10853, "loss": 0.1333, "learning_rate": 1.5241461896311288e-06, "epoch": 0.6462431473718155, "percentage": 64.63, "elapsed_time": "22:12:22", "remaining_time": "12:09:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7015, "total_steps": 10853, "loss": 0.1275, "learning_rate": 1.5234448841876935e-06, "epoch": 0.6463352835490855, "percentage": 64.64, "elapsed_time": "22:12:33", "remaining_time": "12:09:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7016, "total_steps": 10853, "loss": 0.1344, "learning_rate": 1.5227436694175052e-06, "epoch": 0.6464274197263555, "percentage": 64.65, "elapsed_time": "22:12:43", "remaining_time": "12:08:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7017, "total_steps": 10853, "loss": 0.1173, "learning_rate": 1.5220425453856728e-06, "epoch": 0.6465195559036255, "percentage": 64.65, "elapsed_time": "22:12:56", "remaining_time": "12:08:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7018, "total_steps": 10853, "loss": 0.1194, "learning_rate": 1.5213415121572959e-06, "epoch": 0.6466116920808955, "percentage": 64.66, "elapsed_time": "22:13:06", "remaining_time": "12:08:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7019, "total_steps": 10853, "loss": 0.1353, "learning_rate": 1.5206405697974635e-06, "epoch": 0.6467038282581655, "percentage": 64.67, "elapsed_time": "22:13:17", "remaining_time": "12:08:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7020, "total_steps": 10853, "loss": 0.1301, "learning_rate": 1.5199397183712606e-06, "epoch": 0.6467959644354355, "percentage": 64.68, "elapsed_time": "22:13:28", "remaining_time": "12:08:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7021, "total_steps": 10853, "loss": 0.1208, "learning_rate": 1.5192389579437596e-06, "epoch": 0.6468881006127056, "percentage": 64.69, "elapsed_time": "22:13:38", "remaining_time": "12:07:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7022, "total_steps": 10853, "loss": 0.13, "learning_rate": 1.5185382885800282e-06, "epoch": 0.6469802367899756, "percentage": 64.7, "elapsed_time": "22:13:51", "remaining_time": "12:07:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7023, "total_steps": 10853, "loss": 0.1284, "learning_rate": 1.5178377103451213e-06, "epoch": 0.6470723729672456, "percentage": 64.71, "elapsed_time": "22:14:03", "remaining_time": "12:07:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7024, "total_steps": 10853, "loss": 0.1427, "learning_rate": 1.5171372233040887e-06, "epoch": 0.6471645091445156, "percentage": 64.72, "elapsed_time": "22:14:13", "remaining_time": "12:07:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7025, "total_steps": 10853, "loss": 0.1308, "learning_rate": 1.516436827521971e-06, "epoch": 0.6472566453217856, "percentage": 64.73, "elapsed_time": "22:14:23", "remaining_time": "12:07:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7026, "total_steps": 10853, "loss": 0.1233, "learning_rate": 1.5157365230637993e-06, "epoch": 0.6473487814990556, "percentage": 64.74, "elapsed_time": "22:14:35", "remaining_time": "12:06:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7027, "total_steps": 10853, "loss": 0.133, "learning_rate": 1.5150363099945984e-06, "epoch": 0.6474409176763256, "percentage": 64.75, "elapsed_time": "22:14:45", "remaining_time": "12:06:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7028, "total_steps": 10853, "loss": 0.1379, "learning_rate": 1.5143361883793814e-06, "epoch": 0.6475330538535956, "percentage": 64.76, "elapsed_time": "22:14:57", "remaining_time": "12:06:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7029, "total_steps": 10853, "loss": 0.1252, "learning_rate": 1.513636158283155e-06, "epoch": 0.6476251900308656, "percentage": 64.77, "elapsed_time": "22:15:08", "remaining_time": "12:06:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7030, "total_steps": 10853, "loss": 0.1258, "learning_rate": 1.512936219770918e-06, "epoch": 0.6477173262081356, "percentage": 64.77, "elapsed_time": "22:15:18", "remaining_time": "12:06:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7031, "total_steps": 10853, "loss": 0.1152, "learning_rate": 1.5122363729076595e-06, "epoch": 0.6478094623854056, "percentage": 64.78, "elapsed_time": "22:15:29", "remaining_time": "12:05:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7032, "total_steps": 10853, "loss": 0.1245, "learning_rate": 1.5115366177583596e-06, "epoch": 0.6479015985626756, "percentage": 64.79, "elapsed_time": "22:15:38", "remaining_time": "12:05:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7033, "total_steps": 10853, "loss": 0.1258, "learning_rate": 1.510836954387991e-06, "epoch": 0.6479937347399456, "percentage": 64.8, "elapsed_time": "22:15:49", "remaining_time": "12:05:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7034, "total_steps": 10853, "loss": 0.1286, "learning_rate": 1.5101373828615172e-06, "epoch": 0.6480858709172156, "percentage": 64.81, "elapsed_time": "22:16:00", "remaining_time": "12:05:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7035, "total_steps": 10853, "loss": 0.1309, "learning_rate": 1.5094379032438956e-06, "epoch": 0.6481780070944857, "percentage": 64.82, "elapsed_time": "22:16:12", "remaining_time": "12:05:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7036, "total_steps": 10853, "loss": 0.1213, "learning_rate": 1.50873851560007e-06, "epoch": 0.6482701432717557, "percentage": 64.83, "elapsed_time": "22:16:25", "remaining_time": "12:05:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7037, "total_steps": 10853, "loss": 0.1277, "learning_rate": 1.50803921999498e-06, "epoch": 0.6483622794490257, "percentage": 64.84, "elapsed_time": "22:16:36", "remaining_time": "12:04:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7038, "total_steps": 10853, "loss": 0.1098, "learning_rate": 1.5073400164935554e-06, "epoch": 0.6484544156262957, "percentage": 64.85, "elapsed_time": "22:16:46", "remaining_time": "12:04:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7039, "total_steps": 10853, "loss": 0.1283, "learning_rate": 1.5066409051607175e-06, "epoch": 0.6485465518035657, "percentage": 64.86, "elapsed_time": "22:16:56", "remaining_time": "12:04:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7040, "total_steps": 10853, "loss": 0.1239, "learning_rate": 1.5059418860613779e-06, "epoch": 0.6486386879808357, "percentage": 64.87, "elapsed_time": "22:17:06", "remaining_time": "12:04:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7041, "total_steps": 10853, "loss": 0.1346, "learning_rate": 1.5052429592604411e-06, "epoch": 0.6487308241581057, "percentage": 64.88, "elapsed_time": "22:17:16", "remaining_time": "12:04:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7042, "total_steps": 10853, "loss": 0.1346, "learning_rate": 1.5045441248228024e-06, "epoch": 0.6488229603353757, "percentage": 64.89, "elapsed_time": "22:17:28", "remaining_time": "12:03:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7043, "total_steps": 10853, "loss": 0.1408, "learning_rate": 1.5038453828133498e-06, "epoch": 0.6489150965126457, "percentage": 64.89, "elapsed_time": "22:17:38", "remaining_time": "12:03:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7044, "total_steps": 10853, "loss": 0.1397, "learning_rate": 1.50314673329696e-06, "epoch": 0.6490072326899157, "percentage": 64.9, "elapsed_time": "22:17:49", "remaining_time": "12:03:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7045, "total_steps": 10853, "loss": 0.1207, "learning_rate": 1.502448176338503e-06, "epoch": 0.6490993688671857, "percentage": 64.91, "elapsed_time": "22:18:00", "remaining_time": "12:03:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7046, "total_steps": 10853, "loss": 0.1296, "learning_rate": 1.5017497120028404e-06, "epoch": 0.6491915050444557, "percentage": 64.92, "elapsed_time": "22:18:11", "remaining_time": "12:03:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7047, "total_steps": 10853, "loss": 0.1255, "learning_rate": 1.5010513403548253e-06, "epoch": 0.6492836412217257, "percentage": 64.93, "elapsed_time": "22:18:22", "remaining_time": "12:02:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7048, "total_steps": 10853, "loss": 0.1323, "learning_rate": 1.5003530614592995e-06, "epoch": 0.6493757773989958, "percentage": 64.94, "elapsed_time": "22:18:33", "remaining_time": "12:02:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7049, "total_steps": 10853, "loss": 0.1355, "learning_rate": 1.4996548753811001e-06, "epoch": 0.6494679135762658, "percentage": 64.95, "elapsed_time": "22:18:43", "remaining_time": "12:02:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7050, "total_steps": 10853, "loss": 0.1211, "learning_rate": 1.4989567821850527e-06, "epoch": 0.6495600497535358, "percentage": 64.96, "elapsed_time": "22:18:54", "remaining_time": "12:02:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7051, "total_steps": 10853, "loss": 0.1253, "learning_rate": 1.4982587819359767e-06, "epoch": 0.6496521859308058, "percentage": 64.97, "elapsed_time": "22:19:04", "remaining_time": "12:02:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7052, "total_steps": 10853, "loss": 0.1296, "learning_rate": 1.4975608746986802e-06, "epoch": 0.6497443221080758, "percentage": 64.98, "elapsed_time": "22:19:16", "remaining_time": "12:01:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7053, "total_steps": 10853, "loss": 0.1188, "learning_rate": 1.4968630605379642e-06, "epoch": 0.6498364582853458, "percentage": 64.99, "elapsed_time": "22:19:25", "remaining_time": "12:01:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7054, "total_steps": 10853, "loss": 0.1356, "learning_rate": 1.496165339518621e-06, "epoch": 0.6499285944626157, "percentage": 65.0, "elapsed_time": "22:19:35", "remaining_time": "12:01:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7055, "total_steps": 10853, "loss": 0.1427, "learning_rate": 1.495467711705434e-06, "epoch": 0.6500207306398857, "percentage": 65.01, "elapsed_time": "22:19:45", "remaining_time": "12:01:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7056, "total_steps": 10853, "loss": 0.1214, "learning_rate": 1.4947701771631788e-06, "epoch": 0.6501128668171557, "percentage": 65.01, "elapsed_time": "22:19:57", "remaining_time": "12:01:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7057, "total_steps": 10853, "loss": 0.14, "learning_rate": 1.4940727359566205e-06, "epoch": 0.6502050029944257, "percentage": 65.02, "elapsed_time": "22:20:08", "remaining_time": "12:00:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7058, "total_steps": 10853, "loss": 0.1211, "learning_rate": 1.493375388150516e-06, "epoch": 0.6502971391716957, "percentage": 65.03, "elapsed_time": "22:20:19", "remaining_time": "12:00:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7059, "total_steps": 10853, "loss": 0.135, "learning_rate": 1.4926781338096158e-06, "epoch": 0.6503892753489657, "percentage": 65.04, "elapsed_time": "22:20:30", "remaining_time": "12:00:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7060, "total_steps": 10853, "loss": 0.1308, "learning_rate": 1.4919809729986598e-06, "epoch": 0.6504814115262357, "percentage": 65.05, "elapsed_time": "22:20:40", "remaining_time": "12:00:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7061, "total_steps": 10853, "loss": 0.116, "learning_rate": 1.491283905782378e-06, "epoch": 0.6505735477035057, "percentage": 65.06, "elapsed_time": "22:20:50", "remaining_time": "12:00:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7062, "total_steps": 10853, "loss": 0.1253, "learning_rate": 1.4905869322254946e-06, "epoch": 0.6506656838807758, "percentage": 65.07, "elapsed_time": "22:21:00", "remaining_time": "11:59:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7063, "total_steps": 10853, "loss": 0.1217, "learning_rate": 1.4898900523927224e-06, "epoch": 0.6507578200580458, "percentage": 65.08, "elapsed_time": "22:21:10", "remaining_time": "11:59:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7064, "total_steps": 10853, "loss": 0.1323, "learning_rate": 1.489193266348769e-06, "epoch": 0.6508499562353158, "percentage": 65.09, "elapsed_time": "22:21:22", "remaining_time": "11:59:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7065, "total_steps": 10853, "loss": 0.1242, "learning_rate": 1.4884965741583288e-06, "epoch": 0.6509420924125858, "percentage": 65.1, "elapsed_time": "22:21:32", "remaining_time": "11:59:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7066, "total_steps": 10853, "loss": 0.1352, "learning_rate": 1.48779997588609e-06, "epoch": 0.6510342285898558, "percentage": 65.11, "elapsed_time": "22:21:43", "remaining_time": "11:59:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7067, "total_steps": 10853, "loss": 0.1321, "learning_rate": 1.4871034715967331e-06, "epoch": 0.6511263647671258, "percentage": 65.12, "elapsed_time": "22:21:54", "remaining_time": "11:58:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7068, "total_steps": 10853, "loss": 0.1234, "learning_rate": 1.4864070613549284e-06, "epoch": 0.6512185009443958, "percentage": 65.12, "elapsed_time": "22:22:04", "remaining_time": "11:58:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7069, "total_steps": 10853, "loss": 0.1177, "learning_rate": 1.485710745225336e-06, "epoch": 0.6513106371216658, "percentage": 65.13, "elapsed_time": "22:22:15", "remaining_time": "11:58:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7070, "total_steps": 10853, "loss": 0.1207, "learning_rate": 1.4850145232726104e-06, "epoch": 0.6514027732989358, "percentage": 65.14, "elapsed_time": "22:22:26", "remaining_time": "11:58:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7071, "total_steps": 10853, "loss": 0.1262, "learning_rate": 1.4843183955613955e-06, "epoch": 0.6514949094762058, "percentage": 65.15, "elapsed_time": "22:22:37", "remaining_time": "11:58:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7072, "total_steps": 10853, "loss": 0.1188, "learning_rate": 1.4836223621563272e-06, "epoch": 0.6515870456534758, "percentage": 65.16, "elapsed_time": "22:22:49", "remaining_time": "11:57:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7073, "total_steps": 10853, "loss": 0.1319, "learning_rate": 1.4829264231220319e-06, "epoch": 0.6516791818307458, "percentage": 65.17, "elapsed_time": "22:23:01", "remaining_time": "11:57:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7074, "total_steps": 10853, "loss": 0.1248, "learning_rate": 1.4822305785231273e-06, "epoch": 0.6517713180080158, "percentage": 65.18, "elapsed_time": "22:23:13", "remaining_time": "11:57:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7075, "total_steps": 10853, "loss": 0.1353, "learning_rate": 1.4815348284242234e-06, "epoch": 0.6518634541852859, "percentage": 65.19, "elapsed_time": "22:23:25", "remaining_time": "11:57:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7076, "total_steps": 10853, "loss": 0.1353, "learning_rate": 1.4808391728899206e-06, "epoch": 0.6519555903625559, "percentage": 65.2, "elapsed_time": "22:23:36", "remaining_time": "11:57:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7077, "total_steps": 10853, "loss": 0.1279, "learning_rate": 1.4801436119848096e-06, "epoch": 0.6520477265398259, "percentage": 65.21, "elapsed_time": "22:23:46", "remaining_time": "11:56:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7078, "total_steps": 10853, "loss": 0.1232, "learning_rate": 1.4794481457734743e-06, "epoch": 0.6521398627170959, "percentage": 65.22, "elapsed_time": "22:23:58", "remaining_time": "11:56:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7079, "total_steps": 10853, "loss": 0.1279, "learning_rate": 1.478752774320488e-06, "epoch": 0.6522319988943659, "percentage": 65.23, "elapsed_time": "22:24:10", "remaining_time": "11:56:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7080, "total_steps": 10853, "loss": 0.1159, "learning_rate": 1.4780574976904174e-06, "epoch": 0.6523241350716359, "percentage": 65.24, "elapsed_time": "22:24:21", "remaining_time": "11:56:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7081, "total_steps": 10853, "loss": 0.1102, "learning_rate": 1.4773623159478178e-06, "epoch": 0.6524162712489059, "percentage": 65.24, "elapsed_time": "22:24:31", "remaining_time": "11:56:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7082, "total_steps": 10853, "loss": 0.114, "learning_rate": 1.4766672291572364e-06, "epoch": 0.6525084074261759, "percentage": 65.25, "elapsed_time": "22:24:42", "remaining_time": "11:56:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7083, "total_steps": 10853, "loss": 0.1159, "learning_rate": 1.4759722373832135e-06, "epoch": 0.6526005436034459, "percentage": 65.26, "elapsed_time": "22:24:51", "remaining_time": "11:55:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7084, "total_steps": 10853, "loss": 0.1275, "learning_rate": 1.4752773406902788e-06, "epoch": 0.6526926797807159, "percentage": 65.27, "elapsed_time": "22:25:03", "remaining_time": "11:55:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7085, "total_steps": 10853, "loss": 0.1225, "learning_rate": 1.4745825391429537e-06, "epoch": 0.6527848159579859, "percentage": 65.28, "elapsed_time": "22:25:14", "remaining_time": "11:55:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7086, "total_steps": 10853, "loss": 0.1272, "learning_rate": 1.4738878328057493e-06, "epoch": 0.6528769521352559, "percentage": 65.29, "elapsed_time": "22:25:26", "remaining_time": "11:55:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7087, "total_steps": 10853, "loss": 0.1304, "learning_rate": 1.4731932217431704e-06, "epoch": 0.6529690883125259, "percentage": 65.3, "elapsed_time": "22:25:35", "remaining_time": "11:55:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7088, "total_steps": 10853, "loss": 0.1282, "learning_rate": 1.472498706019711e-06, "epoch": 0.6530612244897959, "percentage": 65.31, "elapsed_time": "22:25:46", "remaining_time": "11:54:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7089, "total_steps": 10853, "loss": 0.1323, "learning_rate": 1.4718042856998582e-06, "epoch": 0.653153360667066, "percentage": 65.32, "elapsed_time": "22:25:58", "remaining_time": "11:54:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7090, "total_steps": 10853, "loss": 0.126, "learning_rate": 1.4711099608480878e-06, "epoch": 0.653245496844336, "percentage": 65.33, "elapsed_time": "22:26:09", "remaining_time": "11:54:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7091, "total_steps": 10853, "loss": 0.1287, "learning_rate": 1.4704157315288676e-06, "epoch": 0.653337633021606, "percentage": 65.34, "elapsed_time": "22:26:20", "remaining_time": "11:54:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7092, "total_steps": 10853, "loss": 0.1358, "learning_rate": 1.469721597806658e-06, "epoch": 0.653429769198876, "percentage": 65.35, "elapsed_time": "22:26:30", "remaining_time": "11:54:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7093, "total_steps": 10853, "loss": 0.126, "learning_rate": 1.4690275597459097e-06, "epoch": 0.653521905376146, "percentage": 65.36, "elapsed_time": "22:26:41", "remaining_time": "11:53:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7094, "total_steps": 10853, "loss": 0.1302, "learning_rate": 1.4683336174110622e-06, "epoch": 0.653614041553416, "percentage": 65.36, "elapsed_time": "22:26:51", "remaining_time": "11:53:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7095, "total_steps": 10853, "loss": 0.1223, "learning_rate": 1.4676397708665496e-06, "epoch": 0.653706177730686, "percentage": 65.37, "elapsed_time": "22:27:02", "remaining_time": "11:53:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7096, "total_steps": 10853, "loss": 0.1439, "learning_rate": 1.4669460201767954e-06, "epoch": 0.653798313907956, "percentage": 65.38, "elapsed_time": "22:27:14", "remaining_time": "11:53:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7097, "total_steps": 10853, "loss": 0.1268, "learning_rate": 1.4662523654062153e-06, "epoch": 0.653890450085226, "percentage": 65.39, "elapsed_time": "22:27:25", "remaining_time": "11:53:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7098, "total_steps": 10853, "loss": 0.132, "learning_rate": 1.4655588066192135e-06, "epoch": 0.653982586262496, "percentage": 65.4, "elapsed_time": "22:27:35", "remaining_time": "11:52:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7099, "total_steps": 10853, "loss": 0.1213, "learning_rate": 1.4648653438801876e-06, "epoch": 0.6540747224397659, "percentage": 65.41, "elapsed_time": "22:27:46", "remaining_time": "11:52:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7100, "total_steps": 10853, "loss": 0.1157, "learning_rate": 1.4641719772535265e-06, "epoch": 0.6541668586170359, "percentage": 65.42, "elapsed_time": "22:27:55", "remaining_time": "11:52:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7101, "total_steps": 10853, "loss": 0.1344, "learning_rate": 1.463478706803609e-06, "epoch": 0.6542589947943059, "percentage": 65.43, "elapsed_time": "22:28:05", "remaining_time": "11:52:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7102, "total_steps": 10853, "loss": 0.1218, "learning_rate": 1.4627855325948044e-06, "epoch": 0.6543511309715759, "percentage": 65.44, "elapsed_time": "22:28:16", "remaining_time": "11:52:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7103, "total_steps": 10853, "loss": 0.1363, "learning_rate": 1.462092454691475e-06, "epoch": 0.654443267148846, "percentage": 65.45, "elapsed_time": "22:28:27", "remaining_time": "11:51:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7104, "total_steps": 10853, "loss": 0.1293, "learning_rate": 1.461399473157973e-06, "epoch": 0.654535403326116, "percentage": 65.46, "elapsed_time": "22:28:40", "remaining_time": "11:51:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7105, "total_steps": 10853, "loss": 0.1234, "learning_rate": 1.4607065880586418e-06, "epoch": 0.654627539503386, "percentage": 65.47, "elapsed_time": "22:28:50", "remaining_time": "11:51:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7106, "total_steps": 10853, "loss": 0.1248, "learning_rate": 1.4600137994578156e-06, "epoch": 0.654719675680656, "percentage": 65.47, "elapsed_time": "22:29:01", "remaining_time": "11:51:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7107, "total_steps": 10853, "loss": 0.1305, "learning_rate": 1.4593211074198202e-06, "epoch": 0.654811811857926, "percentage": 65.48, "elapsed_time": "22:29:11", "remaining_time": "11:51:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7108, "total_steps": 10853, "loss": 0.1321, "learning_rate": 1.4586285120089713e-06, "epoch": 0.654903948035196, "percentage": 65.49, "elapsed_time": "22:29:21", "remaining_time": "11:50:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7109, "total_steps": 10853, "loss": 0.1242, "learning_rate": 1.457936013289578e-06, "epoch": 0.654996084212466, "percentage": 65.5, "elapsed_time": "22:29:32", "remaining_time": "11:50:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7110, "total_steps": 10853, "loss": 0.138, "learning_rate": 1.4572436113259376e-06, "epoch": 0.655088220389736, "percentage": 65.51, "elapsed_time": "22:29:42", "remaining_time": "11:50:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7111, "total_steps": 10853, "loss": 0.1395, "learning_rate": 1.4565513061823394e-06, "epoch": 0.655180356567006, "percentage": 65.52, "elapsed_time": "22:29:53", "remaining_time": "11:50:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7112, "total_steps": 10853, "loss": 0.1288, "learning_rate": 1.4558590979230663e-06, "epoch": 0.655272492744276, "percentage": 65.53, "elapsed_time": "22:30:04", "remaining_time": "11:50:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7113, "total_steps": 10853, "loss": 0.1485, "learning_rate": 1.4551669866123868e-06, "epoch": 0.655364628921546, "percentage": 65.54, "elapsed_time": "22:30:15", "remaining_time": "11:49:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7114, "total_steps": 10853, "loss": 0.1385, "learning_rate": 1.4544749723145665e-06, "epoch": 0.655456765098816, "percentage": 65.55, "elapsed_time": "22:30:26", "remaining_time": "11:49:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7115, "total_steps": 10853, "loss": 0.1301, "learning_rate": 1.4537830550938563e-06, "epoch": 0.655548901276086, "percentage": 65.56, "elapsed_time": "22:30:37", "remaining_time": "11:49:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7116, "total_steps": 10853, "loss": 0.1304, "learning_rate": 1.453091235014502e-06, "epoch": 0.6556410374533561, "percentage": 65.57, "elapsed_time": "22:30:48", "remaining_time": "11:49:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7117, "total_steps": 10853, "loss": 0.1213, "learning_rate": 1.4523995121407402e-06, "epoch": 0.6557331736306261, "percentage": 65.58, "elapsed_time": "22:30:58", "remaining_time": "11:49:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7118, "total_steps": 10853, "loss": 0.1301, "learning_rate": 1.4517078865367968e-06, "epoch": 0.6558253098078961, "percentage": 65.59, "elapsed_time": "22:31:09", "remaining_time": "11:48:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7119, "total_steps": 10853, "loss": 0.1374, "learning_rate": 1.4510163582668876e-06, "epoch": 0.6559174459851661, "percentage": 65.59, "elapsed_time": "22:31:21", "remaining_time": "11:48:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7120, "total_steps": 10853, "loss": 0.1384, "learning_rate": 1.4503249273952224e-06, "epoch": 0.6560095821624361, "percentage": 65.6, "elapsed_time": "22:31:32", "remaining_time": "11:48:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7121, "total_steps": 10853, "loss": 0.1316, "learning_rate": 1.449633593986001e-06, "epoch": 0.6561017183397061, "percentage": 65.61, "elapsed_time": "22:31:43", "remaining_time": "11:48:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7122, "total_steps": 10853, "loss": 0.1249, "learning_rate": 1.448942358103414e-06, "epoch": 0.6561938545169761, "percentage": 65.62, "elapsed_time": "22:31:54", "remaining_time": "11:48:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7123, "total_steps": 10853, "loss": 0.1281, "learning_rate": 1.4482512198116424e-06, "epoch": 0.6562859906942461, "percentage": 65.63, "elapsed_time": "22:32:04", "remaining_time": "11:48:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7124, "total_steps": 10853, "loss": 0.1255, "learning_rate": 1.4475601791748572e-06, "epoch": 0.6563781268715161, "percentage": 65.64, "elapsed_time": "22:32:14", "remaining_time": "11:47:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7125, "total_steps": 10853, "loss": 0.1391, "learning_rate": 1.4468692362572228e-06, "epoch": 0.6564702630487861, "percentage": 65.65, "elapsed_time": "22:32:25", "remaining_time": "11:47:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7126, "total_steps": 10853, "loss": 0.1134, "learning_rate": 1.4461783911228938e-06, "epoch": 0.6565623992260561, "percentage": 65.66, "elapsed_time": "22:32:35", "remaining_time": "11:47:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7127, "total_steps": 10853, "loss": 0.1315, "learning_rate": 1.4454876438360138e-06, "epoch": 0.6566545354033261, "percentage": 65.67, "elapsed_time": "22:32:46", "remaining_time": "11:47:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7128, "total_steps": 10853, "loss": 0.143, "learning_rate": 1.4447969944607207e-06, "epoch": 0.6567466715805961, "percentage": 65.68, "elapsed_time": "22:32:55", "remaining_time": "11:47:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7129, "total_steps": 10853, "loss": 0.1223, "learning_rate": 1.444106443061139e-06, "epoch": 0.6568388077578661, "percentage": 65.69, "elapsed_time": "22:33:06", "remaining_time": "11:46:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7130, "total_steps": 10853, "loss": 0.1296, "learning_rate": 1.443415989701389e-06, "epoch": 0.6569309439351362, "percentage": 65.7, "elapsed_time": "22:33:16", "remaining_time": "11:46:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7131, "total_steps": 10853, "loss": 0.1304, "learning_rate": 1.4427256344455764e-06, "epoch": 0.6570230801124062, "percentage": 65.71, "elapsed_time": "22:33:27", "remaining_time": "11:46:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7132, "total_steps": 10853, "loss": 0.1175, "learning_rate": 1.442035377357803e-06, "epoch": 0.6571152162896762, "percentage": 65.71, "elapsed_time": "22:33:38", "remaining_time": "11:46:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7133, "total_steps": 10853, "loss": 0.1304, "learning_rate": 1.4413452185021594e-06, "epoch": 0.6572073524669462, "percentage": 65.72, "elapsed_time": "22:33:50", "remaining_time": "11:46:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7134, "total_steps": 10853, "loss": 0.1314, "learning_rate": 1.4406551579427264e-06, "epoch": 0.6572994886442162, "percentage": 65.73, "elapsed_time": "22:34:01", "remaining_time": "11:45:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7135, "total_steps": 10853, "loss": 0.1136, "learning_rate": 1.4399651957435751e-06, "epoch": 0.6573916248214862, "percentage": 65.74, "elapsed_time": "22:34:11", "remaining_time": "11:45:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7136, "total_steps": 10853, "loss": 0.1188, "learning_rate": 1.439275331968769e-06, "epoch": 0.6574837609987562, "percentage": 65.75, "elapsed_time": "22:34:22", "remaining_time": "11:45:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7137, "total_steps": 10853, "loss": 0.1298, "learning_rate": 1.4385855666823628e-06, "epoch": 0.6575758971760262, "percentage": 65.76, "elapsed_time": "22:34:32", "remaining_time": "11:45:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7138, "total_steps": 10853, "loss": 0.125, "learning_rate": 1.4378958999484021e-06, "epoch": 0.6576680333532962, "percentage": 65.77, "elapsed_time": "22:34:43", "remaining_time": "11:45:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7139, "total_steps": 10853, "loss": 0.1338, "learning_rate": 1.4372063318309213e-06, "epoch": 0.6577601695305662, "percentage": 65.78, "elapsed_time": "22:34:55", "remaining_time": "11:44:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7140, "total_steps": 10853, "loss": 0.1247, "learning_rate": 1.4365168623939458e-06, "epoch": 0.6578523057078361, "percentage": 65.79, "elapsed_time": "22:35:07", "remaining_time": "11:44:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7141, "total_steps": 10853, "loss": 0.1319, "learning_rate": 1.4358274917014942e-06, "epoch": 0.6579444418851061, "percentage": 65.8, "elapsed_time": "22:35:18", "remaining_time": "11:44:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7142, "total_steps": 10853, "loss": 0.1251, "learning_rate": 1.4351382198175745e-06, "epoch": 0.6580365780623761, "percentage": 65.81, "elapsed_time": "22:35:30", "remaining_time": "11:44:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7143, "total_steps": 10853, "loss": 0.115, "learning_rate": 1.4344490468061867e-06, "epoch": 0.6581287142396463, "percentage": 65.82, "elapsed_time": "22:35:42", "remaining_time": "11:44:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7144, "total_steps": 10853, "loss": 0.1347, "learning_rate": 1.4337599727313196e-06, "epoch": 0.6582208504169162, "percentage": 65.83, "elapsed_time": "22:35:54", "remaining_time": "11:43:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7145, "total_steps": 10853, "loss": 0.1285, "learning_rate": 1.4330709976569526e-06, "epoch": 0.6583129865941862, "percentage": 65.83, "elapsed_time": "22:36:05", "remaining_time": "11:43:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7146, "total_steps": 10853, "loss": 0.1313, "learning_rate": 1.4323821216470585e-06, "epoch": 0.6584051227714562, "percentage": 65.84, "elapsed_time": "22:36:15", "remaining_time": "11:43:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7147, "total_steps": 10853, "loss": 0.1316, "learning_rate": 1.4316933447656e-06, "epoch": 0.6584972589487262, "percentage": 65.85, "elapsed_time": "22:36:26", "remaining_time": "11:43:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7148, "total_steps": 10853, "loss": 0.1331, "learning_rate": 1.4310046670765288e-06, "epoch": 0.6585893951259962, "percentage": 65.86, "elapsed_time": "22:36:38", "remaining_time": "11:43:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7149, "total_steps": 10853, "loss": 0.1335, "learning_rate": 1.43031608864379e-06, "epoch": 0.6586815313032662, "percentage": 65.87, "elapsed_time": "22:36:48", "remaining_time": "11:42:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7150, "total_steps": 10853, "loss": 0.1274, "learning_rate": 1.4296276095313168e-06, "epoch": 0.6587736674805362, "percentage": 65.88, "elapsed_time": "22:36:57", "remaining_time": "11:42:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7151, "total_steps": 10853, "loss": 0.119, "learning_rate": 1.4289392298030362e-06, "epoch": 0.6588658036578062, "percentage": 65.89, "elapsed_time": "22:37:08", "remaining_time": "11:42:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7152, "total_steps": 10853, "loss": 0.1281, "learning_rate": 1.4282509495228622e-06, "epoch": 0.6589579398350762, "percentage": 65.9, "elapsed_time": "22:37:17", "remaining_time": "11:42:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7153, "total_steps": 10853, "loss": 0.122, "learning_rate": 1.4275627687547027e-06, "epoch": 0.6590500760123462, "percentage": 65.91, "elapsed_time": "22:37:29", "remaining_time": "11:42:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7154, "total_steps": 10853, "loss": 0.1361, "learning_rate": 1.4268746875624572e-06, "epoch": 0.6591422121896162, "percentage": 65.92, "elapsed_time": "22:37:40", "remaining_time": "11:41:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7155, "total_steps": 10853, "loss": 0.1279, "learning_rate": 1.426186706010012e-06, "epoch": 0.6592343483668862, "percentage": 65.93, "elapsed_time": "22:37:51", "remaining_time": "11:41:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7156, "total_steps": 10853, "loss": 0.1216, "learning_rate": 1.4254988241612456e-06, "epoch": 0.6593264845441562, "percentage": 65.94, "elapsed_time": "22:38:01", "remaining_time": "11:41:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7157, "total_steps": 10853, "loss": 0.1241, "learning_rate": 1.4248110420800293e-06, "epoch": 0.6594186207214263, "percentage": 65.94, "elapsed_time": "22:38:12", "remaining_time": "11:41:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7158, "total_steps": 10853, "loss": 0.1232, "learning_rate": 1.4241233598302233e-06, "epoch": 0.6595107568986963, "percentage": 65.95, "elapsed_time": "22:38:23", "remaining_time": "11:41:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7159, "total_steps": 10853, "loss": 0.1349, "learning_rate": 1.4234357774756802e-06, "epoch": 0.6596028930759663, "percentage": 65.96, "elapsed_time": "22:38:32", "remaining_time": "11:41:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7160, "total_steps": 10853, "loss": 0.1246, "learning_rate": 1.422748295080241e-06, "epoch": 0.6596950292532363, "percentage": 65.97, "elapsed_time": "22:38:44", "remaining_time": "11:40:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7161, "total_steps": 10853, "loss": 0.1195, "learning_rate": 1.4220609127077373e-06, "epoch": 0.6597871654305063, "percentage": 65.98, "elapsed_time": "22:38:55", "remaining_time": "11:40:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7162, "total_steps": 10853, "loss": 0.1328, "learning_rate": 1.4213736304219945e-06, "epoch": 0.6598793016077763, "percentage": 65.99, "elapsed_time": "22:39:05", "remaining_time": "11:40:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7163, "total_steps": 10853, "loss": 0.1263, "learning_rate": 1.4206864482868265e-06, "epoch": 0.6599714377850463, "percentage": 66.0, "elapsed_time": "22:39:16", "remaining_time": "11:40:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7164, "total_steps": 10853, "loss": 0.1315, "learning_rate": 1.4199993663660372e-06, "epoch": 0.6600635739623163, "percentage": 66.01, "elapsed_time": "22:39:28", "remaining_time": "11:40:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7165, "total_steps": 10853, "loss": 0.1255, "learning_rate": 1.419312384723423e-06, "epoch": 0.6601557101395863, "percentage": 66.02, "elapsed_time": "22:39:39", "remaining_time": "11:39:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7166, "total_steps": 10853, "loss": 0.1114, "learning_rate": 1.4186255034227714e-06, "epoch": 0.6602478463168563, "percentage": 66.03, "elapsed_time": "22:39:49", "remaining_time": "11:39:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7167, "total_steps": 10853, "loss": 0.1116, "learning_rate": 1.4179387225278568e-06, "epoch": 0.6603399824941263, "percentage": 66.04, "elapsed_time": "22:39:58", "remaining_time": "11:39:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7168, "total_steps": 10853, "loss": 0.1269, "learning_rate": 1.4172520421024493e-06, "epoch": 0.6604321186713963, "percentage": 66.05, "elapsed_time": "22:40:07", "remaining_time": "11:39:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7169, "total_steps": 10853, "loss": 0.1206, "learning_rate": 1.4165654622103054e-06, "epoch": 0.6605242548486663, "percentage": 66.06, "elapsed_time": "22:40:18", "remaining_time": "11:39:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7170, "total_steps": 10853, "loss": 0.1203, "learning_rate": 1.4158789829151747e-06, "epoch": 0.6606163910259364, "percentage": 66.06, "elapsed_time": "22:40:29", "remaining_time": "11:38:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7171, "total_steps": 10853, "loss": 0.1147, "learning_rate": 1.4151926042807985e-06, "epoch": 0.6607085272032064, "percentage": 66.07, "elapsed_time": "22:40:40", "remaining_time": "11:38:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7172, "total_steps": 10853, "loss": 0.1421, "learning_rate": 1.4145063263709056e-06, "epoch": 0.6608006633804764, "percentage": 66.08, "elapsed_time": "22:40:52", "remaining_time": "11:38:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7173, "total_steps": 10853, "loss": 0.1311, "learning_rate": 1.413820149249216e-06, "epoch": 0.6608927995577464, "percentage": 66.09, "elapsed_time": "22:41:02", "remaining_time": "11:38:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7174, "total_steps": 10853, "loss": 0.1288, "learning_rate": 1.4131340729794424e-06, "epoch": 0.6609849357350164, "percentage": 66.1, "elapsed_time": "22:41:14", "remaining_time": "11:38:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7175, "total_steps": 10853, "loss": 0.1257, "learning_rate": 1.4124480976252872e-06, "epoch": 0.6610770719122864, "percentage": 66.11, "elapsed_time": "22:41:25", "remaining_time": "11:37:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7176, "total_steps": 10853, "loss": 0.1186, "learning_rate": 1.4117622232504442e-06, "epoch": 0.6611692080895564, "percentage": 66.12, "elapsed_time": "22:41:36", "remaining_time": "11:37:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7177, "total_steps": 10853, "loss": 0.1368, "learning_rate": 1.4110764499185957e-06, "epoch": 0.6612613442668264, "percentage": 66.13, "elapsed_time": "22:41:46", "remaining_time": "11:37:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7178, "total_steps": 10853, "loss": 0.1287, "learning_rate": 1.410390777693415e-06, "epoch": 0.6613534804440964, "percentage": 66.14, "elapsed_time": "22:41:56", "remaining_time": "11:37:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7179, "total_steps": 10853, "loss": 0.1223, "learning_rate": 1.409705206638568e-06, "epoch": 0.6614456166213664, "percentage": 66.15, "elapsed_time": "22:42:08", "remaining_time": "11:37:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7180, "total_steps": 10853, "loss": 0.1313, "learning_rate": 1.409019736817711e-06, "epoch": 0.6615377527986364, "percentage": 66.16, "elapsed_time": "22:42:18", "remaining_time": "11:36:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7181, "total_steps": 10853, "loss": 0.14, "learning_rate": 1.4083343682944878e-06, "epoch": 0.6616298889759064, "percentage": 66.17, "elapsed_time": "22:42:30", "remaining_time": "11:36:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7182, "total_steps": 10853, "loss": 0.1366, "learning_rate": 1.4076491011325372e-06, "epoch": 0.6617220251531764, "percentage": 66.18, "elapsed_time": "22:42:40", "remaining_time": "11:36:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7183, "total_steps": 10853, "loss": 0.1335, "learning_rate": 1.4069639353954837e-06, "epoch": 0.6618141613304463, "percentage": 66.18, "elapsed_time": "22:42:51", "remaining_time": "11:36:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7184, "total_steps": 10853, "loss": 0.1259, "learning_rate": 1.4062788711469478e-06, "epoch": 0.6619062975077165, "percentage": 66.19, "elapsed_time": "22:43:01", "remaining_time": "11:36:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7185, "total_steps": 10853, "loss": 0.1272, "learning_rate": 1.405593908450535e-06, "epoch": 0.6619984336849865, "percentage": 66.2, "elapsed_time": "22:43:12", "remaining_time": "11:35:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7186, "total_steps": 10853, "loss": 0.1238, "learning_rate": 1.4049090473698457e-06, "epoch": 0.6620905698622565, "percentage": 66.21, "elapsed_time": "22:43:21", "remaining_time": "11:35:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7187, "total_steps": 10853, "loss": 0.1282, "learning_rate": 1.4042242879684703e-06, "epoch": 0.6621827060395264, "percentage": 66.22, "elapsed_time": "22:43:32", "remaining_time": "11:35:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7188, "total_steps": 10853, "loss": 0.121, "learning_rate": 1.403539630309988e-06, "epoch": 0.6622748422167964, "percentage": 66.23, "elapsed_time": "22:43:42", "remaining_time": "11:35:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7189, "total_steps": 10853, "loss": 0.1236, "learning_rate": 1.4028550744579677e-06, "epoch": 0.6623669783940664, "percentage": 66.24, "elapsed_time": "22:43:53", "remaining_time": "11:35:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7190, "total_steps": 10853, "loss": 0.1263, "learning_rate": 1.4021706204759716e-06, "epoch": 0.6624591145713364, "percentage": 66.25, "elapsed_time": "22:44:04", "remaining_time": "11:34:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7191, "total_steps": 10853, "loss": 0.1319, "learning_rate": 1.4014862684275522e-06, "epoch": 0.6625512507486064, "percentage": 66.26, "elapsed_time": "22:44:15", "remaining_time": "11:34:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7192, "total_steps": 10853, "loss": 0.1287, "learning_rate": 1.4008020183762513e-06, "epoch": 0.6626433869258764, "percentage": 66.27, "elapsed_time": "22:44:25", "remaining_time": "11:34:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7193, "total_steps": 10853, "loss": 0.1249, "learning_rate": 1.4001178703856016e-06, "epoch": 0.6627355231031464, "percentage": 66.28, "elapsed_time": "22:44:36", "remaining_time": "11:34:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7194, "total_steps": 10853, "loss": 0.1298, "learning_rate": 1.3994338245191249e-06, "epoch": 0.6628276592804164, "percentage": 66.29, "elapsed_time": "22:44:45", "remaining_time": "11:34:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7195, "total_steps": 10853, "loss": 0.1291, "learning_rate": 1.398749880840336e-06, "epoch": 0.6629197954576864, "percentage": 66.3, "elapsed_time": "22:44:56", "remaining_time": "11:33:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7196, "total_steps": 10853, "loss": 0.128, "learning_rate": 1.3980660394127394e-06, "epoch": 0.6630119316349564, "percentage": 66.3, "elapsed_time": "22:45:07", "remaining_time": "11:33:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7197, "total_steps": 10853, "loss": 0.1248, "learning_rate": 1.3973823002998305e-06, "epoch": 0.6631040678122264, "percentage": 66.31, "elapsed_time": "22:45:19", "remaining_time": "11:33:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7198, "total_steps": 10853, "loss": 0.1019, "learning_rate": 1.3966986635650936e-06, "epoch": 0.6631962039894965, "percentage": 66.32, "elapsed_time": "22:45:30", "remaining_time": "11:33:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7199, "total_steps": 10853, "loss": 0.1225, "learning_rate": 1.3960151292720039e-06, "epoch": 0.6632883401667665, "percentage": 66.33, "elapsed_time": "22:45:40", "remaining_time": "11:33:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7200, "total_steps": 10853, "loss": 0.1252, "learning_rate": 1.395331697484028e-06, "epoch": 0.6633804763440365, "percentage": 66.34, "elapsed_time": "22:45:51", "remaining_time": "11:32:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7201, "total_steps": 10853, "loss": 0.1179, "learning_rate": 1.394648368264624e-06, "epoch": 0.6634726125213065, "percentage": 66.35, "elapsed_time": "22:46:01", "remaining_time": "11:32:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7202, "total_steps": 10853, "loss": 0.1227, "learning_rate": 1.3939651416772365e-06, "epoch": 0.6635647486985765, "percentage": 66.36, "elapsed_time": "22:46:13", "remaining_time": "11:32:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7203, "total_steps": 10853, "loss": 0.1238, "learning_rate": 1.3932820177853062e-06, "epoch": 0.6636568848758465, "percentage": 66.37, "elapsed_time": "22:46:24", "remaining_time": "11:32:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7204, "total_steps": 10853, "loss": 0.1268, "learning_rate": 1.3925989966522585e-06, "epoch": 0.6637490210531165, "percentage": 66.38, "elapsed_time": "22:46:34", "remaining_time": "11:32:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7205, "total_steps": 10853, "loss": 0.1215, "learning_rate": 1.391916078341514e-06, "epoch": 0.6638411572303865, "percentage": 66.39, "elapsed_time": "22:46:43", "remaining_time": "11:31:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7206, "total_steps": 10853, "loss": 0.1179, "learning_rate": 1.3912332629164798e-06, "epoch": 0.6639332934076565, "percentage": 66.4, "elapsed_time": "22:46:54", "remaining_time": "11:31:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7207, "total_steps": 10853, "loss": 0.124, "learning_rate": 1.3905505504405567e-06, "epoch": 0.6640254295849265, "percentage": 66.41, "elapsed_time": "22:47:05", "remaining_time": "11:31:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7208, "total_steps": 10853, "loss": 0.1283, "learning_rate": 1.3898679409771355e-06, "epoch": 0.6641175657621965, "percentage": 66.41, "elapsed_time": "22:47:16", "remaining_time": "11:31:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7209, "total_steps": 10853, "loss": 0.1266, "learning_rate": 1.389185434589595e-06, "epoch": 0.6642097019394665, "percentage": 66.42, "elapsed_time": "22:47:27", "remaining_time": "11:31:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7210, "total_steps": 10853, "loss": 0.1196, "learning_rate": 1.3885030313413056e-06, "epoch": 0.6643018381167365, "percentage": 66.43, "elapsed_time": "22:47:38", "remaining_time": "11:31:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7211, "total_steps": 10853, "loss": 0.1351, "learning_rate": 1.3878207312956295e-06, "epoch": 0.6643939742940066, "percentage": 66.44, "elapsed_time": "22:47:48", "remaining_time": "11:30:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7212, "total_steps": 10853, "loss": 0.1323, "learning_rate": 1.3871385345159183e-06, "epoch": 0.6644861104712766, "percentage": 66.45, "elapsed_time": "22:47:58", "remaining_time": "11:30:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7213, "total_steps": 10853, "loss": 0.1225, "learning_rate": 1.3864564410655149e-06, "epoch": 0.6645782466485466, "percentage": 66.46, "elapsed_time": "22:48:09", "remaining_time": "11:30:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7214, "total_steps": 10853, "loss": 0.125, "learning_rate": 1.3857744510077507e-06, "epoch": 0.6646703828258166, "percentage": 66.47, "elapsed_time": "22:48:20", "remaining_time": "11:30:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7215, "total_steps": 10853, "loss": 0.1413, "learning_rate": 1.3850925644059475e-06, "epoch": 0.6647625190030866, "percentage": 66.48, "elapsed_time": "22:48:31", "remaining_time": "11:30:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7216, "total_steps": 10853, "loss": 0.1317, "learning_rate": 1.3844107813234197e-06, "epoch": 0.6648546551803566, "percentage": 66.49, "elapsed_time": "22:48:43", "remaining_time": "11:29:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7217, "total_steps": 10853, "loss": 0.1327, "learning_rate": 1.3837291018234723e-06, "epoch": 0.6649467913576266, "percentage": 66.5, "elapsed_time": "22:48:54", "remaining_time": "11:29:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7218, "total_steps": 10853, "loss": 0.1324, "learning_rate": 1.3830475259693964e-06, "epoch": 0.6650389275348966, "percentage": 66.51, "elapsed_time": "22:49:05", "remaining_time": "11:29:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7219, "total_steps": 10853, "loss": 0.114, "learning_rate": 1.3823660538244793e-06, "epoch": 0.6651310637121666, "percentage": 66.52, "elapsed_time": "22:49:16", "remaining_time": "11:29:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7220, "total_steps": 10853, "loss": 0.1366, "learning_rate": 1.3816846854519934e-06, "epoch": 0.6652231998894366, "percentage": 66.53, "elapsed_time": "22:49:26", "remaining_time": "11:29:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7221, "total_steps": 10853, "loss": 0.1224, "learning_rate": 1.3810034209152057e-06, "epoch": 0.6653153360667066, "percentage": 66.53, "elapsed_time": "22:49:38", "remaining_time": "11:28:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7222, "total_steps": 10853, "loss": 0.1209, "learning_rate": 1.3803222602773696e-06, "epoch": 0.6654074722439766, "percentage": 66.54, "elapsed_time": "22:49:48", "remaining_time": "11:28:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7223, "total_steps": 10853, "loss": 0.1295, "learning_rate": 1.379641203601732e-06, "epoch": 0.6654996084212466, "percentage": 66.55, "elapsed_time": "22:49:59", "remaining_time": "11:28:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7224, "total_steps": 10853, "loss": 0.126, "learning_rate": 1.3789602509515306e-06, "epoch": 0.6655917445985166, "percentage": 66.56, "elapsed_time": "22:50:10", "remaining_time": "11:28:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7225, "total_steps": 10853, "loss": 0.1271, "learning_rate": 1.3782794023899899e-06, "epoch": 0.6656838807757867, "percentage": 66.57, "elapsed_time": "22:50:19", "remaining_time": "11:28:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7226, "total_steps": 10853, "loss": 0.111, "learning_rate": 1.3775986579803276e-06, "epoch": 0.6657760169530567, "percentage": 66.58, "elapsed_time": "22:50:30", "remaining_time": "11:27:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7227, "total_steps": 10853, "loss": 0.1267, "learning_rate": 1.37691801778575e-06, "epoch": 0.6658681531303267, "percentage": 66.59, "elapsed_time": "22:50:41", "remaining_time": "11:27:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7228, "total_steps": 10853, "loss": 0.1273, "learning_rate": 1.3762374818694558e-06, "epoch": 0.6659602893075967, "percentage": 66.6, "elapsed_time": "22:50:52", "remaining_time": "11:27:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7229, "total_steps": 10853, "loss": 0.135, "learning_rate": 1.3755570502946324e-06, "epoch": 0.6660524254848667, "percentage": 66.61, "elapsed_time": "22:51:03", "remaining_time": "11:27:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7230, "total_steps": 10853, "loss": 0.1295, "learning_rate": 1.3748767231244587e-06, "epoch": 0.6661445616621366, "percentage": 66.62, "elapsed_time": "22:51:14", "remaining_time": "11:27:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7231, "total_steps": 10853, "loss": 0.1201, "learning_rate": 1.3741965004221012e-06, "epoch": 0.6662366978394066, "percentage": 66.63, "elapsed_time": "22:51:24", "remaining_time": "11:26:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7232, "total_steps": 10853, "loss": 0.1425, "learning_rate": 1.3735163822507196e-06, "epoch": 0.6663288340166766, "percentage": 66.64, "elapsed_time": "22:51:36", "remaining_time": "11:26:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7233, "total_steps": 10853, "loss": 0.1097, "learning_rate": 1.372836368673463e-06, "epoch": 0.6664209701939466, "percentage": 66.65, "elapsed_time": "22:51:47", "remaining_time": "11:26:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7234, "total_steps": 10853, "loss": 0.1303, "learning_rate": 1.3721564597534723e-06, "epoch": 0.6665131063712166, "percentage": 66.65, "elapsed_time": "22:51:58", "remaining_time": "11:26:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7235, "total_steps": 10853, "loss": 0.1259, "learning_rate": 1.3714766555538755e-06, "epoch": 0.6666052425484866, "percentage": 66.66, "elapsed_time": "22:52:09", "remaining_time": "11:26:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7236, "total_steps": 10853, "loss": 0.1465, "learning_rate": 1.3707969561377915e-06, "epoch": 0.6666973787257566, "percentage": 66.67, "elapsed_time": "22:52:18", "remaining_time": "11:25:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7237, "total_steps": 10853, "loss": 0.1137, "learning_rate": 1.370117361568332e-06, "epoch": 0.6667895149030266, "percentage": 66.68, "elapsed_time": "22:52:28", "remaining_time": "11:25:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7238, "total_steps": 10853, "loss": 0.1388, "learning_rate": 1.3694378719085976e-06, "epoch": 0.6668816510802967, "percentage": 66.69, "elapsed_time": "22:52:40", "remaining_time": "11:25:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7239, "total_steps": 10853, "loss": 0.1285, "learning_rate": 1.368758487221678e-06, "epoch": 0.6669737872575667, "percentage": 66.7, "elapsed_time": "22:52:51", "remaining_time": "11:25:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7240, "total_steps": 10853, "loss": 0.1397, "learning_rate": 1.3680792075706545e-06, "epoch": 0.6670659234348367, "percentage": 66.71, "elapsed_time": "22:53:01", "remaining_time": "11:25:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7241, "total_steps": 10853, "loss": 0.1148, "learning_rate": 1.367400033018599e-06, "epoch": 0.6671580596121067, "percentage": 66.72, "elapsed_time": "22:53:13", "remaining_time": "11:25:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7242, "total_steps": 10853, "loss": 0.131, "learning_rate": 1.3667209636285727e-06, "epoch": 0.6672501957893767, "percentage": 66.73, "elapsed_time": "22:53:23", "remaining_time": "11:24:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7243, "total_steps": 10853, "loss": 0.13, "learning_rate": 1.366041999463626e-06, "epoch": 0.6673423319666467, "percentage": 66.74, "elapsed_time": "22:53:35", "remaining_time": "11:24:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7244, "total_steps": 10853, "loss": 0.1232, "learning_rate": 1.3653631405868011e-06, "epoch": 0.6674344681439167, "percentage": 66.75, "elapsed_time": "22:53:46", "remaining_time": "11:24:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7245, "total_steps": 10853, "loss": 0.1277, "learning_rate": 1.3646843870611313e-06, "epoch": 0.6675266043211867, "percentage": 66.76, "elapsed_time": "22:53:56", "remaining_time": "11:24:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7246, "total_steps": 10853, "loss": 0.1319, "learning_rate": 1.3640057389496392e-06, "epoch": 0.6676187404984567, "percentage": 66.76, "elapsed_time": "22:54:08", "remaining_time": "11:24:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7247, "total_steps": 10853, "loss": 0.1258, "learning_rate": 1.3633271963153363e-06, "epoch": 0.6677108766757267, "percentage": 66.77, "elapsed_time": "22:54:19", "remaining_time": "11:23:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7248, "total_steps": 10853, "loss": 0.1285, "learning_rate": 1.3626487592212245e-06, "epoch": 0.6678030128529967, "percentage": 66.78, "elapsed_time": "22:54:30", "remaining_time": "11:23:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7249, "total_steps": 10853, "loss": 0.1221, "learning_rate": 1.361970427730298e-06, "epoch": 0.6678951490302667, "percentage": 66.79, "elapsed_time": "22:54:41", "remaining_time": "11:23:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7250, "total_steps": 10853, "loss": 0.1278, "learning_rate": 1.3612922019055409e-06, "epoch": 0.6679872852075367, "percentage": 66.8, "elapsed_time": "22:54:51", "remaining_time": "11:23:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7251, "total_steps": 10853, "loss": 0.1283, "learning_rate": 1.3606140818099243e-06, "epoch": 0.6680794213848067, "percentage": 66.81, "elapsed_time": "22:55:01", "remaining_time": "11:23:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7252, "total_steps": 10853, "loss": 0.1173, "learning_rate": 1.3599360675064139e-06, "epoch": 0.6681715575620768, "percentage": 66.82, "elapsed_time": "22:55:13", "remaining_time": "11:22:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7253, "total_steps": 10853, "loss": 0.1243, "learning_rate": 1.359258159057961e-06, "epoch": 0.6682636937393468, "percentage": 66.83, "elapsed_time": "22:55:24", "remaining_time": "11:22:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7254, "total_steps": 10853, "loss": 0.1271, "learning_rate": 1.358580356527511e-06, "epoch": 0.6683558299166168, "percentage": 66.84, "elapsed_time": "22:55:33", "remaining_time": "11:22:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7255, "total_steps": 10853, "loss": 0.1261, "learning_rate": 1.3579026599779988e-06, "epoch": 0.6684479660938868, "percentage": 66.85, "elapsed_time": "22:55:44", "remaining_time": "11:22:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7256, "total_steps": 10853, "loss": 0.1245, "learning_rate": 1.3572250694723465e-06, "epoch": 0.6685401022711568, "percentage": 66.86, "elapsed_time": "22:55:54", "remaining_time": "11:22:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7257, "total_steps": 10853, "loss": 0.1139, "learning_rate": 1.3565475850734706e-06, "epoch": 0.6686322384484268, "percentage": 66.87, "elapsed_time": "22:56:02", "remaining_time": "11:21:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7258, "total_steps": 10853, "loss": 0.111, "learning_rate": 1.355870206844273e-06, "epoch": 0.6687243746256968, "percentage": 66.88, "elapsed_time": "22:56:14", "remaining_time": "11:21:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7259, "total_steps": 10853, "loss": 0.125, "learning_rate": 1.3551929348476512e-06, "epoch": 0.6688165108029668, "percentage": 66.88, "elapsed_time": "22:56:24", "remaining_time": "11:21:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7260, "total_steps": 10853, "loss": 0.1212, "learning_rate": 1.3545157691464878e-06, "epoch": 0.6689086469802368, "percentage": 66.89, "elapsed_time": "22:56:35", "remaining_time": "11:21:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7261, "total_steps": 10853, "loss": 0.1246, "learning_rate": 1.353838709803658e-06, "epoch": 0.6690007831575068, "percentage": 66.9, "elapsed_time": "22:56:44", "remaining_time": "11:21:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7262, "total_steps": 10853, "loss": 0.1256, "learning_rate": 1.3531617568820287e-06, "epoch": 0.6690929193347768, "percentage": 66.91, "elapsed_time": "22:56:56", "remaining_time": "11:20:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7263, "total_steps": 10853, "loss": 0.1259, "learning_rate": 1.3524849104444537e-06, "epoch": 0.6691850555120468, "percentage": 66.92, "elapsed_time": "22:57:05", "remaining_time": "11:20:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7264, "total_steps": 10853, "loss": 0.1329, "learning_rate": 1.3518081705537771e-06, "epoch": 0.6692771916893168, "percentage": 66.93, "elapsed_time": "22:57:16", "remaining_time": "11:20:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7265, "total_steps": 10853, "loss": 0.1181, "learning_rate": 1.3511315372728357e-06, "epoch": 0.6693693278665868, "percentage": 66.94, "elapsed_time": "22:57:27", "remaining_time": "11:20:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7266, "total_steps": 10853, "loss": 0.1253, "learning_rate": 1.3504550106644542e-06, "epoch": 0.6694614640438569, "percentage": 66.95, "elapsed_time": "22:57:38", "remaining_time": "11:20:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7267, "total_steps": 10853, "loss": 0.1139, "learning_rate": 1.34977859079145e-06, "epoch": 0.6695536002211269, "percentage": 66.96, "elapsed_time": "22:57:48", "remaining_time": "11:19:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7268, "total_steps": 10853, "loss": 0.1156, "learning_rate": 1.3491022777166276e-06, "epoch": 0.6696457363983969, "percentage": 66.97, "elapsed_time": "22:57:59", "remaining_time": "11:19:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7269, "total_steps": 10853, "loss": 0.1436, "learning_rate": 1.3484260715027813e-06, "epoch": 0.6697378725756669, "percentage": 66.98, "elapsed_time": "22:58:11", "remaining_time": "11:19:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7270, "total_steps": 10853, "loss": 0.1323, "learning_rate": 1.3477499722126985e-06, "epoch": 0.6698300087529369, "percentage": 66.99, "elapsed_time": "22:58:22", "remaining_time": "11:19:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7271, "total_steps": 10853, "loss": 0.1322, "learning_rate": 1.3470739799091555e-06, "epoch": 0.6699221449302069, "percentage": 67.0, "elapsed_time": "22:58:31", "remaining_time": "11:19:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7272, "total_steps": 10853, "loss": 0.1382, "learning_rate": 1.3463980946549166e-06, "epoch": 0.6700142811074769, "percentage": 67.0, "elapsed_time": "22:58:42", "remaining_time": "11:18:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7273, "total_steps": 10853, "loss": 0.1088, "learning_rate": 1.3457223165127397e-06, "epoch": 0.6701064172847468, "percentage": 67.01, "elapsed_time": "22:58:52", "remaining_time": "11:18:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7274, "total_steps": 10853, "loss": 0.1342, "learning_rate": 1.3450466455453693e-06, "epoch": 0.6701985534620168, "percentage": 67.02, "elapsed_time": "22:59:04", "remaining_time": "11:18:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7275, "total_steps": 10853, "loss": 0.1191, "learning_rate": 1.3443710818155428e-06, "epoch": 0.6702906896392868, "percentage": 67.03, "elapsed_time": "22:59:13", "remaining_time": "11:18:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7276, "total_steps": 10853, "loss": 0.1119, "learning_rate": 1.3436956253859851e-06, "epoch": 0.6703828258165568, "percentage": 67.04, "elapsed_time": "22:59:23", "remaining_time": "11:18:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7277, "total_steps": 10853, "loss": 0.1242, "learning_rate": 1.3430202763194125e-06, "epoch": 0.6704749619938268, "percentage": 67.05, "elapsed_time": "22:59:34", "remaining_time": "11:17:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7278, "total_steps": 10853, "loss": 0.1207, "learning_rate": 1.342345034678533e-06, "epoch": 0.6705670981710968, "percentage": 67.06, "elapsed_time": "22:59:46", "remaining_time": "11:17:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7279, "total_steps": 10853, "loss": 0.131, "learning_rate": 1.3416699005260416e-06, "epoch": 0.6706592343483669, "percentage": 67.07, "elapsed_time": "22:59:56", "remaining_time": "11:17:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7280, "total_steps": 10853, "loss": 0.1193, "learning_rate": 1.3409948739246236e-06, "epoch": 0.6707513705256369, "percentage": 67.08, "elapsed_time": "23:00:06", "remaining_time": "11:17:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7281, "total_steps": 10853, "loss": 0.1288, "learning_rate": 1.3403199549369564e-06, "epoch": 0.6708435067029069, "percentage": 67.09, "elapsed_time": "23:00:17", "remaining_time": "11:17:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7282, "total_steps": 10853, "loss": 0.1307, "learning_rate": 1.3396451436257062e-06, "epoch": 0.6709356428801769, "percentage": 67.1, "elapsed_time": "23:00:28", "remaining_time": "11:16:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7283, "total_steps": 10853, "loss": 0.1294, "learning_rate": 1.3389704400535303e-06, "epoch": 0.6710277790574469, "percentage": 67.11, "elapsed_time": "23:00:38", "remaining_time": "11:16:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7284, "total_steps": 10853, "loss": 0.1239, "learning_rate": 1.3382958442830737e-06, "epoch": 0.6711199152347169, "percentage": 67.12, "elapsed_time": "23:00:48", "remaining_time": "11:16:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7285, "total_steps": 10853, "loss": 0.1264, "learning_rate": 1.337621356376972e-06, "epoch": 0.6712120514119869, "percentage": 67.12, "elapsed_time": "23:00:59", "remaining_time": "11:16:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7286, "total_steps": 10853, "loss": 0.1316, "learning_rate": 1.3369469763978527e-06, "epoch": 0.6713041875892569, "percentage": 67.13, "elapsed_time": "23:01:09", "remaining_time": "11:16:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7287, "total_steps": 10853, "loss": 0.1418, "learning_rate": 1.3362727044083318e-06, "epoch": 0.6713963237665269, "percentage": 67.14, "elapsed_time": "23:01:20", "remaining_time": "11:15:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7288, "total_steps": 10853, "loss": 0.1174, "learning_rate": 1.3355985404710164e-06, "epoch": 0.6714884599437969, "percentage": 67.15, "elapsed_time": "23:01:30", "remaining_time": "11:15:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7289, "total_steps": 10853, "loss": 0.1301, "learning_rate": 1.3349244846485022e-06, "epoch": 0.6715805961210669, "percentage": 67.16, "elapsed_time": "23:01:41", "remaining_time": "11:15:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7290, "total_steps": 10853, "loss": 0.1125, "learning_rate": 1.3342505370033736e-06, "epoch": 0.6716727322983369, "percentage": 67.17, "elapsed_time": "23:01:50", "remaining_time": "11:15:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7291, "total_steps": 10853, "loss": 0.1243, "learning_rate": 1.3335766975982082e-06, "epoch": 0.6717648684756069, "percentage": 67.18, "elapsed_time": "23:01:59", "remaining_time": "11:15:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7292, "total_steps": 10853, "loss": 0.1002, "learning_rate": 1.3329029664955729e-06, "epoch": 0.6718570046528769, "percentage": 67.19, "elapsed_time": "23:02:10", "remaining_time": "11:14:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7293, "total_steps": 10853, "loss": 0.1265, "learning_rate": 1.332229343758022e-06, "epoch": 0.671949140830147, "percentage": 67.2, "elapsed_time": "23:02:19", "remaining_time": "11:14:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7294, "total_steps": 10853, "loss": 0.1257, "learning_rate": 1.331555829448103e-06, "epoch": 0.672041277007417, "percentage": 67.21, "elapsed_time": "23:02:30", "remaining_time": "11:14:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7295, "total_steps": 10853, "loss": 0.1209, "learning_rate": 1.33088242362835e-06, "epoch": 0.672133413184687, "percentage": 67.22, "elapsed_time": "23:02:43", "remaining_time": "11:14:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7296, "total_steps": 10853, "loss": 0.1174, "learning_rate": 1.3302091263612907e-06, "epoch": 0.672225549361957, "percentage": 67.23, "elapsed_time": "23:02:54", "remaining_time": "11:14:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7297, "total_steps": 10853, "loss": 0.1295, "learning_rate": 1.3295359377094392e-06, "epoch": 0.672317685539227, "percentage": 67.23, "elapsed_time": "23:03:05", "remaining_time": "11:14:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7298, "total_steps": 10853, "loss": 0.1251, "learning_rate": 1.3288628577353014e-06, "epoch": 0.672409821716497, "percentage": 67.24, "elapsed_time": "23:03:16", "remaining_time": "11:13:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7299, "total_steps": 10853, "loss": 0.1422, "learning_rate": 1.3281898865013749e-06, "epoch": 0.672501957893767, "percentage": 67.25, "elapsed_time": "23:03:26", "remaining_time": "11:13:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7300, "total_steps": 10853, "loss": 0.129, "learning_rate": 1.327517024070143e-06, "epoch": 0.672594094071037, "percentage": 67.26, "elapsed_time": "23:03:36", "remaining_time": "11:13:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7301, "total_steps": 10853, "loss": 0.1319, "learning_rate": 1.3268442705040808e-06, "epoch": 0.672686230248307, "percentage": 67.27, "elapsed_time": "23:03:48", "remaining_time": "11:13:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7302, "total_steps": 10853, "loss": 0.127, "learning_rate": 1.3261716258656543e-06, "epoch": 0.672778366425577, "percentage": 67.28, "elapsed_time": "23:03:59", "remaining_time": "11:13:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7303, "total_steps": 10853, "loss": 0.1272, "learning_rate": 1.3254990902173187e-06, "epoch": 0.672870502602847, "percentage": 67.29, "elapsed_time": "23:04:10", "remaining_time": "11:12:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7304, "total_steps": 10853, "loss": 0.125, "learning_rate": 1.3248266636215202e-06, "epoch": 0.672962638780117, "percentage": 67.3, "elapsed_time": "23:04:23", "remaining_time": "11:12:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7305, "total_steps": 10853, "loss": 0.1094, "learning_rate": 1.324154346140692e-06, "epoch": 0.673054774957387, "percentage": 67.31, "elapsed_time": "23:04:32", "remaining_time": "11:12:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7306, "total_steps": 10853, "loss": 0.1299, "learning_rate": 1.3234821378372586e-06, "epoch": 0.6731469111346571, "percentage": 67.32, "elapsed_time": "23:04:42", "remaining_time": "11:12:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7307, "total_steps": 10853, "loss": 0.1377, "learning_rate": 1.3228100387736353e-06, "epoch": 0.6732390473119271, "percentage": 67.33, "elapsed_time": "23:04:53", "remaining_time": "11:12:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7308, "total_steps": 10853, "loss": 0.1286, "learning_rate": 1.3221380490122276e-06, "epoch": 0.6733311834891971, "percentage": 67.34, "elapsed_time": "23:05:04", "remaining_time": "11:11:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7309, "total_steps": 10853, "loss": 0.1281, "learning_rate": 1.321466168615428e-06, "epoch": 0.6734233196664671, "percentage": 67.35, "elapsed_time": "23:05:15", "remaining_time": "11:11:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7310, "total_steps": 10853, "loss": 0.1281, "learning_rate": 1.3207943976456223e-06, "epoch": 0.6735154558437371, "percentage": 67.35, "elapsed_time": "23:05:24", "remaining_time": "11:11:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7311, "total_steps": 10853, "loss": 0.1258, "learning_rate": 1.3201227361651824e-06, "epoch": 0.6736075920210071, "percentage": 67.36, "elapsed_time": "23:05:36", "remaining_time": "11:11:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7312, "total_steps": 10853, "loss": 0.1188, "learning_rate": 1.3194511842364738e-06, "epoch": 0.6736997281982771, "percentage": 67.37, "elapsed_time": "23:05:46", "remaining_time": "11:11:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7313, "total_steps": 10853, "loss": 0.1274, "learning_rate": 1.3187797419218506e-06, "epoch": 0.6737918643755471, "percentage": 67.38, "elapsed_time": "23:05:58", "remaining_time": "11:10:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7314, "total_steps": 10853, "loss": 0.1361, "learning_rate": 1.3181084092836544e-06, "epoch": 0.673884000552817, "percentage": 67.39, "elapsed_time": "23:06:06", "remaining_time": "11:10:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7315, "total_steps": 10853, "loss": 0.133, "learning_rate": 1.31743718638422e-06, "epoch": 0.673976136730087, "percentage": 67.4, "elapsed_time": "23:06:17", "remaining_time": "11:10:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7316, "total_steps": 10853, "loss": 0.145, "learning_rate": 1.3167660732858705e-06, "epoch": 0.674068272907357, "percentage": 67.41, "elapsed_time": "23:06:26", "remaining_time": "11:10:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7317, "total_steps": 10853, "loss": 0.1169, "learning_rate": 1.316095070050919e-06, "epoch": 0.674160409084627, "percentage": 67.42, "elapsed_time": "23:06:37", "remaining_time": "11:10:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7318, "total_steps": 10853, "loss": 0.1266, "learning_rate": 1.3154241767416665e-06, "epoch": 0.674252545261897, "percentage": 67.43, "elapsed_time": "23:06:48", "remaining_time": "11:09:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7319, "total_steps": 10853, "loss": 0.1148, "learning_rate": 1.3147533934204065e-06, "epoch": 0.674344681439167, "percentage": 67.44, "elapsed_time": "23:06:58", "remaining_time": "11:09:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7320, "total_steps": 10853, "loss": 0.1242, "learning_rate": 1.3140827201494215e-06, "epoch": 0.6744368176164371, "percentage": 67.45, "elapsed_time": "23:07:08", "remaining_time": "11:09:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7321, "total_steps": 10853, "loss": 0.1295, "learning_rate": 1.313412156990985e-06, "epoch": 0.6745289537937071, "percentage": 67.46, "elapsed_time": "23:07:18", "remaining_time": "11:09:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7322, "total_steps": 10853, "loss": 0.136, "learning_rate": 1.312741704007357e-06, "epoch": 0.6746210899709771, "percentage": 67.47, "elapsed_time": "23:07:29", "remaining_time": "11:09:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7323, "total_steps": 10853, "loss": 0.1259, "learning_rate": 1.3120713612607888e-06, "epoch": 0.6747132261482471, "percentage": 67.47, "elapsed_time": "23:07:40", "remaining_time": "11:08:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7324, "total_steps": 10853, "loss": 0.1264, "learning_rate": 1.3114011288135225e-06, "epoch": 0.6748053623255171, "percentage": 67.48, "elapsed_time": "23:07:51", "remaining_time": "11:08:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7325, "total_steps": 10853, "loss": 0.1181, "learning_rate": 1.31073100672779e-06, "epoch": 0.6748974985027871, "percentage": 67.49, "elapsed_time": "23:08:01", "remaining_time": "11:08:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7326, "total_steps": 10853, "loss": 0.1223, "learning_rate": 1.3100609950658109e-06, "epoch": 0.6749896346800571, "percentage": 67.5, "elapsed_time": "23:08:12", "remaining_time": "11:08:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7327, "total_steps": 10853, "loss": 0.1266, "learning_rate": 1.3093910938897972e-06, "epoch": 0.6750817708573271, "percentage": 67.51, "elapsed_time": "23:08:23", "remaining_time": "11:08:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7328, "total_steps": 10853, "loss": 0.117, "learning_rate": 1.3087213032619478e-06, "epoch": 0.6751739070345971, "percentage": 67.52, "elapsed_time": "23:08:34", "remaining_time": "11:07:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7329, "total_steps": 10853, "loss": 0.1212, "learning_rate": 1.3080516232444545e-06, "epoch": 0.6752660432118671, "percentage": 67.53, "elapsed_time": "23:08:46", "remaining_time": "11:07:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7330, "total_steps": 10853, "loss": 0.1307, "learning_rate": 1.3073820538994952e-06, "epoch": 0.6753581793891371, "percentage": 67.54, "elapsed_time": "23:08:57", "remaining_time": "11:07:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7331, "total_steps": 10853, "loss": 0.1074, "learning_rate": 1.3067125952892408e-06, "epoch": 0.6754503155664071, "percentage": 67.55, "elapsed_time": "23:09:09", "remaining_time": "11:07:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7332, "total_steps": 10853, "loss": 0.1121, "learning_rate": 1.3060432474758508e-06, "epoch": 0.6755424517436771, "percentage": 67.56, "elapsed_time": "23:09:20", "remaining_time": "11:07:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7333, "total_steps": 10853, "loss": 0.1374, "learning_rate": 1.3053740105214741e-06, "epoch": 0.6756345879209471, "percentage": 67.57, "elapsed_time": "23:09:31", "remaining_time": "11:07:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7334, "total_steps": 10853, "loss": 0.1158, "learning_rate": 1.3047048844882481e-06, "epoch": 0.6757267240982172, "percentage": 67.58, "elapsed_time": "23:09:42", "remaining_time": "11:06:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7335, "total_steps": 10853, "loss": 0.111, "learning_rate": 1.304035869438302e-06, "epoch": 0.6758188602754872, "percentage": 67.58, "elapsed_time": "23:09:52", "remaining_time": "11:06:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7336, "total_steps": 10853, "loss": 0.1406, "learning_rate": 1.3033669654337544e-06, "epoch": 0.6759109964527572, "percentage": 67.59, "elapsed_time": "23:10:03", "remaining_time": "11:06:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7337, "total_steps": 10853, "loss": 0.1214, "learning_rate": 1.302698172536714e-06, "epoch": 0.6760031326300272, "percentage": 67.6, "elapsed_time": "23:10:14", "remaining_time": "11:06:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7338, "total_steps": 10853, "loss": 0.1255, "learning_rate": 1.3020294908092767e-06, "epoch": 0.6760952688072972, "percentage": 67.61, "elapsed_time": "23:10:25", "remaining_time": "11:06:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7339, "total_steps": 10853, "loss": 0.1268, "learning_rate": 1.3013609203135297e-06, "epoch": 0.6761874049845672, "percentage": 67.62, "elapsed_time": "23:10:33", "remaining_time": "11:05:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7340, "total_steps": 10853, "loss": 0.1238, "learning_rate": 1.3006924611115495e-06, "epoch": 0.6762795411618372, "percentage": 67.63, "elapsed_time": "23:10:43", "remaining_time": "11:05:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7341, "total_steps": 10853, "loss": 0.1232, "learning_rate": 1.300024113265404e-06, "epoch": 0.6763716773391072, "percentage": 67.64, "elapsed_time": "23:10:53", "remaining_time": "11:05:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7342, "total_steps": 10853, "loss": 0.1262, "learning_rate": 1.2993558768371494e-06, "epoch": 0.6764638135163772, "percentage": 67.65, "elapsed_time": "23:11:04", "remaining_time": "11:05:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7343, "total_steps": 10853, "loss": 0.1272, "learning_rate": 1.2986877518888307e-06, "epoch": 0.6765559496936472, "percentage": 67.66, "elapsed_time": "23:11:14", "remaining_time": "11:05:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7344, "total_steps": 10853, "loss": 0.1189, "learning_rate": 1.2980197384824828e-06, "epoch": 0.6766480858709172, "percentage": 67.67, "elapsed_time": "23:11:25", "remaining_time": "11:04:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7345, "total_steps": 10853, "loss": 0.1124, "learning_rate": 1.2973518366801315e-06, "epoch": 0.6767402220481872, "percentage": 67.68, "elapsed_time": "23:11:37", "remaining_time": "11:04:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7346, "total_steps": 10853, "loss": 0.1333, "learning_rate": 1.2966840465437923e-06, "epoch": 0.6768323582254572, "percentage": 67.69, "elapsed_time": "23:11:48", "remaining_time": "11:04:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7347, "total_steps": 10853, "loss": 0.1216, "learning_rate": 1.2960163681354683e-06, "epoch": 0.6769244944027273, "percentage": 67.7, "elapsed_time": "23:11:59", "remaining_time": "11:04:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7348, "total_steps": 10853, "loss": 0.1186, "learning_rate": 1.2953488015171551e-06, "epoch": 0.6770166305799973, "percentage": 67.7, "elapsed_time": "23:12:11", "remaining_time": "11:04:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7349, "total_steps": 10853, "loss": 0.1117, "learning_rate": 1.294681346750834e-06, "epoch": 0.6771087667572673, "percentage": 67.71, "elapsed_time": "23:12:22", "remaining_time": "11:03:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7350, "total_steps": 10853, "loss": 0.1212, "learning_rate": 1.294014003898481e-06, "epoch": 0.6772009029345373, "percentage": 67.72, "elapsed_time": "23:12:33", "remaining_time": "11:03:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7351, "total_steps": 10853, "loss": 0.1429, "learning_rate": 1.2933467730220562e-06, "epoch": 0.6772930391118073, "percentage": 67.73, "elapsed_time": "23:12:44", "remaining_time": "11:03:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7352, "total_steps": 10853, "loss": 0.1338, "learning_rate": 1.2926796541835135e-06, "epoch": 0.6773851752890773, "percentage": 67.74, "elapsed_time": "23:12:55", "remaining_time": "11:03:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7353, "total_steps": 10853, "loss": 0.1153, "learning_rate": 1.2920126474447957e-06, "epoch": 0.6774773114663473, "percentage": 67.75, "elapsed_time": "23:13:06", "remaining_time": "11:03:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7354, "total_steps": 10853, "loss": 0.1418, "learning_rate": 1.2913457528678335e-06, "epoch": 0.6775694476436173, "percentage": 67.76, "elapsed_time": "23:13:17", "remaining_time": "11:02:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7355, "total_steps": 10853, "loss": 0.1257, "learning_rate": 1.2906789705145475e-06, "epoch": 0.6776615838208873, "percentage": 67.77, "elapsed_time": "23:13:28", "remaining_time": "11:02:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7356, "total_steps": 10853, "loss": 0.1156, "learning_rate": 1.2900123004468493e-06, "epoch": 0.6777537199981573, "percentage": 67.78, "elapsed_time": "23:13:40", "remaining_time": "11:02:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7357, "total_steps": 10853, "loss": 0.1326, "learning_rate": 1.289345742726639e-06, "epoch": 0.6778458561754273, "percentage": 67.79, "elapsed_time": "23:13:51", "remaining_time": "11:02:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7358, "total_steps": 10853, "loss": 0.1248, "learning_rate": 1.288679297415808e-06, "epoch": 0.6779379923526972, "percentage": 67.8, "elapsed_time": "23:14:01", "remaining_time": "11:02:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7359, "total_steps": 10853, "loss": 0.1176, "learning_rate": 1.2880129645762344e-06, "epoch": 0.6780301285299672, "percentage": 67.81, "elapsed_time": "23:14:11", "remaining_time": "11:01:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7360, "total_steps": 10853, "loss": 0.1354, "learning_rate": 1.2873467442697862e-06, "epoch": 0.6781222647072372, "percentage": 67.82, "elapsed_time": "23:14:23", "remaining_time": "11:01:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7361, "total_steps": 10853, "loss": 0.1179, "learning_rate": 1.286680636558324e-06, "epoch": 0.6782144008845074, "percentage": 67.82, "elapsed_time": "23:14:33", "remaining_time": "11:01:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7362, "total_steps": 10853, "loss": 0.1177, "learning_rate": 1.2860146415036957e-06, "epoch": 0.6783065370617773, "percentage": 67.83, "elapsed_time": "23:14:44", "remaining_time": "11:01:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7363, "total_steps": 10853, "loss": 0.1226, "learning_rate": 1.2853487591677377e-06, "epoch": 0.6783986732390473, "percentage": 67.84, "elapsed_time": "23:14:54", "remaining_time": "11:01:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7364, "total_steps": 10853, "loss": 0.1116, "learning_rate": 1.2846829896122792e-06, "epoch": 0.6784908094163173, "percentage": 67.85, "elapsed_time": "23:15:05", "remaining_time": "11:00:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7365, "total_steps": 10853, "loss": 0.1259, "learning_rate": 1.284017332899135e-06, "epoch": 0.6785829455935873, "percentage": 67.86, "elapsed_time": "23:15:15", "remaining_time": "11:00:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7366, "total_steps": 10853, "loss": 0.1182, "learning_rate": 1.283351789090113e-06, "epoch": 0.6786750817708573, "percentage": 67.87, "elapsed_time": "23:15:25", "remaining_time": "11:00:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7367, "total_steps": 10853, "loss": 0.1254, "learning_rate": 1.2826863582470078e-06, "epoch": 0.6787672179481273, "percentage": 67.88, "elapsed_time": "23:15:36", "remaining_time": "11:00:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7368, "total_steps": 10853, "loss": 0.1124, "learning_rate": 1.2820210404316053e-06, "epoch": 0.6788593541253973, "percentage": 67.89, "elapsed_time": "23:15:48", "remaining_time": "11:00:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7369, "total_steps": 10853, "loss": 0.1288, "learning_rate": 1.2813558357056806e-06, "epoch": 0.6789514903026673, "percentage": 67.9, "elapsed_time": "23:15:59", "remaining_time": "11:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7370, "total_steps": 10853, "loss": 0.1373, "learning_rate": 1.2806907441309974e-06, "epoch": 0.6790436264799373, "percentage": 67.91, "elapsed_time": "23:16:10", "remaining_time": "10:59:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7371, "total_steps": 10853, "loss": 0.1099, "learning_rate": 1.2800257657693105e-06, "epoch": 0.6791357626572073, "percentage": 67.92, "elapsed_time": "23:16:20", "remaining_time": "10:59:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7372, "total_steps": 10853, "loss": 0.1208, "learning_rate": 1.2793609006823615e-06, "epoch": 0.6792278988344773, "percentage": 67.93, "elapsed_time": "23:16:32", "remaining_time": "10:59:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7373, "total_steps": 10853, "loss": 0.1436, "learning_rate": 1.2786961489318842e-06, "epoch": 0.6793200350117473, "percentage": 67.94, "elapsed_time": "23:16:43", "remaining_time": "10:59:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7374, "total_steps": 10853, "loss": 0.1197, "learning_rate": 1.278031510579602e-06, "epoch": 0.6794121711890174, "percentage": 67.94, "elapsed_time": "23:16:54", "remaining_time": "10:59:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7375, "total_steps": 10853, "loss": 0.1398, "learning_rate": 1.2773669856872256e-06, "epoch": 0.6795043073662874, "percentage": 67.95, "elapsed_time": "23:17:05", "remaining_time": "10:58:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7376, "total_steps": 10853, "loss": 0.1183, "learning_rate": 1.2767025743164551e-06, "epoch": 0.6795964435435574, "percentage": 67.96, "elapsed_time": "23:17:15", "remaining_time": "10:58:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7377, "total_steps": 10853, "loss": 0.1192, "learning_rate": 1.2760382765289821e-06, "epoch": 0.6796885797208274, "percentage": 67.97, "elapsed_time": "23:17:24", "remaining_time": "10:58:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7378, "total_steps": 10853, "loss": 0.1281, "learning_rate": 1.275374092386487e-06, "epoch": 0.6797807158980974, "percentage": 67.98, "elapsed_time": "23:17:35", "remaining_time": "10:58:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7379, "total_steps": 10853, "loss": 0.1199, "learning_rate": 1.2747100219506404e-06, "epoch": 0.6798728520753674, "percentage": 67.99, "elapsed_time": "23:17:46", "remaining_time": "10:58:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7380, "total_steps": 10853, "loss": 0.1258, "learning_rate": 1.2740460652831e-06, "epoch": 0.6799649882526374, "percentage": 68.0, "elapsed_time": "23:17:58", "remaining_time": "10:57:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7381, "total_steps": 10853, "loss": 0.1309, "learning_rate": 1.2733822224455133e-06, "epoch": 0.6800571244299074, "percentage": 68.01, "elapsed_time": "23:18:09", "remaining_time": "10:57:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7382, "total_steps": 10853, "loss": 0.1378, "learning_rate": 1.272718493499519e-06, "epoch": 0.6801492606071774, "percentage": 68.02, "elapsed_time": "23:18:22", "remaining_time": "10:57:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7383, "total_steps": 10853, "loss": 0.126, "learning_rate": 1.272054878506746e-06, "epoch": 0.6802413967844474, "percentage": 68.03, "elapsed_time": "23:18:33", "remaining_time": "10:57:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7384, "total_steps": 10853, "loss": 0.1158, "learning_rate": 1.2713913775288086e-06, "epoch": 0.6803335329617174, "percentage": 68.04, "elapsed_time": "23:18:43", "remaining_time": "10:57:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7385, "total_steps": 10853, "loss": 0.1278, "learning_rate": 1.2707279906273152e-06, "epoch": 0.6804256691389874, "percentage": 68.05, "elapsed_time": "23:18:54", "remaining_time": "10:56:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7386, "total_steps": 10853, "loss": 0.1305, "learning_rate": 1.270064717863859e-06, "epoch": 0.6805178053162574, "percentage": 68.05, "elapsed_time": "23:19:06", "remaining_time": "10:56:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7387, "total_steps": 10853, "loss": 0.1273, "learning_rate": 1.269401559300027e-06, "epoch": 0.6806099414935274, "percentage": 68.06, "elapsed_time": "23:19:17", "remaining_time": "10:56:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7388, "total_steps": 10853, "loss": 0.1353, "learning_rate": 1.2687385149973919e-06, "epoch": 0.6807020776707975, "percentage": 68.07, "elapsed_time": "23:19:26", "remaining_time": "10:56:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7389, "total_steps": 10853, "loss": 0.1169, "learning_rate": 1.268075585017518e-06, "epoch": 0.6807942138480675, "percentage": 68.08, "elapsed_time": "23:19:37", "remaining_time": "10:56:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7390, "total_steps": 10853, "loss": 0.1258, "learning_rate": 1.2674127694219588e-06, "epoch": 0.6808863500253375, "percentage": 68.09, "elapsed_time": "23:19:48", "remaining_time": "10:55:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7391, "total_steps": 10853, "loss": 0.1295, "learning_rate": 1.2667500682722584e-06, "epoch": 0.6809784862026075, "percentage": 68.1, "elapsed_time": "23:19:59", "remaining_time": "10:55:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7392, "total_steps": 10853, "loss": 0.1222, "learning_rate": 1.266087481629945e-06, "epoch": 0.6810706223798775, "percentage": 68.11, "elapsed_time": "23:20:11", "remaining_time": "10:55:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7393, "total_steps": 10853, "loss": 0.1304, "learning_rate": 1.2654250095565417e-06, "epoch": 0.6811627585571475, "percentage": 68.12, "elapsed_time": "23:20:20", "remaining_time": "10:55:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7394, "total_steps": 10853, "loss": 0.1219, "learning_rate": 1.2647626521135592e-06, "epoch": 0.6812548947344175, "percentage": 68.13, "elapsed_time": "23:20:31", "remaining_time": "10:55:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7395, "total_steps": 10853, "loss": 0.131, "learning_rate": 1.2641004093624981e-06, "epoch": 0.6813470309116875, "percentage": 68.14, "elapsed_time": "23:20:43", "remaining_time": "10:54:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7396, "total_steps": 10853, "loss": 0.13, "learning_rate": 1.2634382813648462e-06, "epoch": 0.6814391670889575, "percentage": 68.15, "elapsed_time": "23:20:55", "remaining_time": "10:54:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7397, "total_steps": 10853, "loss": 0.1344, "learning_rate": 1.262776268182084e-06, "epoch": 0.6815313032662275, "percentage": 68.16, "elapsed_time": "23:21:06", "remaining_time": "10:54:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7398, "total_steps": 10853, "loss": 0.1256, "learning_rate": 1.2621143698756778e-06, "epoch": 0.6816234394434975, "percentage": 68.17, "elapsed_time": "23:21:16", "remaining_time": "10:54:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7399, "total_steps": 10853, "loss": 0.1283, "learning_rate": 1.2614525865070848e-06, "epoch": 0.6817155756207675, "percentage": 68.17, "elapsed_time": "23:21:28", "remaining_time": "10:54:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7400, "total_steps": 10853, "loss": 0.1319, "learning_rate": 1.260790918137754e-06, "epoch": 0.6818077117980375, "percentage": 68.18, "elapsed_time": "23:21:38", "remaining_time": "10:54:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7401, "total_steps": 10853, "loss": 0.1239, "learning_rate": 1.2601293648291184e-06, "epoch": 0.6818998479753074, "percentage": 68.19, "elapsed_time": "23:21:50", "remaining_time": "10:53:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7402, "total_steps": 10853, "loss": 0.1301, "learning_rate": 1.2594679266426063e-06, "epoch": 0.6819919841525776, "percentage": 68.2, "elapsed_time": "23:22:03", "remaining_time": "10:53:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7403, "total_steps": 10853, "loss": 0.1171, "learning_rate": 1.2588066036396294e-06, "epoch": 0.6820841203298476, "percentage": 68.21, "elapsed_time": "23:22:13", "remaining_time": "10:53:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7404, "total_steps": 10853, "loss": 0.1195, "learning_rate": 1.2581453958815937e-06, "epoch": 0.6821762565071176, "percentage": 68.22, "elapsed_time": "23:22:25", "remaining_time": "10:53:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7405, "total_steps": 10853, "loss": 0.1265, "learning_rate": 1.2574843034298912e-06, "epoch": 0.6822683926843875, "percentage": 68.23, "elapsed_time": "23:22:36", "remaining_time": "10:53:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7406, "total_steps": 10853, "loss": 0.1312, "learning_rate": 1.2568233263459042e-06, "epoch": 0.6823605288616575, "percentage": 68.24, "elapsed_time": "23:22:48", "remaining_time": "10:52:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7407, "total_steps": 10853, "loss": 0.1346, "learning_rate": 1.2561624646910064e-06, "epoch": 0.6824526650389275, "percentage": 68.25, "elapsed_time": "23:22:58", "remaining_time": "10:52:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7408, "total_steps": 10853, "loss": 0.1376, "learning_rate": 1.2555017185265578e-06, "epoch": 0.6825448012161975, "percentage": 68.26, "elapsed_time": "23:23:09", "remaining_time": "10:52:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7409, "total_steps": 10853, "loss": 0.105, "learning_rate": 1.2548410879139072e-06, "epoch": 0.6826369373934675, "percentage": 68.27, "elapsed_time": "23:23:19", "remaining_time": "10:52:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7410, "total_steps": 10853, "loss": 0.1309, "learning_rate": 1.254180572914396e-06, "epoch": 0.6827290735707375, "percentage": 68.28, "elapsed_time": "23:23:31", "remaining_time": "10:52:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7411, "total_steps": 10853, "loss": 0.1168, "learning_rate": 1.2535201735893526e-06, "epoch": 0.6828212097480075, "percentage": 68.29, "elapsed_time": "23:23:42", "remaining_time": "10:51:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7412, "total_steps": 10853, "loss": 0.1247, "learning_rate": 1.252859890000096e-06, "epoch": 0.6829133459252775, "percentage": 68.29, "elapsed_time": "23:23:51", "remaining_time": "10:51:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7413, "total_steps": 10853, "loss": 0.1182, "learning_rate": 1.252199722207933e-06, "epoch": 0.6830054821025475, "percentage": 68.3, "elapsed_time": "23:24:02", "remaining_time": "10:51:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7414, "total_steps": 10853, "loss": 0.1275, "learning_rate": 1.2515396702741593e-06, "epoch": 0.6830976182798175, "percentage": 68.31, "elapsed_time": "23:24:13", "remaining_time": "10:51:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7415, "total_steps": 10853, "loss": 0.137, "learning_rate": 1.2508797342600613e-06, "epoch": 0.6831897544570876, "percentage": 68.32, "elapsed_time": "23:24:23", "remaining_time": "10:51:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7416, "total_steps": 10853, "loss": 0.1262, "learning_rate": 1.2502199142269154e-06, "epoch": 0.6832818906343576, "percentage": 68.33, "elapsed_time": "23:24:34", "remaining_time": "10:50:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7417, "total_steps": 10853, "loss": 0.1159, "learning_rate": 1.2495602102359837e-06, "epoch": 0.6833740268116276, "percentage": 68.34, "elapsed_time": "23:24:45", "remaining_time": "10:50:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7418, "total_steps": 10853, "loss": 0.1318, "learning_rate": 1.2489006223485225e-06, "epoch": 0.6834661629888976, "percentage": 68.35, "elapsed_time": "23:24:55", "remaining_time": "10:50:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7419, "total_steps": 10853, "loss": 0.1217, "learning_rate": 1.2482411506257722e-06, "epoch": 0.6835582991661676, "percentage": 68.36, "elapsed_time": "23:25:04", "remaining_time": "10:50:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7420, "total_steps": 10853, "loss": 0.1219, "learning_rate": 1.2475817951289665e-06, "epoch": 0.6836504353434376, "percentage": 68.37, "elapsed_time": "23:25:13", "remaining_time": "10:50:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7421, "total_steps": 10853, "loss": 0.1351, "learning_rate": 1.2469225559193251e-06, "epoch": 0.6837425715207076, "percentage": 68.38, "elapsed_time": "23:25:25", "remaining_time": "10:49:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7422, "total_steps": 10853, "loss": 0.1179, "learning_rate": 1.2462634330580593e-06, "epoch": 0.6838347076979776, "percentage": 68.39, "elapsed_time": "23:25:35", "remaining_time": "10:49:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7423, "total_steps": 10853, "loss": 0.1231, "learning_rate": 1.2456044266063694e-06, "epoch": 0.6839268438752476, "percentage": 68.4, "elapsed_time": "23:25:44", "remaining_time": "10:49:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7424, "total_steps": 10853, "loss": 0.1342, "learning_rate": 1.2449455366254434e-06, "epoch": 0.6840189800525176, "percentage": 68.41, "elapsed_time": "23:25:55", "remaining_time": "10:49:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7425, "total_steps": 10853, "loss": 0.1214, "learning_rate": 1.2442867631764588e-06, "epoch": 0.6841111162297876, "percentage": 68.41, "elapsed_time": "23:26:06", "remaining_time": "10:49:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7426, "total_steps": 10853, "loss": 0.1264, "learning_rate": 1.2436281063205833e-06, "epoch": 0.6842032524070576, "percentage": 68.42, "elapsed_time": "23:26:17", "remaining_time": "10:48:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7427, "total_steps": 10853, "loss": 0.1297, "learning_rate": 1.2429695661189731e-06, "epoch": 0.6842953885843276, "percentage": 68.43, "elapsed_time": "23:26:27", "remaining_time": "10:48:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7428, "total_steps": 10853, "loss": 0.133, "learning_rate": 1.242311142632775e-06, "epoch": 0.6843875247615976, "percentage": 68.44, "elapsed_time": "23:26:37", "remaining_time": "10:48:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7429, "total_steps": 10853, "loss": 0.1201, "learning_rate": 1.2416528359231228e-06, "epoch": 0.6844796609388677, "percentage": 68.45, "elapsed_time": "23:26:48", "remaining_time": "10:48:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7430, "total_steps": 10853, "loss": 0.1336, "learning_rate": 1.240994646051139e-06, "epoch": 0.6845717971161377, "percentage": 68.46, "elapsed_time": "23:26:59", "remaining_time": "10:48:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7431, "total_steps": 10853, "loss": 0.1339, "learning_rate": 1.2403365730779383e-06, "epoch": 0.6846639332934077, "percentage": 68.47, "elapsed_time": "23:27:11", "remaining_time": "10:48:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7432, "total_steps": 10853, "loss": 0.128, "learning_rate": 1.2396786170646218e-06, "epoch": 0.6847560694706777, "percentage": 68.48, "elapsed_time": "23:27:21", "remaining_time": "10:47:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7433, "total_steps": 10853, "loss": 0.1191, "learning_rate": 1.2390207780722827e-06, "epoch": 0.6848482056479477, "percentage": 68.49, "elapsed_time": "23:27:33", "remaining_time": "10:47:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7434, "total_steps": 10853, "loss": 0.1268, "learning_rate": 1.238363056162e-06, "epoch": 0.6849403418252177, "percentage": 68.5, "elapsed_time": "23:27:44", "remaining_time": "10:47:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7435, "total_steps": 10853, "loss": 0.1317, "learning_rate": 1.2377054513948423e-06, "epoch": 0.6850324780024877, "percentage": 68.51, "elapsed_time": "23:27:55", "remaining_time": "10:47:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7436, "total_steps": 10853, "loss": 0.1263, "learning_rate": 1.2370479638318692e-06, "epoch": 0.6851246141797577, "percentage": 68.52, "elapsed_time": "23:28:07", "remaining_time": "10:47:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7437, "total_steps": 10853, "loss": 0.1237, "learning_rate": 1.2363905935341295e-06, "epoch": 0.6852167503570277, "percentage": 68.52, "elapsed_time": "23:28:18", "remaining_time": "10:46:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7438, "total_steps": 10853, "loss": 0.1302, "learning_rate": 1.235733340562658e-06, "epoch": 0.6853088865342977, "percentage": 68.53, "elapsed_time": "23:28:29", "remaining_time": "10:46:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7439, "total_steps": 10853, "loss": 0.1192, "learning_rate": 1.2350762049784835e-06, "epoch": 0.6854010227115677, "percentage": 68.54, "elapsed_time": "23:28:39", "remaining_time": "10:46:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7440, "total_steps": 10853, "loss": 0.1278, "learning_rate": 1.2344191868426181e-06, "epoch": 0.6854931588888377, "percentage": 68.55, "elapsed_time": "23:28:50", "remaining_time": "10:46:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7441, "total_steps": 10853, "loss": 0.1238, "learning_rate": 1.2337622862160687e-06, "epoch": 0.6855852950661077, "percentage": 68.56, "elapsed_time": "23:29:01", "remaining_time": "10:46:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7442, "total_steps": 10853, "loss": 0.1244, "learning_rate": 1.233105503159826e-06, "epoch": 0.6856774312433778, "percentage": 68.57, "elapsed_time": "23:29:11", "remaining_time": "10:45:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7443, "total_steps": 10853, "loss": 0.1087, "learning_rate": 1.2324488377348736e-06, "epoch": 0.6857695674206478, "percentage": 68.58, "elapsed_time": "23:29:21", "remaining_time": "10:45:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7444, "total_steps": 10853, "loss": 0.1223, "learning_rate": 1.2317922900021843e-06, "epoch": 0.6858617035979178, "percentage": 68.59, "elapsed_time": "23:29:32", "remaining_time": "10:45:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7445, "total_steps": 10853, "loss": 0.118, "learning_rate": 1.2311358600227172e-06, "epoch": 0.6859538397751878, "percentage": 68.6, "elapsed_time": "23:29:44", "remaining_time": "10:45:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7446, "total_steps": 10853, "loss": 0.1201, "learning_rate": 1.2304795478574211e-06, "epoch": 0.6860459759524578, "percentage": 68.61, "elapsed_time": "23:29:54", "remaining_time": "10:45:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7447, "total_steps": 10853, "loss": 0.1254, "learning_rate": 1.2298233535672357e-06, "epoch": 0.6861381121297278, "percentage": 68.62, "elapsed_time": "23:30:05", "remaining_time": "10:44:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7448, "total_steps": 10853, "loss": 0.1379, "learning_rate": 1.2291672772130885e-06, "epoch": 0.6862302483069977, "percentage": 68.63, "elapsed_time": "23:30:16", "remaining_time": "10:44:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7449, "total_steps": 10853, "loss": 0.1324, "learning_rate": 1.2285113188558975e-06, "epoch": 0.6863223844842677, "percentage": 68.64, "elapsed_time": "23:30:26", "remaining_time": "10:44:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7450, "total_steps": 10853, "loss": 0.1328, "learning_rate": 1.2278554785565671e-06, "epoch": 0.6864145206615377, "percentage": 68.64, "elapsed_time": "23:30:37", "remaining_time": "10:44:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7451, "total_steps": 10853, "loss": 0.1326, "learning_rate": 1.2271997563759918e-06, "epoch": 0.6865066568388077, "percentage": 68.65, "elapsed_time": "23:30:48", "remaining_time": "10:44:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7452, "total_steps": 10853, "loss": 0.1309, "learning_rate": 1.226544152375056e-06, "epoch": 0.6865987930160777, "percentage": 68.66, "elapsed_time": "23:31:00", "remaining_time": "10:43:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7453, "total_steps": 10853, "loss": 0.1204, "learning_rate": 1.2258886666146335e-06, "epoch": 0.6866909291933477, "percentage": 68.67, "elapsed_time": "23:31:12", "remaining_time": "10:43:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7454, "total_steps": 10853, "loss": 0.1168, "learning_rate": 1.2252332991555846e-06, "epoch": 0.6867830653706177, "percentage": 68.68, "elapsed_time": "23:31:23", "remaining_time": "10:43:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7455, "total_steps": 10853, "loss": 0.1382, "learning_rate": 1.224578050058762e-06, "epoch": 0.6868752015478877, "percentage": 68.69, "elapsed_time": "23:31:34", "remaining_time": "10:43:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7456, "total_steps": 10853, "loss": 0.1025, "learning_rate": 1.2239229193850039e-06, "epoch": 0.6869673377251578, "percentage": 68.7, "elapsed_time": "23:31:45", "remaining_time": "10:43:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7457, "total_steps": 10853, "loss": 0.129, "learning_rate": 1.2232679071951398e-06, "epoch": 0.6870594739024278, "percentage": 68.71, "elapsed_time": "23:31:54", "remaining_time": "10:42:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7458, "total_steps": 10853, "loss": 0.1215, "learning_rate": 1.2226130135499891e-06, "epoch": 0.6871516100796978, "percentage": 68.72, "elapsed_time": "23:32:05", "remaining_time": "10:42:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7459, "total_steps": 10853, "loss": 0.1186, "learning_rate": 1.2219582385103564e-06, "epoch": 0.6872437462569678, "percentage": 68.73, "elapsed_time": "23:32:15", "remaining_time": "10:42:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7460, "total_steps": 10853, "loss": 0.1193, "learning_rate": 1.2213035821370401e-06, "epoch": 0.6873358824342378, "percentage": 68.74, "elapsed_time": "23:32:26", "remaining_time": "10:42:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7461, "total_steps": 10853, "loss": 0.1184, "learning_rate": 1.2206490444908226e-06, "epoch": 0.6874280186115078, "percentage": 68.75, "elapsed_time": "23:32:37", "remaining_time": "10:42:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7462, "total_steps": 10853, "loss": 0.139, "learning_rate": 1.21999462563248e-06, "epoch": 0.6875201547887778, "percentage": 68.76, "elapsed_time": "23:32:49", "remaining_time": "10:42:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7463, "total_steps": 10853, "loss": 0.1412, "learning_rate": 1.2193403256227731e-06, "epoch": 0.6876122909660478, "percentage": 68.76, "elapsed_time": "23:33:01", "remaining_time": "10:41:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7464, "total_steps": 10853, "loss": 0.1279, "learning_rate": 1.2186861445224548e-06, "epoch": 0.6877044271433178, "percentage": 68.77, "elapsed_time": "23:33:13", "remaining_time": "10:41:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7465, "total_steps": 10853, "loss": 0.1307, "learning_rate": 1.2180320823922662e-06, "epoch": 0.6877965633205878, "percentage": 68.78, "elapsed_time": "23:33:23", "remaining_time": "10:41:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7466, "total_steps": 10853, "loss": 0.1119, "learning_rate": 1.2173781392929383e-06, "epoch": 0.6878886994978578, "percentage": 68.79, "elapsed_time": "23:33:34", "remaining_time": "10:41:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7467, "total_steps": 10853, "loss": 0.1236, "learning_rate": 1.2167243152851862e-06, "epoch": 0.6879808356751278, "percentage": 68.8, "elapsed_time": "23:33:47", "remaining_time": "10:41:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7468, "total_steps": 10853, "loss": 0.1231, "learning_rate": 1.21607061042972e-06, "epoch": 0.6880729718523978, "percentage": 68.81, "elapsed_time": "23:33:57", "remaining_time": "10:40:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7469, "total_steps": 10853, "loss": 0.1295, "learning_rate": 1.2154170247872354e-06, "epoch": 0.6881651080296678, "percentage": 68.82, "elapsed_time": "23:34:09", "remaining_time": "10:40:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7470, "total_steps": 10853, "loss": 0.1219, "learning_rate": 1.2147635584184194e-06, "epoch": 0.6882572442069379, "percentage": 68.83, "elapsed_time": "23:34:20", "remaining_time": "10:40:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7471, "total_steps": 10853, "loss": 0.126, "learning_rate": 1.2141102113839442e-06, "epoch": 0.6883493803842079, "percentage": 68.84, "elapsed_time": "23:34:30", "remaining_time": "10:40:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7472, "total_steps": 10853, "loss": 0.1192, "learning_rate": 1.2134569837444755e-06, "epoch": 0.6884415165614779, "percentage": 68.85, "elapsed_time": "23:34:40", "remaining_time": "10:40:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7473, "total_steps": 10853, "loss": 0.1312, "learning_rate": 1.2128038755606632e-06, "epoch": 0.6885336527387479, "percentage": 68.86, "elapsed_time": "23:34:51", "remaining_time": "10:39:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7474, "total_steps": 10853, "loss": 0.1272, "learning_rate": 1.2121508868931507e-06, "epoch": 0.6886257889160179, "percentage": 68.87, "elapsed_time": "23:35:03", "remaining_time": "10:39:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7475, "total_steps": 10853, "loss": 0.1238, "learning_rate": 1.2114980178025657e-06, "epoch": 0.6887179250932879, "percentage": 68.87, "elapsed_time": "23:35:13", "remaining_time": "10:39:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7476, "total_steps": 10853, "loss": 0.1275, "learning_rate": 1.2108452683495286e-06, "epoch": 0.6888100612705579, "percentage": 68.88, "elapsed_time": "23:35:25", "remaining_time": "10:39:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7477, "total_steps": 10853, "loss": 0.135, "learning_rate": 1.210192638594648e-06, "epoch": 0.6889021974478279, "percentage": 68.89, "elapsed_time": "23:35:37", "remaining_time": "10:39:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7478, "total_steps": 10853, "loss": 0.1333, "learning_rate": 1.2095401285985197e-06, "epoch": 0.6889943336250979, "percentage": 68.9, "elapsed_time": "23:35:48", "remaining_time": "10:38:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7479, "total_steps": 10853, "loss": 0.1293, "learning_rate": 1.2088877384217286e-06, "epoch": 0.6890864698023679, "percentage": 68.91, "elapsed_time": "23:36:00", "remaining_time": "10:38:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7480, "total_steps": 10853, "loss": 0.1212, "learning_rate": 1.2082354681248495e-06, "epoch": 0.6891786059796379, "percentage": 68.92, "elapsed_time": "23:36:11", "remaining_time": "10:38:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7481, "total_steps": 10853, "loss": 0.1144, "learning_rate": 1.2075833177684465e-06, "epoch": 0.6892707421569079, "percentage": 68.93, "elapsed_time": "23:36:21", "remaining_time": "10:38:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7482, "total_steps": 10853, "loss": 0.1121, "learning_rate": 1.2069312874130725e-06, "epoch": 0.6893628783341779, "percentage": 68.94, "elapsed_time": "23:36:32", "remaining_time": "10:38:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7483, "total_steps": 10853, "loss": 0.1246, "learning_rate": 1.2062793771192676e-06, "epoch": 0.689455014511448, "percentage": 68.95, "elapsed_time": "23:36:43", "remaining_time": "10:38:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7484, "total_steps": 10853, "loss": 0.1246, "learning_rate": 1.2056275869475606e-06, "epoch": 0.689547150688718, "percentage": 68.96, "elapsed_time": "23:36:55", "remaining_time": "10:37:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7485, "total_steps": 10853, "loss": 0.12, "learning_rate": 1.2049759169584718e-06, "epoch": 0.689639286865988, "percentage": 68.97, "elapsed_time": "23:37:06", "remaining_time": "10:37:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7486, "total_steps": 10853, "loss": 0.1231, "learning_rate": 1.2043243672125083e-06, "epoch": 0.689731423043258, "percentage": 68.98, "elapsed_time": "23:37:17", "remaining_time": "10:37:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7487, "total_steps": 10853, "loss": 0.1123, "learning_rate": 1.2036729377701679e-06, "epoch": 0.689823559220528, "percentage": 68.99, "elapsed_time": "23:37:28", "remaining_time": "10:37:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7488, "total_steps": 10853, "loss": 0.1241, "learning_rate": 1.2030216286919343e-06, "epoch": 0.689915695397798, "percentage": 68.99, "elapsed_time": "23:37:39", "remaining_time": "10:37:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7489, "total_steps": 10853, "loss": 0.1266, "learning_rate": 1.2023704400382813e-06, "epoch": 0.690007831575068, "percentage": 69.0, "elapsed_time": "23:37:48", "remaining_time": "10:36:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7490, "total_steps": 10853, "loss": 0.1259, "learning_rate": 1.201719371869673e-06, "epoch": 0.690099967752338, "percentage": 69.01, "elapsed_time": "23:38:00", "remaining_time": "10:36:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7491, "total_steps": 10853, "loss": 0.1364, "learning_rate": 1.2010684242465612e-06, "epoch": 0.690192103929608, "percentage": 69.02, "elapsed_time": "23:38:11", "remaining_time": "10:36:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7492, "total_steps": 10853, "loss": 0.1118, "learning_rate": 1.2004175972293852e-06, "epoch": 0.6902842401068779, "percentage": 69.03, "elapsed_time": "23:38:21", "remaining_time": "10:36:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7493, "total_steps": 10853, "loss": 0.1289, "learning_rate": 1.1997668908785761e-06, "epoch": 0.6903763762841479, "percentage": 69.04, "elapsed_time": "23:38:32", "remaining_time": "10:36:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7494, "total_steps": 10853, "loss": 0.1254, "learning_rate": 1.1991163052545502e-06, "epoch": 0.6904685124614179, "percentage": 69.05, "elapsed_time": "23:38:43", "remaining_time": "10:35:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7495, "total_steps": 10853, "loss": 0.1101, "learning_rate": 1.1984658404177162e-06, "epoch": 0.6905606486386879, "percentage": 69.06, "elapsed_time": "23:38:54", "remaining_time": "10:35:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7496, "total_steps": 10853, "loss": 0.1182, "learning_rate": 1.1978154964284683e-06, "epoch": 0.6906527848159579, "percentage": 69.07, "elapsed_time": "23:39:06", "remaining_time": "10:35:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7497, "total_steps": 10853, "loss": 0.1251, "learning_rate": 1.1971652733471915e-06, "epoch": 0.690744920993228, "percentage": 69.08, "elapsed_time": "23:39:17", "remaining_time": "10:35:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7498, "total_steps": 10853, "loss": 0.126, "learning_rate": 1.19651517123426e-06, "epoch": 0.690837057170498, "percentage": 69.09, "elapsed_time": "23:39:27", "remaining_time": "10:35:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7499, "total_steps": 10853, "loss": 0.1233, "learning_rate": 1.1958651901500356e-06, "epoch": 0.690929193347768, "percentage": 69.1, "elapsed_time": "23:39:39", "remaining_time": "10:34:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7500, "total_steps": 10853, "loss": 0.117, "learning_rate": 1.1952153301548674e-06, "epoch": 0.691021329525038, "percentage": 69.11, "elapsed_time": "23:39:49", "remaining_time": "10:34:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7500, "total_steps": 10853, "eval_loss": 0.12531189620494843, "epoch": 0.691021329525038, "percentage": 69.11, "elapsed_time": "23:44:48", "remaining_time": "10:36:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7501, "total_steps": 10853, "loss": 0.1273, "learning_rate": 1.1945655913090965e-06, "epoch": 0.691113465702308, "percentage": 69.11, "elapsed_time": "23:44:58", "remaining_time": "10:36:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7502, "total_steps": 10853, "loss": 0.1304, "learning_rate": 1.1939159736730508e-06, "epoch": 0.691205601879578, "percentage": 69.12, "elapsed_time": "23:45:09", "remaining_time": "10:36:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7503, "total_steps": 10853, "loss": 0.1305, "learning_rate": 1.1932664773070483e-06, "epoch": 0.691297738056848, "percentage": 69.13, "elapsed_time": "23:45:19", "remaining_time": "10:36:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7504, "total_steps": 10853, "loss": 0.1246, "learning_rate": 1.192617102271394e-06, "epoch": 0.691389874234118, "percentage": 69.14, "elapsed_time": "23:45:32", "remaining_time": "10:36:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7505, "total_steps": 10853, "loss": 0.1142, "learning_rate": 1.1919678486263817e-06, "epoch": 0.691482010411388, "percentage": 69.15, "elapsed_time": "23:45:41", "remaining_time": "10:36:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7506, "total_steps": 10853, "loss": 0.1268, "learning_rate": 1.1913187164322954e-06, "epoch": 0.691574146588658, "percentage": 69.16, "elapsed_time": "23:45:52", "remaining_time": "10:35:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7507, "total_steps": 10853, "loss": 0.1266, "learning_rate": 1.190669705749408e-06, "epoch": 0.691666282765928, "percentage": 69.17, "elapsed_time": "23:46:03", "remaining_time": "10:35:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7508, "total_steps": 10853, "loss": 0.1147, "learning_rate": 1.1900208166379784e-06, "epoch": 0.691758418943198, "percentage": 69.18, "elapsed_time": "23:46:15", "remaining_time": "10:35:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7509, "total_steps": 10853, "loss": 0.1236, "learning_rate": 1.1893720491582579e-06, "epoch": 0.691850555120468, "percentage": 69.19, "elapsed_time": "23:46:26", "remaining_time": "10:35:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7510, "total_steps": 10853, "loss": 0.1153, "learning_rate": 1.1887234033704827e-06, "epoch": 0.6919426912977381, "percentage": 69.2, "elapsed_time": "23:46:36", "remaining_time": "10:35:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7511, "total_steps": 10853, "loss": 0.1264, "learning_rate": 1.1880748793348818e-06, "epoch": 0.6920348274750081, "percentage": 69.21, "elapsed_time": "23:46:48", "remaining_time": "10:34:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7512, "total_steps": 10853, "loss": 0.1233, "learning_rate": 1.1874264771116684e-06, "epoch": 0.6921269636522781, "percentage": 69.22, "elapsed_time": "23:46:58", "remaining_time": "10:34:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7513, "total_steps": 10853, "loss": 0.1286, "learning_rate": 1.1867781967610478e-06, "epoch": 0.6922190998295481, "percentage": 69.23, "elapsed_time": "23:47:08", "remaining_time": "10:34:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7514, "total_steps": 10853, "loss": 0.1237, "learning_rate": 1.186130038343214e-06, "epoch": 0.6923112360068181, "percentage": 69.23, "elapsed_time": "23:47:20", "remaining_time": "10:34:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7515, "total_steps": 10853, "loss": 0.1213, "learning_rate": 1.1854820019183467e-06, "epoch": 0.6924033721840881, "percentage": 69.24, "elapsed_time": "23:47:32", "remaining_time": "10:34:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7516, "total_steps": 10853, "loss": 0.1241, "learning_rate": 1.1848340875466176e-06, "epoch": 0.6924955083613581, "percentage": 69.25, "elapsed_time": "23:47:43", "remaining_time": "10:33:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7517, "total_steps": 10853, "loss": 0.1216, "learning_rate": 1.1841862952881845e-06, "epoch": 0.6925876445386281, "percentage": 69.26, "elapsed_time": "23:47:54", "remaining_time": "10:33:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7518, "total_steps": 10853, "loss": 0.1161, "learning_rate": 1.183538625203195e-06, "epoch": 0.6926797807158981, "percentage": 69.27, "elapsed_time": "23:48:04", "remaining_time": "10:33:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7519, "total_steps": 10853, "loss": 0.1286, "learning_rate": 1.182891077351787e-06, "epoch": 0.6927719168931681, "percentage": 69.28, "elapsed_time": "23:48:16", "remaining_time": "10:33:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7520, "total_steps": 10853, "loss": 0.1376, "learning_rate": 1.1822436517940844e-06, "epoch": 0.6928640530704381, "percentage": 69.29, "elapsed_time": "23:48:27", "remaining_time": "10:33:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7521, "total_steps": 10853, "loss": 0.1233, "learning_rate": 1.1815963485901994e-06, "epoch": 0.6929561892477081, "percentage": 69.3, "elapsed_time": "23:48:38", "remaining_time": "10:32:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7522, "total_steps": 10853, "loss": 0.1235, "learning_rate": 1.1809491678002356e-06, "epoch": 0.6930483254249781, "percentage": 69.31, "elapsed_time": "23:48:48", "remaining_time": "10:32:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7523, "total_steps": 10853, "loss": 0.1257, "learning_rate": 1.1803021094842831e-06, "epoch": 0.6931404616022481, "percentage": 69.32, "elapsed_time": "23:48:59", "remaining_time": "10:32:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7524, "total_steps": 10853, "loss": 0.1131, "learning_rate": 1.179655173702423e-06, "epoch": 0.6932325977795182, "percentage": 69.33, "elapsed_time": "23:49:12", "remaining_time": "10:32:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7525, "total_steps": 10853, "loss": 0.1219, "learning_rate": 1.1790083605147221e-06, "epoch": 0.6933247339567882, "percentage": 69.34, "elapsed_time": "23:49:23", "remaining_time": "10:32:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7526, "total_steps": 10853, "loss": 0.1343, "learning_rate": 1.1783616699812362e-06, "epoch": 0.6934168701340582, "percentage": 69.34, "elapsed_time": "23:49:34", "remaining_time": "10:31:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7527, "total_steps": 10853, "loss": 0.1312, "learning_rate": 1.1777151021620113e-06, "epoch": 0.6935090063113282, "percentage": 69.35, "elapsed_time": "23:49:46", "remaining_time": "10:31:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7528, "total_steps": 10853, "loss": 0.1333, "learning_rate": 1.1770686571170824e-06, "epoch": 0.6936011424885982, "percentage": 69.36, "elapsed_time": "23:49:57", "remaining_time": "10:31:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7529, "total_steps": 10853, "loss": 0.1271, "learning_rate": 1.17642233490647e-06, "epoch": 0.6936932786658682, "percentage": 69.37, "elapsed_time": "23:50:08", "remaining_time": "10:31:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7530, "total_steps": 10853, "loss": 0.1104, "learning_rate": 1.1757761355901875e-06, "epoch": 0.6937854148431382, "percentage": 69.38, "elapsed_time": "23:50:17", "remaining_time": "10:31:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7531, "total_steps": 10853, "loss": 0.1385, "learning_rate": 1.1751300592282325e-06, "epoch": 0.6938775510204082, "percentage": 69.39, "elapsed_time": "23:50:28", "remaining_time": "10:30:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7532, "total_steps": 10853, "loss": 0.1143, "learning_rate": 1.1744841058805947e-06, "epoch": 0.6939696871976782, "percentage": 69.4, "elapsed_time": "23:50:39", "remaining_time": "10:30:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7533, "total_steps": 10853, "loss": 0.1469, "learning_rate": 1.1738382756072495e-06, "epoch": 0.6940618233749482, "percentage": 69.41, "elapsed_time": "23:50:50", "remaining_time": "10:30:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7534, "total_steps": 10853, "loss": 0.1203, "learning_rate": 1.1731925684681631e-06, "epoch": 0.6941539595522181, "percentage": 69.42, "elapsed_time": "23:51:00", "remaining_time": "10:30:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7535, "total_steps": 10853, "loss": 0.1331, "learning_rate": 1.1725469845232906e-06, "epoch": 0.6942460957294881, "percentage": 69.43, "elapsed_time": "23:51:11", "remaining_time": "10:30:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7536, "total_steps": 10853, "loss": 0.1205, "learning_rate": 1.1719015238325731e-06, "epoch": 0.6943382319067581, "percentage": 69.44, "elapsed_time": "23:51:21", "remaining_time": "10:30:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7537, "total_steps": 10853, "loss": 0.1173, "learning_rate": 1.1712561864559415e-06, "epoch": 0.6944303680840282, "percentage": 69.45, "elapsed_time": "23:51:31", "remaining_time": "10:29:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7538, "total_steps": 10853, "loss": 0.1277, "learning_rate": 1.1706109724533158e-06, "epoch": 0.6945225042612982, "percentage": 69.46, "elapsed_time": "23:51:42", "remaining_time": "10:29:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7539, "total_steps": 10853, "loss": 0.1225, "learning_rate": 1.1699658818846044e-06, "epoch": 0.6946146404385682, "percentage": 69.46, "elapsed_time": "23:51:53", "remaining_time": "10:29:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7540, "total_steps": 10853, "loss": 0.1134, "learning_rate": 1.1693209148097049e-06, "epoch": 0.6947067766158382, "percentage": 69.47, "elapsed_time": "23:52:03", "remaining_time": "10:29:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7541, "total_steps": 10853, "loss": 0.1421, "learning_rate": 1.1686760712885018e-06, "epoch": 0.6947989127931082, "percentage": 69.48, "elapsed_time": "23:52:14", "remaining_time": "10:29:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7542, "total_steps": 10853, "loss": 0.1273, "learning_rate": 1.1680313513808677e-06, "epoch": 0.6948910489703782, "percentage": 69.49, "elapsed_time": "23:52:26", "remaining_time": "10:28:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7543, "total_steps": 10853, "loss": 0.1231, "learning_rate": 1.1673867551466658e-06, "epoch": 0.6949831851476482, "percentage": 69.5, "elapsed_time": "23:52:37", "remaining_time": "10:28:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7544, "total_steps": 10853, "loss": 0.1212, "learning_rate": 1.1667422826457475e-06, "epoch": 0.6950753213249182, "percentage": 69.51, "elapsed_time": "23:52:47", "remaining_time": "10:28:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7545, "total_steps": 10853, "loss": 0.13, "learning_rate": 1.1660979339379524e-06, "epoch": 0.6951674575021882, "percentage": 69.52, "elapsed_time": "23:52:58", "remaining_time": "10:28:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7546, "total_steps": 10853, "loss": 0.1245, "learning_rate": 1.1654537090831069e-06, "epoch": 0.6952595936794582, "percentage": 69.53, "elapsed_time": "23:53:08", "remaining_time": "10:28:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7547, "total_steps": 10853, "loss": 0.1291, "learning_rate": 1.164809608141029e-06, "epoch": 0.6953517298567282, "percentage": 69.54, "elapsed_time": "23:53:19", "remaining_time": "10:27:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7548, "total_steps": 10853, "loss": 0.1357, "learning_rate": 1.1641656311715218e-06, "epoch": 0.6954438660339982, "percentage": 69.55, "elapsed_time": "23:53:30", "remaining_time": "10:27:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7549, "total_steps": 10853, "loss": 0.1119, "learning_rate": 1.1635217782343801e-06, "epoch": 0.6955360022112682, "percentage": 69.56, "elapsed_time": "23:53:40", "remaining_time": "10:27:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7550, "total_steps": 10853, "loss": 0.1146, "learning_rate": 1.1628780493893849e-06, "epoch": 0.6956281383885382, "percentage": 69.57, "elapsed_time": "23:53:52", "remaining_time": "10:27:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7551, "total_steps": 10853, "loss": 0.1108, "learning_rate": 1.162234444696306e-06, "epoch": 0.6957202745658083, "percentage": 69.58, "elapsed_time": "23:54:03", "remaining_time": "10:27:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7552, "total_steps": 10853, "loss": 0.1218, "learning_rate": 1.1615909642149042e-06, "epoch": 0.6958124107430783, "percentage": 69.58, "elapsed_time": "23:54:13", "remaining_time": "10:26:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7553, "total_steps": 10853, "loss": 0.1365, "learning_rate": 1.1609476080049254e-06, "epoch": 0.6959045469203483, "percentage": 69.59, "elapsed_time": "23:54:23", "remaining_time": "10:26:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7554, "total_steps": 10853, "loss": 0.1189, "learning_rate": 1.1603043761261043e-06, "epoch": 0.6959966830976183, "percentage": 69.6, "elapsed_time": "23:54:34", "remaining_time": "10:26:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7555, "total_steps": 10853, "loss": 0.119, "learning_rate": 1.159661268638166e-06, "epoch": 0.6960888192748883, "percentage": 69.61, "elapsed_time": "23:54:45", "remaining_time": "10:26:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7556, "total_steps": 10853, "loss": 0.1251, "learning_rate": 1.1590182856008233e-06, "epoch": 0.6961809554521583, "percentage": 69.62, "elapsed_time": "23:54:55", "remaining_time": "10:26:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7557, "total_steps": 10853, "loss": 0.1549, "learning_rate": 1.158375427073778e-06, "epoch": 0.6962730916294283, "percentage": 69.63, "elapsed_time": "23:55:06", "remaining_time": "10:25:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7558, "total_steps": 10853, "loss": 0.1194, "learning_rate": 1.1577326931167184e-06, "epoch": 0.6963652278066983, "percentage": 69.64, "elapsed_time": "23:55:17", "remaining_time": "10:25:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7559, "total_steps": 10853, "loss": 0.1276, "learning_rate": 1.1570900837893223e-06, "epoch": 0.6964573639839683, "percentage": 69.65, "elapsed_time": "23:55:29", "remaining_time": "10:25:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7560, "total_steps": 10853, "loss": 0.1195, "learning_rate": 1.1564475991512562e-06, "epoch": 0.6965495001612383, "percentage": 69.66, "elapsed_time": "23:55:41", "remaining_time": "10:25:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7561, "total_steps": 10853, "loss": 0.1386, "learning_rate": 1.1558052392621758e-06, "epoch": 0.6966416363385083, "percentage": 69.67, "elapsed_time": "23:55:52", "remaining_time": "10:25:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7562, "total_steps": 10853, "loss": 0.1104, "learning_rate": 1.155163004181723e-06, "epoch": 0.6967337725157783, "percentage": 69.68, "elapsed_time": "23:56:03", "remaining_time": "10:24:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7563, "total_steps": 10853, "loss": 0.1233, "learning_rate": 1.1545208939695306e-06, "epoch": 0.6968259086930483, "percentage": 69.69, "elapsed_time": "23:56:13", "remaining_time": "10:24:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7564, "total_steps": 10853, "loss": 0.1172, "learning_rate": 1.1538789086852173e-06, "epoch": 0.6969180448703183, "percentage": 69.7, "elapsed_time": "23:56:24", "remaining_time": "10:24:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7565, "total_steps": 10853, "loss": 0.1308, "learning_rate": 1.1532370483883931e-06, "epoch": 0.6970101810475884, "percentage": 69.7, "elapsed_time": "23:56:34", "remaining_time": "10:24:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7566, "total_steps": 10853, "loss": 0.1378, "learning_rate": 1.152595313138653e-06, "epoch": 0.6971023172248584, "percentage": 69.71, "elapsed_time": "23:56:46", "remaining_time": "10:24:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7567, "total_steps": 10853, "loss": 0.1221, "learning_rate": 1.151953702995583e-06, "epoch": 0.6971944534021284, "percentage": 69.72, "elapsed_time": "23:56:57", "remaining_time": "10:24:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7568, "total_steps": 10853, "loss": 0.127, "learning_rate": 1.1513122180187577e-06, "epoch": 0.6972865895793984, "percentage": 69.73, "elapsed_time": "23:57:07", "remaining_time": "10:23:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7569, "total_steps": 10853, "loss": 0.1254, "learning_rate": 1.150670858267738e-06, "epoch": 0.6973787257566684, "percentage": 69.74, "elapsed_time": "23:57:18", "remaining_time": "10:23:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7570, "total_steps": 10853, "loss": 0.1345, "learning_rate": 1.150029623802074e-06, "epoch": 0.6974708619339384, "percentage": 69.75, "elapsed_time": "23:57:30", "remaining_time": "10:23:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7571, "total_steps": 10853, "loss": 0.12, "learning_rate": 1.1493885146813042e-06, "epoch": 0.6975629981112084, "percentage": 69.76, "elapsed_time": "23:57:41", "remaining_time": "10:23:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7572, "total_steps": 10853, "loss": 0.1288, "learning_rate": 1.148747530964956e-06, "epoch": 0.6976551342884784, "percentage": 69.77, "elapsed_time": "23:57:53", "remaining_time": "10:23:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7573, "total_steps": 10853, "loss": 0.1291, "learning_rate": 1.1481066727125463e-06, "epoch": 0.6977472704657484, "percentage": 69.78, "elapsed_time": "23:58:03", "remaining_time": "10:22:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7574, "total_steps": 10853, "loss": 0.1309, "learning_rate": 1.1474659399835772e-06, "epoch": 0.6978394066430184, "percentage": 69.79, "elapsed_time": "23:58:14", "remaining_time": "10:22:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7575, "total_steps": 10853, "loss": 0.1156, "learning_rate": 1.1468253328375404e-06, "epoch": 0.6979315428202884, "percentage": 69.8, "elapsed_time": "23:58:24", "remaining_time": "10:22:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7576, "total_steps": 10853, "loss": 0.1199, "learning_rate": 1.1461848513339168e-06, "epoch": 0.6980236789975584, "percentage": 69.81, "elapsed_time": "23:58:35", "remaining_time": "10:22:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7577, "total_steps": 10853, "loss": 0.1276, "learning_rate": 1.145544495532176e-06, "epoch": 0.6981158151748283, "percentage": 69.81, "elapsed_time": "23:58:46", "remaining_time": "10:22:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7578, "total_steps": 10853, "loss": 0.1166, "learning_rate": 1.144904265491775e-06, "epoch": 0.6982079513520985, "percentage": 69.82, "elapsed_time": "23:58:57", "remaining_time": "10:21:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7579, "total_steps": 10853, "loss": 0.1264, "learning_rate": 1.1442641612721588e-06, "epoch": 0.6983000875293685, "percentage": 69.83, "elapsed_time": "23:59:08", "remaining_time": "10:21:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7580, "total_steps": 10853, "loss": 0.1265, "learning_rate": 1.1436241829327605e-06, "epoch": 0.6983922237066384, "percentage": 69.84, "elapsed_time": "23:59:19", "remaining_time": "10:21:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7581, "total_steps": 10853, "loss": 0.1258, "learning_rate": 1.1429843305330027e-06, "epoch": 0.6984843598839084, "percentage": 69.85, "elapsed_time": "23:59:30", "remaining_time": "10:21:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7582, "total_steps": 10853, "loss": 0.1166, "learning_rate": 1.1423446041322967e-06, "epoch": 0.6985764960611784, "percentage": 69.86, "elapsed_time": "23:59:39", "remaining_time": "10:21:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7583, "total_steps": 10853, "loss": 0.1187, "learning_rate": 1.1417050037900393e-06, "epoch": 0.6986686322384484, "percentage": 69.87, "elapsed_time": "23:59:49", "remaining_time": "10:20:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7584, "total_steps": 10853, "loss": 0.1289, "learning_rate": 1.1410655295656196e-06, "epoch": 0.6987607684157184, "percentage": 69.88, "elapsed_time": "23:59:59", "remaining_time": "10:20:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7585, "total_steps": 10853, "loss": 0.1297, "learning_rate": 1.1404261815184105e-06, "epoch": 0.6988529045929884, "percentage": 69.89, "elapsed_time": "1 day, 0:00:10", "remaining_time": "10:20:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7586, "total_steps": 10853, "loss": 0.1296, "learning_rate": 1.1397869597077783e-06, "epoch": 0.6989450407702584, "percentage": 69.9, "elapsed_time": "1 day, 0:00:23", "remaining_time": "10:20:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7587, "total_steps": 10853, "loss": 0.1199, "learning_rate": 1.1391478641930716e-06, "epoch": 0.6990371769475284, "percentage": 69.91, "elapsed_time": "1 day, 0:00:33", "remaining_time": "10:20:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7588, "total_steps": 10853, "loss": 0.1236, "learning_rate": 1.1385088950336329e-06, "epoch": 0.6991293131247984, "percentage": 69.92, "elapsed_time": "1 day, 0:00:45", "remaining_time": "10:19:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7589, "total_steps": 10853, "loss": 0.1101, "learning_rate": 1.1378700522887903e-06, "epoch": 0.6992214493020684, "percentage": 69.93, "elapsed_time": "1 day, 0:00:54", "remaining_time": "10:19:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7590, "total_steps": 10853, "loss": 0.1366, "learning_rate": 1.13723133601786e-06, "epoch": 0.6993135854793384, "percentage": 69.93, "elapsed_time": "1 day, 0:01:04", "remaining_time": "10:19:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7591, "total_steps": 10853, "loss": 0.1117, "learning_rate": 1.136592746280146e-06, "epoch": 0.6994057216566084, "percentage": 69.94, "elapsed_time": "1 day, 0:01:15", "remaining_time": "10:19:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7592, "total_steps": 10853, "loss": 0.1278, "learning_rate": 1.1359542831349422e-06, "epoch": 0.6994978578338785, "percentage": 69.95, "elapsed_time": "1 day, 0:01:26", "remaining_time": "10:19:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7593, "total_steps": 10853, "loss": 0.1139, "learning_rate": 1.1353159466415298e-06, "epoch": 0.6995899940111485, "percentage": 69.96, "elapsed_time": "1 day, 0:01:37", "remaining_time": "10:18:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7594, "total_steps": 10853, "loss": 0.1227, "learning_rate": 1.1346777368591797e-06, "epoch": 0.6996821301884185, "percentage": 69.97, "elapsed_time": "1 day, 0:01:48", "remaining_time": "10:18:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7595, "total_steps": 10853, "loss": 0.127, "learning_rate": 1.1340396538471488e-06, "epoch": 0.6997742663656885, "percentage": 69.98, "elapsed_time": "1 day, 0:01:58", "remaining_time": "10:18:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7596, "total_steps": 10853, "loss": 0.1247, "learning_rate": 1.133401697664682e-06, "epoch": 0.6998664025429585, "percentage": 69.99, "elapsed_time": "1 day, 0:02:08", "remaining_time": "10:18:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7597, "total_steps": 10853, "loss": 0.1195, "learning_rate": 1.1327638683710146e-06, "epoch": 0.6999585387202285, "percentage": 70.0, "elapsed_time": "1 day, 0:02:19", "remaining_time": "10:18:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7598, "total_steps": 10853, "loss": 0.1128, "learning_rate": 1.13212616602537e-06, "epoch": 0.7000506748974985, "percentage": 70.01, "elapsed_time": "1 day, 0:02:30", "remaining_time": "10:17:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7599, "total_steps": 10853, "loss": 0.1092, "learning_rate": 1.1314885906869575e-06, "epoch": 0.7001428110747685, "percentage": 70.02, "elapsed_time": "1 day, 0:02:42", "remaining_time": "10:17:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7600, "total_steps": 10853, "loss": 0.1093, "learning_rate": 1.1308511424149774e-06, "epoch": 0.7002349472520385, "percentage": 70.03, "elapsed_time": "1 day, 0:02:52", "remaining_time": "10:17:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7601, "total_steps": 10853, "loss": 0.1192, "learning_rate": 1.1302138212686152e-06, "epoch": 0.7003270834293085, "percentage": 70.04, "elapsed_time": "1 day, 0:03:03", "remaining_time": "10:17:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7602, "total_steps": 10853, "loss": 0.1218, "learning_rate": 1.1295766273070469e-06, "epoch": 0.7004192196065785, "percentage": 70.05, "elapsed_time": "1 day, 0:03:13", "remaining_time": "10:17:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7603, "total_steps": 10853, "loss": 0.1283, "learning_rate": 1.1289395605894374e-06, "epoch": 0.7005113557838485, "percentage": 70.05, "elapsed_time": "1 day, 0:03:24", "remaining_time": "10:17:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7604, "total_steps": 10853, "loss": 0.1368, "learning_rate": 1.1283026211749362e-06, "epoch": 0.7006034919611185, "percentage": 70.06, "elapsed_time": "1 day, 0:03:35", "remaining_time": "10:16:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7605, "total_steps": 10853, "loss": 0.1191, "learning_rate": 1.127665809122685e-06, "epoch": 0.7006956281383886, "percentage": 70.07, "elapsed_time": "1 day, 0:03:46", "remaining_time": "10:16:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7606, "total_steps": 10853, "loss": 0.1316, "learning_rate": 1.1270291244918106e-06, "epoch": 0.7007877643156586, "percentage": 70.08, "elapsed_time": "1 day, 0:03:56", "remaining_time": "10:16:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7607, "total_steps": 10853, "loss": 0.1207, "learning_rate": 1.1263925673414303e-06, "epoch": 0.7008799004929286, "percentage": 70.09, "elapsed_time": "1 day, 0:04:06", "remaining_time": "10:16:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7608, "total_steps": 10853, "loss": 0.1286, "learning_rate": 1.1257561377306471e-06, "epoch": 0.7009720366701986, "percentage": 70.1, "elapsed_time": "1 day, 0:04:17", "remaining_time": "10:16:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7609, "total_steps": 10853, "loss": 0.1295, "learning_rate": 1.1251198357185547e-06, "epoch": 0.7010641728474686, "percentage": 70.11, "elapsed_time": "1 day, 0:04:28", "remaining_time": "10:15:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7610, "total_steps": 10853, "loss": 0.1313, "learning_rate": 1.1244836613642342e-06, "epoch": 0.7011563090247386, "percentage": 70.12, "elapsed_time": "1 day, 0:04:39", "remaining_time": "10:15:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7611, "total_steps": 10853, "loss": 0.1225, "learning_rate": 1.1238476147267537e-06, "epoch": 0.7012484452020086, "percentage": 70.13, "elapsed_time": "1 day, 0:04:48", "remaining_time": "10:15:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7612, "total_steps": 10853, "loss": 0.1284, "learning_rate": 1.1232116958651695e-06, "epoch": 0.7013405813792786, "percentage": 70.14, "elapsed_time": "1 day, 0:04:59", "remaining_time": "10:15:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7613, "total_steps": 10853, "loss": 0.124, "learning_rate": 1.1225759048385276e-06, "epoch": 0.7014327175565486, "percentage": 70.15, "elapsed_time": "1 day, 0:05:09", "remaining_time": "10:15:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7614, "total_steps": 10853, "loss": 0.1252, "learning_rate": 1.1219402417058611e-06, "epoch": 0.7015248537338186, "percentage": 70.16, "elapsed_time": "1 day, 0:05:20", "remaining_time": "10:14:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7615, "total_steps": 10853, "loss": 0.1209, "learning_rate": 1.1213047065261922e-06, "epoch": 0.7016169899110886, "percentage": 70.16, "elapsed_time": "1 day, 0:05:30", "remaining_time": "10:14:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7616, "total_steps": 10853, "loss": 0.1197, "learning_rate": 1.12066929935853e-06, "epoch": 0.7017091260883586, "percentage": 70.17, "elapsed_time": "1 day, 0:05:41", "remaining_time": "10:14:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7617, "total_steps": 10853, "loss": 0.1194, "learning_rate": 1.1200340202618706e-06, "epoch": 0.7018012622656286, "percentage": 70.18, "elapsed_time": "1 day, 0:05:53", "remaining_time": "10:14:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7618, "total_steps": 10853, "loss": 0.1111, "learning_rate": 1.1193988692952012e-06, "epoch": 0.7018933984428986, "percentage": 70.19, "elapsed_time": "1 day, 0:06:04", "remaining_time": "10:14:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7619, "total_steps": 10853, "loss": 0.1183, "learning_rate": 1.118763846517496e-06, "epoch": 0.7019855346201687, "percentage": 70.2, "elapsed_time": "1 day, 0:06:14", "remaining_time": "10:13:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7620, "total_steps": 10853, "loss": 0.1249, "learning_rate": 1.1181289519877156e-06, "epoch": 0.7020776707974387, "percentage": 70.21, "elapsed_time": "1 day, 0:06:25", "remaining_time": "10:13:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7621, "total_steps": 10853, "loss": 0.126, "learning_rate": 1.1174941857648105e-06, "epoch": 0.7021698069747087, "percentage": 70.22, "elapsed_time": "1 day, 0:06:35", "remaining_time": "10:13:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7622, "total_steps": 10853, "loss": 0.1226, "learning_rate": 1.11685954790772e-06, "epoch": 0.7022619431519787, "percentage": 70.23, "elapsed_time": "1 day, 0:06:45", "remaining_time": "10:13:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7623, "total_steps": 10853, "loss": 0.1193, "learning_rate": 1.1162250384753697e-06, "epoch": 0.7023540793292486, "percentage": 70.24, "elapsed_time": "1 day, 0:06:56", "remaining_time": "10:13:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7624, "total_steps": 10853, "loss": 0.129, "learning_rate": 1.1155906575266722e-06, "epoch": 0.7024462155065186, "percentage": 70.25, "elapsed_time": "1 day, 0:07:08", "remaining_time": "10:12:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7625, "total_steps": 10853, "loss": 0.1347, "learning_rate": 1.1149564051205314e-06, "epoch": 0.7025383516837886, "percentage": 70.26, "elapsed_time": "1 day, 0:07:19", "remaining_time": "10:12:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7626, "total_steps": 10853, "loss": 0.1283, "learning_rate": 1.114322281315837e-06, "epoch": 0.7026304878610586, "percentage": 70.27, "elapsed_time": "1 day, 0:07:29", "remaining_time": "10:12:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7627, "total_steps": 10853, "loss": 0.1162, "learning_rate": 1.1136882861714692e-06, "epoch": 0.7027226240383286, "percentage": 70.28, "elapsed_time": "1 day, 0:07:40", "remaining_time": "10:12:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7628, "total_steps": 10853, "loss": 0.1226, "learning_rate": 1.1130544197462933e-06, "epoch": 0.7028147602155986, "percentage": 70.28, "elapsed_time": "1 day, 0:07:52", "remaining_time": "10:12:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7629, "total_steps": 10853, "loss": 0.1211, "learning_rate": 1.1124206820991628e-06, "epoch": 0.7029068963928686, "percentage": 70.29, "elapsed_time": "1 day, 0:08:03", "remaining_time": "10:11:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7630, "total_steps": 10853, "loss": 0.1249, "learning_rate": 1.1117870732889214e-06, "epoch": 0.7029990325701386, "percentage": 70.3, "elapsed_time": "1 day, 0:08:13", "remaining_time": "10:11:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7631, "total_steps": 10853, "loss": 0.129, "learning_rate": 1.111153593374399e-06, "epoch": 0.7030911687474086, "percentage": 70.31, "elapsed_time": "1 day, 0:08:25", "remaining_time": "10:11:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7632, "total_steps": 10853, "loss": 0.1297, "learning_rate": 1.1105202424144165e-06, "epoch": 0.7031833049246786, "percentage": 70.32, "elapsed_time": "1 day, 0:08:37", "remaining_time": "10:11:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7633, "total_steps": 10853, "loss": 0.1245, "learning_rate": 1.109887020467779e-06, "epoch": 0.7032754411019487, "percentage": 70.33, "elapsed_time": "1 day, 0:08:48", "remaining_time": "10:11:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7634, "total_steps": 10853, "loss": 0.1288, "learning_rate": 1.10925392759328e-06, "epoch": 0.7033675772792187, "percentage": 70.34, "elapsed_time": "1 day, 0:08:59", "remaining_time": "10:10:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7635, "total_steps": 10853, "loss": 0.1262, "learning_rate": 1.1086209638497038e-06, "epoch": 0.7034597134564887, "percentage": 70.35, "elapsed_time": "1 day, 0:09:09", "remaining_time": "10:10:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7636, "total_steps": 10853, "loss": 0.1417, "learning_rate": 1.1079881292958217e-06, "epoch": 0.7035518496337587, "percentage": 70.36, "elapsed_time": "1 day, 0:09:18", "remaining_time": "10:10:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7637, "total_steps": 10853, "loss": 0.1427, "learning_rate": 1.1073554239903905e-06, "epoch": 0.7036439858110287, "percentage": 70.37, "elapsed_time": "1 day, 0:09:29", "remaining_time": "10:10:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7638, "total_steps": 10853, "loss": 0.1191, "learning_rate": 1.106722847992159e-06, "epoch": 0.7037361219882987, "percentage": 70.38, "elapsed_time": "1 day, 0:09:41", "remaining_time": "10:10:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7639, "total_steps": 10853, "loss": 0.1183, "learning_rate": 1.1060904013598604e-06, "epoch": 0.7038282581655687, "percentage": 70.39, "elapsed_time": "1 day, 0:09:53", "remaining_time": "10:10:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7640, "total_steps": 10853, "loss": 0.1263, "learning_rate": 1.1054580841522188e-06, "epoch": 0.7039203943428387, "percentage": 70.4, "elapsed_time": "1 day, 0:10:04", "remaining_time": "10:09:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7641, "total_steps": 10853, "loss": 0.1206, "learning_rate": 1.1048258964279432e-06, "epoch": 0.7040125305201087, "percentage": 70.4, "elapsed_time": "1 day, 0:10:13", "remaining_time": "10:09:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7642, "total_steps": 10853, "loss": 0.1274, "learning_rate": 1.1041938382457332e-06, "epoch": 0.7041046666973787, "percentage": 70.41, "elapsed_time": "1 day, 0:10:23", "remaining_time": "10:09:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7643, "total_steps": 10853, "loss": 0.125, "learning_rate": 1.1035619096642766e-06, "epoch": 0.7041968028746487, "percentage": 70.42, "elapsed_time": "1 day, 0:10:35", "remaining_time": "10:09:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7644, "total_steps": 10853, "loss": 0.1305, "learning_rate": 1.102930110742247e-06, "epoch": 0.7042889390519187, "percentage": 70.43, "elapsed_time": "1 day, 0:10:45", "remaining_time": "10:09:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7645, "total_steps": 10853, "loss": 0.1262, "learning_rate": 1.102298441538306e-06, "epoch": 0.7043810752291887, "percentage": 70.44, "elapsed_time": "1 day, 0:10:56", "remaining_time": "10:08:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7646, "total_steps": 10853, "loss": 0.1188, "learning_rate": 1.101666902111105e-06, "epoch": 0.7044732114064588, "percentage": 70.45, "elapsed_time": "1 day, 0:11:07", "remaining_time": "10:08:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7647, "total_steps": 10853, "loss": 0.1153, "learning_rate": 1.1010354925192826e-06, "epoch": 0.7045653475837288, "percentage": 70.46, "elapsed_time": "1 day, 0:11:18", "remaining_time": "10:08:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7648, "total_steps": 10853, "loss": 0.1325, "learning_rate": 1.1004042128214664e-06, "epoch": 0.7046574837609988, "percentage": 70.47, "elapsed_time": "1 day, 0:11:30", "remaining_time": "10:08:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7649, "total_steps": 10853, "loss": 0.1183, "learning_rate": 1.0997730630762697e-06, "epoch": 0.7047496199382688, "percentage": 70.48, "elapsed_time": "1 day, 0:11:41", "remaining_time": "10:08:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7650, "total_steps": 10853, "loss": 0.1078, "learning_rate": 1.0991420433422936e-06, "epoch": 0.7048417561155388, "percentage": 70.49, "elapsed_time": "1 day, 0:11:52", "remaining_time": "10:07:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7651, "total_steps": 10853, "loss": 0.1178, "learning_rate": 1.0985111536781298e-06, "epoch": 0.7049338922928088, "percentage": 70.5, "elapsed_time": "1 day, 0:12:04", "remaining_time": "10:07:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7652, "total_steps": 10853, "loss": 0.129, "learning_rate": 1.0978803941423572e-06, "epoch": 0.7050260284700788, "percentage": 70.51, "elapsed_time": "1 day, 0:12:14", "remaining_time": "10:07:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7653, "total_steps": 10853, "loss": 0.122, "learning_rate": 1.0972497647935396e-06, "epoch": 0.7051181646473488, "percentage": 70.52, "elapsed_time": "1 day, 0:12:24", "remaining_time": "10:07:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7654, "total_steps": 10853, "loss": 0.1081, "learning_rate": 1.0966192656902335e-06, "epoch": 0.7052103008246188, "percentage": 70.52, "elapsed_time": "1 day, 0:12:35", "remaining_time": "10:07:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7655, "total_steps": 10853, "loss": 0.1314, "learning_rate": 1.0959888968909784e-06, "epoch": 0.7053024370018888, "percentage": 70.53, "elapsed_time": "1 day, 0:12:46", "remaining_time": "10:06:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7656, "total_steps": 10853, "loss": 0.1221, "learning_rate": 1.0953586584543066e-06, "epoch": 0.7053945731791588, "percentage": 70.54, "elapsed_time": "1 day, 0:12:58", "remaining_time": "10:06:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7657, "total_steps": 10853, "loss": 0.1217, "learning_rate": 1.0947285504387337e-06, "epoch": 0.7054867093564288, "percentage": 70.55, "elapsed_time": "1 day, 0:13:10", "remaining_time": "10:06:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7658, "total_steps": 10853, "loss": 0.114, "learning_rate": 1.094098572902766e-06, "epoch": 0.7055788455336988, "percentage": 70.56, "elapsed_time": "1 day, 0:13:19", "remaining_time": "10:06:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7659, "total_steps": 10853, "loss": 0.1178, "learning_rate": 1.0934687259048975e-06, "epoch": 0.7056709817109688, "percentage": 70.57, "elapsed_time": "1 day, 0:13:29", "remaining_time": "10:06:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7660, "total_steps": 10853, "loss": 0.1229, "learning_rate": 1.092839009503609e-06, "epoch": 0.7057631178882389, "percentage": 70.58, "elapsed_time": "1 day, 0:13:40", "remaining_time": "10:05:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7661, "total_steps": 10853, "loss": 0.1261, "learning_rate": 1.0922094237573706e-06, "epoch": 0.7058552540655089, "percentage": 70.59, "elapsed_time": "1 day, 0:13:49", "remaining_time": "10:05:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7662, "total_steps": 10853, "loss": 0.1221, "learning_rate": 1.0915799687246376e-06, "epoch": 0.7059473902427789, "percentage": 70.6, "elapsed_time": "1 day, 0:14:00", "remaining_time": "10:05:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7663, "total_steps": 10853, "loss": 0.1247, "learning_rate": 1.0909506444638563e-06, "epoch": 0.7060395264200489, "percentage": 70.61, "elapsed_time": "1 day, 0:14:12", "remaining_time": "10:05:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7664, "total_steps": 10853, "loss": 0.1145, "learning_rate": 1.09032145103346e-06, "epoch": 0.7061316625973189, "percentage": 70.62, "elapsed_time": "1 day, 0:14:22", "remaining_time": "10:05:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7665, "total_steps": 10853, "loss": 0.1172, "learning_rate": 1.0896923884918687e-06, "epoch": 0.7062237987745889, "percentage": 70.63, "elapsed_time": "1 day, 0:14:33", "remaining_time": "10:04:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7666, "total_steps": 10853, "loss": 0.1307, "learning_rate": 1.0890634568974901e-06, "epoch": 0.7063159349518588, "percentage": 70.63, "elapsed_time": "1 day, 0:14:45", "remaining_time": "10:04:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7667, "total_steps": 10853, "loss": 0.1148, "learning_rate": 1.0884346563087214e-06, "epoch": 0.7064080711291288, "percentage": 70.64, "elapsed_time": "1 day, 0:14:56", "remaining_time": "10:04:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7668, "total_steps": 10853, "loss": 0.1219, "learning_rate": 1.0878059867839469e-06, "epoch": 0.7065002073063988, "percentage": 70.65, "elapsed_time": "1 day, 0:15:07", "remaining_time": "10:04:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7669, "total_steps": 10853, "loss": 0.124, "learning_rate": 1.0871774483815393e-06, "epoch": 0.7065923434836688, "percentage": 70.66, "elapsed_time": "1 day, 0:15:17", "remaining_time": "10:04:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7670, "total_steps": 10853, "loss": 0.1226, "learning_rate": 1.0865490411598576e-06, "epoch": 0.7066844796609388, "percentage": 70.67, "elapsed_time": "1 day, 0:15:28", "remaining_time": "10:04:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7671, "total_steps": 10853, "loss": 0.1221, "learning_rate": 1.0859207651772485e-06, "epoch": 0.7067766158382088, "percentage": 70.68, "elapsed_time": "1 day, 0:15:40", "remaining_time": "10:03:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7672, "total_steps": 10853, "loss": 0.1254, "learning_rate": 1.0852926204920488e-06, "epoch": 0.7068687520154788, "percentage": 70.69, "elapsed_time": "1 day, 0:15:49", "remaining_time": "10:03:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7673, "total_steps": 10853, "loss": 0.1197, "learning_rate": 1.084664607162582e-06, "epoch": 0.7069608881927489, "percentage": 70.7, "elapsed_time": "1 day, 0:16:02", "remaining_time": "10:03:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7674, "total_steps": 10853, "loss": 0.123, "learning_rate": 1.0840367252471583e-06, "epoch": 0.7070530243700189, "percentage": 70.71, "elapsed_time": "1 day, 0:16:12", "remaining_time": "10:03:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7675, "total_steps": 10853, "loss": 0.1408, "learning_rate": 1.083408974804078e-06, "epoch": 0.7071451605472889, "percentage": 70.72, "elapsed_time": "1 day, 0:16:23", "remaining_time": "10:03:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7676, "total_steps": 10853, "loss": 0.1181, "learning_rate": 1.082781355891626e-06, "epoch": 0.7072372967245589, "percentage": 70.73, "elapsed_time": "1 day, 0:16:33", "remaining_time": "10:02:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7677, "total_steps": 10853, "loss": 0.1183, "learning_rate": 1.0821538685680783e-06, "epoch": 0.7073294329018289, "percentage": 70.74, "elapsed_time": "1 day, 0:16:43", "remaining_time": "10:02:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7678, "total_steps": 10853, "loss": 0.127, "learning_rate": 1.0815265128916955e-06, "epoch": 0.7074215690790989, "percentage": 70.75, "elapsed_time": "1 day, 0:16:54", "remaining_time": "10:02:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7679, "total_steps": 10853, "loss": 0.1134, "learning_rate": 1.0808992889207287e-06, "epoch": 0.7075137052563689, "percentage": 70.75, "elapsed_time": "1 day, 0:17:04", "remaining_time": "10:02:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7680, "total_steps": 10853, "loss": 0.1234, "learning_rate": 1.0802721967134167e-06, "epoch": 0.7076058414336389, "percentage": 70.76, "elapsed_time": "1 day, 0:17:14", "remaining_time": "10:02:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7681, "total_steps": 10853, "loss": 0.125, "learning_rate": 1.0796452363279838e-06, "epoch": 0.7076979776109089, "percentage": 70.77, "elapsed_time": "1 day, 0:17:24", "remaining_time": "10:01:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7682, "total_steps": 10853, "loss": 0.1178, "learning_rate": 1.079018407822643e-06, "epoch": 0.7077901137881789, "percentage": 70.78, "elapsed_time": "1 day, 0:17:35", "remaining_time": "10:01:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7683, "total_steps": 10853, "loss": 0.1213, "learning_rate": 1.0783917112555956e-06, "epoch": 0.7078822499654489, "percentage": 70.79, "elapsed_time": "1 day, 0:17:45", "remaining_time": "10:01:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7684, "total_steps": 10853, "loss": 0.123, "learning_rate": 1.0777651466850308e-06, "epoch": 0.7079743861427189, "percentage": 70.8, "elapsed_time": "1 day, 0:17:55", "remaining_time": "10:01:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7685, "total_steps": 10853, "loss": 0.1239, "learning_rate": 1.0771387141691265e-06, "epoch": 0.7080665223199889, "percentage": 70.81, "elapsed_time": "1 day, 0:18:06", "remaining_time": "10:01:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7686, "total_steps": 10853, "loss": 0.1199, "learning_rate": 1.0765124137660454e-06, "epoch": 0.7081586584972589, "percentage": 70.82, "elapsed_time": "1 day, 0:18:16", "remaining_time": "10:00:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7687, "total_steps": 10853, "loss": 0.1322, "learning_rate": 1.075886245533939e-06, "epoch": 0.708250794674529, "percentage": 70.83, "elapsed_time": "1 day, 0:18:26", "remaining_time": "10:00:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7688, "total_steps": 10853, "loss": 0.1346, "learning_rate": 1.075260209530948e-06, "epoch": 0.708342930851799, "percentage": 70.84, "elapsed_time": "1 day, 0:18:38", "remaining_time": "10:00:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7689, "total_steps": 10853, "loss": 0.1359, "learning_rate": 1.0746343058151998e-06, "epoch": 0.708435067029069, "percentage": 70.85, "elapsed_time": "1 day, 0:18:48", "remaining_time": "10:00:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7690, "total_steps": 10853, "loss": 0.1341, "learning_rate": 1.074008534444811e-06, "epoch": 0.708527203206339, "percentage": 70.86, "elapsed_time": "1 day, 0:18:59", "remaining_time": "10:00:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7691, "total_steps": 10853, "loss": 0.1127, "learning_rate": 1.0733828954778827e-06, "epoch": 0.708619339383609, "percentage": 70.87, "elapsed_time": "1 day, 0:19:10", "remaining_time": "9:59:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7692, "total_steps": 10853, "loss": 0.125, "learning_rate": 1.0727573889725053e-06, "epoch": 0.708711475560879, "percentage": 70.87, "elapsed_time": "1 day, 0:19:20", "remaining_time": "9:59:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7693, "total_steps": 10853, "loss": 0.1176, "learning_rate": 1.0721320149867582e-06, "epoch": 0.708803611738149, "percentage": 70.88, "elapsed_time": "1 day, 0:19:31", "remaining_time": "9:59:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7694, "total_steps": 10853, "loss": 0.1304, "learning_rate": 1.0715067735787079e-06, "epoch": 0.708895747915419, "percentage": 70.89, "elapsed_time": "1 day, 0:19:42", "remaining_time": "9:59:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7695, "total_steps": 10853, "loss": 0.1362, "learning_rate": 1.0708816648064067e-06, "epoch": 0.708987884092689, "percentage": 70.9, "elapsed_time": "1 day, 0:19:54", "remaining_time": "9:59:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7696, "total_steps": 10853, "loss": 0.1363, "learning_rate": 1.0702566887278975e-06, "epoch": 0.709080020269959, "percentage": 70.91, "elapsed_time": "1 day, 0:20:05", "remaining_time": "9:58:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7697, "total_steps": 10853, "loss": 0.1194, "learning_rate": 1.0696318454012074e-06, "epoch": 0.709172156447229, "percentage": 70.92, "elapsed_time": "1 day, 0:20:17", "remaining_time": "9:58:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7698, "total_steps": 10853, "loss": 0.1263, "learning_rate": 1.0690071348843559e-06, "epoch": 0.709264292624499, "percentage": 70.93, "elapsed_time": "1 day, 0:20:28", "remaining_time": "9:58:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7699, "total_steps": 10853, "loss": 0.1268, "learning_rate": 1.0683825572353447e-06, "epoch": 0.709356428801769, "percentage": 70.94, "elapsed_time": "1 day, 0:20:40", "remaining_time": "9:58:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7700, "total_steps": 10853, "loss": 0.1292, "learning_rate": 1.0677581125121672e-06, "epoch": 0.709448564979039, "percentage": 70.95, "elapsed_time": "1 day, 0:20:51", "remaining_time": "9:58:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7701, "total_steps": 10853, "loss": 0.1328, "learning_rate": 1.067133800772803e-06, "epoch": 0.7095407011563091, "percentage": 70.96, "elapsed_time": "1 day, 0:21:01", "remaining_time": "9:57:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7702, "total_steps": 10853, "loss": 0.1256, "learning_rate": 1.0665096220752214e-06, "epoch": 0.7096328373335791, "percentage": 70.97, "elapsed_time": "1 day, 0:21:10", "remaining_time": "9:57:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7703, "total_steps": 10853, "loss": 0.125, "learning_rate": 1.065885576477374e-06, "epoch": 0.7097249735108491, "percentage": 70.98, "elapsed_time": "1 day, 0:21:21", "remaining_time": "9:57:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7704, "total_steps": 10853, "loss": 0.1227, "learning_rate": 1.0652616640372051e-06, "epoch": 0.7098171096881191, "percentage": 70.98, "elapsed_time": "1 day, 0:21:33", "remaining_time": "9:57:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7705, "total_steps": 10853, "loss": 0.1225, "learning_rate": 1.064637884812645e-06, "epoch": 0.7099092458653891, "percentage": 70.99, "elapsed_time": "1 day, 0:21:44", "remaining_time": "9:57:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7706, "total_steps": 10853, "loss": 0.1216, "learning_rate": 1.0640142388616128e-06, "epoch": 0.7100013820426591, "percentage": 71.0, "elapsed_time": "1 day, 0:21:53", "remaining_time": "9:57:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7707, "total_steps": 10853, "loss": 0.1171, "learning_rate": 1.063390726242012e-06, "epoch": 0.710093518219929, "percentage": 71.01, "elapsed_time": "1 day, 0:22:03", "remaining_time": "9:56:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7708, "total_steps": 10853, "loss": 0.1179, "learning_rate": 1.062767347011738e-06, "epoch": 0.710185654397199, "percentage": 71.02, "elapsed_time": "1 day, 0:22:13", "remaining_time": "9:56:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7709, "total_steps": 10853, "loss": 0.1249, "learning_rate": 1.0621441012286696e-06, "epoch": 0.710277790574469, "percentage": 71.03, "elapsed_time": "1 day, 0:22:23", "remaining_time": "9:56:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7710, "total_steps": 10853, "loss": 0.1297, "learning_rate": 1.061520988950677e-06, "epoch": 0.710369926751739, "percentage": 71.04, "elapsed_time": "1 day, 0:22:34", "remaining_time": "9:56:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7711, "total_steps": 10853, "loss": 0.1155, "learning_rate": 1.0608980102356146e-06, "epoch": 0.710462062929009, "percentage": 71.05, "elapsed_time": "1 day, 0:22:44", "remaining_time": "9:56:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7712, "total_steps": 10853, "loss": 0.1335, "learning_rate": 1.0602751651413264e-06, "epoch": 0.710554199106279, "percentage": 71.06, "elapsed_time": "1 day, 0:22:55", "remaining_time": "9:55:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7713, "total_steps": 10853, "loss": 0.1095, "learning_rate": 1.0596524537256453e-06, "epoch": 0.710646335283549, "percentage": 71.07, "elapsed_time": "1 day, 0:23:07", "remaining_time": "9:55:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7714, "total_steps": 10853, "loss": 0.1199, "learning_rate": 1.0590298760463879e-06, "epoch": 0.7107384714608191, "percentage": 71.08, "elapsed_time": "1 day, 0:23:18", "remaining_time": "9:55:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7715, "total_steps": 10853, "loss": 0.1242, "learning_rate": 1.0584074321613625e-06, "epoch": 0.7108306076380891, "percentage": 71.09, "elapsed_time": "1 day, 0:23:28", "remaining_time": "9:55:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7716, "total_steps": 10853, "loss": 0.1165, "learning_rate": 1.0577851221283614e-06, "epoch": 0.7109227438153591, "percentage": 71.1, "elapsed_time": "1 day, 0:23:39", "remaining_time": "9:55:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7717, "total_steps": 10853, "loss": 0.1329, "learning_rate": 1.0571629460051665e-06, "epoch": 0.7110148799926291, "percentage": 71.1, "elapsed_time": "1 day, 0:23:50", "remaining_time": "9:54:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7718, "total_steps": 10853, "loss": 0.1371, "learning_rate": 1.0565409038495486e-06, "epoch": 0.7111070161698991, "percentage": 71.11, "elapsed_time": "1 day, 0:24:01", "remaining_time": "9:54:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7719, "total_steps": 10853, "loss": 0.1222, "learning_rate": 1.055918995719263e-06, "epoch": 0.7111991523471691, "percentage": 71.12, "elapsed_time": "1 day, 0:24:11", "remaining_time": "9:54:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7720, "total_steps": 10853, "loss": 0.121, "learning_rate": 1.0552972216720534e-06, "epoch": 0.7112912885244391, "percentage": 71.13, "elapsed_time": "1 day, 0:24:20", "remaining_time": "9:54:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7721, "total_steps": 10853, "loss": 0.1318, "learning_rate": 1.054675581765652e-06, "epoch": 0.7113834247017091, "percentage": 71.14, "elapsed_time": "1 day, 0:24:31", "remaining_time": "9:54:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7722, "total_steps": 10853, "loss": 0.1285, "learning_rate": 1.0540540760577785e-06, "epoch": 0.7114755608789791, "percentage": 71.15, "elapsed_time": "1 day, 0:24:43", "remaining_time": "9:53:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7723, "total_steps": 10853, "loss": 0.1306, "learning_rate": 1.0534327046061404e-06, "epoch": 0.7115676970562491, "percentage": 71.16, "elapsed_time": "1 day, 0:24:54", "remaining_time": "9:53:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7724, "total_steps": 10853, "loss": 0.1198, "learning_rate": 1.0528114674684318e-06, "epoch": 0.7116598332335191, "percentage": 71.17, "elapsed_time": "1 day, 0:25:06", "remaining_time": "9:53:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7725, "total_steps": 10853, "loss": 0.126, "learning_rate": 1.0521903647023327e-06, "epoch": 0.7117519694107891, "percentage": 71.18, "elapsed_time": "1 day, 0:25:17", "remaining_time": "9:53:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7726, "total_steps": 10853, "loss": 0.1087, "learning_rate": 1.0515693963655144e-06, "epoch": 0.7118441055880591, "percentage": 71.19, "elapsed_time": "1 day, 0:25:26", "remaining_time": "9:53:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7727, "total_steps": 10853, "loss": 0.1198, "learning_rate": 1.0509485625156342e-06, "epoch": 0.7119362417653291, "percentage": 71.2, "elapsed_time": "1 day, 0:25:37", "remaining_time": "9:52:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7728, "total_steps": 10853, "loss": 0.1204, "learning_rate": 1.0503278632103353e-06, "epoch": 0.7120283779425992, "percentage": 71.21, "elapsed_time": "1 day, 0:25:47", "remaining_time": "9:52:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7729, "total_steps": 10853, "loss": 0.138, "learning_rate": 1.0497072985072509e-06, "epoch": 0.7121205141198692, "percentage": 71.22, "elapsed_time": "1 day, 0:25:59", "remaining_time": "9:52:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7730, "total_steps": 10853, "loss": 0.1377, "learning_rate": 1.0490868684639994e-06, "epoch": 0.7122126502971392, "percentage": 71.22, "elapsed_time": "1 day, 0:26:10", "remaining_time": "9:52:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7731, "total_steps": 10853, "loss": 0.1275, "learning_rate": 1.0484665731381892e-06, "epoch": 0.7123047864744092, "percentage": 71.23, "elapsed_time": "1 day, 0:26:20", "remaining_time": "9:52:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7732, "total_steps": 10853, "loss": 0.1211, "learning_rate": 1.0478464125874126e-06, "epoch": 0.7123969226516792, "percentage": 71.24, "elapsed_time": "1 day, 0:26:31", "remaining_time": "9:51:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7733, "total_steps": 10853, "loss": 0.1144, "learning_rate": 1.047226386869253e-06, "epoch": 0.7124890588289492, "percentage": 71.25, "elapsed_time": "1 day, 0:26:42", "remaining_time": "9:51:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7734, "total_steps": 10853, "loss": 0.1236, "learning_rate": 1.046606496041281e-06, "epoch": 0.7125811950062192, "percentage": 71.26, "elapsed_time": "1 day, 0:26:53", "remaining_time": "9:51:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7735, "total_steps": 10853, "loss": 0.1174, "learning_rate": 1.0459867401610519e-06, "epoch": 0.7126733311834892, "percentage": 71.27, "elapsed_time": "1 day, 0:27:04", "remaining_time": "9:51:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7736, "total_steps": 10853, "loss": 0.1251, "learning_rate": 1.0453671192861095e-06, "epoch": 0.7127654673607592, "percentage": 71.28, "elapsed_time": "1 day, 0:27:15", "remaining_time": "9:51:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7737, "total_steps": 10853, "loss": 0.1321, "learning_rate": 1.0447476334739867e-06, "epoch": 0.7128576035380292, "percentage": 71.29, "elapsed_time": "1 day, 0:27:25", "remaining_time": "9:50:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7738, "total_steps": 10853, "loss": 0.1257, "learning_rate": 1.0441282827822027e-06, "epoch": 0.7129497397152992, "percentage": 71.3, "elapsed_time": "1 day, 0:27:35", "remaining_time": "9:50:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7739, "total_steps": 10853, "loss": 0.1311, "learning_rate": 1.0435090672682655e-06, "epoch": 0.7130418758925692, "percentage": 71.31, "elapsed_time": "1 day, 0:27:46", "remaining_time": "9:50:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7740, "total_steps": 10853, "loss": 0.1309, "learning_rate": 1.042889986989668e-06, "epoch": 0.7131340120698392, "percentage": 71.32, "elapsed_time": "1 day, 0:27:55", "remaining_time": "9:50:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7741, "total_steps": 10853, "loss": 0.1259, "learning_rate": 1.0422710420038912e-06, "epoch": 0.7132261482471093, "percentage": 71.33, "elapsed_time": "1 day, 0:28:05", "remaining_time": "9:50:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7742, "total_steps": 10853, "loss": 0.1116, "learning_rate": 1.0416522323684048e-06, "epoch": 0.7133182844243793, "percentage": 71.34, "elapsed_time": "1 day, 0:28:17", "remaining_time": "9:50:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7743, "total_steps": 10853, "loss": 0.1275, "learning_rate": 1.0410335581406657e-06, "epoch": 0.7134104206016493, "percentage": 71.34, "elapsed_time": "1 day, 0:28:29", "remaining_time": "9:49:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7744, "total_steps": 10853, "loss": 0.1285, "learning_rate": 1.0404150193781187e-06, "epoch": 0.7135025567789193, "percentage": 71.35, "elapsed_time": "1 day, 0:28:41", "remaining_time": "9:49:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7745, "total_steps": 10853, "loss": 0.1163, "learning_rate": 1.0397966161381943e-06, "epoch": 0.7135946929561893, "percentage": 71.36, "elapsed_time": "1 day, 0:28:51", "remaining_time": "9:49:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7746, "total_steps": 10853, "loss": 0.1261, "learning_rate": 1.03917834847831e-06, "epoch": 0.7136868291334593, "percentage": 71.37, "elapsed_time": "1 day, 0:29:00", "remaining_time": "9:49:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7747, "total_steps": 10853, "loss": 0.109, "learning_rate": 1.0385602164558735e-06, "epoch": 0.7137789653107293, "percentage": 71.38, "elapsed_time": "1 day, 0:29:11", "remaining_time": "9:49:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7748, "total_steps": 10853, "loss": 0.1214, "learning_rate": 1.037942220128279e-06, "epoch": 0.7138711014879993, "percentage": 71.39, "elapsed_time": "1 day, 0:29:21", "remaining_time": "9:48:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7749, "total_steps": 10853, "loss": 0.1218, "learning_rate": 1.0373243595529058e-06, "epoch": 0.7139632376652693, "percentage": 71.4, "elapsed_time": "1 day, 0:29:33", "remaining_time": "9:48:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7750, "total_steps": 10853, "loss": 0.118, "learning_rate": 1.0367066347871243e-06, "epoch": 0.7140553738425393, "percentage": 71.41, "elapsed_time": "1 day, 0:29:44", "remaining_time": "9:48:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7751, "total_steps": 10853, "loss": 0.1277, "learning_rate": 1.0360890458882882e-06, "epoch": 0.7141475100198093, "percentage": 71.42, "elapsed_time": "1 day, 0:29:54", "remaining_time": "9:48:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7752, "total_steps": 10853, "loss": 0.1118, "learning_rate": 1.0354715929137429e-06, "epoch": 0.7142396461970792, "percentage": 71.43, "elapsed_time": "1 day, 0:30:05", "remaining_time": "9:48:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7753, "total_steps": 10853, "loss": 0.1122, "learning_rate": 1.0348542759208166e-06, "epoch": 0.7143317823743492, "percentage": 71.44, "elapsed_time": "1 day, 0:30:16", "remaining_time": "9:47:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7754, "total_steps": 10853, "loss": 0.1282, "learning_rate": 1.0342370949668287e-06, "epoch": 0.7144239185516192, "percentage": 71.45, "elapsed_time": "1 day, 0:30:26", "remaining_time": "9:47:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7755, "total_steps": 10853, "loss": 0.118, "learning_rate": 1.0336200501090848e-06, "epoch": 0.7145160547288893, "percentage": 71.45, "elapsed_time": "1 day, 0:30:36", "remaining_time": "9:47:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7756, "total_steps": 10853, "loss": 0.1266, "learning_rate": 1.0330031414048775e-06, "epoch": 0.7146081909061593, "percentage": 71.46, "elapsed_time": "1 day, 0:30:47", "remaining_time": "9:47:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7757, "total_steps": 10853, "loss": 0.1212, "learning_rate": 1.0323863689114851e-06, "epoch": 0.7147003270834293, "percentage": 71.47, "elapsed_time": "1 day, 0:30:59", "remaining_time": "9:47:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7758, "total_steps": 10853, "loss": 0.1239, "learning_rate": 1.0317697326861766e-06, "epoch": 0.7147924632606993, "percentage": 71.48, "elapsed_time": "1 day, 0:31:10", "remaining_time": "9:46:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7759, "total_steps": 10853, "loss": 0.1219, "learning_rate": 1.0311532327862064e-06, "epoch": 0.7148845994379693, "percentage": 71.49, "elapsed_time": "1 day, 0:31:21", "remaining_time": "9:46:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7760, "total_steps": 10853, "loss": 0.1372, "learning_rate": 1.0305368692688175e-06, "epoch": 0.7149767356152393, "percentage": 71.5, "elapsed_time": "1 day, 0:31:31", "remaining_time": "9:46:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7761, "total_steps": 10853, "loss": 0.1201, "learning_rate": 1.0299206421912382e-06, "epoch": 0.7150688717925093, "percentage": 71.51, "elapsed_time": "1 day, 0:31:42", "remaining_time": "9:46:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7762, "total_steps": 10853, "loss": 0.1085, "learning_rate": 1.0293045516106848e-06, "epoch": 0.7151610079697793, "percentage": 71.52, "elapsed_time": "1 day, 0:31:53", "remaining_time": "9:46:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7763, "total_steps": 10853, "loss": 0.1145, "learning_rate": 1.0286885975843621e-06, "epoch": 0.7152531441470493, "percentage": 71.53, "elapsed_time": "1 day, 0:32:04", "remaining_time": "9:45:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7764, "total_steps": 10853, "loss": 0.1216, "learning_rate": 1.0280727801694624e-06, "epoch": 0.7153452803243193, "percentage": 71.54, "elapsed_time": "1 day, 0:32:14", "remaining_time": "9:45:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7765, "total_steps": 10853, "loss": 0.1254, "learning_rate": 1.0274570994231622e-06, "epoch": 0.7154374165015893, "percentage": 71.55, "elapsed_time": "1 day, 0:32:25", "remaining_time": "9:45:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7766, "total_steps": 10853, "loss": 0.1273, "learning_rate": 1.02684155540263e-06, "epoch": 0.7155295526788593, "percentage": 71.56, "elapsed_time": "1 day, 0:32:35", "remaining_time": "9:45:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7767, "total_steps": 10853, "loss": 0.1203, "learning_rate": 1.026226148165017e-06, "epoch": 0.7156216888561293, "percentage": 71.57, "elapsed_time": "1 day, 0:32:45", "remaining_time": "9:45:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7768, "total_steps": 10853, "loss": 0.1198, "learning_rate": 1.0256108777674656e-06, "epoch": 0.7157138250333993, "percentage": 71.57, "elapsed_time": "1 day, 0:32:56", "remaining_time": "9:44:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7769, "total_steps": 10853, "loss": 0.1157, "learning_rate": 1.024995744267102e-06, "epoch": 0.7158059612106694, "percentage": 71.58, "elapsed_time": "1 day, 0:33:06", "remaining_time": "9:44:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7770, "total_steps": 10853, "loss": 0.13, "learning_rate": 1.0243807477210423e-06, "epoch": 0.7158980973879394, "percentage": 71.59, "elapsed_time": "1 day, 0:33:17", "remaining_time": "9:44:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7771, "total_steps": 10853, "loss": 0.1114, "learning_rate": 1.0237658881863898e-06, "epoch": 0.7159902335652094, "percentage": 71.6, "elapsed_time": "1 day, 0:33:28", "remaining_time": "9:44:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7772, "total_steps": 10853, "loss": 0.1203, "learning_rate": 1.0231511657202327e-06, "epoch": 0.7160823697424794, "percentage": 71.61, "elapsed_time": "1 day, 0:33:39", "remaining_time": "9:44:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7773, "total_steps": 10853, "loss": 0.1236, "learning_rate": 1.0225365803796498e-06, "epoch": 0.7161745059197494, "percentage": 71.62, "elapsed_time": "1 day, 0:33:49", "remaining_time": "9:43:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7774, "total_steps": 10853, "loss": 0.1101, "learning_rate": 1.0219221322217032e-06, "epoch": 0.7162666420970194, "percentage": 71.63, "elapsed_time": "1 day, 0:33:59", "remaining_time": "9:43:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7775, "total_steps": 10853, "loss": 0.1358, "learning_rate": 1.0213078213034457e-06, "epoch": 0.7163587782742894, "percentage": 71.64, "elapsed_time": "1 day, 0:34:10", "remaining_time": "9:43:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7776, "total_steps": 10853, "loss": 0.1147, "learning_rate": 1.0206936476819165e-06, "epoch": 0.7164509144515594, "percentage": 71.65, "elapsed_time": "1 day, 0:34:20", "remaining_time": "9:43:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7777, "total_steps": 10853, "loss": 0.1173, "learning_rate": 1.0200796114141428e-06, "epoch": 0.7165430506288294, "percentage": 71.66, "elapsed_time": "1 day, 0:34:32", "remaining_time": "9:43:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7778, "total_steps": 10853, "loss": 0.1267, "learning_rate": 1.0194657125571347e-06, "epoch": 0.7166351868060994, "percentage": 71.67, "elapsed_time": "1 day, 0:34:42", "remaining_time": "9:43:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7779, "total_steps": 10853, "loss": 0.1134, "learning_rate": 1.0188519511678946e-06, "epoch": 0.7167273229833694, "percentage": 71.68, "elapsed_time": "1 day, 0:34:53", "remaining_time": "9:42:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7780, "total_steps": 10853, "loss": 0.1138, "learning_rate": 1.0182383273034102e-06, "epoch": 0.7168194591606394, "percentage": 71.69, "elapsed_time": "1 day, 0:35:05", "remaining_time": "9:42:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7781, "total_steps": 10853, "loss": 0.131, "learning_rate": 1.0176248410206577e-06, "epoch": 0.7169115953379094, "percentage": 71.69, "elapsed_time": "1 day, 0:35:16", "remaining_time": "9:42:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7782, "total_steps": 10853, "loss": 0.1226, "learning_rate": 1.017011492376597e-06, "epoch": 0.7170037315151795, "percentage": 71.7, "elapsed_time": "1 day, 0:35:27", "remaining_time": "9:42:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7783, "total_steps": 10853, "loss": 0.1081, "learning_rate": 1.0163982814281797e-06, "epoch": 0.7170958676924495, "percentage": 71.71, "elapsed_time": "1 day, 0:35:38", "remaining_time": "9:42:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7784, "total_steps": 10853, "loss": 0.117, "learning_rate": 1.0157852082323411e-06, "epoch": 0.7171880038697195, "percentage": 71.72, "elapsed_time": "1 day, 0:35:47", "remaining_time": "9:41:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7785, "total_steps": 10853, "loss": 0.1232, "learning_rate": 1.0151722728460064e-06, "epoch": 0.7172801400469895, "percentage": 71.73, "elapsed_time": "1 day, 0:35:57", "remaining_time": "9:41:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7786, "total_steps": 10853, "loss": 0.1162, "learning_rate": 1.0145594753260849e-06, "epoch": 0.7173722762242595, "percentage": 71.74, "elapsed_time": "1 day, 0:36:06", "remaining_time": "9:41:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7787, "total_steps": 10853, "loss": 0.1218, "learning_rate": 1.0139468157294762e-06, "epoch": 0.7174644124015295, "percentage": 71.75, "elapsed_time": "1 day, 0:36:18", "remaining_time": "9:41:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7788, "total_steps": 10853, "loss": 0.1112, "learning_rate": 1.0133342941130664e-06, "epoch": 0.7175565485787995, "percentage": 71.76, "elapsed_time": "1 day, 0:36:28", "remaining_time": "9:41:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7789, "total_steps": 10853, "loss": 0.1259, "learning_rate": 1.0127219105337274e-06, "epoch": 0.7176486847560695, "percentage": 71.77, "elapsed_time": "1 day, 0:36:39", "remaining_time": "9:40:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7790, "total_steps": 10853, "loss": 0.1169, "learning_rate": 1.0121096650483182e-06, "epoch": 0.7177408209333395, "percentage": 71.78, "elapsed_time": "1 day, 0:36:50", "remaining_time": "9:40:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7791, "total_steps": 10853, "loss": 0.1194, "learning_rate": 1.0114975577136866e-06, "epoch": 0.7178329571106095, "percentage": 71.79, "elapsed_time": "1 day, 0:37:01", "remaining_time": "9:40:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7792, "total_steps": 10853, "loss": 0.1277, "learning_rate": 1.010885588586667e-06, "epoch": 0.7179250932878795, "percentage": 71.8, "elapsed_time": "1 day, 0:37:12", "remaining_time": "9:40:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7793, "total_steps": 10853, "loss": 0.1202, "learning_rate": 1.0102737577240818e-06, "epoch": 0.7180172294651495, "percentage": 71.81, "elapsed_time": "1 day, 0:37:22", "remaining_time": "9:40:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7794, "total_steps": 10853, "loss": 0.1214, "learning_rate": 1.0096620651827382e-06, "epoch": 0.7181093656424195, "percentage": 71.81, "elapsed_time": "1 day, 0:37:33", "remaining_time": "9:39:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7795, "total_steps": 10853, "loss": 0.1128, "learning_rate": 1.0090505110194315e-06, "epoch": 0.7182015018196894, "percentage": 71.82, "elapsed_time": "1 day, 0:37:43", "remaining_time": "9:39:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7796, "total_steps": 10853, "loss": 0.1269, "learning_rate": 1.0084390952909456e-06, "epoch": 0.7182936379969596, "percentage": 71.83, "elapsed_time": "1 day, 0:37:55", "remaining_time": "9:39:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7797, "total_steps": 10853, "loss": 0.1154, "learning_rate": 1.0078278180540507e-06, "epoch": 0.7183857741742296, "percentage": 71.84, "elapsed_time": "1 day, 0:38:06", "remaining_time": "9:39:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7798, "total_steps": 10853, "loss": 0.1106, "learning_rate": 1.0072166793655027e-06, "epoch": 0.7184779103514995, "percentage": 71.85, "elapsed_time": "1 day, 0:38:17", "remaining_time": "9:39:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7799, "total_steps": 10853, "loss": 0.1301, "learning_rate": 1.0066056792820478e-06, "epoch": 0.7185700465287695, "percentage": 71.86, "elapsed_time": "1 day, 0:38:28", "remaining_time": "9:38:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7800, "total_steps": 10853, "loss": 0.1053, "learning_rate": 1.0059948178604154e-06, "epoch": 0.7186621827060395, "percentage": 71.87, "elapsed_time": "1 day, 0:38:38", "remaining_time": "9:38:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7801, "total_steps": 10853, "loss": 0.1349, "learning_rate": 1.0053840951573247e-06, "epoch": 0.7187543188833095, "percentage": 71.88, "elapsed_time": "1 day, 0:38:48", "remaining_time": "9:38:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7802, "total_steps": 10853, "loss": 0.1157, "learning_rate": 1.0047735112294827e-06, "epoch": 0.7188464550605795, "percentage": 71.89, "elapsed_time": "1 day, 0:38:59", "remaining_time": "9:38:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7803, "total_steps": 10853, "loss": 0.1197, "learning_rate": 1.00416306613358e-06, "epoch": 0.7189385912378495, "percentage": 71.9, "elapsed_time": "1 day, 0:39:10", "remaining_time": "9:38:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7804, "total_steps": 10853, "loss": 0.1341, "learning_rate": 1.0035527599262988e-06, "epoch": 0.7190307274151195, "percentage": 71.91, "elapsed_time": "1 day, 0:39:21", "remaining_time": "9:37:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7805, "total_steps": 10853, "loss": 0.1309, "learning_rate": 1.0029425926643035e-06, "epoch": 0.7191228635923895, "percentage": 71.92, "elapsed_time": "1 day, 0:39:32", "remaining_time": "9:37:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7806, "total_steps": 10853, "loss": 0.1228, "learning_rate": 1.0023325644042508e-06, "epoch": 0.7192149997696595, "percentage": 71.92, "elapsed_time": "1 day, 0:39:42", "remaining_time": "9:37:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7807, "total_steps": 10853, "loss": 0.1173, "learning_rate": 1.0017226752027798e-06, "epoch": 0.7193071359469295, "percentage": 71.93, "elapsed_time": "1 day, 0:39:52", "remaining_time": "9:37:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7808, "total_steps": 10853, "loss": 0.1264, "learning_rate": 1.0011129251165198e-06, "epoch": 0.7193992721241995, "percentage": 71.94, "elapsed_time": "1 day, 0:40:04", "remaining_time": "9:37:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7809, "total_steps": 10853, "loss": 0.1195, "learning_rate": 1.0005033142020868e-06, "epoch": 0.7194914083014696, "percentage": 71.95, "elapsed_time": "1 day, 0:40:15", "remaining_time": "9:37:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7810, "total_steps": 10853, "loss": 0.1127, "learning_rate": 9.998938425160822e-07, "epoch": 0.7195835444787396, "percentage": 71.96, "elapsed_time": "1 day, 0:40:27", "remaining_time": "9:36:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7811, "total_steps": 10853, "loss": 0.1177, "learning_rate": 9.992845101150949e-07, "epoch": 0.7196756806560096, "percentage": 71.97, "elapsed_time": "1 day, 0:40:38", "remaining_time": "9:36:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7812, "total_steps": 10853, "loss": 0.1272, "learning_rate": 9.986753170557026e-07, "epoch": 0.7197678168332796, "percentage": 71.98, "elapsed_time": "1 day, 0:40:49", "remaining_time": "9:36:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7813, "total_steps": 10853, "loss": 0.1306, "learning_rate": 9.980662633944687e-07, "epoch": 0.7198599530105496, "percentage": 71.99, "elapsed_time": "1 day, 0:40:58", "remaining_time": "9:36:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7814, "total_steps": 10853, "loss": 0.1187, "learning_rate": 9.974573491879447e-07, "epoch": 0.7199520891878196, "percentage": 72.0, "elapsed_time": "1 day, 0:41:10", "remaining_time": "9:36:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7815, "total_steps": 10853, "loss": 0.1422, "learning_rate": 9.968485744926673e-07, "epoch": 0.7200442253650896, "percentage": 72.01, "elapsed_time": "1 day, 0:41:21", "remaining_time": "9:35:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7816, "total_steps": 10853, "loss": 0.1283, "learning_rate": 9.962399393651608e-07, "epoch": 0.7201363615423596, "percentage": 72.02, "elapsed_time": "1 day, 0:41:32", "remaining_time": "9:35:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7817, "total_steps": 10853, "loss": 0.1113, "learning_rate": 9.95631443861938e-07, "epoch": 0.7202284977196296, "percentage": 72.03, "elapsed_time": "1 day, 0:41:42", "remaining_time": "9:35:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7818, "total_steps": 10853, "loss": 0.1239, "learning_rate": 9.95023088039498e-07, "epoch": 0.7203206338968996, "percentage": 72.04, "elapsed_time": "1 day, 0:41:53", "remaining_time": "9:35:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7819, "total_steps": 10853, "loss": 0.1211, "learning_rate": 9.94414871954326e-07, "epoch": 0.7204127700741696, "percentage": 72.04, "elapsed_time": "1 day, 0:42:04", "remaining_time": "9:35:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7820, "total_steps": 10853, "loss": 0.1275, "learning_rate": 9.938067956628955e-07, "epoch": 0.7205049062514396, "percentage": 72.05, "elapsed_time": "1 day, 0:42:15", "remaining_time": "9:34:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7821, "total_steps": 10853, "loss": 0.1234, "learning_rate": 9.931988592216654e-07, "epoch": 0.7205970424287096, "percentage": 72.06, "elapsed_time": "1 day, 0:42:26", "remaining_time": "9:34:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7822, "total_steps": 10853, "loss": 0.1247, "learning_rate": 9.925910626870841e-07, "epoch": 0.7206891786059796, "percentage": 72.07, "elapsed_time": "1 day, 0:42:37", "remaining_time": "9:34:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7823, "total_steps": 10853, "loss": 0.1403, "learning_rate": 9.919834061155841e-07, "epoch": 0.7207813147832497, "percentage": 72.08, "elapsed_time": "1 day, 0:42:48", "remaining_time": "9:34:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7824, "total_steps": 10853, "loss": 0.1207, "learning_rate": 9.913758895635872e-07, "epoch": 0.7208734509605197, "percentage": 72.09, "elapsed_time": "1 day, 0:42:58", "remaining_time": "9:34:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7825, "total_steps": 10853, "loss": 0.1305, "learning_rate": 9.907685130875022e-07, "epoch": 0.7209655871377897, "percentage": 72.1, "elapsed_time": "1 day, 0:43:09", "remaining_time": "9:33:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7826, "total_steps": 10853, "loss": 0.1322, "learning_rate": 9.901612767437233e-07, "epoch": 0.7210577233150597, "percentage": 72.11, "elapsed_time": "1 day, 0:43:21", "remaining_time": "9:33:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7827, "total_steps": 10853, "loss": 0.126, "learning_rate": 9.89554180588631e-07, "epoch": 0.7211498594923297, "percentage": 72.12, "elapsed_time": "1 day, 0:43:31", "remaining_time": "9:33:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7828, "total_steps": 10853, "loss": 0.1259, "learning_rate": 9.889472246785962e-07, "epoch": 0.7212419956695997, "percentage": 72.13, "elapsed_time": "1 day, 0:43:41", "remaining_time": "9:33:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7829, "total_steps": 10853, "loss": 0.123, "learning_rate": 9.883404090699739e-07, "epoch": 0.7213341318468697, "percentage": 72.14, "elapsed_time": "1 day, 0:43:51", "remaining_time": "9:33:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7830, "total_steps": 10853, "loss": 0.1255, "learning_rate": 9.877337338191081e-07, "epoch": 0.7214262680241397, "percentage": 72.15, "elapsed_time": "1 day, 0:44:01", "remaining_time": "9:32:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7831, "total_steps": 10853, "loss": 0.1257, "learning_rate": 9.871271989823279e-07, "epoch": 0.7215184042014097, "percentage": 72.16, "elapsed_time": "1 day, 0:44:12", "remaining_time": "9:32:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7832, "total_steps": 10853, "loss": 0.1222, "learning_rate": 9.865208046159493e-07, "epoch": 0.7216105403786797, "percentage": 72.16, "elapsed_time": "1 day, 0:44:22", "remaining_time": "9:32:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7833, "total_steps": 10853, "loss": 0.1315, "learning_rate": 9.85914550776277e-07, "epoch": 0.7217026765559497, "percentage": 72.17, "elapsed_time": "1 day, 0:44:33", "remaining_time": "9:32:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7834, "total_steps": 10853, "loss": 0.1376, "learning_rate": 9.853084375196013e-07, "epoch": 0.7217948127332197, "percentage": 72.18, "elapsed_time": "1 day, 0:44:46", "remaining_time": "9:32:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7835, "total_steps": 10853, "loss": 0.1134, "learning_rate": 9.847024649022014e-07, "epoch": 0.7218869489104897, "percentage": 72.19, "elapsed_time": "1 day, 0:44:55", "remaining_time": "9:31:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7836, "total_steps": 10853, "loss": 0.1229, "learning_rate": 9.840966329803404e-07, "epoch": 0.7219790850877598, "percentage": 72.2, "elapsed_time": "1 day, 0:45:05", "remaining_time": "9:31:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7837, "total_steps": 10853, "loss": 0.1241, "learning_rate": 9.834909418102694e-07, "epoch": 0.7220712212650298, "percentage": 72.21, "elapsed_time": "1 day, 0:45:15", "remaining_time": "9:31:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7838, "total_steps": 10853, "loss": 0.1148, "learning_rate": 9.828853914482276e-07, "epoch": 0.7221633574422998, "percentage": 72.22, "elapsed_time": "1 day, 0:45:26", "remaining_time": "9:31:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7839, "total_steps": 10853, "loss": 0.1161, "learning_rate": 9.822799819504413e-07, "epoch": 0.7222554936195698, "percentage": 72.23, "elapsed_time": "1 day, 0:45:38", "remaining_time": "9:31:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7840, "total_steps": 10853, "loss": 0.1116, "learning_rate": 9.816747133731213e-07, "epoch": 0.7223476297968398, "percentage": 72.24, "elapsed_time": "1 day, 0:45:49", "remaining_time": "9:31:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7841, "total_steps": 10853, "loss": 0.1177, "learning_rate": 9.810695857724685e-07, "epoch": 0.7224397659741097, "percentage": 72.25, "elapsed_time": "1 day, 0:45:59", "remaining_time": "9:30:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7842, "total_steps": 10853, "loss": 0.1274, "learning_rate": 9.80464599204667e-07, "epoch": 0.7225319021513797, "percentage": 72.26, "elapsed_time": "1 day, 0:46:12", "remaining_time": "9:30:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7843, "total_steps": 10853, "loss": 0.118, "learning_rate": 9.798597537258921e-07, "epoch": 0.7226240383286497, "percentage": 72.27, "elapsed_time": "1 day, 0:46:23", "remaining_time": "9:30:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7844, "total_steps": 10853, "loss": 0.1253, "learning_rate": 9.79255049392302e-07, "epoch": 0.7227161745059197, "percentage": 72.27, "elapsed_time": "1 day, 0:46:35", "remaining_time": "9:30:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7845, "total_steps": 10853, "loss": 0.1185, "learning_rate": 9.78650486260044e-07, "epoch": 0.7228083106831897, "percentage": 72.28, "elapsed_time": "1 day, 0:46:44", "remaining_time": "9:30:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7846, "total_steps": 10853, "loss": 0.1191, "learning_rate": 9.78046064385253e-07, "epoch": 0.7229004468604597, "percentage": 72.29, "elapsed_time": "1 day, 0:46:54", "remaining_time": "9:29:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7847, "total_steps": 10853, "loss": 0.1203, "learning_rate": 9.774417838240485e-07, "epoch": 0.7229925830377297, "percentage": 72.3, "elapsed_time": "1 day, 0:47:04", "remaining_time": "9:29:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7848, "total_steps": 10853, "loss": 0.1163, "learning_rate": 9.768376446325376e-07, "epoch": 0.7230847192149997, "percentage": 72.31, "elapsed_time": "1 day, 0:47:16", "remaining_time": "9:29:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7849, "total_steps": 10853, "loss": 0.1151, "learning_rate": 9.762336468668151e-07, "epoch": 0.7231768553922697, "percentage": 72.32, "elapsed_time": "1 day, 0:47:27", "remaining_time": "9:29:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7850, "total_steps": 10853, "loss": 0.111, "learning_rate": 9.756297905829627e-07, "epoch": 0.7232689915695398, "percentage": 72.33, "elapsed_time": "1 day, 0:47:37", "remaining_time": "9:29:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7851, "total_steps": 10853, "loss": 0.1085, "learning_rate": 9.75026075837049e-07, "epoch": 0.7233611277468098, "percentage": 72.34, "elapsed_time": "1 day, 0:47:47", "remaining_time": "9:28:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7852, "total_steps": 10853, "loss": 0.125, "learning_rate": 9.744225026851284e-07, "epoch": 0.7234532639240798, "percentage": 72.35, "elapsed_time": "1 day, 0:47:58", "remaining_time": "9:28:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7853, "total_steps": 10853, "loss": 0.1143, "learning_rate": 9.738190711832415e-07, "epoch": 0.7235454001013498, "percentage": 72.36, "elapsed_time": "1 day, 0:48:09", "remaining_time": "9:28:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7854, "total_steps": 10853, "loss": 0.1284, "learning_rate": 9.732157813874185e-07, "epoch": 0.7236375362786198, "percentage": 72.37, "elapsed_time": "1 day, 0:48:20", "remaining_time": "9:28:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7855, "total_steps": 10853, "loss": 0.1117, "learning_rate": 9.72612633353675e-07, "epoch": 0.7237296724558898, "percentage": 72.38, "elapsed_time": "1 day, 0:48:32", "remaining_time": "9:28:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7856, "total_steps": 10853, "loss": 0.1122, "learning_rate": 9.720096271380122e-07, "epoch": 0.7238218086331598, "percentage": 72.39, "elapsed_time": "1 day, 0:48:42", "remaining_time": "9:27:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7857, "total_steps": 10853, "loss": 0.1265, "learning_rate": 9.714067627964199e-07, "epoch": 0.7239139448104298, "percentage": 72.39, "elapsed_time": "1 day, 0:48:52", "remaining_time": "9:27:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7858, "total_steps": 10853, "loss": 0.1265, "learning_rate": 9.708040403848752e-07, "epoch": 0.7240060809876998, "percentage": 72.4, "elapsed_time": "1 day, 0:49:03", "remaining_time": "9:27:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7859, "total_steps": 10853, "loss": 0.1134, "learning_rate": 9.70201459959339e-07, "epoch": 0.7240982171649698, "percentage": 72.41, "elapsed_time": "1 day, 0:49:15", "remaining_time": "9:27:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7860, "total_steps": 10853, "loss": 0.1183, "learning_rate": 9.695990215757625e-07, "epoch": 0.7241903533422398, "percentage": 72.42, "elapsed_time": "1 day, 0:49:26", "remaining_time": "9:27:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7861, "total_steps": 10853, "loss": 0.1205, "learning_rate": 9.689967252900809e-07, "epoch": 0.7242824895195098, "percentage": 72.43, "elapsed_time": "1 day, 0:49:36", "remaining_time": "9:26:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7862, "total_steps": 10853, "loss": 0.1195, "learning_rate": 9.683945711582181e-07, "epoch": 0.7243746256967798, "percentage": 72.44, "elapsed_time": "1 day, 0:49:46", "remaining_time": "9:26:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7863, "total_steps": 10853, "loss": 0.1353, "learning_rate": 9.677925592360851e-07, "epoch": 0.7244667618740498, "percentage": 72.45, "elapsed_time": "1 day, 0:49:56", "remaining_time": "9:26:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7864, "total_steps": 10853, "loss": 0.1206, "learning_rate": 9.671906895795779e-07, "epoch": 0.7245588980513199, "percentage": 72.46, "elapsed_time": "1 day, 0:50:06", "remaining_time": "9:26:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7865, "total_steps": 10853, "loss": 0.1356, "learning_rate": 9.665889622445792e-07, "epoch": 0.7246510342285899, "percentage": 72.47, "elapsed_time": "1 day, 0:50:16", "remaining_time": "9:26:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7866, "total_steps": 10853, "loss": 0.121, "learning_rate": 9.659873772869601e-07, "epoch": 0.7247431704058599, "percentage": 72.48, "elapsed_time": "1 day, 0:50:26", "remaining_time": "9:25:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7867, "total_steps": 10853, "loss": 0.1267, "learning_rate": 9.653859347625786e-07, "epoch": 0.7248353065831299, "percentage": 72.49, "elapsed_time": "1 day, 0:50:38", "remaining_time": "9:25:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7868, "total_steps": 10853, "loss": 0.1128, "learning_rate": 9.647846347272788e-07, "epoch": 0.7249274427603999, "percentage": 72.5, "elapsed_time": "1 day, 0:50:50", "remaining_time": "9:25:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7869, "total_steps": 10853, "loss": 0.1276, "learning_rate": 9.64183477236891e-07, "epoch": 0.7250195789376699, "percentage": 72.51, "elapsed_time": "1 day, 0:51:00", "remaining_time": "9:25:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7870, "total_steps": 10853, "loss": 0.1354, "learning_rate": 9.635824623472317e-07, "epoch": 0.7251117151149399, "percentage": 72.51, "elapsed_time": "1 day, 0:51:11", "remaining_time": "9:25:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7871, "total_steps": 10853, "loss": 0.1242, "learning_rate": 9.629815901141062e-07, "epoch": 0.7252038512922099, "percentage": 72.52, "elapsed_time": "1 day, 0:51:21", "remaining_time": "9:25:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7872, "total_steps": 10853, "loss": 0.1182, "learning_rate": 9.623808605933063e-07, "epoch": 0.7252959874694799, "percentage": 72.53, "elapsed_time": "1 day, 0:51:32", "remaining_time": "9:24:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7873, "total_steps": 10853, "loss": 0.1125, "learning_rate": 9.617802738406082e-07, "epoch": 0.7253881236467499, "percentage": 72.54, "elapsed_time": "1 day, 0:51:43", "remaining_time": "9:24:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7874, "total_steps": 10853, "loss": 0.1193, "learning_rate": 9.611798299117778e-07, "epoch": 0.7254802598240199, "percentage": 72.55, "elapsed_time": "1 day, 0:51:52", "remaining_time": "9:24:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7875, "total_steps": 10853, "loss": 0.118, "learning_rate": 9.605795288625652e-07, "epoch": 0.7255723960012899, "percentage": 72.56, "elapsed_time": "1 day, 0:52:03", "remaining_time": "9:24:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7876, "total_steps": 10853, "loss": 0.1302, "learning_rate": 9.599793707487098e-07, "epoch": 0.7256645321785599, "percentage": 72.57, "elapsed_time": "1 day, 0:52:13", "remaining_time": "9:24:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7877, "total_steps": 10853, "loss": 0.1216, "learning_rate": 9.593793556259347e-07, "epoch": 0.72575666835583, "percentage": 72.58, "elapsed_time": "1 day, 0:52:23", "remaining_time": "9:23:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7878, "total_steps": 10853, "loss": 0.1231, "learning_rate": 9.587794835499523e-07, "epoch": 0.7258488045331, "percentage": 72.59, "elapsed_time": "1 day, 0:52:34", "remaining_time": "9:23:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7879, "total_steps": 10853, "loss": 0.1155, "learning_rate": 9.581797545764614e-07, "epoch": 0.72594094071037, "percentage": 72.6, "elapsed_time": "1 day, 0:52:45", "remaining_time": "9:23:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7880, "total_steps": 10853, "loss": 0.1185, "learning_rate": 9.575801687611464e-07, "epoch": 0.72603307688764, "percentage": 72.61, "elapsed_time": "1 day, 0:52:56", "remaining_time": "9:23:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7881, "total_steps": 10853, "loss": 0.1298, "learning_rate": 9.569807261596779e-07, "epoch": 0.72612521306491, "percentage": 72.62, "elapsed_time": "1 day, 0:53:06", "remaining_time": "9:23:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7882, "total_steps": 10853, "loss": 0.1248, "learning_rate": 9.56381426827715e-07, "epoch": 0.72621734924218, "percentage": 72.63, "elapsed_time": "1 day, 0:53:18", "remaining_time": "9:22:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7883, "total_steps": 10853, "loss": 0.1295, "learning_rate": 9.557822708209025e-07, "epoch": 0.72630948541945, "percentage": 72.63, "elapsed_time": "1 day, 0:53:28", "remaining_time": "9:22:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7884, "total_steps": 10853, "loss": 0.1181, "learning_rate": 9.551832581948733e-07, "epoch": 0.72640162159672, "percentage": 72.64, "elapsed_time": "1 day, 0:53:38", "remaining_time": "9:22:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7885, "total_steps": 10853, "loss": 0.1184, "learning_rate": 9.54584389005245e-07, "epoch": 0.72649375777399, "percentage": 72.65, "elapsed_time": "1 day, 0:53:49", "remaining_time": "9:22:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7886, "total_steps": 10853, "loss": 0.1144, "learning_rate": 9.539856633076217e-07, "epoch": 0.7265858939512599, "percentage": 72.66, "elapsed_time": "1 day, 0:54:00", "remaining_time": "9:22:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7887, "total_steps": 10853, "loss": 0.1206, "learning_rate": 9.533870811575957e-07, "epoch": 0.7266780301285299, "percentage": 72.67, "elapsed_time": "1 day, 0:54:10", "remaining_time": "9:21:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7888, "total_steps": 10853, "loss": 0.132, "learning_rate": 9.527886426107458e-07, "epoch": 0.7267701663057999, "percentage": 72.68, "elapsed_time": "1 day, 0:54:20", "remaining_time": "9:21:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7889, "total_steps": 10853, "loss": 0.1217, "learning_rate": 9.52190347722638e-07, "epoch": 0.7268623024830699, "percentage": 72.69, "elapsed_time": "1 day, 0:54:31", "remaining_time": "9:21:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7890, "total_steps": 10853, "loss": 0.1214, "learning_rate": 9.515921965488226e-07, "epoch": 0.7269544386603399, "percentage": 72.7, "elapsed_time": "1 day, 0:54:42", "remaining_time": "9:21:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7891, "total_steps": 10853, "loss": 0.113, "learning_rate": 9.509941891448376e-07, "epoch": 0.72704657483761, "percentage": 72.71, "elapsed_time": "1 day, 0:54:54", "remaining_time": "9:21:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7892, "total_steps": 10853, "loss": 0.1235, "learning_rate": 9.503963255662091e-07, "epoch": 0.72713871101488, "percentage": 72.72, "elapsed_time": "1 day, 0:55:06", "remaining_time": "9:20:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7893, "total_steps": 10853, "loss": 0.124, "learning_rate": 9.497986058684491e-07, "epoch": 0.72723084719215, "percentage": 72.73, "elapsed_time": "1 day, 0:55:18", "remaining_time": "9:20:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7894, "total_steps": 10853, "loss": 0.123, "learning_rate": 9.492010301070548e-07, "epoch": 0.72732298336942, "percentage": 72.74, "elapsed_time": "1 day, 0:55:30", "remaining_time": "9:20:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7895, "total_steps": 10853, "loss": 0.1203, "learning_rate": 9.486035983375125e-07, "epoch": 0.72741511954669, "percentage": 72.74, "elapsed_time": "1 day, 0:55:40", "remaining_time": "9:20:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7896, "total_steps": 10853, "loss": 0.1061, "learning_rate": 9.48006310615292e-07, "epoch": 0.72750725572396, "percentage": 72.75, "elapsed_time": "1 day, 0:55:52", "remaining_time": "9:20:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7897, "total_steps": 10853, "loss": 0.1166, "learning_rate": 9.474091669958538e-07, "epoch": 0.72759939190123, "percentage": 72.76, "elapsed_time": "1 day, 0:56:02", "remaining_time": "9:20:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7898, "total_steps": 10853, "loss": 0.1117, "learning_rate": 9.468121675346406e-07, "epoch": 0.7276915280785, "percentage": 72.77, "elapsed_time": "1 day, 0:56:13", "remaining_time": "9:19:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7899, "total_steps": 10853, "loss": 0.1227, "learning_rate": 9.462153122870846e-07, "epoch": 0.72778366425577, "percentage": 72.78, "elapsed_time": "1 day, 0:56:25", "remaining_time": "9:19:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7900, "total_steps": 10853, "loss": 0.1275, "learning_rate": 9.456186013086049e-07, "epoch": 0.72787580043304, "percentage": 72.79, "elapsed_time": "1 day, 0:56:36", "remaining_time": "9:19:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7901, "total_steps": 10853, "loss": 0.1252, "learning_rate": 9.450220346546057e-07, "epoch": 0.72796793661031, "percentage": 72.8, "elapsed_time": "1 day, 0:56:47", "remaining_time": "9:19:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7902, "total_steps": 10853, "loss": 0.1342, "learning_rate": 9.444256123804768e-07, "epoch": 0.72806007278758, "percentage": 72.81, "elapsed_time": "1 day, 0:56:57", "remaining_time": "9:19:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7903, "total_steps": 10853, "loss": 0.1233, "learning_rate": 9.438293345415972e-07, "epoch": 0.72815220896485, "percentage": 72.82, "elapsed_time": "1 day, 0:57:08", "remaining_time": "9:18:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7904, "total_steps": 10853, "loss": 0.119, "learning_rate": 9.432332011933315e-07, "epoch": 0.7282443451421201, "percentage": 72.83, "elapsed_time": "1 day, 0:57:20", "remaining_time": "9:18:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7905, "total_steps": 10853, "loss": 0.1209, "learning_rate": 9.426372123910313e-07, "epoch": 0.7283364813193901, "percentage": 72.84, "elapsed_time": "1 day, 0:57:32", "remaining_time": "9:18:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7906, "total_steps": 10853, "loss": 0.1126, "learning_rate": 9.420413681900337e-07, "epoch": 0.7284286174966601, "percentage": 72.85, "elapsed_time": "1 day, 0:57:42", "remaining_time": "9:18:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7907, "total_steps": 10853, "loss": 0.1184, "learning_rate": 9.414456686456619e-07, "epoch": 0.7285207536739301, "percentage": 72.86, "elapsed_time": "1 day, 0:57:53", "remaining_time": "9:18:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7908, "total_steps": 10853, "loss": 0.1154, "learning_rate": 9.408501138132273e-07, "epoch": 0.7286128898512001, "percentage": 72.86, "elapsed_time": "1 day, 0:58:02", "remaining_time": "9:17:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7909, "total_steps": 10853, "loss": 0.1241, "learning_rate": 9.402547037480284e-07, "epoch": 0.7287050260284701, "percentage": 72.87, "elapsed_time": "1 day, 0:58:12", "remaining_time": "9:17:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7910, "total_steps": 10853, "loss": 0.1188, "learning_rate": 9.396594385053473e-07, "epoch": 0.7287971622057401, "percentage": 72.88, "elapsed_time": "1 day, 0:58:23", "remaining_time": "9:17:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7911, "total_steps": 10853, "loss": 0.1157, "learning_rate": 9.39064318140456e-07, "epoch": 0.7288892983830101, "percentage": 72.89, "elapsed_time": "1 day, 0:58:34", "remaining_time": "9:17:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7912, "total_steps": 10853, "loss": 0.1129, "learning_rate": 9.3846934270861e-07, "epoch": 0.7289814345602801, "percentage": 72.9, "elapsed_time": "1 day, 0:58:45", "remaining_time": "9:17:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7913, "total_steps": 10853, "loss": 0.0989, "learning_rate": 9.378745122650545e-07, "epoch": 0.7290735707375501, "percentage": 72.91, "elapsed_time": "1 day, 0:58:54", "remaining_time": "9:16:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7914, "total_steps": 10853, "loss": 0.128, "learning_rate": 9.372798268650177e-07, "epoch": 0.7291657069148201, "percentage": 72.92, "elapsed_time": "1 day, 0:59:05", "remaining_time": "9:16:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7915, "total_steps": 10853, "loss": 0.1119, "learning_rate": 9.366852865637171e-07, "epoch": 0.7292578430920901, "percentage": 72.93, "elapsed_time": "1 day, 0:59:15", "remaining_time": "9:16:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7916, "total_steps": 10853, "loss": 0.1165, "learning_rate": 9.360908914163569e-07, "epoch": 0.7293499792693601, "percentage": 72.94, "elapsed_time": "1 day, 0:59:26", "remaining_time": "9:16:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7917, "total_steps": 10853, "loss": 0.1151, "learning_rate": 9.354966414781247e-07, "epoch": 0.7294421154466301, "percentage": 72.95, "elapsed_time": "1 day, 0:59:37", "remaining_time": "9:16:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7918, "total_steps": 10853, "loss": 0.1299, "learning_rate": 9.349025368041989e-07, "epoch": 0.7295342516239002, "percentage": 72.96, "elapsed_time": "1 day, 0:59:48", "remaining_time": "9:15:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7919, "total_steps": 10853, "loss": 0.1303, "learning_rate": 9.343085774497399e-07, "epoch": 0.7296263878011702, "percentage": 72.97, "elapsed_time": "1 day, 0:59:59", "remaining_time": "9:15:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7920, "total_steps": 10853, "loss": 0.1114, "learning_rate": 9.337147634698979e-07, "epoch": 0.7297185239784402, "percentage": 72.98, "elapsed_time": "1 day, 1:00:11", "remaining_time": "9:15:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7921, "total_steps": 10853, "loss": 0.1186, "learning_rate": 9.331210949198097e-07, "epoch": 0.7298106601557102, "percentage": 72.98, "elapsed_time": "1 day, 1:00:21", "remaining_time": "9:15:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7922, "total_steps": 10853, "loss": 0.1175, "learning_rate": 9.325275718545962e-07, "epoch": 0.7299027963329802, "percentage": 72.99, "elapsed_time": "1 day, 1:00:32", "remaining_time": "9:15:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7923, "total_steps": 10853, "loss": 0.1143, "learning_rate": 9.319341943293659e-07, "epoch": 0.7299949325102502, "percentage": 73.0, "elapsed_time": "1 day, 1:00:44", "remaining_time": "9:14:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7924, "total_steps": 10853, "loss": 0.1131, "learning_rate": 9.31340962399214e-07, "epoch": 0.7300870686875202, "percentage": 73.01, "elapsed_time": "1 day, 1:00:54", "remaining_time": "9:14:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7925, "total_steps": 10853, "loss": 0.1215, "learning_rate": 9.307478761192229e-07, "epoch": 0.7301792048647902, "percentage": 73.02, "elapsed_time": "1 day, 1:01:06", "remaining_time": "9:14:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7926, "total_steps": 10853, "loss": 0.1148, "learning_rate": 9.301549355444611e-07, "epoch": 0.7302713410420602, "percentage": 73.03, "elapsed_time": "1 day, 1:01:17", "remaining_time": "9:14:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7927, "total_steps": 10853, "loss": 0.1234, "learning_rate": 9.295621407299824e-07, "epoch": 0.7303634772193301, "percentage": 73.04, "elapsed_time": "1 day, 1:01:26", "remaining_time": "9:14:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7928, "total_steps": 10853, "loss": 0.1241, "learning_rate": 9.289694917308273e-07, "epoch": 0.7304556133966001, "percentage": 73.05, "elapsed_time": "1 day, 1:01:39", "remaining_time": "9:14:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7929, "total_steps": 10853, "loss": 0.1211, "learning_rate": 9.283769886020238e-07, "epoch": 0.7305477495738701, "percentage": 73.06, "elapsed_time": "1 day, 1:01:49", "remaining_time": "9:13:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7930, "total_steps": 10853, "loss": 0.1112, "learning_rate": 9.277846313985869e-07, "epoch": 0.7306398857511401, "percentage": 73.07, "elapsed_time": "1 day, 1:01:58", "remaining_time": "9:13:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7931, "total_steps": 10853, "loss": 0.1291, "learning_rate": 9.271924201755153e-07, "epoch": 0.7307320219284101, "percentage": 73.08, "elapsed_time": "1 day, 1:02:09", "remaining_time": "9:13:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7932, "total_steps": 10853, "loss": 0.1146, "learning_rate": 9.26600354987797e-07, "epoch": 0.7308241581056802, "percentage": 73.09, "elapsed_time": "1 day, 1:02:19", "remaining_time": "9:13:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7933, "total_steps": 10853, "loss": 0.1253, "learning_rate": 9.260084358904056e-07, "epoch": 0.7309162942829502, "percentage": 73.09, "elapsed_time": "1 day, 1:02:30", "remaining_time": "9:13:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7934, "total_steps": 10853, "loss": 0.118, "learning_rate": 9.254166629383005e-07, "epoch": 0.7310084304602202, "percentage": 73.1, "elapsed_time": "1 day, 1:02:40", "remaining_time": "9:12:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7935, "total_steps": 10853, "loss": 0.1155, "learning_rate": 9.24825036186427e-07, "epoch": 0.7311005666374902, "percentage": 73.11, "elapsed_time": "1 day, 1:02:52", "remaining_time": "9:12:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7936, "total_steps": 10853, "loss": 0.125, "learning_rate": 9.242335556897181e-07, "epoch": 0.7311927028147602, "percentage": 73.12, "elapsed_time": "1 day, 1:03:03", "remaining_time": "9:12:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7937, "total_steps": 10853, "loss": 0.1071, "learning_rate": 9.236422215030932e-07, "epoch": 0.7312848389920302, "percentage": 73.13, "elapsed_time": "1 day, 1:03:12", "remaining_time": "9:12:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7938, "total_steps": 10853, "loss": 0.1308, "learning_rate": 9.230510336814586e-07, "epoch": 0.7313769751693002, "percentage": 73.14, "elapsed_time": "1 day, 1:03:23", "remaining_time": "9:12:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7939, "total_steps": 10853, "loss": 0.1254, "learning_rate": 9.224599922797053e-07, "epoch": 0.7314691113465702, "percentage": 73.15, "elapsed_time": "1 day, 1:03:34", "remaining_time": "9:11:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7940, "total_steps": 10853, "loss": 0.1145, "learning_rate": 9.218690973527106e-07, "epoch": 0.7315612475238402, "percentage": 73.16, "elapsed_time": "1 day, 1:03:44", "remaining_time": "9:11:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7941, "total_steps": 10853, "loss": 0.1336, "learning_rate": 9.212783489553401e-07, "epoch": 0.7316533837011102, "percentage": 73.17, "elapsed_time": "1 day, 1:03:55", "remaining_time": "9:11:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7942, "total_steps": 10853, "loss": 0.1341, "learning_rate": 9.206877471424455e-07, "epoch": 0.7317455198783802, "percentage": 73.18, "elapsed_time": "1 day, 1:04:06", "remaining_time": "9:11:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7943, "total_steps": 10853, "loss": 0.1216, "learning_rate": 9.200972919688628e-07, "epoch": 0.7318376560556502, "percentage": 73.19, "elapsed_time": "1 day, 1:04:16", "remaining_time": "9:11:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7944, "total_steps": 10853, "loss": 0.1232, "learning_rate": 9.195069834894174e-07, "epoch": 0.7319297922329202, "percentage": 73.2, "elapsed_time": "1 day, 1:04:25", "remaining_time": "9:10:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7945, "total_steps": 10853, "loss": 0.1208, "learning_rate": 9.189168217589178e-07, "epoch": 0.7320219284101903, "percentage": 73.21, "elapsed_time": "1 day, 1:04:35", "remaining_time": "9:10:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7946, "total_steps": 10853, "loss": 0.1156, "learning_rate": 9.183268068321616e-07, "epoch": 0.7321140645874603, "percentage": 73.21, "elapsed_time": "1 day, 1:04:47", "remaining_time": "9:10:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7947, "total_steps": 10853, "loss": 0.1082, "learning_rate": 9.177369387639323e-07, "epoch": 0.7322062007647303, "percentage": 73.22, "elapsed_time": "1 day, 1:04:58", "remaining_time": "9:10:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7948, "total_steps": 10853, "loss": 0.1116, "learning_rate": 9.171472176089977e-07, "epoch": 0.7322983369420003, "percentage": 73.23, "elapsed_time": "1 day, 1:05:09", "remaining_time": "9:10:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7949, "total_steps": 10853, "loss": 0.1304, "learning_rate": 9.165576434221152e-07, "epoch": 0.7323904731192703, "percentage": 73.24, "elapsed_time": "1 day, 1:05:19", "remaining_time": "9:09:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7950, "total_steps": 10853, "loss": 0.11, "learning_rate": 9.15968216258025e-07, "epoch": 0.7324826092965403, "percentage": 73.25, "elapsed_time": "1 day, 1:05:30", "remaining_time": "9:09:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7951, "total_steps": 10853, "loss": 0.1214, "learning_rate": 9.153789361714573e-07, "epoch": 0.7325747454738103, "percentage": 73.26, "elapsed_time": "1 day, 1:05:41", "remaining_time": "9:09:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7952, "total_steps": 10853, "loss": 0.1265, "learning_rate": 9.147898032171251e-07, "epoch": 0.7326668816510803, "percentage": 73.27, "elapsed_time": "1 day, 1:05:51", "remaining_time": "9:09:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7953, "total_steps": 10853, "loss": 0.1164, "learning_rate": 9.142008174497302e-07, "epoch": 0.7327590178283503, "percentage": 73.28, "elapsed_time": "1 day, 1:06:03", "remaining_time": "9:09:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7954, "total_steps": 10853, "loss": 0.1167, "learning_rate": 9.136119789239612e-07, "epoch": 0.7328511540056203, "percentage": 73.29, "elapsed_time": "1 day, 1:06:13", "remaining_time": "9:08:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7955, "total_steps": 10853, "loss": 0.1242, "learning_rate": 9.130232876944903e-07, "epoch": 0.7329432901828903, "percentage": 73.3, "elapsed_time": "1 day, 1:06:25", "remaining_time": "9:08:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7956, "total_steps": 10853, "loss": 0.1272, "learning_rate": 9.124347438159772e-07, "epoch": 0.7330354263601603, "percentage": 73.31, "elapsed_time": "1 day, 1:06:36", "remaining_time": "9:08:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7957, "total_steps": 10853, "loss": 0.1247, "learning_rate": 9.118463473430689e-07, "epoch": 0.7331275625374303, "percentage": 73.32, "elapsed_time": "1 day, 1:06:46", "remaining_time": "9:08:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7958, "total_steps": 10853, "loss": 0.1175, "learning_rate": 9.112580983303984e-07, "epoch": 0.7332196987147003, "percentage": 73.33, "elapsed_time": "1 day, 1:06:59", "remaining_time": "9:08:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7959, "total_steps": 10853, "loss": 0.121, "learning_rate": 9.106699968325849e-07, "epoch": 0.7333118348919704, "percentage": 73.33, "elapsed_time": "1 day, 1:07:11", "remaining_time": "9:08:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7960, "total_steps": 10853, "loss": 0.1317, "learning_rate": 9.100820429042337e-07, "epoch": 0.7334039710692404, "percentage": 73.34, "elapsed_time": "1 day, 1:07:22", "remaining_time": "9:07:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7961, "total_steps": 10853, "loss": 0.1193, "learning_rate": 9.094942365999349e-07, "epoch": 0.7334961072465104, "percentage": 73.35, "elapsed_time": "1 day, 1:07:33", "remaining_time": "9:07:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7962, "total_steps": 10853, "loss": 0.1299, "learning_rate": 9.089065779742673e-07, "epoch": 0.7335882434237804, "percentage": 73.36, "elapsed_time": "1 day, 1:07:44", "remaining_time": "9:07:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7963, "total_steps": 10853, "loss": 0.1145, "learning_rate": 9.083190670817963e-07, "epoch": 0.7336803796010504, "percentage": 73.37, "elapsed_time": "1 day, 1:07:55", "remaining_time": "9:07:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7964, "total_steps": 10853, "loss": 0.1143, "learning_rate": 9.0773170397707e-07, "epoch": 0.7337725157783204, "percentage": 73.38, "elapsed_time": "1 day, 1:08:07", "remaining_time": "9:07:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7965, "total_steps": 10853, "loss": 0.125, "learning_rate": 9.071444887146275e-07, "epoch": 0.7338646519555904, "percentage": 73.39, "elapsed_time": "1 day, 1:08:17", "remaining_time": "9:06:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7966, "total_steps": 10853, "loss": 0.1177, "learning_rate": 9.065574213489897e-07, "epoch": 0.7339567881328604, "percentage": 73.4, "elapsed_time": "1 day, 1:08:28", "remaining_time": "9:06:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7967, "total_steps": 10853, "loss": 0.1147, "learning_rate": 9.059705019346676e-07, "epoch": 0.7340489243101304, "percentage": 73.41, "elapsed_time": "1 day, 1:08:39", "remaining_time": "9:06:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7968, "total_steps": 10853, "loss": 0.117, "learning_rate": 9.053837305261551e-07, "epoch": 0.7341410604874004, "percentage": 73.42, "elapsed_time": "1 day, 1:08:47", "remaining_time": "9:06:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7969, "total_steps": 10853, "loss": 0.1014, "learning_rate": 9.047971071779349e-07, "epoch": 0.7342331966646704, "percentage": 73.43, "elapsed_time": "1 day, 1:08:58", "remaining_time": "9:06:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7970, "total_steps": 10853, "loss": 0.1282, "learning_rate": 9.042106319444757e-07, "epoch": 0.7343253328419403, "percentage": 73.44, "elapsed_time": "1 day, 1:09:09", "remaining_time": "9:05:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7971, "total_steps": 10853, "loss": 0.1172, "learning_rate": 9.036243048802312e-07, "epoch": 0.7344174690192103, "percentage": 73.45, "elapsed_time": "1 day, 1:09:20", "remaining_time": "9:05:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7972, "total_steps": 10853, "loss": 0.1143, "learning_rate": 9.030381260396409e-07, "epoch": 0.7345096051964805, "percentage": 73.45, "elapsed_time": "1 day, 1:09:30", "remaining_time": "9:05:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7973, "total_steps": 10853, "loss": 0.131, "learning_rate": 9.024520954771326e-07, "epoch": 0.7346017413737504, "percentage": 73.46, "elapsed_time": "1 day, 1:09:41", "remaining_time": "9:05:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7974, "total_steps": 10853, "loss": 0.1241, "learning_rate": 9.018662132471189e-07, "epoch": 0.7346938775510204, "percentage": 73.47, "elapsed_time": "1 day, 1:09:51", "remaining_time": "9:05:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7975, "total_steps": 10853, "loss": 0.1179, "learning_rate": 9.012804794040003e-07, "epoch": 0.7347860137282904, "percentage": 73.48, "elapsed_time": "1 day, 1:10:01", "remaining_time": "9:04:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7976, "total_steps": 10853, "loss": 0.121, "learning_rate": 9.006948940021612e-07, "epoch": 0.7348781499055604, "percentage": 73.49, "elapsed_time": "1 day, 1:10:12", "remaining_time": "9:04:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7977, "total_steps": 10853, "loss": 0.1145, "learning_rate": 9.001094570959726e-07, "epoch": 0.7349702860828304, "percentage": 73.5, "elapsed_time": "1 day, 1:10:22", "remaining_time": "9:04:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7978, "total_steps": 10853, "loss": 0.1219, "learning_rate": 8.995241687397929e-07, "epoch": 0.7350624222601004, "percentage": 73.51, "elapsed_time": "1 day, 1:10:32", "remaining_time": "9:04:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7979, "total_steps": 10853, "loss": 0.1294, "learning_rate": 8.989390289879665e-07, "epoch": 0.7351545584373704, "percentage": 73.52, "elapsed_time": "1 day, 1:10:42", "remaining_time": "9:04:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7980, "total_steps": 10853, "loss": 0.1242, "learning_rate": 8.983540378948244e-07, "epoch": 0.7352466946146404, "percentage": 73.53, "elapsed_time": "1 day, 1:10:53", "remaining_time": "9:03:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7981, "total_steps": 10853, "loss": 0.1137, "learning_rate": 8.977691955146823e-07, "epoch": 0.7353388307919104, "percentage": 73.54, "elapsed_time": "1 day, 1:11:04", "remaining_time": "9:03:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7982, "total_steps": 10853, "loss": 0.1279, "learning_rate": 8.971845019018419e-07, "epoch": 0.7354309669691804, "percentage": 73.55, "elapsed_time": "1 day, 1:11:14", "remaining_time": "9:03:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7983, "total_steps": 10853, "loss": 0.1302, "learning_rate": 8.965999571105929e-07, "epoch": 0.7355231031464504, "percentage": 73.56, "elapsed_time": "1 day, 1:11:25", "remaining_time": "9:03:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7984, "total_steps": 10853, "loss": 0.139, "learning_rate": 8.960155611952115e-07, "epoch": 0.7356152393237204, "percentage": 73.56, "elapsed_time": "1 day, 1:11:36", "remaining_time": "9:03:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7985, "total_steps": 10853, "loss": 0.1162, "learning_rate": 8.954313142099568e-07, "epoch": 0.7357073755009904, "percentage": 73.57, "elapsed_time": "1 day, 1:11:47", "remaining_time": "9:02:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7986, "total_steps": 10853, "loss": 0.1218, "learning_rate": 8.948472162090782e-07, "epoch": 0.7357995116782605, "percentage": 73.58, "elapsed_time": "1 day, 1:11:58", "remaining_time": "9:02:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7987, "total_steps": 10853, "loss": 0.1146, "learning_rate": 8.942632672468077e-07, "epoch": 0.7358916478555305, "percentage": 73.59, "elapsed_time": "1 day, 1:12:08", "remaining_time": "9:02:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7988, "total_steps": 10853, "loss": 0.1266, "learning_rate": 8.936794673773661e-07, "epoch": 0.7359837840328005, "percentage": 73.6, "elapsed_time": "1 day, 1:12:19", "remaining_time": "9:02:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7989, "total_steps": 10853, "loss": 0.1266, "learning_rate": 8.930958166549583e-07, "epoch": 0.7360759202100705, "percentage": 73.61, "elapsed_time": "1 day, 1:12:29", "remaining_time": "9:02:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7990, "total_steps": 10853, "loss": 0.1176, "learning_rate": 8.925123151337767e-07, "epoch": 0.7361680563873405, "percentage": 73.62, "elapsed_time": "1 day, 1:12:40", "remaining_time": "9:02:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7991, "total_steps": 10853, "loss": 0.1205, "learning_rate": 8.919289628680005e-07, "epoch": 0.7362601925646105, "percentage": 73.63, "elapsed_time": "1 day, 1:12:52", "remaining_time": "9:01:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7992, "total_steps": 10853, "loss": 0.1156, "learning_rate": 8.913457599117933e-07, "epoch": 0.7363523287418805, "percentage": 73.64, "elapsed_time": "1 day, 1:13:03", "remaining_time": "9:01:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7993, "total_steps": 10853, "loss": 0.1165, "learning_rate": 8.907627063193045e-07, "epoch": 0.7364444649191505, "percentage": 73.65, "elapsed_time": "1 day, 1:13:14", "remaining_time": "9:01:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7994, "total_steps": 10853, "loss": 0.1275, "learning_rate": 8.901798021446714e-07, "epoch": 0.7365366010964205, "percentage": 73.66, "elapsed_time": "1 day, 1:13:24", "remaining_time": "9:01:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7995, "total_steps": 10853, "loss": 0.1101, "learning_rate": 8.895970474420171e-07, "epoch": 0.7366287372736905, "percentage": 73.67, "elapsed_time": "1 day, 1:13:36", "remaining_time": "9:01:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7996, "total_steps": 10853, "loss": 0.1194, "learning_rate": 8.890144422654512e-07, "epoch": 0.7367208734509605, "percentage": 73.68, "elapsed_time": "1 day, 1:13:47", "remaining_time": "9:00:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7997, "total_steps": 10853, "loss": 0.1174, "learning_rate": 8.884319866690674e-07, "epoch": 0.7368130096282305, "percentage": 73.68, "elapsed_time": "1 day, 1:13:58", "remaining_time": "9:00:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7998, "total_steps": 10853, "loss": 0.1168, "learning_rate": 8.878496807069464e-07, "epoch": 0.7369051458055005, "percentage": 73.69, "elapsed_time": "1 day, 1:14:10", "remaining_time": "9:00:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7999, "total_steps": 10853, "loss": 0.1199, "learning_rate": 8.87267524433156e-07, "epoch": 0.7369972819827705, "percentage": 73.7, "elapsed_time": "1 day, 1:14:20", "remaining_time": "9:00:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8000, "total_steps": 10853, "loss": 0.116, "learning_rate": 8.866855179017505e-07, "epoch": 0.7370894181600406, "percentage": 73.71, "elapsed_time": "1 day, 1:14:31", "remaining_time": "9:00:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8000, "total_steps": 10853, "eval_loss": 0.12275012582540512, "epoch": 0.7370894181600406, "percentage": 73.71, "elapsed_time": "1 day, 1:19:30", "remaining_time": "9:01:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8001, "total_steps": 10853, "loss": 0.1074, "learning_rate": 8.861036611667676e-07, "epoch": 0.7371815543373106, "percentage": 73.72, "elapsed_time": "1 day, 1:19:41", "remaining_time": "9:01:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8002, "total_steps": 10853, "loss": 0.1059, "learning_rate": 8.855219542822341e-07, "epoch": 0.7372736905145806, "percentage": 73.73, "elapsed_time": "1 day, 1:19:51", "remaining_time": "9:01:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8003, "total_steps": 10853, "loss": 0.1236, "learning_rate": 8.8494039730216e-07, "epoch": 0.7373658266918506, "percentage": 73.74, "elapsed_time": "1 day, 1:20:02", "remaining_time": "9:01:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8004, "total_steps": 10853, "loss": 0.1317, "learning_rate": 8.843589902805438e-07, "epoch": 0.7374579628691206, "percentage": 73.75, "elapsed_time": "1 day, 1:20:12", "remaining_time": "9:01:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8005, "total_steps": 10853, "loss": 0.1203, "learning_rate": 8.837777332713701e-07, "epoch": 0.7375500990463906, "percentage": 73.76, "elapsed_time": "1 day, 1:20:23", "remaining_time": "9:00:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8006, "total_steps": 10853, "loss": 0.1187, "learning_rate": 8.831966263286071e-07, "epoch": 0.7376422352236606, "percentage": 73.77, "elapsed_time": "1 day, 1:20:31", "remaining_time": "9:00:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8007, "total_steps": 10853, "loss": 0.1241, "learning_rate": 8.826156695062113e-07, "epoch": 0.7377343714009306, "percentage": 73.78, "elapsed_time": "1 day, 1:20:41", "remaining_time": "9:00:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8008, "total_steps": 10853, "loss": 0.1228, "learning_rate": 8.820348628581254e-07, "epoch": 0.7378265075782006, "percentage": 73.79, "elapsed_time": "1 day, 1:20:52", "remaining_time": "9:00:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8009, "total_steps": 10853, "loss": 0.1244, "learning_rate": 8.814542064382767e-07, "epoch": 0.7379186437554706, "percentage": 73.8, "elapsed_time": "1 day, 1:21:02", "remaining_time": "9:00:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8010, "total_steps": 10853, "loss": 0.1214, "learning_rate": 8.808737003005782e-07, "epoch": 0.7380107799327406, "percentage": 73.8, "elapsed_time": "1 day, 1:21:13", "remaining_time": "8:59:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8011, "total_steps": 10853, "loss": 0.1257, "learning_rate": 8.802933444989308e-07, "epoch": 0.7381029161100106, "percentage": 73.81, "elapsed_time": "1 day, 1:21:23", "remaining_time": "8:59:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8012, "total_steps": 10853, "loss": 0.1104, "learning_rate": 8.797131390872207e-07, "epoch": 0.7381950522872806, "percentage": 73.82, "elapsed_time": "1 day, 1:21:33", "remaining_time": "8:59:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8013, "total_steps": 10853, "loss": 0.1216, "learning_rate": 8.79133084119321e-07, "epoch": 0.7382871884645507, "percentage": 73.83, "elapsed_time": "1 day, 1:21:44", "remaining_time": "8:59:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8014, "total_steps": 10853, "loss": 0.1287, "learning_rate": 8.78553179649089e-07, "epoch": 0.7383793246418207, "percentage": 73.84, "elapsed_time": "1 day, 1:21:56", "remaining_time": "8:59:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8015, "total_steps": 10853, "loss": 0.1248, "learning_rate": 8.779734257303677e-07, "epoch": 0.7384714608190907, "percentage": 73.85, "elapsed_time": "1 day, 1:22:06", "remaining_time": "8:58:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8016, "total_steps": 10853, "loss": 0.119, "learning_rate": 8.773938224169884e-07, "epoch": 0.7385635969963606, "percentage": 73.86, "elapsed_time": "1 day, 1:22:16", "remaining_time": "8:58:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8017, "total_steps": 10853, "loss": 0.1301, "learning_rate": 8.768143697627681e-07, "epoch": 0.7386557331736306, "percentage": 73.87, "elapsed_time": "1 day, 1:22:27", "remaining_time": "8:58:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8018, "total_steps": 10853, "loss": 0.1085, "learning_rate": 8.762350678215076e-07, "epoch": 0.7387478693509006, "percentage": 73.88, "elapsed_time": "1 day, 1:22:39", "remaining_time": "8:58:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8019, "total_steps": 10853, "loss": 0.1299, "learning_rate": 8.756559166469966e-07, "epoch": 0.7388400055281706, "percentage": 73.89, "elapsed_time": "1 day, 1:22:52", "remaining_time": "8:58:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8020, "total_steps": 10853, "loss": 0.1221, "learning_rate": 8.750769162930076e-07, "epoch": 0.7389321417054406, "percentage": 73.9, "elapsed_time": "1 day, 1:23:04", "remaining_time": "8:58:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8021, "total_steps": 10853, "loss": 0.1208, "learning_rate": 8.744980668133026e-07, "epoch": 0.7390242778827106, "percentage": 73.91, "elapsed_time": "1 day, 1:23:15", "remaining_time": "8:57:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8022, "total_steps": 10853, "loss": 0.1197, "learning_rate": 8.739193682616265e-07, "epoch": 0.7391164140599806, "percentage": 73.92, "elapsed_time": "1 day, 1:23:26", "remaining_time": "8:57:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8023, "total_steps": 10853, "loss": 0.1226, "learning_rate": 8.733408206917118e-07, "epoch": 0.7392085502372506, "percentage": 73.92, "elapsed_time": "1 day, 1:23:37", "remaining_time": "8:57:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8024, "total_steps": 10853, "loss": 0.1292, "learning_rate": 8.727624241572779e-07, "epoch": 0.7393006864145206, "percentage": 73.93, "elapsed_time": "1 day, 1:23:49", "remaining_time": "8:57:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8025, "total_steps": 10853, "loss": 0.1146, "learning_rate": 8.72184178712028e-07, "epoch": 0.7393928225917906, "percentage": 73.94, "elapsed_time": "1 day, 1:23:58", "remaining_time": "8:57:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8026, "total_steps": 10853, "loss": 0.1159, "learning_rate": 8.716060844096514e-07, "epoch": 0.7394849587690606, "percentage": 73.95, "elapsed_time": "1 day, 1:24:08", "remaining_time": "8:56:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8027, "total_steps": 10853, "loss": 0.1127, "learning_rate": 8.710281413038252e-07, "epoch": 0.7395770949463307, "percentage": 73.96, "elapsed_time": "1 day, 1:24:18", "remaining_time": "8:56:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8028, "total_steps": 10853, "loss": 0.1323, "learning_rate": 8.704503494482114e-07, "epoch": 0.7396692311236007, "percentage": 73.97, "elapsed_time": "1 day, 1:24:29", "remaining_time": "8:56:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8029, "total_steps": 10853, "loss": 0.1144, "learning_rate": 8.698727088964587e-07, "epoch": 0.7397613673008707, "percentage": 73.98, "elapsed_time": "1 day, 1:24:39", "remaining_time": "8:56:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8030, "total_steps": 10853, "loss": 0.1126, "learning_rate": 8.692952197022006e-07, "epoch": 0.7398535034781407, "percentage": 73.99, "elapsed_time": "1 day, 1:24:50", "remaining_time": "8:56:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8031, "total_steps": 10853, "loss": 0.1252, "learning_rate": 8.687178819190558e-07, "epoch": 0.7399456396554107, "percentage": 74.0, "elapsed_time": "1 day, 1:24:59", "remaining_time": "8:55:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8032, "total_steps": 10853, "loss": 0.1327, "learning_rate": 8.681406956006316e-07, "epoch": 0.7400377758326807, "percentage": 74.01, "elapsed_time": "1 day, 1:25:11", "remaining_time": "8:55:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8033, "total_steps": 10853, "loss": 0.1218, "learning_rate": 8.675636608005191e-07, "epoch": 0.7401299120099507, "percentage": 74.02, "elapsed_time": "1 day, 1:25:21", "remaining_time": "8:55:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8034, "total_steps": 10853, "loss": 0.1308, "learning_rate": 8.669867775722973e-07, "epoch": 0.7402220481872207, "percentage": 74.03, "elapsed_time": "1 day, 1:25:32", "remaining_time": "8:55:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8035, "total_steps": 10853, "loss": 0.1094, "learning_rate": 8.66410045969529e-07, "epoch": 0.7403141843644907, "percentage": 74.03, "elapsed_time": "1 day, 1:25:43", "remaining_time": "8:55:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8036, "total_steps": 10853, "loss": 0.1215, "learning_rate": 8.658334660457629e-07, "epoch": 0.7404063205417607, "percentage": 74.04, "elapsed_time": "1 day, 1:25:51", "remaining_time": "8:54:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8037, "total_steps": 10853, "loss": 0.1024, "learning_rate": 8.652570378545355e-07, "epoch": 0.7404984567190307, "percentage": 74.05, "elapsed_time": "1 day, 1:26:01", "remaining_time": "8:54:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8038, "total_steps": 10853, "loss": 0.1074, "learning_rate": 8.646807614493685e-07, "epoch": 0.7405905928963007, "percentage": 74.06, "elapsed_time": "1 day, 1:26:12", "remaining_time": "8:54:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8039, "total_steps": 10853, "loss": 0.119, "learning_rate": 8.641046368837682e-07, "epoch": 0.7406827290735707, "percentage": 74.07, "elapsed_time": "1 day, 1:26:22", "remaining_time": "8:54:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8040, "total_steps": 10853, "loss": 0.1068, "learning_rate": 8.635286642112295e-07, "epoch": 0.7407748652508408, "percentage": 74.08, "elapsed_time": "1 day, 1:26:31", "remaining_time": "8:54:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8041, "total_steps": 10853, "loss": 0.1261, "learning_rate": 8.629528434852294e-07, "epoch": 0.7408670014281108, "percentage": 74.09, "elapsed_time": "1 day, 1:26:41", "remaining_time": "8:53:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8042, "total_steps": 10853, "loss": 0.1303, "learning_rate": 8.623771747592347e-07, "epoch": 0.7409591376053808, "percentage": 74.1, "elapsed_time": "1 day, 1:26:53", "remaining_time": "8:53:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8043, "total_steps": 10853, "loss": 0.113, "learning_rate": 8.618016580866947e-07, "epoch": 0.7410512737826508, "percentage": 74.11, "elapsed_time": "1 day, 1:27:04", "remaining_time": "8:53:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8044, "total_steps": 10853, "loss": 0.1088, "learning_rate": 8.612262935210472e-07, "epoch": 0.7411434099599208, "percentage": 74.12, "elapsed_time": "1 day, 1:27:15", "remaining_time": "8:53:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8045, "total_steps": 10853, "loss": 0.1181, "learning_rate": 8.606510811157154e-07, "epoch": 0.7412355461371908, "percentage": 74.13, "elapsed_time": "1 day, 1:27:26", "remaining_time": "8:53:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8046, "total_steps": 10853, "loss": 0.1277, "learning_rate": 8.600760209241074e-07, "epoch": 0.7413276823144608, "percentage": 74.14, "elapsed_time": "1 day, 1:27:37", "remaining_time": "8:52:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8047, "total_steps": 10853, "loss": 0.1219, "learning_rate": 8.595011129996164e-07, "epoch": 0.7414198184917308, "percentage": 74.15, "elapsed_time": "1 day, 1:27:48", "remaining_time": "8:52:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8048, "total_steps": 10853, "loss": 0.1226, "learning_rate": 8.589263573956236e-07, "epoch": 0.7415119546690008, "percentage": 74.15, "elapsed_time": "1 day, 1:27:58", "remaining_time": "8:52:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8049, "total_steps": 10853, "loss": 0.1117, "learning_rate": 8.583517541654951e-07, "epoch": 0.7416040908462708, "percentage": 74.16, "elapsed_time": "1 day, 1:28:10", "remaining_time": "8:52:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8050, "total_steps": 10853, "loss": 0.1226, "learning_rate": 8.577773033625836e-07, "epoch": 0.7416962270235408, "percentage": 74.17, "elapsed_time": "1 day, 1:28:21", "remaining_time": "8:52:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8051, "total_steps": 10853, "loss": 0.1094, "learning_rate": 8.572030050402264e-07, "epoch": 0.7417883632008108, "percentage": 74.18, "elapsed_time": "1 day, 1:28:32", "remaining_time": "8:51:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8052, "total_steps": 10853, "loss": 0.1222, "learning_rate": 8.566288592517461e-07, "epoch": 0.7418804993780808, "percentage": 74.19, "elapsed_time": "1 day, 1:28:41", "remaining_time": "8:51:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8053, "total_steps": 10853, "loss": 0.1109, "learning_rate": 8.560548660504531e-07, "epoch": 0.7419726355553508, "percentage": 74.2, "elapsed_time": "1 day, 1:28:53", "remaining_time": "8:51:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8054, "total_steps": 10853, "loss": 0.1222, "learning_rate": 8.554810254896434e-07, "epoch": 0.7420647717326209, "percentage": 74.21, "elapsed_time": "1 day, 1:29:03", "remaining_time": "8:51:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8055, "total_steps": 10853, "loss": 0.1051, "learning_rate": 8.54907337622597e-07, "epoch": 0.7421569079098909, "percentage": 74.22, "elapsed_time": "1 day, 1:29:13", "remaining_time": "8:51:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8056, "total_steps": 10853, "loss": 0.1295, "learning_rate": 8.543338025025818e-07, "epoch": 0.7422490440871609, "percentage": 74.23, "elapsed_time": "1 day, 1:29:23", "remaining_time": "8:50:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8057, "total_steps": 10853, "loss": 0.1194, "learning_rate": 8.537604201828495e-07, "epoch": 0.7423411802644309, "percentage": 74.24, "elapsed_time": "1 day, 1:29:32", "remaining_time": "8:50:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8058, "total_steps": 10853, "loss": 0.1215, "learning_rate": 8.5318719071664e-07, "epoch": 0.7424333164417009, "percentage": 74.25, "elapsed_time": "1 day, 1:29:44", "remaining_time": "8:50:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8059, "total_steps": 10853, "loss": 0.1263, "learning_rate": 8.526141141571764e-07, "epoch": 0.7425254526189708, "percentage": 74.26, "elapsed_time": "1 day, 1:29:55", "remaining_time": "8:50:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8060, "total_steps": 10853, "loss": 0.1238, "learning_rate": 8.520411905576697e-07, "epoch": 0.7426175887962408, "percentage": 74.27, "elapsed_time": "1 day, 1:30:06", "remaining_time": "8:50:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8061, "total_steps": 10853, "loss": 0.1126, "learning_rate": 8.514684199713166e-07, "epoch": 0.7427097249735108, "percentage": 74.27, "elapsed_time": "1 day, 1:30:16", "remaining_time": "8:50:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8062, "total_steps": 10853, "loss": 0.1186, "learning_rate": 8.508958024512972e-07, "epoch": 0.7428018611507808, "percentage": 74.28, "elapsed_time": "1 day, 1:30:26", "remaining_time": "8:49:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8063, "total_steps": 10853, "loss": 0.1221, "learning_rate": 8.503233380507808e-07, "epoch": 0.7428939973280508, "percentage": 74.29, "elapsed_time": "1 day, 1:30:37", "remaining_time": "8:49:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8064, "total_steps": 10853, "loss": 0.125, "learning_rate": 8.497510268229192e-07, "epoch": 0.7429861335053208, "percentage": 74.3, "elapsed_time": "1 day, 1:30:47", "remaining_time": "8:49:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8065, "total_steps": 10853, "loss": 0.1272, "learning_rate": 8.491788688208524e-07, "epoch": 0.7430782696825908, "percentage": 74.31, "elapsed_time": "1 day, 1:30:58", "remaining_time": "8:49:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8066, "total_steps": 10853, "loss": 0.1312, "learning_rate": 8.486068640977063e-07, "epoch": 0.7431704058598608, "percentage": 74.32, "elapsed_time": "1 day, 1:31:08", "remaining_time": "8:49:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8067, "total_steps": 10853, "loss": 0.1144, "learning_rate": 8.480350127065904e-07, "epoch": 0.7432625420371308, "percentage": 74.33, "elapsed_time": "1 day, 1:31:18", "remaining_time": "8:48:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8068, "total_steps": 10853, "loss": 0.116, "learning_rate": 8.474633147006006e-07, "epoch": 0.7433546782144009, "percentage": 74.34, "elapsed_time": "1 day, 1:31:28", "remaining_time": "8:48:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8069, "total_steps": 10853, "loss": 0.1281, "learning_rate": 8.468917701328197e-07, "epoch": 0.7434468143916709, "percentage": 74.35, "elapsed_time": "1 day, 1:31:39", "remaining_time": "8:48:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8070, "total_steps": 10853, "loss": 0.1262, "learning_rate": 8.46320379056316e-07, "epoch": 0.7435389505689409, "percentage": 74.36, "elapsed_time": "1 day, 1:31:50", "remaining_time": "8:48:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8071, "total_steps": 10853, "loss": 0.1239, "learning_rate": 8.45749141524144e-07, "epoch": 0.7436310867462109, "percentage": 74.37, "elapsed_time": "1 day, 1:32:00", "remaining_time": "8:48:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8072, "total_steps": 10853, "loss": 0.1068, "learning_rate": 8.45178057589342e-07, "epoch": 0.7437232229234809, "percentage": 74.38, "elapsed_time": "1 day, 1:32:10", "remaining_time": "8:47:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8073, "total_steps": 10853, "loss": 0.1309, "learning_rate": 8.446071273049347e-07, "epoch": 0.7438153591007509, "percentage": 74.38, "elapsed_time": "1 day, 1:32:21", "remaining_time": "8:47:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8074, "total_steps": 10853, "loss": 0.122, "learning_rate": 8.440363507239338e-07, "epoch": 0.7439074952780209, "percentage": 74.39, "elapsed_time": "1 day, 1:32:31", "remaining_time": "8:47:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8075, "total_steps": 10853, "loss": 0.1103, "learning_rate": 8.434657278993369e-07, "epoch": 0.7439996314552909, "percentage": 74.4, "elapsed_time": "1 day, 1:32:42", "remaining_time": "8:47:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8076, "total_steps": 10853, "loss": 0.1141, "learning_rate": 8.428952588841247e-07, "epoch": 0.7440917676325609, "percentage": 74.41, "elapsed_time": "1 day, 1:32:53", "remaining_time": "8:47:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8077, "total_steps": 10853, "loss": 0.1267, "learning_rate": 8.423249437312667e-07, "epoch": 0.7441839038098309, "percentage": 74.42, "elapsed_time": "1 day, 1:33:05", "remaining_time": "8:46:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8078, "total_steps": 10853, "loss": 0.1132, "learning_rate": 8.41754782493715e-07, "epoch": 0.7442760399871009, "percentage": 74.43, "elapsed_time": "1 day, 1:33:15", "remaining_time": "8:46:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8079, "total_steps": 10853, "loss": 0.1165, "learning_rate": 8.411847752244115e-07, "epoch": 0.7443681761643709, "percentage": 74.44, "elapsed_time": "1 day, 1:33:25", "remaining_time": "8:46:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8080, "total_steps": 10853, "loss": 0.1479, "learning_rate": 8.406149219762791e-07, "epoch": 0.7444603123416409, "percentage": 74.45, "elapsed_time": "1 day, 1:33:37", "remaining_time": "8:46:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8081, "total_steps": 10853, "loss": 0.1087, "learning_rate": 8.400452228022296e-07, "epoch": 0.744552448518911, "percentage": 74.46, "elapsed_time": "1 day, 1:33:48", "remaining_time": "8:46:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8082, "total_steps": 10853, "loss": 0.125, "learning_rate": 8.394756777551602e-07, "epoch": 0.744644584696181, "percentage": 74.47, "elapsed_time": "1 day, 1:33:59", "remaining_time": "8:45:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8083, "total_steps": 10853, "loss": 0.1173, "learning_rate": 8.389062868879541e-07, "epoch": 0.744736720873451, "percentage": 74.48, "elapsed_time": "1 day, 1:34:08", "remaining_time": "8:45:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8084, "total_steps": 10853, "loss": 0.1102, "learning_rate": 8.383370502534765e-07, "epoch": 0.744828857050721, "percentage": 74.49, "elapsed_time": "1 day, 1:34:19", "remaining_time": "8:45:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8085, "total_steps": 10853, "loss": 0.1245, "learning_rate": 8.377679679045828e-07, "epoch": 0.744920993227991, "percentage": 74.5, "elapsed_time": "1 day, 1:34:31", "remaining_time": "8:45:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8086, "total_steps": 10853, "loss": 0.1255, "learning_rate": 8.371990398941121e-07, "epoch": 0.745013129405261, "percentage": 74.5, "elapsed_time": "1 day, 1:34:42", "remaining_time": "8:45:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8087, "total_steps": 10853, "loss": 0.1198, "learning_rate": 8.366302662748901e-07, "epoch": 0.745105265582531, "percentage": 74.51, "elapsed_time": "1 day, 1:34:52", "remaining_time": "8:44:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8088, "total_steps": 10853, "loss": 0.1132, "learning_rate": 8.360616470997263e-07, "epoch": 0.745197401759801, "percentage": 74.52, "elapsed_time": "1 day, 1:35:02", "remaining_time": "8:44:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8089, "total_steps": 10853, "loss": 0.1203, "learning_rate": 8.354931824214185e-07, "epoch": 0.745289537937071, "percentage": 74.53, "elapsed_time": "1 day, 1:35:14", "remaining_time": "8:44:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8090, "total_steps": 10853, "loss": 0.1263, "learning_rate": 8.349248722927469e-07, "epoch": 0.745381674114341, "percentage": 74.54, "elapsed_time": "1 day, 1:35:24", "remaining_time": "8:44:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8091, "total_steps": 10853, "loss": 0.123, "learning_rate": 8.343567167664801e-07, "epoch": 0.745473810291611, "percentage": 74.55, "elapsed_time": "1 day, 1:35:36", "remaining_time": "8:44:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8092, "total_steps": 10853, "loss": 0.1203, "learning_rate": 8.337887158953723e-07, "epoch": 0.745565946468881, "percentage": 74.56, "elapsed_time": "1 day, 1:35:48", "remaining_time": "8:44:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8093, "total_steps": 10853, "loss": 0.1192, "learning_rate": 8.332208697321606e-07, "epoch": 0.745658082646151, "percentage": 74.57, "elapsed_time": "1 day, 1:36:00", "remaining_time": "8:43:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8094, "total_steps": 10853, "loss": 0.115, "learning_rate": 8.326531783295716e-07, "epoch": 0.745750218823421, "percentage": 74.58, "elapsed_time": "1 day, 1:36:12", "remaining_time": "8:43:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8095, "total_steps": 10853, "loss": 0.1287, "learning_rate": 8.320856417403134e-07, "epoch": 0.7458423550006911, "percentage": 74.59, "elapsed_time": "1 day, 1:36:23", "remaining_time": "8:43:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8096, "total_steps": 10853, "loss": 0.1241, "learning_rate": 8.315182600170838e-07, "epoch": 0.7459344911779611, "percentage": 74.6, "elapsed_time": "1 day, 1:36:33", "remaining_time": "8:43:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8097, "total_steps": 10853, "loss": 0.134, "learning_rate": 8.309510332125623e-07, "epoch": 0.7460266273552311, "percentage": 74.61, "elapsed_time": "1 day, 1:36:46", "remaining_time": "8:43:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8098, "total_steps": 10853, "loss": 0.1176, "learning_rate": 8.30383961379417e-07, "epoch": 0.7461187635325011, "percentage": 74.62, "elapsed_time": "1 day, 1:36:56", "remaining_time": "8:42:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8099, "total_steps": 10853, "loss": 0.1205, "learning_rate": 8.298170445703016e-07, "epoch": 0.7462108997097711, "percentage": 74.62, "elapsed_time": "1 day, 1:37:07", "remaining_time": "8:42:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8100, "total_steps": 10853, "loss": 0.1242, "learning_rate": 8.292502828378534e-07, "epoch": 0.746303035887041, "percentage": 74.63, "elapsed_time": "1 day, 1:37:18", "remaining_time": "8:42:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8101, "total_steps": 10853, "loss": 0.1261, "learning_rate": 8.286836762346953e-07, "epoch": 0.746395172064311, "percentage": 74.64, "elapsed_time": "1 day, 1:37:29", "remaining_time": "8:42:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8102, "total_steps": 10853, "loss": 0.1253, "learning_rate": 8.281172248134376e-07, "epoch": 0.746487308241581, "percentage": 74.65, "elapsed_time": "1 day, 1:37:40", "remaining_time": "8:42:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8103, "total_steps": 10853, "loss": 0.1213, "learning_rate": 8.275509286266755e-07, "epoch": 0.746579444418851, "percentage": 74.66, "elapsed_time": "1 day, 1:37:51", "remaining_time": "8:41:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8104, "total_steps": 10853, "loss": 0.124, "learning_rate": 8.26984787726991e-07, "epoch": 0.746671580596121, "percentage": 74.67, "elapsed_time": "1 day, 1:38:01", "remaining_time": "8:41:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8105, "total_steps": 10853, "loss": 0.1287, "learning_rate": 8.264188021669483e-07, "epoch": 0.746763716773391, "percentage": 74.68, "elapsed_time": "1 day, 1:38:12", "remaining_time": "8:41:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8106, "total_steps": 10853, "loss": 0.1213, "learning_rate": 8.258529719990996e-07, "epoch": 0.746855852950661, "percentage": 74.69, "elapsed_time": "1 day, 1:38:23", "remaining_time": "8:41:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8107, "total_steps": 10853, "loss": 0.1349, "learning_rate": 8.252872972759826e-07, "epoch": 0.746947989127931, "percentage": 74.7, "elapsed_time": "1 day, 1:38:34", "remaining_time": "8:41:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8108, "total_steps": 10853, "loss": 0.1182, "learning_rate": 8.24721778050121e-07, "epoch": 0.7470401253052011, "percentage": 74.71, "elapsed_time": "1 day, 1:38:44", "remaining_time": "8:40:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8109, "total_steps": 10853, "loss": 0.1245, "learning_rate": 8.241564143740216e-07, "epoch": 0.7471322614824711, "percentage": 74.72, "elapsed_time": "1 day, 1:38:55", "remaining_time": "8:40:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8110, "total_steps": 10853, "loss": 0.1196, "learning_rate": 8.235912063001805e-07, "epoch": 0.7472243976597411, "percentage": 74.73, "elapsed_time": "1 day, 1:39:06", "remaining_time": "8:40:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8111, "total_steps": 10853, "loss": 0.1161, "learning_rate": 8.230261538810755e-07, "epoch": 0.7473165338370111, "percentage": 74.74, "elapsed_time": "1 day, 1:39:17", "remaining_time": "8:40:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8112, "total_steps": 10853, "loss": 0.1207, "learning_rate": 8.224612571691734e-07, "epoch": 0.7474086700142811, "percentage": 74.74, "elapsed_time": "1 day, 1:39:29", "remaining_time": "8:40:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8113, "total_steps": 10853, "loss": 0.1223, "learning_rate": 8.218965162169232e-07, "epoch": 0.7475008061915511, "percentage": 74.75, "elapsed_time": "1 day, 1:39:39", "remaining_time": "8:39:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8114, "total_steps": 10853, "loss": 0.1238, "learning_rate": 8.21331931076762e-07, "epoch": 0.7475929423688211, "percentage": 74.76, "elapsed_time": "1 day, 1:39:50", "remaining_time": "8:39:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8115, "total_steps": 10853, "loss": 0.1277, "learning_rate": 8.207675018011127e-07, "epoch": 0.7476850785460911, "percentage": 74.77, "elapsed_time": "1 day, 1:40:01", "remaining_time": "8:39:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8116, "total_steps": 10853, "loss": 0.1207, "learning_rate": 8.202032284423817e-07, "epoch": 0.7477772147233611, "percentage": 74.78, "elapsed_time": "1 day, 1:40:13", "remaining_time": "8:39:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8117, "total_steps": 10853, "loss": 0.1241, "learning_rate": 8.196391110529606e-07, "epoch": 0.7478693509006311, "percentage": 74.79, "elapsed_time": "1 day, 1:40:25", "remaining_time": "8:39:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8118, "total_steps": 10853, "loss": 0.1097, "learning_rate": 8.19075149685229e-07, "epoch": 0.7479614870779011, "percentage": 74.8, "elapsed_time": "1 day, 1:40:36", "remaining_time": "8:39:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8119, "total_steps": 10853, "loss": 0.1178, "learning_rate": 8.185113443915504e-07, "epoch": 0.7480536232551711, "percentage": 74.81, "elapsed_time": "1 day, 1:40:47", "remaining_time": "8:38:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8120, "total_steps": 10853, "loss": 0.1184, "learning_rate": 8.179476952242757e-07, "epoch": 0.7481457594324411, "percentage": 74.82, "elapsed_time": "1 day, 1:40:59", "remaining_time": "8:38:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8121, "total_steps": 10853, "loss": 0.1134, "learning_rate": 8.173842022357381e-07, "epoch": 0.7482378956097111, "percentage": 74.83, "elapsed_time": "1 day, 1:41:10", "remaining_time": "8:38:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8122, "total_steps": 10853, "loss": 0.1188, "learning_rate": 8.168208654782578e-07, "epoch": 0.7483300317869812, "percentage": 74.84, "elapsed_time": "1 day, 1:41:21", "remaining_time": "8:38:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8123, "total_steps": 10853, "loss": 0.1269, "learning_rate": 8.162576850041415e-07, "epoch": 0.7484221679642512, "percentage": 74.85, "elapsed_time": "1 day, 1:41:31", "remaining_time": "8:38:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8124, "total_steps": 10853, "loss": 0.1197, "learning_rate": 8.156946608656799e-07, "epoch": 0.7485143041415212, "percentage": 74.85, "elapsed_time": "1 day, 1:41:42", "remaining_time": "8:37:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8125, "total_steps": 10853, "loss": 0.1065, "learning_rate": 8.151317931151514e-07, "epoch": 0.7486064403187912, "percentage": 74.86, "elapsed_time": "1 day, 1:41:53", "remaining_time": "8:37:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8126, "total_steps": 10853, "loss": 0.1379, "learning_rate": 8.145690818048171e-07, "epoch": 0.7486985764960612, "percentage": 74.87, "elapsed_time": "1 day, 1:42:06", "remaining_time": "8:37:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8127, "total_steps": 10853, "loss": 0.1245, "learning_rate": 8.140065269869244e-07, "epoch": 0.7487907126733312, "percentage": 74.88, "elapsed_time": "1 day, 1:42:16", "remaining_time": "8:37:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8128, "total_steps": 10853, "loss": 0.1114, "learning_rate": 8.134441287137068e-07, "epoch": 0.7488828488506012, "percentage": 74.89, "elapsed_time": "1 day, 1:42:26", "remaining_time": "8:37:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8129, "total_steps": 10853, "loss": 0.1084, "learning_rate": 8.128818870373845e-07, "epoch": 0.7489749850278712, "percentage": 74.9, "elapsed_time": "1 day, 1:42:37", "remaining_time": "8:36:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8130, "total_steps": 10853, "loss": 0.1278, "learning_rate": 8.123198020101594e-07, "epoch": 0.7490671212051412, "percentage": 74.91, "elapsed_time": "1 day, 1:42:48", "remaining_time": "8:36:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8131, "total_steps": 10853, "loss": 0.1276, "learning_rate": 8.117578736842232e-07, "epoch": 0.7491592573824112, "percentage": 74.92, "elapsed_time": "1 day, 1:42:59", "remaining_time": "8:36:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8132, "total_steps": 10853, "loss": 0.12, "learning_rate": 8.111961021117496e-07, "epoch": 0.7492513935596812, "percentage": 74.93, "elapsed_time": "1 day, 1:43:10", "remaining_time": "8:36:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8133, "total_steps": 10853, "loss": 0.1216, "learning_rate": 8.106344873449001e-07, "epoch": 0.7493435297369512, "percentage": 74.94, "elapsed_time": "1 day, 1:43:20", "remaining_time": "8:36:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8134, "total_steps": 10853, "loss": 0.1268, "learning_rate": 8.100730294358197e-07, "epoch": 0.7494356659142212, "percentage": 74.95, "elapsed_time": "1 day, 1:43:31", "remaining_time": "8:35:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8135, "total_steps": 10853, "loss": 0.1239, "learning_rate": 8.095117284366405e-07, "epoch": 0.7495278020914912, "percentage": 74.96, "elapsed_time": "1 day, 1:43:42", "remaining_time": "8:35:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8136, "total_steps": 10853, "loss": 0.1165, "learning_rate": 8.089505843994797e-07, "epoch": 0.7496199382687613, "percentage": 74.97, "elapsed_time": "1 day, 1:43:54", "remaining_time": "8:35:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8137, "total_steps": 10853, "loss": 0.1101, "learning_rate": 8.083895973764394e-07, "epoch": 0.7497120744460313, "percentage": 74.97, "elapsed_time": "1 day, 1:44:05", "remaining_time": "8:35:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8138, "total_steps": 10853, "loss": 0.1259, "learning_rate": 8.078287674196061e-07, "epoch": 0.7498042106233013, "percentage": 74.98, "elapsed_time": "1 day, 1:44:17", "remaining_time": "8:35:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8139, "total_steps": 10853, "loss": 0.1264, "learning_rate": 8.072680945810538e-07, "epoch": 0.7498963468005713, "percentage": 74.99, "elapsed_time": "1 day, 1:44:27", "remaining_time": "8:35:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8140, "total_steps": 10853, "loss": 0.1351, "learning_rate": 8.067075789128412e-07, "epoch": 0.7499884829778413, "percentage": 75.0, "elapsed_time": "1 day, 1:44:39", "remaining_time": "8:34:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8141, "total_steps": 10853, "loss": 0.1151, "learning_rate": 8.061472204670129e-07, "epoch": 0.7500806191551113, "percentage": 75.01, "elapsed_time": "1 day, 1:44:50", "remaining_time": "8:34:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8142, "total_steps": 10853, "loss": 0.1183, "learning_rate": 8.055870192955975e-07, "epoch": 0.7501727553323813, "percentage": 75.02, "elapsed_time": "1 day, 1:45:01", "remaining_time": "8:34:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8143, "total_steps": 10853, "loss": 0.1179, "learning_rate": 8.050269754506091e-07, "epoch": 0.7502648915096513, "percentage": 75.03, "elapsed_time": "1 day, 1:45:12", "remaining_time": "8:34:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8144, "total_steps": 10853, "loss": 0.1281, "learning_rate": 8.044670889840481e-07, "epoch": 0.7503570276869213, "percentage": 75.04, "elapsed_time": "1 day, 1:45:24", "remaining_time": "8:34:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8145, "total_steps": 10853, "loss": 0.1243, "learning_rate": 8.039073599479014e-07, "epoch": 0.7504491638641912, "percentage": 75.05, "elapsed_time": "1 day, 1:45:35", "remaining_time": "8:33:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8146, "total_steps": 10853, "loss": 0.1229, "learning_rate": 8.033477883941379e-07, "epoch": 0.7505413000414612, "percentage": 75.06, "elapsed_time": "1 day, 1:45:46", "remaining_time": "8:33:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8147, "total_steps": 10853, "loss": 0.1275, "learning_rate": 8.027883743747156e-07, "epoch": 0.7506334362187312, "percentage": 75.07, "elapsed_time": "1 day, 1:45:57", "remaining_time": "8:33:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8148, "total_steps": 10853, "loss": 0.1158, "learning_rate": 8.022291179415747e-07, "epoch": 0.7507255723960012, "percentage": 75.08, "elapsed_time": "1 day, 1:46:08", "remaining_time": "8:33:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8149, "total_steps": 10853, "loss": 0.1265, "learning_rate": 8.016700191466431e-07, "epoch": 0.7508177085732713, "percentage": 75.09, "elapsed_time": "1 day, 1:46:18", "remaining_time": "8:33:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8150, "total_steps": 10853, "loss": 0.1172, "learning_rate": 8.011110780418335e-07, "epoch": 0.7509098447505413, "percentage": 75.09, "elapsed_time": "1 day, 1:46:29", "remaining_time": "8:32:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8151, "total_steps": 10853, "loss": 0.1294, "learning_rate": 8.005522946790426e-07, "epoch": 0.7510019809278113, "percentage": 75.1, "elapsed_time": "1 day, 1:46:40", "remaining_time": "8:32:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8152, "total_steps": 10853, "loss": 0.1256, "learning_rate": 7.999936691101545e-07, "epoch": 0.7510941171050813, "percentage": 75.11, "elapsed_time": "1 day, 1:46:51", "remaining_time": "8:32:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8153, "total_steps": 10853, "loss": 0.1276, "learning_rate": 7.994352013870366e-07, "epoch": 0.7511862532823513, "percentage": 75.12, "elapsed_time": "1 day, 1:47:02", "remaining_time": "8:32:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8154, "total_steps": 10853, "loss": 0.1093, "learning_rate": 7.988768915615441e-07, "epoch": 0.7512783894596213, "percentage": 75.13, "elapsed_time": "1 day, 1:47:11", "remaining_time": "8:32:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8155, "total_steps": 10853, "loss": 0.1131, "learning_rate": 7.983187396855144e-07, "epoch": 0.7513705256368913, "percentage": 75.14, "elapsed_time": "1 day, 1:47:21", "remaining_time": "8:31:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8156, "total_steps": 10853, "loss": 0.1218, "learning_rate": 7.977607458107731e-07, "epoch": 0.7514626618141613, "percentage": 75.15, "elapsed_time": "1 day, 1:47:32", "remaining_time": "8:31:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8157, "total_steps": 10853, "loss": 0.1189, "learning_rate": 7.972029099891293e-07, "epoch": 0.7515547979914313, "percentage": 75.16, "elapsed_time": "1 day, 1:47:43", "remaining_time": "8:31:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8158, "total_steps": 10853, "loss": 0.1142, "learning_rate": 7.966452322723806e-07, "epoch": 0.7516469341687013, "percentage": 75.17, "elapsed_time": "1 day, 1:47:53", "remaining_time": "8:31:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8159, "total_steps": 10853, "loss": 0.1199, "learning_rate": 7.960877127123038e-07, "epoch": 0.7517390703459713, "percentage": 75.18, "elapsed_time": "1 day, 1:48:04", "remaining_time": "8:31:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8160, "total_steps": 10853, "loss": 0.1117, "learning_rate": 7.955303513606657e-07, "epoch": 0.7518312065232413, "percentage": 75.19, "elapsed_time": "1 day, 1:48:15", "remaining_time": "8:30:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8161, "total_steps": 10853, "loss": 0.1276, "learning_rate": 7.949731482692185e-07, "epoch": 0.7519233427005113, "percentage": 75.2, "elapsed_time": "1 day, 1:48:26", "remaining_time": "8:30:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8162, "total_steps": 10853, "loss": 0.1145, "learning_rate": 7.944161034896986e-07, "epoch": 0.7520154788777813, "percentage": 75.21, "elapsed_time": "1 day, 1:48:36", "remaining_time": "8:30:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8163, "total_steps": 10853, "loss": 0.1261, "learning_rate": 7.93859217073826e-07, "epoch": 0.7521076150550514, "percentage": 75.21, "elapsed_time": "1 day, 1:48:48", "remaining_time": "8:30:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8164, "total_steps": 10853, "loss": 0.1186, "learning_rate": 7.933024890733099e-07, "epoch": 0.7521997512323214, "percentage": 75.22, "elapsed_time": "1 day, 1:48:57", "remaining_time": "8:30:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8165, "total_steps": 10853, "loss": 0.1238, "learning_rate": 7.927459195398404e-07, "epoch": 0.7522918874095914, "percentage": 75.23, "elapsed_time": "1 day, 1:49:07", "remaining_time": "8:29:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8166, "total_steps": 10853, "loss": 0.1281, "learning_rate": 7.921895085250967e-07, "epoch": 0.7523840235868614, "percentage": 75.24, "elapsed_time": "1 day, 1:49:18", "remaining_time": "8:29:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8167, "total_steps": 10853, "loss": 0.1115, "learning_rate": 7.916332560807402e-07, "epoch": 0.7524761597641314, "percentage": 75.25, "elapsed_time": "1 day, 1:49:29", "remaining_time": "8:29:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8168, "total_steps": 10853, "loss": 0.1172, "learning_rate": 7.910771622584199e-07, "epoch": 0.7525682959414014, "percentage": 75.26, "elapsed_time": "1 day, 1:49:39", "remaining_time": "8:29:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8169, "total_steps": 10853, "loss": 0.1144, "learning_rate": 7.905212271097696e-07, "epoch": 0.7526604321186714, "percentage": 75.27, "elapsed_time": "1 day, 1:49:49", "remaining_time": "8:29:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8170, "total_steps": 10853, "loss": 0.1203, "learning_rate": 7.899654506864074e-07, "epoch": 0.7527525682959414, "percentage": 75.28, "elapsed_time": "1 day, 1:49:59", "remaining_time": "8:29:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8171, "total_steps": 10853, "loss": 0.1143, "learning_rate": 7.894098330399363e-07, "epoch": 0.7528447044732114, "percentage": 75.29, "elapsed_time": "1 day, 1:50:10", "remaining_time": "8:28:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8172, "total_steps": 10853, "loss": 0.1297, "learning_rate": 7.888543742219462e-07, "epoch": 0.7529368406504814, "percentage": 75.3, "elapsed_time": "1 day, 1:50:21", "remaining_time": "8:28:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8173, "total_steps": 10853, "loss": 0.1205, "learning_rate": 7.882990742840119e-07, "epoch": 0.7530289768277514, "percentage": 75.31, "elapsed_time": "1 day, 1:50:31", "remaining_time": "8:28:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8174, "total_steps": 10853, "loss": 0.1246, "learning_rate": 7.877439332776934e-07, "epoch": 0.7531211130050214, "percentage": 75.32, "elapsed_time": "1 day, 1:50:42", "remaining_time": "8:28:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8175, "total_steps": 10853, "loss": 0.1078, "learning_rate": 7.87188951254535e-07, "epoch": 0.7532132491822914, "percentage": 75.32, "elapsed_time": "1 day, 1:50:53", "remaining_time": "8:28:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8176, "total_steps": 10853, "loss": 0.1246, "learning_rate": 7.866341282660661e-07, "epoch": 0.7533053853595615, "percentage": 75.33, "elapsed_time": "1 day, 1:51:04", "remaining_time": "8:27:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8177, "total_steps": 10853, "loss": 0.1194, "learning_rate": 7.860794643638026e-07, "epoch": 0.7533975215368315, "percentage": 75.34, "elapsed_time": "1 day, 1:51:16", "remaining_time": "8:27:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8178, "total_steps": 10853, "loss": 0.1274, "learning_rate": 7.855249595992454e-07, "epoch": 0.7534896577141015, "percentage": 75.35, "elapsed_time": "1 day, 1:51:27", "remaining_time": "8:27:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8179, "total_steps": 10853, "loss": 0.1141, "learning_rate": 7.849706140238808e-07, "epoch": 0.7535817938913715, "percentage": 75.36, "elapsed_time": "1 day, 1:51:38", "remaining_time": "8:27:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8180, "total_steps": 10853, "loss": 0.1171, "learning_rate": 7.844164276891794e-07, "epoch": 0.7536739300686415, "percentage": 75.37, "elapsed_time": "1 day, 1:51:48", "remaining_time": "8:27:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8181, "total_steps": 10853, "loss": 0.124, "learning_rate": 7.838624006465967e-07, "epoch": 0.7537660662459115, "percentage": 75.38, "elapsed_time": "1 day, 1:51:59", "remaining_time": "8:26:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8182, "total_steps": 10853, "loss": 0.1174, "learning_rate": 7.833085329475748e-07, "epoch": 0.7538582024231815, "percentage": 75.39, "elapsed_time": "1 day, 1:52:08", "remaining_time": "8:26:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8183, "total_steps": 10853, "loss": 0.1298, "learning_rate": 7.82754824643541e-07, "epoch": 0.7539503386004515, "percentage": 75.4, "elapsed_time": "1 day, 1:52:20", "remaining_time": "8:26:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8184, "total_steps": 10853, "loss": 0.1291, "learning_rate": 7.822012757859057e-07, "epoch": 0.7540424747777215, "percentage": 75.41, "elapsed_time": "1 day, 1:52:31", "remaining_time": "8:26:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8185, "total_steps": 10853, "loss": 0.1147, "learning_rate": 7.816478864260677e-07, "epoch": 0.7541346109549915, "percentage": 75.42, "elapsed_time": "1 day, 1:52:42", "remaining_time": "8:26:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8186, "total_steps": 10853, "loss": 0.1255, "learning_rate": 7.810946566154076e-07, "epoch": 0.7542267471322615, "percentage": 75.43, "elapsed_time": "1 day, 1:52:52", "remaining_time": "8:25:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8187, "total_steps": 10853, "loss": 0.1261, "learning_rate": 7.805415864052942e-07, "epoch": 0.7543188833095315, "percentage": 75.44, "elapsed_time": "1 day, 1:53:03", "remaining_time": "8:25:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8188, "total_steps": 10853, "loss": 0.123, "learning_rate": 7.79988675847079e-07, "epoch": 0.7544110194868014, "percentage": 75.44, "elapsed_time": "1 day, 1:53:13", "remaining_time": "8:25:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8189, "total_steps": 10853, "loss": 0.1225, "learning_rate": 7.794359249921004e-07, "epoch": 0.7545031556640714, "percentage": 75.45, "elapsed_time": "1 day, 1:53:24", "remaining_time": "8:25:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8190, "total_steps": 10853, "loss": 0.1172, "learning_rate": 7.78883333891682e-07, "epoch": 0.7545952918413416, "percentage": 75.46, "elapsed_time": "1 day, 1:53:35", "remaining_time": "8:25:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8191, "total_steps": 10853, "loss": 0.1158, "learning_rate": 7.783309025971314e-07, "epoch": 0.7546874280186116, "percentage": 75.47, "elapsed_time": "1 day, 1:53:46", "remaining_time": "8:24:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8192, "total_steps": 10853, "loss": 0.1343, "learning_rate": 7.777786311597408e-07, "epoch": 0.7547795641958815, "percentage": 75.48, "elapsed_time": "1 day, 1:53:57", "remaining_time": "8:24:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8193, "total_steps": 10853, "loss": 0.1216, "learning_rate": 7.772265196307896e-07, "epoch": 0.7548717003731515, "percentage": 75.49, "elapsed_time": "1 day, 1:54:08", "remaining_time": "8:24:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8194, "total_steps": 10853, "loss": 0.1193, "learning_rate": 7.766745680615417e-07, "epoch": 0.7549638365504215, "percentage": 75.5, "elapsed_time": "1 day, 1:54:18", "remaining_time": "8:24:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8195, "total_steps": 10853, "loss": 0.1125, "learning_rate": 7.761227765032464e-07, "epoch": 0.7550559727276915, "percentage": 75.51, "elapsed_time": "1 day, 1:54:27", "remaining_time": "8:24:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8196, "total_steps": 10853, "loss": 0.1198, "learning_rate": 7.755711450071365e-07, "epoch": 0.7551481089049615, "percentage": 75.52, "elapsed_time": "1 day, 1:54:39", "remaining_time": "8:23:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8197, "total_steps": 10853, "loss": 0.1275, "learning_rate": 7.750196736244309e-07, "epoch": 0.7552402450822315, "percentage": 75.53, "elapsed_time": "1 day, 1:54:48", "remaining_time": "8:23:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8198, "total_steps": 10853, "loss": 0.1175, "learning_rate": 7.744683624063343e-07, "epoch": 0.7553323812595015, "percentage": 75.54, "elapsed_time": "1 day, 1:54:58", "remaining_time": "8:23:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8199, "total_steps": 10853, "loss": 0.1212, "learning_rate": 7.739172114040366e-07, "epoch": 0.7554245174367715, "percentage": 75.55, "elapsed_time": "1 day, 1:55:08", "remaining_time": "8:23:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8200, "total_steps": 10853, "loss": 0.1191, "learning_rate": 7.733662206687106e-07, "epoch": 0.7555166536140415, "percentage": 75.56, "elapsed_time": "1 day, 1:55:19", "remaining_time": "8:23:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8201, "total_steps": 10853, "loss": 0.13, "learning_rate": 7.728153902515181e-07, "epoch": 0.7556087897913115, "percentage": 75.56, "elapsed_time": "1 day, 1:55:30", "remaining_time": "8:23:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8202, "total_steps": 10853, "loss": 0.1409, "learning_rate": 7.722647202036012e-07, "epoch": 0.7557009259685815, "percentage": 75.57, "elapsed_time": "1 day, 1:55:40", "remaining_time": "8:22:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8203, "total_steps": 10853, "loss": 0.1164, "learning_rate": 7.717142105760922e-07, "epoch": 0.7557930621458516, "percentage": 75.58, "elapsed_time": "1 day, 1:55:50", "remaining_time": "8:22:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8204, "total_steps": 10853, "loss": 0.132, "learning_rate": 7.711638614201037e-07, "epoch": 0.7558851983231216, "percentage": 75.59, "elapsed_time": "1 day, 1:56:01", "remaining_time": "8:22:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8205, "total_steps": 10853, "loss": 0.1185, "learning_rate": 7.706136727867366e-07, "epoch": 0.7559773345003916, "percentage": 75.6, "elapsed_time": "1 day, 1:56:12", "remaining_time": "8:22:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8206, "total_steps": 10853, "loss": 0.1142, "learning_rate": 7.700636447270773e-07, "epoch": 0.7560694706776616, "percentage": 75.61, "elapsed_time": "1 day, 1:56:23", "remaining_time": "8:22:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8207, "total_steps": 10853, "loss": 0.125, "learning_rate": 7.695137772921938e-07, "epoch": 0.7561616068549316, "percentage": 75.62, "elapsed_time": "1 day, 1:56:34", "remaining_time": "8:21:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8208, "total_steps": 10853, "loss": 0.1211, "learning_rate": 7.68964070533143e-07, "epoch": 0.7562537430322016, "percentage": 75.63, "elapsed_time": "1 day, 1:56:45", "remaining_time": "8:21:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8209, "total_steps": 10853, "loss": 0.1332, "learning_rate": 7.684145245009639e-07, "epoch": 0.7563458792094716, "percentage": 75.64, "elapsed_time": "1 day, 1:56:56", "remaining_time": "8:21:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8210, "total_steps": 10853, "loss": 0.1177, "learning_rate": 7.678651392466824e-07, "epoch": 0.7564380153867416, "percentage": 75.65, "elapsed_time": "1 day, 1:57:06", "remaining_time": "8:21:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8211, "total_steps": 10853, "loss": 0.1197, "learning_rate": 7.6731591482131e-07, "epoch": 0.7565301515640116, "percentage": 75.66, "elapsed_time": "1 day, 1:57:17", "remaining_time": "8:21:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8212, "total_steps": 10853, "loss": 0.1129, "learning_rate": 7.667668512758414e-07, "epoch": 0.7566222877412816, "percentage": 75.67, "elapsed_time": "1 day, 1:57:28", "remaining_time": "8:20:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8213, "total_steps": 10853, "loss": 0.1158, "learning_rate": 7.662179486612561e-07, "epoch": 0.7567144239185516, "percentage": 75.67, "elapsed_time": "1 day, 1:57:38", "remaining_time": "8:20:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8214, "total_steps": 10853, "loss": 0.127, "learning_rate": 7.656692070285212e-07, "epoch": 0.7568065600958216, "percentage": 75.68, "elapsed_time": "1 day, 1:57:49", "remaining_time": "8:20:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8215, "total_steps": 10853, "loss": 0.1314, "learning_rate": 7.651206264285871e-07, "epoch": 0.7568986962730916, "percentage": 75.69, "elapsed_time": "1 day, 1:58:00", "remaining_time": "8:20:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8216, "total_steps": 10853, "loss": 0.118, "learning_rate": 7.645722069123904e-07, "epoch": 0.7569908324503616, "percentage": 75.7, "elapsed_time": "1 day, 1:58:10", "remaining_time": "8:20:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8217, "total_steps": 10853, "loss": 0.1108, "learning_rate": 7.640239485308506e-07, "epoch": 0.7570829686276317, "percentage": 75.71, "elapsed_time": "1 day, 1:58:20", "remaining_time": "8:19:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8218, "total_steps": 10853, "loss": 0.1242, "learning_rate": 7.634758513348737e-07, "epoch": 0.7571751048049017, "percentage": 75.72, "elapsed_time": "1 day, 1:58:32", "remaining_time": "8:19:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8219, "total_steps": 10853, "loss": 0.1134, "learning_rate": 7.629279153753508e-07, "epoch": 0.7572672409821717, "percentage": 75.73, "elapsed_time": "1 day, 1:58:42", "remaining_time": "8:19:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8220, "total_steps": 10853, "loss": 0.1257, "learning_rate": 7.623801407031586e-07, "epoch": 0.7573593771594417, "percentage": 75.74, "elapsed_time": "1 day, 1:58:52", "remaining_time": "8:19:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8221, "total_steps": 10853, "loss": 0.1285, "learning_rate": 7.618325273691565e-07, "epoch": 0.7574515133367117, "percentage": 75.75, "elapsed_time": "1 day, 1:59:03", "remaining_time": "8:19:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8222, "total_steps": 10853, "loss": 0.1191, "learning_rate": 7.612850754241921e-07, "epoch": 0.7575436495139817, "percentage": 75.76, "elapsed_time": "1 day, 1:59:14", "remaining_time": "8:18:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8223, "total_steps": 10853, "loss": 0.129, "learning_rate": 7.607377849190947e-07, "epoch": 0.7576357856912517, "percentage": 75.77, "elapsed_time": "1 day, 1:59:24", "remaining_time": "8:18:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8224, "total_steps": 10853, "loss": 0.1252, "learning_rate": 7.601906559046824e-07, "epoch": 0.7577279218685217, "percentage": 75.78, "elapsed_time": "1 day, 1:59:35", "remaining_time": "8:18:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8225, "total_steps": 10853, "loss": 0.1418, "learning_rate": 7.596436884317537e-07, "epoch": 0.7578200580457917, "percentage": 75.79, "elapsed_time": "1 day, 1:59:47", "remaining_time": "8:18:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8226, "total_steps": 10853, "loss": 0.1316, "learning_rate": 7.590968825510958e-07, "epoch": 0.7579121942230617, "percentage": 75.79, "elapsed_time": "1 day, 1:59:57", "remaining_time": "8:18:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8227, "total_steps": 10853, "loss": 0.1246, "learning_rate": 7.585502383134807e-07, "epoch": 0.7580043304003317, "percentage": 75.8, "elapsed_time": "1 day, 2:00:08", "remaining_time": "8:17:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8228, "total_steps": 10853, "loss": 0.1281, "learning_rate": 7.580037557696634e-07, "epoch": 0.7580964665776017, "percentage": 75.81, "elapsed_time": "1 day, 2:00:20", "remaining_time": "8:17:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8229, "total_steps": 10853, "loss": 0.1277, "learning_rate": 7.574574349703839e-07, "epoch": 0.7581886027548717, "percentage": 75.82, "elapsed_time": "1 day, 2:00:30", "remaining_time": "8:17:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8230, "total_steps": 10853, "loss": 0.1169, "learning_rate": 7.569112759663693e-07, "epoch": 0.7582807389321417, "percentage": 75.83, "elapsed_time": "1 day, 2:00:41", "remaining_time": "8:17:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8231, "total_steps": 10853, "loss": 0.1259, "learning_rate": 7.5636527880833e-07, "epoch": 0.7583728751094118, "percentage": 75.84, "elapsed_time": "1 day, 2:00:52", "remaining_time": "8:17:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8232, "total_steps": 10853, "loss": 0.1325, "learning_rate": 7.558194435469634e-07, "epoch": 0.7584650112866818, "percentage": 75.85, "elapsed_time": "1 day, 2:01:02", "remaining_time": "8:17:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8233, "total_steps": 10853, "loss": 0.1194, "learning_rate": 7.55273770232949e-07, "epoch": 0.7585571474639518, "percentage": 75.86, "elapsed_time": "1 day, 2:01:12", "remaining_time": "8:16:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8234, "total_steps": 10853, "loss": 0.1212, "learning_rate": 7.547282589169519e-07, "epoch": 0.7586492836412217, "percentage": 75.87, "elapsed_time": "1 day, 2:01:23", "remaining_time": "8:16:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8235, "total_steps": 10853, "loss": 0.1148, "learning_rate": 7.541829096496239e-07, "epoch": 0.7587414198184917, "percentage": 75.88, "elapsed_time": "1 day, 2:01:33", "remaining_time": "8:16:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8236, "total_steps": 10853, "loss": 0.1273, "learning_rate": 7.536377224816008e-07, "epoch": 0.7588335559957617, "percentage": 75.89, "elapsed_time": "1 day, 2:01:44", "remaining_time": "8:16:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8237, "total_steps": 10853, "loss": 0.1308, "learning_rate": 7.530926974635036e-07, "epoch": 0.7589256921730317, "percentage": 75.9, "elapsed_time": "1 day, 2:01:55", "remaining_time": "8:16:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8238, "total_steps": 10853, "loss": 0.1287, "learning_rate": 7.525478346459369e-07, "epoch": 0.7590178283503017, "percentage": 75.91, "elapsed_time": "1 day, 2:02:06", "remaining_time": "8:15:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8239, "total_steps": 10853, "loss": 0.131, "learning_rate": 7.520031340794926e-07, "epoch": 0.7591099645275717, "percentage": 75.91, "elapsed_time": "1 day, 2:02:16", "remaining_time": "8:15:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8240, "total_steps": 10853, "loss": 0.1231, "learning_rate": 7.514585958147444e-07, "epoch": 0.7592021007048417, "percentage": 75.92, "elapsed_time": "1 day, 2:02:27", "remaining_time": "8:15:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8241, "total_steps": 10853, "loss": 0.1251, "learning_rate": 7.509142199022545e-07, "epoch": 0.7592942368821117, "percentage": 75.93, "elapsed_time": "1 day, 2:02:38", "remaining_time": "8:15:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8242, "total_steps": 10853, "loss": 0.1167, "learning_rate": 7.50370006392567e-07, "epoch": 0.7593863730593817, "percentage": 75.94, "elapsed_time": "1 day, 2:02:49", "remaining_time": "8:15:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8243, "total_steps": 10853, "loss": 0.1197, "learning_rate": 7.498259553362128e-07, "epoch": 0.7594785092366517, "percentage": 75.95, "elapsed_time": "1 day, 2:02:59", "remaining_time": "8:14:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8244, "total_steps": 10853, "loss": 0.1209, "learning_rate": 7.492820667837075e-07, "epoch": 0.7595706454139218, "percentage": 75.96, "elapsed_time": "1 day, 2:03:09", "remaining_time": "8:14:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8245, "total_steps": 10853, "loss": 0.1313, "learning_rate": 7.487383407855508e-07, "epoch": 0.7596627815911918, "percentage": 75.97, "elapsed_time": "1 day, 2:03:20", "remaining_time": "8:14:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8246, "total_steps": 10853, "loss": 0.1056, "learning_rate": 7.481947773922269e-07, "epoch": 0.7597549177684618, "percentage": 75.98, "elapsed_time": "1 day, 2:03:32", "remaining_time": "8:14:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8247, "total_steps": 10853, "loss": 0.1188, "learning_rate": 7.476513766542065e-07, "epoch": 0.7598470539457318, "percentage": 75.99, "elapsed_time": "1 day, 2:03:42", "remaining_time": "8:14:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8248, "total_steps": 10853, "loss": 0.1308, "learning_rate": 7.471081386219442e-07, "epoch": 0.7599391901230018, "percentage": 76.0, "elapsed_time": "1 day, 2:03:53", "remaining_time": "8:13:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8249, "total_steps": 10853, "loss": 0.139, "learning_rate": 7.465650633458807e-07, "epoch": 0.7600313263002718, "percentage": 76.01, "elapsed_time": "1 day, 2:04:03", "remaining_time": "8:13:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8250, "total_steps": 10853, "loss": 0.124, "learning_rate": 7.460221508764398e-07, "epoch": 0.7601234624775418, "percentage": 76.02, "elapsed_time": "1 day, 2:04:14", "remaining_time": "8:13:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8251, "total_steps": 10853, "loss": 0.1086, "learning_rate": 7.454794012640301e-07, "epoch": 0.7602155986548118, "percentage": 76.03, "elapsed_time": "1 day, 2:04:24", "remaining_time": "8:13:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8252, "total_steps": 10853, "loss": 0.1212, "learning_rate": 7.449368145590469e-07, "epoch": 0.7603077348320818, "percentage": 76.03, "elapsed_time": "1 day, 2:04:35", "remaining_time": "8:13:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8253, "total_steps": 10853, "loss": 0.1256, "learning_rate": 7.443943908118703e-07, "epoch": 0.7603998710093518, "percentage": 76.04, "elapsed_time": "1 day, 2:04:47", "remaining_time": "8:12:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8254, "total_steps": 10853, "loss": 0.1354, "learning_rate": 7.438521300728624e-07, "epoch": 0.7604920071866218, "percentage": 76.05, "elapsed_time": "1 day, 2:04:57", "remaining_time": "8:12:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8255, "total_steps": 10853, "loss": 0.1264, "learning_rate": 7.433100323923742e-07, "epoch": 0.7605841433638918, "percentage": 76.06, "elapsed_time": "1 day, 2:05:09", "remaining_time": "8:12:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8256, "total_steps": 10853, "loss": 0.1195, "learning_rate": 7.427680978207378e-07, "epoch": 0.7606762795411618, "percentage": 76.07, "elapsed_time": "1 day, 2:05:18", "remaining_time": "8:12:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8257, "total_steps": 10853, "loss": 0.1026, "learning_rate": 7.422263264082732e-07, "epoch": 0.7607684157184318, "percentage": 76.08, "elapsed_time": "1 day, 2:05:29", "remaining_time": "8:12:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8258, "total_steps": 10853, "loss": 0.1048, "learning_rate": 7.416847182052825e-07, "epoch": 0.7608605518957019, "percentage": 76.09, "elapsed_time": "1 day, 2:05:38", "remaining_time": "8:11:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8259, "total_steps": 10853, "loss": 0.121, "learning_rate": 7.411432732620552e-07, "epoch": 0.7609526880729719, "percentage": 76.1, "elapsed_time": "1 day, 2:05:49", "remaining_time": "8:11:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8260, "total_steps": 10853, "loss": 0.1267, "learning_rate": 7.406019916288651e-07, "epoch": 0.7610448242502419, "percentage": 76.11, "elapsed_time": "1 day, 2:06:00", "remaining_time": "8:11:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8261, "total_steps": 10853, "loss": 0.1151, "learning_rate": 7.400608733559692e-07, "epoch": 0.7611369604275119, "percentage": 76.12, "elapsed_time": "1 day, 2:06:11", "remaining_time": "8:11:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8262, "total_steps": 10853, "loss": 0.1235, "learning_rate": 7.395199184936099e-07, "epoch": 0.7612290966047819, "percentage": 76.13, "elapsed_time": "1 day, 2:06:23", "remaining_time": "8:11:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8263, "total_steps": 10853, "loss": 0.1182, "learning_rate": 7.389791270920158e-07, "epoch": 0.7613212327820519, "percentage": 76.14, "elapsed_time": "1 day, 2:06:35", "remaining_time": "8:11:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8264, "total_steps": 10853, "loss": 0.1416, "learning_rate": 7.38438499201399e-07, "epoch": 0.7614133689593219, "percentage": 76.14, "elapsed_time": "1 day, 2:06:46", "remaining_time": "8:10:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8265, "total_steps": 10853, "loss": 0.1188, "learning_rate": 7.378980348719581e-07, "epoch": 0.7615055051365919, "percentage": 76.15, "elapsed_time": "1 day, 2:06:56", "remaining_time": "8:10:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8266, "total_steps": 10853, "loss": 0.1153, "learning_rate": 7.373577341538742e-07, "epoch": 0.7615976413138619, "percentage": 76.16, "elapsed_time": "1 day, 2:07:08", "remaining_time": "8:10:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8267, "total_steps": 10853, "loss": 0.11, "learning_rate": 7.368175970973138e-07, "epoch": 0.7616897774911319, "percentage": 76.17, "elapsed_time": "1 day, 2:07:19", "remaining_time": "8:10:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8268, "total_steps": 10853, "loss": 0.1197, "learning_rate": 7.362776237524291e-07, "epoch": 0.7617819136684019, "percentage": 76.18, "elapsed_time": "1 day, 2:07:28", "remaining_time": "8:10:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8269, "total_steps": 10853, "loss": 0.1197, "learning_rate": 7.357378141693569e-07, "epoch": 0.7618740498456719, "percentage": 76.19, "elapsed_time": "1 day, 2:07:38", "remaining_time": "8:09:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8270, "total_steps": 10853, "loss": 0.1239, "learning_rate": 7.351981683982193e-07, "epoch": 0.7619661860229419, "percentage": 76.2, "elapsed_time": "1 day, 2:07:49", "remaining_time": "8:09:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8271, "total_steps": 10853, "loss": 0.127, "learning_rate": 7.346586864891217e-07, "epoch": 0.762058322200212, "percentage": 76.21, "elapsed_time": "1 day, 2:08:00", "remaining_time": "8:09:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8272, "total_steps": 10853, "loss": 0.1118, "learning_rate": 7.341193684921541e-07, "epoch": 0.762150458377482, "percentage": 76.22, "elapsed_time": "1 day, 2:08:12", "remaining_time": "8:09:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8273, "total_steps": 10853, "loss": 0.1177, "learning_rate": 7.335802144573933e-07, "epoch": 0.762242594554752, "percentage": 76.23, "elapsed_time": "1 day, 2:08:23", "remaining_time": "8:09:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8274, "total_steps": 10853, "loss": 0.1163, "learning_rate": 7.330412244349005e-07, "epoch": 0.762334730732022, "percentage": 76.24, "elapsed_time": "1 day, 2:08:34", "remaining_time": "8:08:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8275, "total_steps": 10853, "loss": 0.1334, "learning_rate": 7.325023984747195e-07, "epoch": 0.762426866909292, "percentage": 76.25, "elapsed_time": "1 day, 2:08:45", "remaining_time": "8:08:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8276, "total_steps": 10853, "loss": 0.1225, "learning_rate": 7.319637366268817e-07, "epoch": 0.762519003086562, "percentage": 76.26, "elapsed_time": "1 day, 2:08:57", "remaining_time": "8:08:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8277, "total_steps": 10853, "loss": 0.1131, "learning_rate": 7.314252389414003e-07, "epoch": 0.762611139263832, "percentage": 76.26, "elapsed_time": "1 day, 2:09:09", "remaining_time": "8:08:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8278, "total_steps": 10853, "loss": 0.1247, "learning_rate": 7.308869054682769e-07, "epoch": 0.762703275441102, "percentage": 76.27, "elapsed_time": "1 day, 2:09:21", "remaining_time": "8:08:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8279, "total_steps": 10853, "loss": 0.1261, "learning_rate": 7.303487362574938e-07, "epoch": 0.7627954116183719, "percentage": 76.28, "elapsed_time": "1 day, 2:09:32", "remaining_time": "8:07:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8280, "total_steps": 10853, "loss": 0.1337, "learning_rate": 7.298107313590208e-07, "epoch": 0.7628875477956419, "percentage": 76.29, "elapsed_time": "1 day, 2:09:43", "remaining_time": "8:07:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8281, "total_steps": 10853, "loss": 0.1247, "learning_rate": 7.292728908228127e-07, "epoch": 0.7629796839729119, "percentage": 76.3, "elapsed_time": "1 day, 2:09:53", "remaining_time": "8:07:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8282, "total_steps": 10853, "loss": 0.1222, "learning_rate": 7.287352146988075e-07, "epoch": 0.7630718201501819, "percentage": 76.31, "elapsed_time": "1 day, 2:10:04", "remaining_time": "8:07:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8283, "total_steps": 10853, "loss": 0.1031, "learning_rate": 7.281977030369275e-07, "epoch": 0.7631639563274519, "percentage": 76.32, "elapsed_time": "1 day, 2:10:13", "remaining_time": "8:07:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8284, "total_steps": 10853, "loss": 0.1208, "learning_rate": 7.276603558870812e-07, "epoch": 0.7632560925047219, "percentage": 76.33, "elapsed_time": "1 day, 2:10:24", "remaining_time": "8:07:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8285, "total_steps": 10853, "loss": 0.1164, "learning_rate": 7.271231732991619e-07, "epoch": 0.763348228681992, "percentage": 76.34, "elapsed_time": "1 day, 2:10:35", "remaining_time": "8:06:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8286, "total_steps": 10853, "loss": 0.1222, "learning_rate": 7.265861553230472e-07, "epoch": 0.763440364859262, "percentage": 76.35, "elapsed_time": "1 day, 2:10:46", "remaining_time": "8:06:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8287, "total_steps": 10853, "loss": 0.1282, "learning_rate": 7.26049302008599e-07, "epoch": 0.763532501036532, "percentage": 76.36, "elapsed_time": "1 day, 2:10:56", "remaining_time": "8:06:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8288, "total_steps": 10853, "loss": 0.1399, "learning_rate": 7.255126134056631e-07, "epoch": 0.763624637213802, "percentage": 76.37, "elapsed_time": "1 day, 2:11:07", "remaining_time": "8:06:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8289, "total_steps": 10853, "loss": 0.1243, "learning_rate": 7.249760895640723e-07, "epoch": 0.763716773391072, "percentage": 76.38, "elapsed_time": "1 day, 2:11:17", "remaining_time": "8:06:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8290, "total_steps": 10853, "loss": 0.1155, "learning_rate": 7.244397305336423e-07, "epoch": 0.763808909568342, "percentage": 76.38, "elapsed_time": "1 day, 2:11:27", "remaining_time": "8:05:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8291, "total_steps": 10853, "loss": 0.1219, "learning_rate": 7.239035363641752e-07, "epoch": 0.763901045745612, "percentage": 76.39, "elapsed_time": "1 day, 2:11:37", "remaining_time": "8:05:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8292, "total_steps": 10853, "loss": 0.1287, "learning_rate": 7.233675071054564e-07, "epoch": 0.763993181922882, "percentage": 76.4, "elapsed_time": "1 day, 2:11:48", "remaining_time": "8:05:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8293, "total_steps": 10853, "loss": 0.1236, "learning_rate": 7.228316428072546e-07, "epoch": 0.764085318100152, "percentage": 76.41, "elapsed_time": "1 day, 2:12:00", "remaining_time": "8:05:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8294, "total_steps": 10853, "loss": 0.1158, "learning_rate": 7.222959435193258e-07, "epoch": 0.764177454277422, "percentage": 76.42, "elapsed_time": "1 day, 2:12:11", "remaining_time": "8:05:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8295, "total_steps": 10853, "loss": 0.1343, "learning_rate": 7.21760409291411e-07, "epoch": 0.764269590454692, "percentage": 76.43, "elapsed_time": "1 day, 2:12:22", "remaining_time": "8:04:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8296, "total_steps": 10853, "loss": 0.127, "learning_rate": 7.212250401732329e-07, "epoch": 0.764361726631962, "percentage": 76.44, "elapsed_time": "1 day, 2:12:33", "remaining_time": "8:04:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8297, "total_steps": 10853, "loss": 0.1196, "learning_rate": 7.206898362145021e-07, "epoch": 0.764453862809232, "percentage": 76.45, "elapsed_time": "1 day, 2:12:43", "remaining_time": "8:04:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8298, "total_steps": 10853, "loss": 0.1122, "learning_rate": 7.201547974649104e-07, "epoch": 0.764545998986502, "percentage": 76.46, "elapsed_time": "1 day, 2:12:55", "remaining_time": "8:04:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8299, "total_steps": 10853, "loss": 0.1236, "learning_rate": 7.196199239741383e-07, "epoch": 0.7646381351637721, "percentage": 76.47, "elapsed_time": "1 day, 2:13:05", "remaining_time": "8:04:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8300, "total_steps": 10853, "loss": 0.1167, "learning_rate": 7.190852157918468e-07, "epoch": 0.7647302713410421, "percentage": 76.48, "elapsed_time": "1 day, 2:13:17", "remaining_time": "8:03:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8301, "total_steps": 10853, "loss": 0.1136, "learning_rate": 7.185506729676849e-07, "epoch": 0.7648224075183121, "percentage": 76.49, "elapsed_time": "1 day, 2:13:29", "remaining_time": "8:03:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8302, "total_steps": 10853, "loss": 0.1223, "learning_rate": 7.180162955512856e-07, "epoch": 0.7649145436955821, "percentage": 76.49, "elapsed_time": "1 day, 2:13:38", "remaining_time": "8:03:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8303, "total_steps": 10853, "loss": 0.1136, "learning_rate": 7.174820835922649e-07, "epoch": 0.7650066798728521, "percentage": 76.5, "elapsed_time": "1 day, 2:13:49", "remaining_time": "8:03:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8304, "total_steps": 10853, "loss": 0.1164, "learning_rate": 7.16948037140224e-07, "epoch": 0.7650988160501221, "percentage": 76.51, "elapsed_time": "1 day, 2:13:59", "remaining_time": "8:03:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8305, "total_steps": 10853, "loss": 0.1411, "learning_rate": 7.164141562447497e-07, "epoch": 0.7651909522273921, "percentage": 76.52, "elapsed_time": "1 day, 2:14:10", "remaining_time": "8:02:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8306, "total_steps": 10853, "loss": 0.1118, "learning_rate": 7.158804409554126e-07, "epoch": 0.7652830884046621, "percentage": 76.53, "elapsed_time": "1 day, 2:14:20", "remaining_time": "8:02:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8307, "total_steps": 10853, "loss": 0.1277, "learning_rate": 7.153468913217695e-07, "epoch": 0.7653752245819321, "percentage": 76.54, "elapsed_time": "1 day, 2:14:32", "remaining_time": "8:02:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8308, "total_steps": 10853, "loss": 0.1164, "learning_rate": 7.148135073933599e-07, "epoch": 0.7654673607592021, "percentage": 76.55, "elapsed_time": "1 day, 2:14:41", "remaining_time": "8:02:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8309, "total_steps": 10853, "loss": 0.1253, "learning_rate": 7.142802892197071e-07, "epoch": 0.7655594969364721, "percentage": 76.56, "elapsed_time": "1 day, 2:14:51", "remaining_time": "8:02:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8310, "total_steps": 10853, "loss": 0.1269, "learning_rate": 7.137472368503217e-07, "epoch": 0.7656516331137421, "percentage": 76.57, "elapsed_time": "1 day, 2:15:02", "remaining_time": "8:01:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8311, "total_steps": 10853, "loss": 0.1159, "learning_rate": 7.132143503346986e-07, "epoch": 0.7657437692910121, "percentage": 76.58, "elapsed_time": "1 day, 2:15:13", "remaining_time": "8:01:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8312, "total_steps": 10853, "loss": 0.1301, "learning_rate": 7.126816297223147e-07, "epoch": 0.7658359054682822, "percentage": 76.59, "elapsed_time": "1 day, 2:15:24", "remaining_time": "8:01:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8313, "total_steps": 10853, "loss": 0.1231, "learning_rate": 7.121490750626342e-07, "epoch": 0.7659280416455522, "percentage": 76.6, "elapsed_time": "1 day, 2:15:34", "remaining_time": "8:01:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8314, "total_steps": 10853, "loss": 0.1137, "learning_rate": 7.116166864051038e-07, "epoch": 0.7660201778228222, "percentage": 76.61, "elapsed_time": "1 day, 2:15:44", "remaining_time": "8:01:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8315, "total_steps": 10853, "loss": 0.1232, "learning_rate": 7.110844637991574e-07, "epoch": 0.7661123140000922, "percentage": 76.61, "elapsed_time": "1 day, 2:15:56", "remaining_time": "8:01:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8316, "total_steps": 10853, "loss": 0.1164, "learning_rate": 7.105524072942105e-07, "epoch": 0.7662044501773622, "percentage": 76.62, "elapsed_time": "1 day, 2:16:06", "remaining_time": "8:00:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8317, "total_steps": 10853, "loss": 0.1227, "learning_rate": 7.100205169396649e-07, "epoch": 0.7662965863546322, "percentage": 76.63, "elapsed_time": "1 day, 2:16:18", "remaining_time": "8:00:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8318, "total_steps": 10853, "loss": 0.1218, "learning_rate": 7.09488792784907e-07, "epoch": 0.7663887225319022, "percentage": 76.64, "elapsed_time": "1 day, 2:16:28", "remaining_time": "8:00:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8319, "total_steps": 10853, "loss": 0.1202, "learning_rate": 7.089572348793081e-07, "epoch": 0.7664808587091722, "percentage": 76.65, "elapsed_time": "1 day, 2:16:38", "remaining_time": "8:00:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8320, "total_steps": 10853, "loss": 0.1177, "learning_rate": 7.084258432722227e-07, "epoch": 0.7665729948864421, "percentage": 76.66, "elapsed_time": "1 day, 2:16:48", "remaining_time": "8:00:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8321, "total_steps": 10853, "loss": 0.1164, "learning_rate": 7.078946180129898e-07, "epoch": 0.7666651310637121, "percentage": 76.67, "elapsed_time": "1 day, 2:17:00", "remaining_time": "7:59:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8322, "total_steps": 10853, "loss": 0.1064, "learning_rate": 7.073635591509345e-07, "epoch": 0.7667572672409821, "percentage": 76.68, "elapsed_time": "1 day, 2:17:12", "remaining_time": "7:59:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8323, "total_steps": 10853, "loss": 0.1205, "learning_rate": 7.068326667353659e-07, "epoch": 0.7668494034182521, "percentage": 76.69, "elapsed_time": "1 day, 2:17:23", "remaining_time": "7:59:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8324, "total_steps": 10853, "loss": 0.1213, "learning_rate": 7.063019408155777e-07, "epoch": 0.7669415395955221, "percentage": 76.7, "elapsed_time": "1 day, 2:17:32", "remaining_time": "7:59:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8325, "total_steps": 10853, "loss": 0.1217, "learning_rate": 7.057713814408473e-07, "epoch": 0.7670336757727921, "percentage": 76.71, "elapsed_time": "1 day, 2:17:45", "remaining_time": "7:59:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8326, "total_steps": 10853, "loss": 0.1292, "learning_rate": 7.052409886604364e-07, "epoch": 0.7671258119500622, "percentage": 76.72, "elapsed_time": "1 day, 2:17:56", "remaining_time": "7:58:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8327, "total_steps": 10853, "loss": 0.1229, "learning_rate": 7.04710762523593e-07, "epoch": 0.7672179481273322, "percentage": 76.73, "elapsed_time": "1 day, 2:18:08", "remaining_time": "7:58:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8328, "total_steps": 10853, "loss": 0.1302, "learning_rate": 7.041807030795495e-07, "epoch": 0.7673100843046022, "percentage": 76.73, "elapsed_time": "1 day, 2:18:19", "remaining_time": "7:58:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8329, "total_steps": 10853, "loss": 0.1288, "learning_rate": 7.036508103775199e-07, "epoch": 0.7674022204818722, "percentage": 76.74, "elapsed_time": "1 day, 2:18:29", "remaining_time": "7:58:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8330, "total_steps": 10853, "loss": 0.1177, "learning_rate": 7.031210844667066e-07, "epoch": 0.7674943566591422, "percentage": 76.75, "elapsed_time": "1 day, 2:18:40", "remaining_time": "7:58:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8331, "total_steps": 10853, "loss": 0.1194, "learning_rate": 7.025915253962934e-07, "epoch": 0.7675864928364122, "percentage": 76.76, "elapsed_time": "1 day, 2:18:51", "remaining_time": "7:57:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8332, "total_steps": 10853, "loss": 0.123, "learning_rate": 7.020621332154512e-07, "epoch": 0.7676786290136822, "percentage": 76.77, "elapsed_time": "1 day, 2:19:02", "remaining_time": "7:57:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8333, "total_steps": 10853, "loss": 0.104, "learning_rate": 7.015329079733327e-07, "epoch": 0.7677707651909522, "percentage": 76.78, "elapsed_time": "1 day, 2:19:12", "remaining_time": "7:57:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8334, "total_steps": 10853, "loss": 0.1159, "learning_rate": 7.010038497190774e-07, "epoch": 0.7678629013682222, "percentage": 76.79, "elapsed_time": "1 day, 2:19:24", "remaining_time": "7:57:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8335, "total_steps": 10853, "loss": 0.1274, "learning_rate": 7.004749585018089e-07, "epoch": 0.7679550375454922, "percentage": 76.8, "elapsed_time": "1 day, 2:19:34", "remaining_time": "7:57:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8336, "total_steps": 10853, "loss": 0.1261, "learning_rate": 6.999462343706339e-07, "epoch": 0.7680471737227622, "percentage": 76.81, "elapsed_time": "1 day, 2:19:45", "remaining_time": "7:56:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8337, "total_steps": 10853, "loss": 0.1127, "learning_rate": 6.994176773746445e-07, "epoch": 0.7681393099000322, "percentage": 76.82, "elapsed_time": "1 day, 2:19:56", "remaining_time": "7:56:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8338, "total_steps": 10853, "loss": 0.1123, "learning_rate": 6.988892875629172e-07, "epoch": 0.7682314460773022, "percentage": 76.83, "elapsed_time": "1 day, 2:20:08", "remaining_time": "7:56:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8339, "total_steps": 10853, "loss": 0.1266, "learning_rate": 6.983610649845136e-07, "epoch": 0.7683235822545723, "percentage": 76.84, "elapsed_time": "1 day, 2:20:17", "remaining_time": "7:56:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8340, "total_steps": 10853, "loss": 0.118, "learning_rate": 6.978330096884794e-07, "epoch": 0.7684157184318423, "percentage": 76.85, "elapsed_time": "1 day, 2:20:28", "remaining_time": "7:56:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8341, "total_steps": 10853, "loss": 0.1259, "learning_rate": 6.973051217238444e-07, "epoch": 0.7685078546091123, "percentage": 76.85, "elapsed_time": "1 day, 2:20:39", "remaining_time": "7:56:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8342, "total_steps": 10853, "loss": 0.1077, "learning_rate": 6.967774011396222e-07, "epoch": 0.7685999907863823, "percentage": 76.86, "elapsed_time": "1 day, 2:20:50", "remaining_time": "7:55:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8343, "total_steps": 10853, "loss": 0.1203, "learning_rate": 6.962498479848124e-07, "epoch": 0.7686921269636523, "percentage": 76.87, "elapsed_time": "1 day, 2:21:00", "remaining_time": "7:55:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8344, "total_steps": 10853, "loss": 0.1223, "learning_rate": 6.957224623083989e-07, "epoch": 0.7687842631409223, "percentage": 76.88, "elapsed_time": "1 day, 2:21:11", "remaining_time": "7:55:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8345, "total_steps": 10853, "loss": 0.1125, "learning_rate": 6.951952441593482e-07, "epoch": 0.7688763993181923, "percentage": 76.89, "elapsed_time": "1 day, 2:21:23", "remaining_time": "7:55:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8346, "total_steps": 10853, "loss": 0.1082, "learning_rate": 6.946681935866143e-07, "epoch": 0.7689685354954623, "percentage": 76.9, "elapsed_time": "1 day, 2:21:32", "remaining_time": "7:55:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8347, "total_steps": 10853, "loss": 0.128, "learning_rate": 6.941413106391321e-07, "epoch": 0.7690606716727323, "percentage": 76.91, "elapsed_time": "1 day, 2:21:43", "remaining_time": "7:54:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8348, "total_steps": 10853, "loss": 0.1194, "learning_rate": 6.936145953658233e-07, "epoch": 0.7691528078500023, "percentage": 76.92, "elapsed_time": "1 day, 2:21:54", "remaining_time": "7:54:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8349, "total_steps": 10853, "loss": 0.1198, "learning_rate": 6.930880478155946e-07, "epoch": 0.7692449440272723, "percentage": 76.93, "elapsed_time": "1 day, 2:22:05", "remaining_time": "7:54:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8350, "total_steps": 10853, "loss": 0.1165, "learning_rate": 6.925616680373346e-07, "epoch": 0.7693370802045423, "percentage": 76.94, "elapsed_time": "1 day, 2:22:16", "remaining_time": "7:54:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8351, "total_steps": 10853, "loss": 0.1176, "learning_rate": 6.920354560799189e-07, "epoch": 0.7694292163818123, "percentage": 76.95, "elapsed_time": "1 day, 2:22:27", "remaining_time": "7:54:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8352, "total_steps": 10853, "loss": 0.1333, "learning_rate": 6.915094119922048e-07, "epoch": 0.7695213525590823, "percentage": 76.96, "elapsed_time": "1 day, 2:22:38", "remaining_time": "7:53:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8353, "total_steps": 10853, "loss": 0.1208, "learning_rate": 6.909835358230372e-07, "epoch": 0.7696134887363524, "percentage": 76.96, "elapsed_time": "1 day, 2:22:50", "remaining_time": "7:53:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8354, "total_steps": 10853, "loss": 0.1298, "learning_rate": 6.904578276212423e-07, "epoch": 0.7697056249136224, "percentage": 76.97, "elapsed_time": "1 day, 2:23:01", "remaining_time": "7:53:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8355, "total_steps": 10853, "loss": 0.1303, "learning_rate": 6.899322874356329e-07, "epoch": 0.7697977610908924, "percentage": 76.98, "elapsed_time": "1 day, 2:23:12", "remaining_time": "7:53:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8356, "total_steps": 10853, "loss": 0.1253, "learning_rate": 6.89406915315006e-07, "epoch": 0.7698898972681624, "percentage": 76.99, "elapsed_time": "1 day, 2:23:24", "remaining_time": "7:53:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8357, "total_steps": 10853, "loss": 0.1262, "learning_rate": 6.888817113081419e-07, "epoch": 0.7699820334454324, "percentage": 77.0, "elapsed_time": "1 day, 2:23:35", "remaining_time": "7:52:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8358, "total_steps": 10853, "loss": 0.1318, "learning_rate": 6.883566754638052e-07, "epoch": 0.7700741696227024, "percentage": 77.01, "elapsed_time": "1 day, 2:23:46", "remaining_time": "7:52:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8359, "total_steps": 10853, "loss": 0.1122, "learning_rate": 6.878318078307461e-07, "epoch": 0.7701663057999724, "percentage": 77.02, "elapsed_time": "1 day, 2:23:57", "remaining_time": "7:52:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8360, "total_steps": 10853, "loss": 0.1169, "learning_rate": 6.873071084576985e-07, "epoch": 0.7702584419772424, "percentage": 77.03, "elapsed_time": "1 day, 2:24:07", "remaining_time": "7:52:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8361, "total_steps": 10853, "loss": 0.1277, "learning_rate": 6.86782577393382e-07, "epoch": 0.7703505781545124, "percentage": 77.04, "elapsed_time": "1 day, 2:24:17", "remaining_time": "7:52:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8362, "total_steps": 10853, "loss": 0.1244, "learning_rate": 6.862582146864982e-07, "epoch": 0.7704427143317824, "percentage": 77.05, "elapsed_time": "1 day, 2:24:27", "remaining_time": "7:52:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8363, "total_steps": 10853, "loss": 0.1117, "learning_rate": 6.857340203857335e-07, "epoch": 0.7705348505090523, "percentage": 77.06, "elapsed_time": "1 day, 2:24:38", "remaining_time": "7:51:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8364, "total_steps": 10853, "loss": 0.1195, "learning_rate": 6.852099945397603e-07, "epoch": 0.7706269866863223, "percentage": 77.07, "elapsed_time": "1 day, 2:24:49", "remaining_time": "7:51:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8365, "total_steps": 10853, "loss": 0.1244, "learning_rate": 6.846861371972355e-07, "epoch": 0.7707191228635923, "percentage": 77.08, "elapsed_time": "1 day, 2:25:00", "remaining_time": "7:51:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8366, "total_steps": 10853, "loss": 0.1309, "learning_rate": 6.841624484067971e-07, "epoch": 0.7708112590408623, "percentage": 77.08, "elapsed_time": "1 day, 2:25:10", "remaining_time": "7:51:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8367, "total_steps": 10853, "loss": 0.1127, "learning_rate": 6.836389282170716e-07, "epoch": 0.7709033952181324, "percentage": 77.09, "elapsed_time": "1 day, 2:25:21", "remaining_time": "7:51:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8368, "total_steps": 10853, "loss": 0.1336, "learning_rate": 6.831155766766665e-07, "epoch": 0.7709955313954024, "percentage": 77.1, "elapsed_time": "1 day, 2:25:34", "remaining_time": "7:50:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8369, "total_steps": 10853, "loss": 0.108, "learning_rate": 6.825923938341761e-07, "epoch": 0.7710876675726724, "percentage": 77.11, "elapsed_time": "1 day, 2:25:44", "remaining_time": "7:50:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8370, "total_steps": 10853, "loss": 0.1247, "learning_rate": 6.820693797381769e-07, "epoch": 0.7711798037499424, "percentage": 77.12, "elapsed_time": "1 day, 2:25:54", "remaining_time": "7:50:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8371, "total_steps": 10853, "loss": 0.1251, "learning_rate": 6.815465344372316e-07, "epoch": 0.7712719399272124, "percentage": 77.13, "elapsed_time": "1 day, 2:26:05", "remaining_time": "7:50:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8372, "total_steps": 10853, "loss": 0.1124, "learning_rate": 6.81023857979887e-07, "epoch": 0.7713640761044824, "percentage": 77.14, "elapsed_time": "1 day, 2:26:16", "remaining_time": "7:50:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8373, "total_steps": 10853, "loss": 0.1187, "learning_rate": 6.805013504146729e-07, "epoch": 0.7714562122817524, "percentage": 77.15, "elapsed_time": "1 day, 2:26:27", "remaining_time": "7:49:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8374, "total_steps": 10853, "loss": 0.1231, "learning_rate": 6.799790117901034e-07, "epoch": 0.7715483484590224, "percentage": 77.16, "elapsed_time": "1 day, 2:26:37", "remaining_time": "7:49:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8375, "total_steps": 10853, "loss": 0.1228, "learning_rate": 6.794568421546785e-07, "epoch": 0.7716404846362924, "percentage": 77.17, "elapsed_time": "1 day, 2:26:48", "remaining_time": "7:49:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8376, "total_steps": 10853, "loss": 0.1279, "learning_rate": 6.78934841556882e-07, "epoch": 0.7717326208135624, "percentage": 77.18, "elapsed_time": "1 day, 2:26:59", "remaining_time": "7:49:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8377, "total_steps": 10853, "loss": 0.1173, "learning_rate": 6.784130100451819e-07, "epoch": 0.7718247569908324, "percentage": 77.19, "elapsed_time": "1 day, 2:27:10", "remaining_time": "7:49:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8378, "total_steps": 10853, "loss": 0.1227, "learning_rate": 6.778913476680302e-07, "epoch": 0.7719168931681024, "percentage": 77.2, "elapsed_time": "1 day, 2:27:22", "remaining_time": "7:48:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8379, "total_steps": 10853, "loss": 0.1274, "learning_rate": 6.773698544738619e-07, "epoch": 0.7720090293453724, "percentage": 77.2, "elapsed_time": "1 day, 2:27:32", "remaining_time": "7:48:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8380, "total_steps": 10853, "loss": 0.1158, "learning_rate": 6.768485305110989e-07, "epoch": 0.7721011655226425, "percentage": 77.21, "elapsed_time": "1 day, 2:27:42", "remaining_time": "7:48:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8381, "total_steps": 10853, "loss": 0.1176, "learning_rate": 6.763273758281458e-07, "epoch": 0.7721933016999125, "percentage": 77.22, "elapsed_time": "1 day, 2:27:54", "remaining_time": "7:48:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8382, "total_steps": 10853, "loss": 0.1245, "learning_rate": 6.758063904733933e-07, "epoch": 0.7722854378771825, "percentage": 77.23, "elapsed_time": "1 day, 2:28:06", "remaining_time": "7:48:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8383, "total_steps": 10853, "loss": 0.1195, "learning_rate": 6.752855744952136e-07, "epoch": 0.7723775740544525, "percentage": 77.24, "elapsed_time": "1 day, 2:28:17", "remaining_time": "7:47:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8384, "total_steps": 10853, "loss": 0.1189, "learning_rate": 6.747649279419638e-07, "epoch": 0.7724697102317225, "percentage": 77.25, "elapsed_time": "1 day, 2:28:27", "remaining_time": "7:47:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8385, "total_steps": 10853, "loss": 0.1061, "learning_rate": 6.742444508619869e-07, "epoch": 0.7725618464089925, "percentage": 77.26, "elapsed_time": "1 day, 2:28:38", "remaining_time": "7:47:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8386, "total_steps": 10853, "loss": 0.1258, "learning_rate": 6.737241433036101e-07, "epoch": 0.7726539825862625, "percentage": 77.27, "elapsed_time": "1 day, 2:28:50", "remaining_time": "7:47:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8387, "total_steps": 10853, "loss": 0.1226, "learning_rate": 6.732040053151423e-07, "epoch": 0.7727461187635325, "percentage": 77.28, "elapsed_time": "1 day, 2:29:01", "remaining_time": "7:47:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8388, "total_steps": 10853, "loss": 0.1173, "learning_rate": 6.7268403694488e-07, "epoch": 0.7728382549408025, "percentage": 77.29, "elapsed_time": "1 day, 2:29:10", "remaining_time": "7:47:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8389, "total_steps": 10853, "loss": 0.1146, "learning_rate": 6.721642382411006e-07, "epoch": 0.7729303911180725, "percentage": 77.3, "elapsed_time": "1 day, 2:29:21", "remaining_time": "7:46:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8390, "total_steps": 10853, "loss": 0.1306, "learning_rate": 6.716446092520696e-07, "epoch": 0.7730225272953425, "percentage": 77.31, "elapsed_time": "1 day, 2:29:32", "remaining_time": "7:46:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8391, "total_steps": 10853, "loss": 0.1175, "learning_rate": 6.711251500260322e-07, "epoch": 0.7731146634726125, "percentage": 77.32, "elapsed_time": "1 day, 2:29:43", "remaining_time": "7:46:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8392, "total_steps": 10853, "loss": 0.1264, "learning_rate": 6.706058606112217e-07, "epoch": 0.7732067996498825, "percentage": 77.32, "elapsed_time": "1 day, 2:29:54", "remaining_time": "7:46:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8393, "total_steps": 10853, "loss": 0.1133, "learning_rate": 6.700867410558537e-07, "epoch": 0.7732989358271525, "percentage": 77.33, "elapsed_time": "1 day, 2:30:05", "remaining_time": "7:46:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8394, "total_steps": 10853, "loss": 0.1211, "learning_rate": 6.695677914081303e-07, "epoch": 0.7733910720044226, "percentage": 77.34, "elapsed_time": "1 day, 2:30:16", "remaining_time": "7:45:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8395, "total_steps": 10853, "loss": 0.1177, "learning_rate": 6.690490117162333e-07, "epoch": 0.7734832081816926, "percentage": 77.35, "elapsed_time": "1 day, 2:30:26", "remaining_time": "7:45:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8396, "total_steps": 10853, "loss": 0.1175, "learning_rate": 6.68530402028332e-07, "epoch": 0.7735753443589626, "percentage": 77.36, "elapsed_time": "1 day, 2:30:39", "remaining_time": "7:45:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8397, "total_steps": 10853, "loss": 0.1119, "learning_rate": 6.680119623925804e-07, "epoch": 0.7736674805362326, "percentage": 77.37, "elapsed_time": "1 day, 2:30:51", "remaining_time": "7:45:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8398, "total_steps": 10853, "loss": 0.1232, "learning_rate": 6.67493692857116e-07, "epoch": 0.7737596167135026, "percentage": 77.38, "elapsed_time": "1 day, 2:31:01", "remaining_time": "7:45:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8399, "total_steps": 10853, "loss": 0.1178, "learning_rate": 6.669755934700586e-07, "epoch": 0.7738517528907726, "percentage": 77.39, "elapsed_time": "1 day, 2:31:12", "remaining_time": "7:44:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8400, "total_steps": 10853, "loss": 0.1211, "learning_rate": 6.664576642795153e-07, "epoch": 0.7739438890680426, "percentage": 77.4, "elapsed_time": "1 day, 2:31:24", "remaining_time": "7:44:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8401, "total_steps": 10853, "loss": 0.1158, "learning_rate": 6.659399053335747e-07, "epoch": 0.7740360252453126, "percentage": 77.41, "elapsed_time": "1 day, 2:31:35", "remaining_time": "7:44:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8402, "total_steps": 10853, "loss": 0.118, "learning_rate": 6.654223166803117e-07, "epoch": 0.7741281614225826, "percentage": 77.42, "elapsed_time": "1 day, 2:31:45", "remaining_time": "7:44:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8403, "total_steps": 10853, "loss": 0.1139, "learning_rate": 6.649048983677834e-07, "epoch": 0.7742202975998526, "percentage": 77.43, "elapsed_time": "1 day, 2:31:55", "remaining_time": "7:44:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8404, "total_steps": 10853, "loss": 0.1165, "learning_rate": 6.643876504440327e-07, "epoch": 0.7743124337771226, "percentage": 77.43, "elapsed_time": "1 day, 2:32:06", "remaining_time": "7:43:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8405, "total_steps": 10853, "loss": 0.1256, "learning_rate": 6.638705729570871e-07, "epoch": 0.7744045699543926, "percentage": 77.44, "elapsed_time": "1 day, 2:32:15", "remaining_time": "7:43:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8406, "total_steps": 10853, "loss": 0.1117, "learning_rate": 6.633536659549558e-07, "epoch": 0.7744967061316625, "percentage": 77.45, "elapsed_time": "1 day, 2:32:27", "remaining_time": "7:43:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8407, "total_steps": 10853, "loss": 0.1152, "learning_rate": 6.628369294856349e-07, "epoch": 0.7745888423089327, "percentage": 77.46, "elapsed_time": "1 day, 2:32:37", "remaining_time": "7:43:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8408, "total_steps": 10853, "loss": 0.1324, "learning_rate": 6.623203635971018e-07, "epoch": 0.7746809784862027, "percentage": 77.47, "elapsed_time": "1 day, 2:32:48", "remaining_time": "7:43:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8409, "total_steps": 10853, "loss": 0.1121, "learning_rate": 6.618039683373209e-07, "epoch": 0.7747731146634727, "percentage": 77.48, "elapsed_time": "1 day, 2:32:59", "remaining_time": "7:42:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8410, "total_steps": 10853, "loss": 0.1175, "learning_rate": 6.612877437542403e-07, "epoch": 0.7748652508407426, "percentage": 77.49, "elapsed_time": "1 day, 2:33:10", "remaining_time": "7:42:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8411, "total_steps": 10853, "loss": 0.1134, "learning_rate": 6.607716898957903e-07, "epoch": 0.7749573870180126, "percentage": 77.5, "elapsed_time": "1 day, 2:33:19", "remaining_time": "7:42:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8412, "total_steps": 10853, "loss": 0.126, "learning_rate": 6.602558068098864e-07, "epoch": 0.7750495231952826, "percentage": 77.51, "elapsed_time": "1 day, 2:33:29", "remaining_time": "7:42:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8413, "total_steps": 10853, "loss": 0.1098, "learning_rate": 6.597400945444285e-07, "epoch": 0.7751416593725526, "percentage": 77.52, "elapsed_time": "1 day, 2:33:40", "remaining_time": "7:42:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8414, "total_steps": 10853, "loss": 0.1268, "learning_rate": 6.59224553147301e-07, "epoch": 0.7752337955498226, "percentage": 77.53, "elapsed_time": "1 day, 2:33:51", "remaining_time": "7:42:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8415, "total_steps": 10853, "loss": 0.1165, "learning_rate": 6.587091826663728e-07, "epoch": 0.7753259317270926, "percentage": 77.54, "elapsed_time": "1 day, 2:34:02", "remaining_time": "7:41:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8416, "total_steps": 10853, "loss": 0.1165, "learning_rate": 6.581939831494948e-07, "epoch": 0.7754180679043626, "percentage": 77.55, "elapsed_time": "1 day, 2:34:12", "remaining_time": "7:41:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8417, "total_steps": 10853, "loss": 0.1091, "learning_rate": 6.576789546445031e-07, "epoch": 0.7755102040816326, "percentage": 77.55, "elapsed_time": "1 day, 2:34:21", "remaining_time": "7:41:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8418, "total_steps": 10853, "loss": 0.1157, "learning_rate": 6.571640971992188e-07, "epoch": 0.7756023402589026, "percentage": 77.56, "elapsed_time": "1 day, 2:34:31", "remaining_time": "7:41:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8419, "total_steps": 10853, "loss": 0.1152, "learning_rate": 6.566494108614471e-07, "epoch": 0.7756944764361726, "percentage": 77.57, "elapsed_time": "1 day, 2:34:42", "remaining_time": "7:41:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8420, "total_steps": 10853, "loss": 0.1111, "learning_rate": 6.561348956789751e-07, "epoch": 0.7757866126134426, "percentage": 77.58, "elapsed_time": "1 day, 2:34:51", "remaining_time": "7:40:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8421, "total_steps": 10853, "loss": 0.1194, "learning_rate": 6.556205516995772e-07, "epoch": 0.7758787487907127, "percentage": 77.59, "elapsed_time": "1 day, 2:35:00", "remaining_time": "7:40:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8422, "total_steps": 10853, "loss": 0.1287, "learning_rate": 6.551063789710091e-07, "epoch": 0.7759708849679827, "percentage": 77.6, "elapsed_time": "1 day, 2:35:11", "remaining_time": "7:40:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8423, "total_steps": 10853, "loss": 0.1111, "learning_rate": 6.545923775410129e-07, "epoch": 0.7760630211452527, "percentage": 77.61, "elapsed_time": "1 day, 2:35:22", "remaining_time": "7:40:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8424, "total_steps": 10853, "loss": 0.1266, "learning_rate": 6.540785474573121e-07, "epoch": 0.7761551573225227, "percentage": 77.62, "elapsed_time": "1 day, 2:35:34", "remaining_time": "7:40:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8425, "total_steps": 10853, "loss": 0.1191, "learning_rate": 6.535648887676171e-07, "epoch": 0.7762472934997927, "percentage": 77.63, "elapsed_time": "1 day, 2:35:44", "remaining_time": "7:39:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8426, "total_steps": 10853, "loss": 0.1304, "learning_rate": 6.530514015196218e-07, "epoch": 0.7763394296770627, "percentage": 77.64, "elapsed_time": "1 day, 2:35:56", "remaining_time": "7:39:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8427, "total_steps": 10853, "loss": 0.1286, "learning_rate": 6.525380857610022e-07, "epoch": 0.7764315658543327, "percentage": 77.65, "elapsed_time": "1 day, 2:36:07", "remaining_time": "7:39:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8428, "total_steps": 10853, "loss": 0.1194, "learning_rate": 6.520249415394197e-07, "epoch": 0.7765237020316027, "percentage": 77.66, "elapsed_time": "1 day, 2:36:17", "remaining_time": "7:39:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8429, "total_steps": 10853, "loss": 0.1156, "learning_rate": 6.515119689025201e-07, "epoch": 0.7766158382088727, "percentage": 77.67, "elapsed_time": "1 day, 2:36:27", "remaining_time": "7:39:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8430, "total_steps": 10853, "loss": 0.1312, "learning_rate": 6.509991678979333e-07, "epoch": 0.7767079743861427, "percentage": 77.67, "elapsed_time": "1 day, 2:36:39", "remaining_time": "7:38:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8431, "total_steps": 10853, "loss": 0.1197, "learning_rate": 6.504865385732734e-07, "epoch": 0.7768001105634127, "percentage": 77.68, "elapsed_time": "1 day, 2:36:49", "remaining_time": "7:38:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8432, "total_steps": 10853, "loss": 0.1198, "learning_rate": 6.499740809761373e-07, "epoch": 0.7768922467406827, "percentage": 77.69, "elapsed_time": "1 day, 2:36:59", "remaining_time": "7:38:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8433, "total_steps": 10853, "loss": 0.1112, "learning_rate": 6.494617951541063e-07, "epoch": 0.7769843829179527, "percentage": 77.7, "elapsed_time": "1 day, 2:37:10", "remaining_time": "7:38:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8434, "total_steps": 10853, "loss": 0.1287, "learning_rate": 6.489496811547468e-07, "epoch": 0.7770765190952227, "percentage": 77.71, "elapsed_time": "1 day, 2:37:21", "remaining_time": "7:38:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8435, "total_steps": 10853, "loss": 0.1223, "learning_rate": 6.484377390256086e-07, "epoch": 0.7771686552724928, "percentage": 77.72, "elapsed_time": "1 day, 2:37:31", "remaining_time": "7:37:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8436, "total_steps": 10853, "loss": 0.1034, "learning_rate": 6.479259688142261e-07, "epoch": 0.7772607914497628, "percentage": 77.73, "elapsed_time": "1 day, 2:37:41", "remaining_time": "7:37:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8437, "total_steps": 10853, "loss": 0.113, "learning_rate": 6.474143705681171e-07, "epoch": 0.7773529276270328, "percentage": 77.74, "elapsed_time": "1 day, 2:37:51", "remaining_time": "7:37:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8438, "total_steps": 10853, "loss": 0.1095, "learning_rate": 6.469029443347821e-07, "epoch": 0.7774450638043028, "percentage": 77.75, "elapsed_time": "1 day, 2:38:02", "remaining_time": "7:37:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8439, "total_steps": 10853, "loss": 0.1255, "learning_rate": 6.463916901617084e-07, "epoch": 0.7775371999815728, "percentage": 77.76, "elapsed_time": "1 day, 2:38:15", "remaining_time": "7:37:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8440, "total_steps": 10853, "loss": 0.1217, "learning_rate": 6.458806080963664e-07, "epoch": 0.7776293361588428, "percentage": 77.77, "elapsed_time": "1 day, 2:38:25", "remaining_time": "7:36:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8441, "total_steps": 10853, "loss": 0.119, "learning_rate": 6.453696981862087e-07, "epoch": 0.7777214723361128, "percentage": 77.78, "elapsed_time": "1 day, 2:38:35", "remaining_time": "7:36:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8442, "total_steps": 10853, "loss": 0.1176, "learning_rate": 6.448589604786748e-07, "epoch": 0.7778136085133828, "percentage": 77.78, "elapsed_time": "1 day, 2:38:45", "remaining_time": "7:36:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8443, "total_steps": 10853, "loss": 0.1338, "learning_rate": 6.443483950211854e-07, "epoch": 0.7779057446906528, "percentage": 77.79, "elapsed_time": "1 day, 2:38:57", "remaining_time": "7:36:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8444, "total_steps": 10853, "loss": 0.1161, "learning_rate": 6.438380018611481e-07, "epoch": 0.7779978808679228, "percentage": 77.8, "elapsed_time": "1 day, 2:39:08", "remaining_time": "7:36:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8445, "total_steps": 10853, "loss": 0.126, "learning_rate": 6.433277810459512e-07, "epoch": 0.7780900170451928, "percentage": 77.81, "elapsed_time": "1 day, 2:39:19", "remaining_time": "7:36:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8446, "total_steps": 10853, "loss": 0.1196, "learning_rate": 6.428177326229698e-07, "epoch": 0.7781821532224628, "percentage": 77.82, "elapsed_time": "1 day, 2:39:30", "remaining_time": "7:35:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8447, "total_steps": 10853, "loss": 0.1278, "learning_rate": 6.423078566395624e-07, "epoch": 0.7782742893997328, "percentage": 77.83, "elapsed_time": "1 day, 2:39:42", "remaining_time": "7:35:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8448, "total_steps": 10853, "loss": 0.1195, "learning_rate": 6.417981531430705e-07, "epoch": 0.7783664255770029, "percentage": 77.84, "elapsed_time": "1 day, 2:39:53", "remaining_time": "7:35:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8449, "total_steps": 10853, "loss": 0.1217, "learning_rate": 6.412886221808193e-07, "epoch": 0.7784585617542729, "percentage": 77.85, "elapsed_time": "1 day, 2:40:03", "remaining_time": "7:35:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8450, "total_steps": 10853, "loss": 0.118, "learning_rate": 6.407792638001195e-07, "epoch": 0.7785506979315429, "percentage": 77.86, "elapsed_time": "1 day, 2:40:14", "remaining_time": "7:35:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8451, "total_steps": 10853, "loss": 0.1143, "learning_rate": 6.402700780482651e-07, "epoch": 0.7786428341088129, "percentage": 77.87, "elapsed_time": "1 day, 2:40:23", "remaining_time": "7:34:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8452, "total_steps": 10853, "loss": 0.1192, "learning_rate": 6.39761064972535e-07, "epoch": 0.7787349702860829, "percentage": 77.88, "elapsed_time": "1 day, 2:40:34", "remaining_time": "7:34:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8453, "total_steps": 10853, "loss": 0.1194, "learning_rate": 6.392522246201902e-07, "epoch": 0.7788271064633528, "percentage": 77.89, "elapsed_time": "1 day, 2:40:45", "remaining_time": "7:34:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8454, "total_steps": 10853, "loss": 0.1185, "learning_rate": 6.387435570384759e-07, "epoch": 0.7789192426406228, "percentage": 77.9, "elapsed_time": "1 day, 2:40:55", "remaining_time": "7:34:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8455, "total_steps": 10853, "loss": 0.1257, "learning_rate": 6.382350622746225e-07, "epoch": 0.7790113788178928, "percentage": 77.9, "elapsed_time": "1 day, 2:41:05", "remaining_time": "7:34:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8456, "total_steps": 10853, "loss": 0.1122, "learning_rate": 6.377267403758447e-07, "epoch": 0.7791035149951628, "percentage": 77.91, "elapsed_time": "1 day, 2:41:15", "remaining_time": "7:33:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8457, "total_steps": 10853, "loss": 0.1252, "learning_rate": 6.372185913893389e-07, "epoch": 0.7791956511724328, "percentage": 77.92, "elapsed_time": "1 day, 2:41:26", "remaining_time": "7:33:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8458, "total_steps": 10853, "loss": 0.1228, "learning_rate": 6.367106153622879e-07, "epoch": 0.7792877873497028, "percentage": 77.93, "elapsed_time": "1 day, 2:41:36", "remaining_time": "7:33:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8459, "total_steps": 10853, "loss": 0.1174, "learning_rate": 6.362028123418562e-07, "epoch": 0.7793799235269728, "percentage": 77.94, "elapsed_time": "1 day, 2:41:46", "remaining_time": "7:33:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8460, "total_steps": 10853, "loss": 0.1094, "learning_rate": 6.356951823751947e-07, "epoch": 0.7794720597042428, "percentage": 77.95, "elapsed_time": "1 day, 2:41:55", "remaining_time": "7:33:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8461, "total_steps": 10853, "loss": 0.1064, "learning_rate": 6.351877255094352e-07, "epoch": 0.7795641958815128, "percentage": 77.96, "elapsed_time": "1 day, 2:42:05", "remaining_time": "7:32:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8462, "total_steps": 10853, "loss": 0.1091, "learning_rate": 6.346804417916963e-07, "epoch": 0.7796563320587829, "percentage": 77.97, "elapsed_time": "1 day, 2:42:16", "remaining_time": "7:32:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8463, "total_steps": 10853, "loss": 0.1224, "learning_rate": 6.341733312690798e-07, "epoch": 0.7797484682360529, "percentage": 77.98, "elapsed_time": "1 day, 2:42:26", "remaining_time": "7:32:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8464, "total_steps": 10853, "loss": 0.1152, "learning_rate": 6.336663939886695e-07, "epoch": 0.7798406044133229, "percentage": 77.99, "elapsed_time": "1 day, 2:42:37", "remaining_time": "7:32:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8465, "total_steps": 10853, "loss": 0.1287, "learning_rate": 6.331596299975362e-07, "epoch": 0.7799327405905929, "percentage": 78.0, "elapsed_time": "1 day, 2:42:48", "remaining_time": "7:32:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8466, "total_steps": 10853, "loss": 0.1197, "learning_rate": 6.326530393427316e-07, "epoch": 0.7800248767678629, "percentage": 78.01, "elapsed_time": "1 day, 2:42:58", "remaining_time": "7:31:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8467, "total_steps": 10853, "loss": 0.1156, "learning_rate": 6.321466220712929e-07, "epoch": 0.7801170129451329, "percentage": 78.02, "elapsed_time": "1 day, 2:43:10", "remaining_time": "7:31:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8468, "total_steps": 10853, "loss": 0.113, "learning_rate": 6.316403782302416e-07, "epoch": 0.7802091491224029, "percentage": 78.02, "elapsed_time": "1 day, 2:43:18", "remaining_time": "7:31:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8469, "total_steps": 10853, "loss": 0.1289, "learning_rate": 6.311343078665835e-07, "epoch": 0.7803012852996729, "percentage": 78.03, "elapsed_time": "1 day, 2:43:29", "remaining_time": "7:31:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8470, "total_steps": 10853, "loss": 0.1248, "learning_rate": 6.306284110273047e-07, "epoch": 0.7803934214769429, "percentage": 78.04, "elapsed_time": "1 day, 2:43:40", "remaining_time": "7:31:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8471, "total_steps": 10853, "loss": 0.1162, "learning_rate": 6.301226877593794e-07, "epoch": 0.7804855576542129, "percentage": 78.05, "elapsed_time": "1 day, 2:43:51", "remaining_time": "7:30:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8472, "total_steps": 10853, "loss": 0.1259, "learning_rate": 6.296171381097635e-07, "epoch": 0.7805776938314829, "percentage": 78.06, "elapsed_time": "1 day, 2:44:01", "remaining_time": "7:30:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8473, "total_steps": 10853, "loss": 0.1188, "learning_rate": 6.291117621253984e-07, "epoch": 0.7806698300087529, "percentage": 78.07, "elapsed_time": "1 day, 2:44:13", "remaining_time": "7:30:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8474, "total_steps": 10853, "loss": 0.1215, "learning_rate": 6.286065598532065e-07, "epoch": 0.7807619661860229, "percentage": 78.08, "elapsed_time": "1 day, 2:44:23", "remaining_time": "7:30:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8475, "total_steps": 10853, "loss": 0.127, "learning_rate": 6.281015313400981e-07, "epoch": 0.780854102363293, "percentage": 78.09, "elapsed_time": "1 day, 2:44:32", "remaining_time": "7:30:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8476, "total_steps": 10853, "loss": 0.1233, "learning_rate": 6.27596676632963e-07, "epoch": 0.780946238540563, "percentage": 78.1, "elapsed_time": "1 day, 2:44:43", "remaining_time": "7:30:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8477, "total_steps": 10853, "loss": 0.1276, "learning_rate": 6.270919957786789e-07, "epoch": 0.781038374717833, "percentage": 78.11, "elapsed_time": "1 day, 2:44:54", "remaining_time": "7:29:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8478, "total_steps": 10853, "loss": 0.1148, "learning_rate": 6.265874888241035e-07, "epoch": 0.781130510895103, "percentage": 78.12, "elapsed_time": "1 day, 2:45:06", "remaining_time": "7:29:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8479, "total_steps": 10853, "loss": 0.1167, "learning_rate": 6.260831558160818e-07, "epoch": 0.781222647072373, "percentage": 78.13, "elapsed_time": "1 day, 2:45:17", "remaining_time": "7:29:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8480, "total_steps": 10853, "loss": 0.1319, "learning_rate": 6.255789968014411e-07, "epoch": 0.781314783249643, "percentage": 78.14, "elapsed_time": "1 day, 2:45:28", "remaining_time": "7:29:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8481, "total_steps": 10853, "loss": 0.1244, "learning_rate": 6.250750118269927e-07, "epoch": 0.781406919426913, "percentage": 78.14, "elapsed_time": "1 day, 2:45:38", "remaining_time": "7:29:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8482, "total_steps": 10853, "loss": 0.1134, "learning_rate": 6.245712009395303e-07, "epoch": 0.781499055604183, "percentage": 78.15, "elapsed_time": "1 day, 2:45:49", "remaining_time": "7:28:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8483, "total_steps": 10853, "loss": 0.1192, "learning_rate": 6.240675641858335e-07, "epoch": 0.781591191781453, "percentage": 78.16, "elapsed_time": "1 day, 2:46:01", "remaining_time": "7:28:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8484, "total_steps": 10853, "loss": 0.1166, "learning_rate": 6.235641016126653e-07, "epoch": 0.781683327958723, "percentage": 78.17, "elapsed_time": "1 day, 2:46:13", "remaining_time": "7:28:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8485, "total_steps": 10853, "loss": 0.1334, "learning_rate": 6.230608132667732e-07, "epoch": 0.781775464135993, "percentage": 78.18, "elapsed_time": "1 day, 2:46:22", "remaining_time": "7:28:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8486, "total_steps": 10853, "loss": 0.1149, "learning_rate": 6.225576991948865e-07, "epoch": 0.781867600313263, "percentage": 78.19, "elapsed_time": "1 day, 2:46:33", "remaining_time": "7:28:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8487, "total_steps": 10853, "loss": 0.1187, "learning_rate": 6.220547594437188e-07, "epoch": 0.781959736490533, "percentage": 78.2, "elapsed_time": "1 day, 2:46:43", "remaining_time": "7:27:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8488, "total_steps": 10853, "loss": 0.1317, "learning_rate": 6.215519940599687e-07, "epoch": 0.782051872667803, "percentage": 78.21, "elapsed_time": "1 day, 2:46:55", "remaining_time": "7:27:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8489, "total_steps": 10853, "loss": 0.1257, "learning_rate": 6.210494030903188e-07, "epoch": 0.7821440088450731, "percentage": 78.22, "elapsed_time": "1 day, 2:47:05", "remaining_time": "7:27:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8490, "total_steps": 10853, "loss": 0.1198, "learning_rate": 6.205469865814334e-07, "epoch": 0.7822361450223431, "percentage": 78.23, "elapsed_time": "1 day, 2:47:14", "remaining_time": "7:27:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8491, "total_steps": 10853, "loss": 0.1239, "learning_rate": 6.200447445799631e-07, "epoch": 0.7823282811996131, "percentage": 78.24, "elapsed_time": "1 day, 2:47:24", "remaining_time": "7:27:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8492, "total_steps": 10853, "loss": 0.1197, "learning_rate": 6.195426771325402e-07, "epoch": 0.7824204173768831, "percentage": 78.25, "elapsed_time": "1 day, 2:47:36", "remaining_time": "7:26:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8493, "total_steps": 10853, "loss": 0.109, "learning_rate": 6.190407842857818e-07, "epoch": 0.7825125535541531, "percentage": 78.25, "elapsed_time": "1 day, 2:47:48", "remaining_time": "7:26:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8494, "total_steps": 10853, "loss": 0.1144, "learning_rate": 6.1853906608629e-07, "epoch": 0.782604689731423, "percentage": 78.26, "elapsed_time": "1 day, 2:47:59", "remaining_time": "7:26:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8495, "total_steps": 10853, "loss": 0.1174, "learning_rate": 6.180375225806475e-07, "epoch": 0.782696825908693, "percentage": 78.27, "elapsed_time": "1 day, 2:48:10", "remaining_time": "7:26:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8496, "total_steps": 10853, "loss": 0.1078, "learning_rate": 6.175361538154243e-07, "epoch": 0.782788962085963, "percentage": 78.28, "elapsed_time": "1 day, 2:48:21", "remaining_time": "7:26:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8497, "total_steps": 10853, "loss": 0.1135, "learning_rate": 6.170349598371711e-07, "epoch": 0.782881098263233, "percentage": 78.29, "elapsed_time": "1 day, 2:48:33", "remaining_time": "7:26:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8498, "total_steps": 10853, "loss": 0.1284, "learning_rate": 6.165339406924253e-07, "epoch": 0.782973234440503, "percentage": 78.3, "elapsed_time": "1 day, 2:48:44", "remaining_time": "7:25:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8499, "total_steps": 10853, "loss": 0.1156, "learning_rate": 6.16033096427705e-07, "epoch": 0.783065370617773, "percentage": 78.31, "elapsed_time": "1 day, 2:48:54", "remaining_time": "7:25:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8500, "total_steps": 10853, "loss": 0.1259, "learning_rate": 6.155324270895144e-07, "epoch": 0.783157506795043, "percentage": 78.32, "elapsed_time": "1 day, 2:49:05", "remaining_time": "7:25:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8500, "total_steps": 10853, "eval_loss": 0.12055304646492004, "epoch": 0.783157506795043, "percentage": 78.32, "elapsed_time": "1 day, 2:54:04", "remaining_time": "7:26:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8501, "total_steps": 10853, "loss": 0.1266, "learning_rate": 6.150319327243417e-07, "epoch": 0.783249642972313, "percentage": 78.33, "elapsed_time": "1 day, 2:54:15", "remaining_time": "7:26:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8502, "total_steps": 10853, "loss": 0.1236, "learning_rate": 6.145316133786569e-07, "epoch": 0.783341779149583, "percentage": 78.34, "elapsed_time": "1 day, 2:54:27", "remaining_time": "7:26:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8503, "total_steps": 10853, "loss": 0.1201, "learning_rate": 6.140314690989138e-07, "epoch": 0.7834339153268531, "percentage": 78.35, "elapsed_time": "1 day, 2:54:37", "remaining_time": "7:26:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8504, "total_steps": 10853, "loss": 0.1188, "learning_rate": 6.135314999315517e-07, "epoch": 0.7835260515041231, "percentage": 78.36, "elapsed_time": "1 day, 2:54:47", "remaining_time": "7:26:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8505, "total_steps": 10853, "loss": 0.1112, "learning_rate": 6.130317059229932e-07, "epoch": 0.7836181876813931, "percentage": 78.37, "elapsed_time": "1 day, 2:54:56", "remaining_time": "7:25:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8506, "total_steps": 10853, "loss": 0.1215, "learning_rate": 6.125320871196445e-07, "epoch": 0.7837103238586631, "percentage": 78.37, "elapsed_time": "1 day, 2:55:08", "remaining_time": "7:25:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8507, "total_steps": 10853, "loss": 0.1204, "learning_rate": 6.120326435678945e-07, "epoch": 0.7838024600359331, "percentage": 78.38, "elapsed_time": "1 day, 2:55:19", "remaining_time": "7:25:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8508, "total_steps": 10853, "loss": 0.1267, "learning_rate": 6.115333753141159e-07, "epoch": 0.7838945962132031, "percentage": 78.39, "elapsed_time": "1 day, 2:55:31", "remaining_time": "7:25:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8509, "total_steps": 10853, "loss": 0.1191, "learning_rate": 6.110342824046667e-07, "epoch": 0.7839867323904731, "percentage": 78.4, "elapsed_time": "1 day, 2:55:41", "remaining_time": "7:25:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8510, "total_steps": 10853, "loss": 0.134, "learning_rate": 6.105353648858887e-07, "epoch": 0.7840788685677431, "percentage": 78.41, "elapsed_time": "1 day, 2:55:52", "remaining_time": "7:24:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8511, "total_steps": 10853, "loss": 0.1279, "learning_rate": 6.100366228041043e-07, "epoch": 0.7841710047450131, "percentage": 78.42, "elapsed_time": "1 day, 2:56:02", "remaining_time": "7:24:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8512, "total_steps": 10853, "loss": 0.128, "learning_rate": 6.095380562056238e-07, "epoch": 0.7842631409222831, "percentage": 78.43, "elapsed_time": "1 day, 2:56:13", "remaining_time": "7:24:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8513, "total_steps": 10853, "loss": 0.1217, "learning_rate": 6.090396651367375e-07, "epoch": 0.7843552770995531, "percentage": 78.44, "elapsed_time": "1 day, 2:56:24", "remaining_time": "7:24:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8514, "total_steps": 10853, "loss": 0.1314, "learning_rate": 6.085414496437226e-07, "epoch": 0.7844474132768231, "percentage": 78.45, "elapsed_time": "1 day, 2:56:35", "remaining_time": "7:24:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8515, "total_steps": 10853, "loss": 0.1304, "learning_rate": 6.080434097728368e-07, "epoch": 0.7845395494540931, "percentage": 78.46, "elapsed_time": "1 day, 2:56:47", "remaining_time": "7:23:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8516, "total_steps": 10853, "loss": 0.1086, "learning_rate": 6.075455455703242e-07, "epoch": 0.7846316856313632, "percentage": 78.47, "elapsed_time": "1 day, 2:56:56", "remaining_time": "7:23:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8517, "total_steps": 10853, "loss": 0.1289, "learning_rate": 6.070478570824118e-07, "epoch": 0.7847238218086332, "percentage": 78.48, "elapsed_time": "1 day, 2:57:07", "remaining_time": "7:23:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8518, "total_steps": 10853, "loss": 0.1077, "learning_rate": 6.065503443553097e-07, "epoch": 0.7848159579859032, "percentage": 78.49, "elapsed_time": "1 day, 2:57:18", "remaining_time": "7:23:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8519, "total_steps": 10853, "loss": 0.1263, "learning_rate": 6.060530074352114e-07, "epoch": 0.7849080941631732, "percentage": 78.49, "elapsed_time": "1 day, 2:57:28", "remaining_time": "7:23:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8520, "total_steps": 10853, "loss": 0.1178, "learning_rate": 6.055558463682948e-07, "epoch": 0.7850002303404432, "percentage": 78.5, "elapsed_time": "1 day, 2:57:40", "remaining_time": "7:22:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8521, "total_steps": 10853, "loss": 0.1191, "learning_rate": 6.050588612007221e-07, "epoch": 0.7850923665177132, "percentage": 78.51, "elapsed_time": "1 day, 2:57:50", "remaining_time": "7:22:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8522, "total_steps": 10853, "loss": 0.1155, "learning_rate": 6.045620519786386e-07, "epoch": 0.7851845026949832, "percentage": 78.52, "elapsed_time": "1 day, 2:57:59", "remaining_time": "7:22:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8523, "total_steps": 10853, "loss": 0.1172, "learning_rate": 6.040654187481726e-07, "epoch": 0.7852766388722532, "percentage": 78.53, "elapsed_time": "1 day, 2:58:09", "remaining_time": "7:22:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8524, "total_steps": 10853, "loss": 0.1212, "learning_rate": 6.035689615554358e-07, "epoch": 0.7853687750495232, "percentage": 78.54, "elapsed_time": "1 day, 2:58:18", "remaining_time": "7:22:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8525, "total_steps": 10853, "loss": 0.1116, "learning_rate": 6.030726804465251e-07, "epoch": 0.7854609112267932, "percentage": 78.55, "elapsed_time": "1 day, 2:58:29", "remaining_time": "7:21:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8526, "total_steps": 10853, "loss": 0.12, "learning_rate": 6.0257657546752e-07, "epoch": 0.7855530474040632, "percentage": 78.56, "elapsed_time": "1 day, 2:58:40", "remaining_time": "7:21:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8527, "total_steps": 10853, "loss": 0.1243, "learning_rate": 6.020806466644849e-07, "epoch": 0.7856451835813332, "percentage": 78.57, "elapsed_time": "1 day, 2:58:52", "remaining_time": "7:21:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8528, "total_steps": 10853, "loss": 0.1187, "learning_rate": 6.015848940834662e-07, "epoch": 0.7857373197586032, "percentage": 78.58, "elapsed_time": "1 day, 2:59:03", "remaining_time": "7:21:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8529, "total_steps": 10853, "loss": 0.1183, "learning_rate": 6.010893177704935e-07, "epoch": 0.7858294559358732, "percentage": 78.59, "elapsed_time": "1 day, 2:59:14", "remaining_time": "7:21:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8530, "total_steps": 10853, "loss": 0.128, "learning_rate": 6.00593917771582e-07, "epoch": 0.7859215921131433, "percentage": 78.6, "elapsed_time": "1 day, 2:59:24", "remaining_time": "7:21:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8531, "total_steps": 10853, "loss": 0.114, "learning_rate": 6.000986941327303e-07, "epoch": 0.7860137282904133, "percentage": 78.6, "elapsed_time": "1 day, 2:59:36", "remaining_time": "7:20:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8532, "total_steps": 10853, "loss": 0.1209, "learning_rate": 5.996036468999187e-07, "epoch": 0.7861058644676833, "percentage": 78.61, "elapsed_time": "1 day, 2:59:47", "remaining_time": "7:20:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8533, "total_steps": 10853, "loss": 0.1266, "learning_rate": 5.991087761191136e-07, "epoch": 0.7861980006449533, "percentage": 78.62, "elapsed_time": "1 day, 2:59:59", "remaining_time": "7:20:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8534, "total_steps": 10853, "loss": 0.1131, "learning_rate": 5.986140818362626e-07, "epoch": 0.7862901368222233, "percentage": 78.63, "elapsed_time": "1 day, 3:00:10", "remaining_time": "7:20:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8535, "total_steps": 10853, "loss": 0.1282, "learning_rate": 5.981195640972995e-07, "epoch": 0.7863822729994933, "percentage": 78.64, "elapsed_time": "1 day, 3:00:21", "remaining_time": "7:20:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8536, "total_steps": 10853, "loss": 0.124, "learning_rate": 5.976252229481385e-07, "epoch": 0.7864744091767633, "percentage": 78.65, "elapsed_time": "1 day, 3:00:32", "remaining_time": "7:19:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8537, "total_steps": 10853, "loss": 0.1148, "learning_rate": 5.971310584346807e-07, "epoch": 0.7865665453540333, "percentage": 78.66, "elapsed_time": "1 day, 3:00:42", "remaining_time": "7:19:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8538, "total_steps": 10853, "loss": 0.1145, "learning_rate": 5.966370706028094e-07, "epoch": 0.7866586815313032, "percentage": 78.67, "elapsed_time": "1 day, 3:00:53", "remaining_time": "7:19:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8539, "total_steps": 10853, "loss": 0.1266, "learning_rate": 5.96143259498391e-07, "epoch": 0.7867508177085732, "percentage": 78.68, "elapsed_time": "1 day, 3:01:04", "remaining_time": "7:19:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8540, "total_steps": 10853, "loss": 0.128, "learning_rate": 5.956496251672752e-07, "epoch": 0.7868429538858432, "percentage": 78.69, "elapsed_time": "1 day, 3:01:15", "remaining_time": "7:19:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8541, "total_steps": 10853, "loss": 0.1215, "learning_rate": 5.951561676552966e-07, "epoch": 0.7869350900631132, "percentage": 78.7, "elapsed_time": "1 day, 3:01:25", "remaining_time": "7:18:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8542, "total_steps": 10853, "loss": 0.123, "learning_rate": 5.946628870082729e-07, "epoch": 0.7870272262403832, "percentage": 78.71, "elapsed_time": "1 day, 3:01:35", "remaining_time": "7:18:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8543, "total_steps": 10853, "loss": 0.1325, "learning_rate": 5.941697832720058e-07, "epoch": 0.7871193624176533, "percentage": 78.72, "elapsed_time": "1 day, 3:01:47", "remaining_time": "7:18:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8544, "total_steps": 10853, "loss": 0.1203, "learning_rate": 5.936768564922796e-07, "epoch": 0.7872114985949233, "percentage": 78.72, "elapsed_time": "1 day, 3:01:57", "remaining_time": "7:18:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8545, "total_steps": 10853, "loss": 0.1176, "learning_rate": 5.931841067148616e-07, "epoch": 0.7873036347721933, "percentage": 78.73, "elapsed_time": "1 day, 3:02:07", "remaining_time": "7:18:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8546, "total_steps": 10853, "loss": 0.1213, "learning_rate": 5.926915339855044e-07, "epoch": 0.7873957709494633, "percentage": 78.74, "elapsed_time": "1 day, 3:02:19", "remaining_time": "7:17:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8547, "total_steps": 10853, "loss": 0.1156, "learning_rate": 5.921991383499445e-07, "epoch": 0.7874879071267333, "percentage": 78.75, "elapsed_time": "1 day, 3:02:28", "remaining_time": "7:17:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8548, "total_steps": 10853, "loss": 0.1103, "learning_rate": 5.917069198538991e-07, "epoch": 0.7875800433040033, "percentage": 78.76, "elapsed_time": "1 day, 3:02:38", "remaining_time": "7:17:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8549, "total_steps": 10853, "loss": 0.1023, "learning_rate": 5.912148785430713e-07, "epoch": 0.7876721794812733, "percentage": 78.77, "elapsed_time": "1 day, 3:02:49", "remaining_time": "7:17:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8550, "total_steps": 10853, "loss": 0.1245, "learning_rate": 5.907230144631485e-07, "epoch": 0.7877643156585433, "percentage": 78.78, "elapsed_time": "1 day, 3:02:59", "remaining_time": "7:17:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8551, "total_steps": 10853, "loss": 0.1112, "learning_rate": 5.902313276597984e-07, "epoch": 0.7878564518358133, "percentage": 78.79, "elapsed_time": "1 day, 3:03:11", "remaining_time": "7:16:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8552, "total_steps": 10853, "loss": 0.1145, "learning_rate": 5.89739818178676e-07, "epoch": 0.7879485880130833, "percentage": 78.8, "elapsed_time": "1 day, 3:03:21", "remaining_time": "7:16:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8553, "total_steps": 10853, "loss": 0.1374, "learning_rate": 5.892484860654163e-07, "epoch": 0.7880407241903533, "percentage": 78.81, "elapsed_time": "1 day, 3:03:32", "remaining_time": "7:16:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8554, "total_steps": 10853, "loss": 0.1309, "learning_rate": 5.8875733136564e-07, "epoch": 0.7881328603676233, "percentage": 78.82, "elapsed_time": "1 day, 3:03:43", "remaining_time": "7:16:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8555, "total_steps": 10853, "loss": 0.128, "learning_rate": 5.882663541249523e-07, "epoch": 0.7882249965448933, "percentage": 78.83, "elapsed_time": "1 day, 3:03:55", "remaining_time": "7:16:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8556, "total_steps": 10853, "loss": 0.1202, "learning_rate": 5.877755543889391e-07, "epoch": 0.7883171327221633, "percentage": 78.84, "elapsed_time": "1 day, 3:04:07", "remaining_time": "7:16:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8557, "total_steps": 10853, "loss": 0.1213, "learning_rate": 5.872849322031706e-07, "epoch": 0.7884092688994334, "percentage": 78.84, "elapsed_time": "1 day, 3:04:18", "remaining_time": "7:15:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8558, "total_steps": 10853, "loss": 0.1227, "learning_rate": 5.867944876132022e-07, "epoch": 0.7885014050767034, "percentage": 78.85, "elapsed_time": "1 day, 3:04:27", "remaining_time": "7:15:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8559, "total_steps": 10853, "loss": 0.1034, "learning_rate": 5.863042206645716e-07, "epoch": 0.7885935412539734, "percentage": 78.86, "elapsed_time": "1 day, 3:04:38", "remaining_time": "7:15:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8560, "total_steps": 10853, "loss": 0.1258, "learning_rate": 5.858141314028007e-07, "epoch": 0.7886856774312434, "percentage": 78.87, "elapsed_time": "1 day, 3:04:49", "remaining_time": "7:15:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8561, "total_steps": 10853, "loss": 0.1123, "learning_rate": 5.853242198733938e-07, "epoch": 0.7887778136085134, "percentage": 78.88, "elapsed_time": "1 day, 3:05:00", "remaining_time": "7:15:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8562, "total_steps": 10853, "loss": 0.1252, "learning_rate": 5.848344861218383e-07, "epoch": 0.7888699497857834, "percentage": 78.89, "elapsed_time": "1 day, 3:05:12", "remaining_time": "7:14:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8563, "total_steps": 10853, "loss": 0.1263, "learning_rate": 5.843449301936068e-07, "epoch": 0.7889620859630534, "percentage": 78.9, "elapsed_time": "1 day, 3:05:23", "remaining_time": "7:14:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8564, "total_steps": 10853, "loss": 0.1278, "learning_rate": 5.838555521341558e-07, "epoch": 0.7890542221403234, "percentage": 78.91, "elapsed_time": "1 day, 3:05:34", "remaining_time": "7:14:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8565, "total_steps": 10853, "loss": 0.1244, "learning_rate": 5.833663519889218e-07, "epoch": 0.7891463583175934, "percentage": 78.92, "elapsed_time": "1 day, 3:05:44", "remaining_time": "7:14:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8566, "total_steps": 10853, "loss": 0.1109, "learning_rate": 5.828773298033294e-07, "epoch": 0.7892384944948634, "percentage": 78.93, "elapsed_time": "1 day, 3:05:56", "remaining_time": "7:14:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8567, "total_steps": 10853, "loss": 0.1232, "learning_rate": 5.823884856227824e-07, "epoch": 0.7893306306721334, "percentage": 78.94, "elapsed_time": "1 day, 3:06:07", "remaining_time": "7:13:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8568, "total_steps": 10853, "loss": 0.13, "learning_rate": 5.818998194926714e-07, "epoch": 0.7894227668494034, "percentage": 78.95, "elapsed_time": "1 day, 3:06:19", "remaining_time": "7:13:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8569, "total_steps": 10853, "loss": 0.1206, "learning_rate": 5.81411331458368e-07, "epoch": 0.7895149030266734, "percentage": 78.96, "elapsed_time": "1 day, 3:06:30", "remaining_time": "7:13:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8570, "total_steps": 10853, "loss": 0.1077, "learning_rate": 5.809230215652292e-07, "epoch": 0.7896070392039435, "percentage": 78.96, "elapsed_time": "1 day, 3:06:40", "remaining_time": "7:13:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8571, "total_steps": 10853, "loss": 0.1171, "learning_rate": 5.804348898585949e-07, "epoch": 0.7896991753812135, "percentage": 78.97, "elapsed_time": "1 day, 3:06:51", "remaining_time": "7:13:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8572, "total_steps": 10853, "loss": 0.1248, "learning_rate": 5.799469363837876e-07, "epoch": 0.7897913115584835, "percentage": 78.98, "elapsed_time": "1 day, 3:07:04", "remaining_time": "7:12:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8573, "total_steps": 10853, "loss": 0.1208, "learning_rate": 5.794591611861134e-07, "epoch": 0.7898834477357535, "percentage": 78.99, "elapsed_time": "1 day, 3:07:15", "remaining_time": "7:12:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8574, "total_steps": 10853, "loss": 0.1139, "learning_rate": 5.789715643108623e-07, "epoch": 0.7899755839130235, "percentage": 79.0, "elapsed_time": "1 day, 3:07:25", "remaining_time": "7:12:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8575, "total_steps": 10853, "loss": 0.1215, "learning_rate": 5.784841458033086e-07, "epoch": 0.7900677200902935, "percentage": 79.01, "elapsed_time": "1 day, 3:07:38", "remaining_time": "7:12:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8576, "total_steps": 10853, "loss": 0.1176, "learning_rate": 5.779969057087095e-07, "epoch": 0.7901598562675635, "percentage": 79.02, "elapsed_time": "1 day, 3:07:49", "remaining_time": "7:12:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8577, "total_steps": 10853, "loss": 0.1222, "learning_rate": 5.775098440723042e-07, "epoch": 0.7902519924448335, "percentage": 79.03, "elapsed_time": "1 day, 3:08:00", "remaining_time": "7:12:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8578, "total_steps": 10853, "loss": 0.1129, "learning_rate": 5.770229609393166e-07, "epoch": 0.7903441286221035, "percentage": 79.04, "elapsed_time": "1 day, 3:08:11", "remaining_time": "7:11:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8579, "total_steps": 10853, "loss": 0.1278, "learning_rate": 5.765362563549537e-07, "epoch": 0.7904362647993735, "percentage": 79.05, "elapsed_time": "1 day, 3:08:21", "remaining_time": "7:11:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8580, "total_steps": 10853, "loss": 0.1103, "learning_rate": 5.760497303644063e-07, "epoch": 0.7905284009766435, "percentage": 79.06, "elapsed_time": "1 day, 3:08:32", "remaining_time": "7:11:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8581, "total_steps": 10853, "loss": 0.1257, "learning_rate": 5.755633830128493e-07, "epoch": 0.7906205371539134, "percentage": 79.07, "elapsed_time": "1 day, 3:08:43", "remaining_time": "7:11:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8582, "total_steps": 10853, "loss": 0.1261, "learning_rate": 5.750772143454395e-07, "epoch": 0.7907126733311834, "percentage": 79.07, "elapsed_time": "1 day, 3:08:53", "remaining_time": "7:11:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8583, "total_steps": 10853, "loss": 0.1067, "learning_rate": 5.745912244073166e-07, "epoch": 0.7908048095084534, "percentage": 79.08, "elapsed_time": "1 day, 3:09:04", "remaining_time": "7:10:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8584, "total_steps": 10853, "loss": 0.1311, "learning_rate": 5.741054132436058e-07, "epoch": 0.7908969456857236, "percentage": 79.09, "elapsed_time": "1 day, 3:09:15", "remaining_time": "7:10:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8585, "total_steps": 10853, "loss": 0.1168, "learning_rate": 5.736197808994151e-07, "epoch": 0.7909890818629935, "percentage": 79.1, "elapsed_time": "1 day, 3:09:26", "remaining_time": "7:10:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8586, "total_steps": 10853, "loss": 0.1181, "learning_rate": 5.731343274198348e-07, "epoch": 0.7910812180402635, "percentage": 79.11, "elapsed_time": "1 day, 3:09:37", "remaining_time": "7:10:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8587, "total_steps": 10853, "loss": 0.1241, "learning_rate": 5.726490528499398e-07, "epoch": 0.7911733542175335, "percentage": 79.12, "elapsed_time": "1 day, 3:09:49", "remaining_time": "7:10:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8588, "total_steps": 10853, "loss": 0.1298, "learning_rate": 5.721639572347873e-07, "epoch": 0.7912654903948035, "percentage": 79.13, "elapsed_time": "1 day, 3:10:00", "remaining_time": "7:09:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8589, "total_steps": 10853, "loss": 0.1155, "learning_rate": 5.716790406194195e-07, "epoch": 0.7913576265720735, "percentage": 79.14, "elapsed_time": "1 day, 3:10:11", "remaining_time": "7:09:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8590, "total_steps": 10853, "loss": 0.1208, "learning_rate": 5.711943030488595e-07, "epoch": 0.7914497627493435, "percentage": 79.15, "elapsed_time": "1 day, 3:10:22", "remaining_time": "7:09:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8591, "total_steps": 10853, "loss": 0.1156, "learning_rate": 5.707097445681162e-07, "epoch": 0.7915418989266135, "percentage": 79.16, "elapsed_time": "1 day, 3:10:34", "remaining_time": "7:09:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8592, "total_steps": 10853, "loss": 0.1209, "learning_rate": 5.702253652221815e-07, "epoch": 0.7916340351038835, "percentage": 79.17, "elapsed_time": "1 day, 3:10:43", "remaining_time": "7:09:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8593, "total_steps": 10853, "loss": 0.1093, "learning_rate": 5.697411650560292e-07, "epoch": 0.7917261712811535, "percentage": 79.18, "elapsed_time": "1 day, 3:10:54", "remaining_time": "7:08:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8594, "total_steps": 10853, "loss": 0.1137, "learning_rate": 5.692571441146167e-07, "epoch": 0.7918183074584235, "percentage": 79.19, "elapsed_time": "1 day, 3:11:05", "remaining_time": "7:08:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8595, "total_steps": 10853, "loss": 0.1251, "learning_rate": 5.68773302442886e-07, "epoch": 0.7919104436356935, "percentage": 79.19, "elapsed_time": "1 day, 3:11:16", "remaining_time": "7:08:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8596, "total_steps": 10853, "loss": 0.1328, "learning_rate": 5.682896400857623e-07, "epoch": 0.7920025798129635, "percentage": 79.2, "elapsed_time": "1 day, 3:11:28", "remaining_time": "7:08:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8597, "total_steps": 10853, "loss": 0.1175, "learning_rate": 5.678061570881541e-07, "epoch": 0.7920947159902335, "percentage": 79.21, "elapsed_time": "1 day, 3:11:38", "remaining_time": "7:08:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8598, "total_steps": 10853, "loss": 0.1126, "learning_rate": 5.673228534949521e-07, "epoch": 0.7921868521675036, "percentage": 79.22, "elapsed_time": "1 day, 3:11:48", "remaining_time": "7:07:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8599, "total_steps": 10853, "loss": 0.1095, "learning_rate": 5.668397293510303e-07, "epoch": 0.7922789883447736, "percentage": 79.23, "elapsed_time": "1 day, 3:11:59", "remaining_time": "7:07:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8600, "total_steps": 10853, "loss": 0.1139, "learning_rate": 5.66356784701248e-07, "epoch": 0.7923711245220436, "percentage": 79.24, "elapsed_time": "1 day, 3:12:10", "remaining_time": "7:07:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8601, "total_steps": 10853, "loss": 0.1224, "learning_rate": 5.658740195904466e-07, "epoch": 0.7924632606993136, "percentage": 79.25, "elapsed_time": "1 day, 3:12:21", "remaining_time": "7:07:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8602, "total_steps": 10853, "loss": 0.1183, "learning_rate": 5.653914340634504e-07, "epoch": 0.7925553968765836, "percentage": 79.26, "elapsed_time": "1 day, 3:12:31", "remaining_time": "7:07:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8603, "total_steps": 10853, "loss": 0.1234, "learning_rate": 5.649090281650682e-07, "epoch": 0.7926475330538536, "percentage": 79.27, "elapsed_time": "1 day, 3:12:40", "remaining_time": "7:07:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8604, "total_steps": 10853, "loss": 0.1118, "learning_rate": 5.644268019400903e-07, "epoch": 0.7927396692311236, "percentage": 79.28, "elapsed_time": "1 day, 3:12:52", "remaining_time": "7:06:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8605, "total_steps": 10853, "loss": 0.1296, "learning_rate": 5.639447554332928e-07, "epoch": 0.7928318054083936, "percentage": 79.29, "elapsed_time": "1 day, 3:13:02", "remaining_time": "7:06:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8606, "total_steps": 10853, "loss": 0.1084, "learning_rate": 5.634628886894324e-07, "epoch": 0.7929239415856636, "percentage": 79.3, "elapsed_time": "1 day, 3:13:13", "remaining_time": "7:06:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8607, "total_steps": 10853, "loss": 0.1208, "learning_rate": 5.629812017532515e-07, "epoch": 0.7930160777629336, "percentage": 79.31, "elapsed_time": "1 day, 3:13:24", "remaining_time": "7:06:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8608, "total_steps": 10853, "loss": 0.1269, "learning_rate": 5.62499694669475e-07, "epoch": 0.7931082139402036, "percentage": 79.31, "elapsed_time": "1 day, 3:13:35", "remaining_time": "7:06:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8609, "total_steps": 10853, "loss": 0.1304, "learning_rate": 5.620183674828094e-07, "epoch": 0.7932003501174736, "percentage": 79.32, "elapsed_time": "1 day, 3:13:46", "remaining_time": "7:05:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8610, "total_steps": 10853, "loss": 0.1208, "learning_rate": 5.615372202379482e-07, "epoch": 0.7932924862947436, "percentage": 79.33, "elapsed_time": "1 day, 3:13:56", "remaining_time": "7:05:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8611, "total_steps": 10853, "loss": 0.1101, "learning_rate": 5.610562529795635e-07, "epoch": 0.7933846224720137, "percentage": 79.34, "elapsed_time": "1 day, 3:14:07", "remaining_time": "7:05:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8612, "total_steps": 10853, "loss": 0.1253, "learning_rate": 5.605754657523147e-07, "epoch": 0.7934767586492837, "percentage": 79.35, "elapsed_time": "1 day, 3:14:16", "remaining_time": "7:05:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8613, "total_steps": 10853, "loss": 0.1208, "learning_rate": 5.600948586008432e-07, "epoch": 0.7935688948265537, "percentage": 79.36, "elapsed_time": "1 day, 3:14:27", "remaining_time": "7:05:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8614, "total_steps": 10853, "loss": 0.122, "learning_rate": 5.59614431569773e-07, "epoch": 0.7936610310038237, "percentage": 79.37, "elapsed_time": "1 day, 3:14:39", "remaining_time": "7:04:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8615, "total_steps": 10853, "loss": 0.1276, "learning_rate": 5.591341847037107e-07, "epoch": 0.7937531671810937, "percentage": 79.38, "elapsed_time": "1 day, 3:14:49", "remaining_time": "7:04:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8616, "total_steps": 10853, "loss": 0.1233, "learning_rate": 5.586541180472485e-07, "epoch": 0.7938453033583637, "percentage": 79.39, "elapsed_time": "1 day, 3:14:58", "remaining_time": "7:04:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8617, "total_steps": 10853, "loss": 0.1024, "learning_rate": 5.581742316449601e-07, "epoch": 0.7939374395356337, "percentage": 79.4, "elapsed_time": "1 day, 3:15:09", "remaining_time": "7:04:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8618, "total_steps": 10853, "loss": 0.128, "learning_rate": 5.57694525541404e-07, "epoch": 0.7940295757129037, "percentage": 79.41, "elapsed_time": "1 day, 3:15:21", "remaining_time": "7:04:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8619, "total_steps": 10853, "loss": 0.1172, "learning_rate": 5.572149997811205e-07, "epoch": 0.7941217118901737, "percentage": 79.42, "elapsed_time": "1 day, 3:15:32", "remaining_time": "7:03:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8620, "total_steps": 10853, "loss": 0.1236, "learning_rate": 5.567356544086325e-07, "epoch": 0.7942138480674437, "percentage": 79.43, "elapsed_time": "1 day, 3:15:44", "remaining_time": "7:03:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8621, "total_steps": 10853, "loss": 0.1204, "learning_rate": 5.56256489468448e-07, "epoch": 0.7943059842447137, "percentage": 79.43, "elapsed_time": "1 day, 3:15:55", "remaining_time": "7:03:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8622, "total_steps": 10853, "loss": 0.1267, "learning_rate": 5.557775050050584e-07, "epoch": 0.7943981204219837, "percentage": 79.44, "elapsed_time": "1 day, 3:16:07", "remaining_time": "7:03:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8623, "total_steps": 10853, "loss": 0.1062, "learning_rate": 5.552987010629363e-07, "epoch": 0.7944902565992537, "percentage": 79.45, "elapsed_time": "1 day, 3:16:17", "remaining_time": "7:03:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8624, "total_steps": 10853, "loss": 0.1191, "learning_rate": 5.54820077686539e-07, "epoch": 0.7945823927765236, "percentage": 79.46, "elapsed_time": "1 day, 3:16:28", "remaining_time": "7:02:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8625, "total_steps": 10853, "loss": 0.121, "learning_rate": 5.543416349203071e-07, "epoch": 0.7946745289537938, "percentage": 79.47, "elapsed_time": "1 day, 3:16:39", "remaining_time": "7:02:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8626, "total_steps": 10853, "loss": 0.1174, "learning_rate": 5.538633728086643e-07, "epoch": 0.7947666651310638, "percentage": 79.48, "elapsed_time": "1 day, 3:16:50", "remaining_time": "7:02:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8627, "total_steps": 10853, "loss": 0.1123, "learning_rate": 5.533852913960158e-07, "epoch": 0.7948588013083338, "percentage": 79.49, "elapsed_time": "1 day, 3:17:01", "remaining_time": "7:02:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8628, "total_steps": 10853, "loss": 0.1296, "learning_rate": 5.529073907267526e-07, "epoch": 0.7949509374856037, "percentage": 79.5, "elapsed_time": "1 day, 3:17:12", "remaining_time": "7:02:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8629, "total_steps": 10853, "loss": 0.1155, "learning_rate": 5.524296708452476e-07, "epoch": 0.7950430736628737, "percentage": 79.51, "elapsed_time": "1 day, 3:17:23", "remaining_time": "7:02:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8630, "total_steps": 10853, "loss": 0.1262, "learning_rate": 5.519521317958581e-07, "epoch": 0.7951352098401437, "percentage": 79.52, "elapsed_time": "1 day, 3:17:35", "remaining_time": "7:01:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8631, "total_steps": 10853, "loss": 0.1203, "learning_rate": 5.514747736229225e-07, "epoch": 0.7952273460174137, "percentage": 79.53, "elapsed_time": "1 day, 3:17:45", "remaining_time": "7:01:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8632, "total_steps": 10853, "loss": 0.1228, "learning_rate": 5.509975963707636e-07, "epoch": 0.7953194821946837, "percentage": 79.54, "elapsed_time": "1 day, 3:17:56", "remaining_time": "7:01:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8633, "total_steps": 10853, "loss": 0.1193, "learning_rate": 5.505206000836874e-07, "epoch": 0.7954116183719537, "percentage": 79.54, "elapsed_time": "1 day, 3:18:07", "remaining_time": "7:01:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8634, "total_steps": 10853, "loss": 0.122, "learning_rate": 5.500437848059842e-07, "epoch": 0.7955037545492237, "percentage": 79.55, "elapsed_time": "1 day, 3:18:18", "remaining_time": "7:01:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8635, "total_steps": 10853, "loss": 0.1182, "learning_rate": 5.495671505819244e-07, "epoch": 0.7955958907264937, "percentage": 79.56, "elapsed_time": "1 day, 3:18:28", "remaining_time": "7:00:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8636, "total_steps": 10853, "loss": 0.1212, "learning_rate": 5.490906974557655e-07, "epoch": 0.7956880269037637, "percentage": 79.57, "elapsed_time": "1 day, 3:18:39", "remaining_time": "7:00:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8637, "total_steps": 10853, "loss": 0.1258, "learning_rate": 5.486144254717446e-07, "epoch": 0.7957801630810337, "percentage": 79.58, "elapsed_time": "1 day, 3:18:50", "remaining_time": "7:00:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8638, "total_steps": 10853, "loss": 0.1163, "learning_rate": 5.481383346740843e-07, "epoch": 0.7958722992583038, "percentage": 79.59, "elapsed_time": "1 day, 3:19:01", "remaining_time": "7:00:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8639, "total_steps": 10853, "loss": 0.1226, "learning_rate": 5.476624251069904e-07, "epoch": 0.7959644354355738, "percentage": 79.6, "elapsed_time": "1 day, 3:19:12", "remaining_time": "7:00:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8640, "total_steps": 10853, "loss": 0.1128, "learning_rate": 5.471866968146497e-07, "epoch": 0.7960565716128438, "percentage": 79.61, "elapsed_time": "1 day, 3:19:23", "remaining_time": "6:59:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8641, "total_steps": 10853, "loss": 0.1306, "learning_rate": 5.46711149841235e-07, "epoch": 0.7961487077901138, "percentage": 79.62, "elapsed_time": "1 day, 3:19:35", "remaining_time": "6:59:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8642, "total_steps": 10853, "loss": 0.1194, "learning_rate": 5.462357842308997e-07, "epoch": 0.7962408439673838, "percentage": 79.63, "elapsed_time": "1 day, 3:19:45", "remaining_time": "6:59:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8643, "total_steps": 10853, "loss": 0.1155, "learning_rate": 5.457606000277826e-07, "epoch": 0.7963329801446538, "percentage": 79.64, "elapsed_time": "1 day, 3:19:55", "remaining_time": "6:59:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8644, "total_steps": 10853, "loss": 0.1126, "learning_rate": 5.452855972760035e-07, "epoch": 0.7964251163219238, "percentage": 79.65, "elapsed_time": "1 day, 3:20:06", "remaining_time": "6:59:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8645, "total_steps": 10853, "loss": 0.1086, "learning_rate": 5.448107760196672e-07, "epoch": 0.7965172524991938, "percentage": 79.66, "elapsed_time": "1 day, 3:20:16", "remaining_time": "6:58:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8646, "total_steps": 10853, "loss": 0.1196, "learning_rate": 5.443361363028612e-07, "epoch": 0.7966093886764638, "percentage": 79.66, "elapsed_time": "1 day, 3:20:27", "remaining_time": "6:58:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8647, "total_steps": 10853, "loss": 0.1292, "learning_rate": 5.438616781696557e-07, "epoch": 0.7967015248537338, "percentage": 79.67, "elapsed_time": "1 day, 3:20:39", "remaining_time": "6:58:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8648, "total_steps": 10853, "loss": 0.1288, "learning_rate": 5.43387401664103e-07, "epoch": 0.7967936610310038, "percentage": 79.68, "elapsed_time": "1 day, 3:20:50", "remaining_time": "6:58:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8649, "total_steps": 10853, "loss": 0.1161, "learning_rate": 5.429133068302405e-07, "epoch": 0.7968857972082738, "percentage": 79.69, "elapsed_time": "1 day, 3:21:00", "remaining_time": "6:58:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8650, "total_steps": 10853, "loss": 0.0994, "learning_rate": 5.424393937120884e-07, "epoch": 0.7969779333855438, "percentage": 79.7, "elapsed_time": "1 day, 3:21:12", "remaining_time": "6:57:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8651, "total_steps": 10853, "loss": 0.124, "learning_rate": 5.419656623536498e-07, "epoch": 0.7970700695628138, "percentage": 79.71, "elapsed_time": "1 day, 3:21:23", "remaining_time": "6:57:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8652, "total_steps": 10853, "loss": 0.1042, "learning_rate": 5.414921127989104e-07, "epoch": 0.7971622057400839, "percentage": 79.72, "elapsed_time": "1 day, 3:21:33", "remaining_time": "6:57:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8653, "total_steps": 10853, "loss": 0.1294, "learning_rate": 5.410187450918381e-07, "epoch": 0.7972543419173539, "percentage": 79.73, "elapsed_time": "1 day, 3:21:44", "remaining_time": "6:57:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8654, "total_steps": 10853, "loss": 0.1296, "learning_rate": 5.405455592763864e-07, "epoch": 0.7973464780946239, "percentage": 79.74, "elapsed_time": "1 day, 3:21:56", "remaining_time": "6:57:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8655, "total_steps": 10853, "loss": 0.1147, "learning_rate": 5.400725553964908e-07, "epoch": 0.7974386142718939, "percentage": 79.75, "elapsed_time": "1 day, 3:22:07", "remaining_time": "6:57:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8656, "total_steps": 10853, "loss": 0.1142, "learning_rate": 5.39599733496069e-07, "epoch": 0.7975307504491639, "percentage": 79.76, "elapsed_time": "1 day, 3:22:19", "remaining_time": "6:56:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8657, "total_steps": 10853, "loss": 0.1179, "learning_rate": 5.391270936190232e-07, "epoch": 0.7976228866264339, "percentage": 79.77, "elapsed_time": "1 day, 3:22:28", "remaining_time": "6:56:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8658, "total_steps": 10853, "loss": 0.112, "learning_rate": 5.386546358092376e-07, "epoch": 0.7977150228037039, "percentage": 79.78, "elapsed_time": "1 day, 3:22:39", "remaining_time": "6:56:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8659, "total_steps": 10853, "loss": 0.1172, "learning_rate": 5.381823601105804e-07, "epoch": 0.7978071589809739, "percentage": 79.78, "elapsed_time": "1 day, 3:22:50", "remaining_time": "6:56:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8660, "total_steps": 10853, "loss": 0.1094, "learning_rate": 5.377102665669018e-07, "epoch": 0.7978992951582439, "percentage": 79.79, "elapsed_time": "1 day, 3:23:01", "remaining_time": "6:56:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8661, "total_steps": 10853, "loss": 0.1221, "learning_rate": 5.372383552220358e-07, "epoch": 0.7979914313355139, "percentage": 79.8, "elapsed_time": "1 day, 3:23:13", "remaining_time": "6:55:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8662, "total_steps": 10853, "loss": 0.1191, "learning_rate": 5.36766626119801e-07, "epoch": 0.7980835675127839, "percentage": 79.81, "elapsed_time": "1 day, 3:23:24", "remaining_time": "6:55:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8663, "total_steps": 10853, "loss": 0.1222, "learning_rate": 5.362950793039959e-07, "epoch": 0.7981757036900539, "percentage": 79.82, "elapsed_time": "1 day, 3:23:35", "remaining_time": "6:55:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8664, "total_steps": 10853, "loss": 0.1258, "learning_rate": 5.358237148184034e-07, "epoch": 0.7982678398673239, "percentage": 79.83, "elapsed_time": "1 day, 3:23:47", "remaining_time": "6:55:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8665, "total_steps": 10853, "loss": 0.103, "learning_rate": 5.353525327067902e-07, "epoch": 0.7983599760445939, "percentage": 79.84, "elapsed_time": "1 day, 3:23:58", "remaining_time": "6:55:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8666, "total_steps": 10853, "loss": 0.1191, "learning_rate": 5.348815330129059e-07, "epoch": 0.798452112221864, "percentage": 79.85, "elapsed_time": "1 day, 3:24:08", "remaining_time": "6:54:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8667, "total_steps": 10853, "loss": 0.1198, "learning_rate": 5.344107157804834e-07, "epoch": 0.798544248399134, "percentage": 79.86, "elapsed_time": "1 day, 3:24:18", "remaining_time": "6:54:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8668, "total_steps": 10853, "loss": 0.1292, "learning_rate": 5.339400810532375e-07, "epoch": 0.798636384576404, "percentage": 79.87, "elapsed_time": "1 day, 3:24:30", "remaining_time": "6:54:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8669, "total_steps": 10853, "loss": 0.1162, "learning_rate": 5.334696288748661e-07, "epoch": 0.798728520753674, "percentage": 79.88, "elapsed_time": "1 day, 3:24:41", "remaining_time": "6:54:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8670, "total_steps": 10853, "loss": 0.1116, "learning_rate": 5.329993592890512e-07, "epoch": 0.798820656930944, "percentage": 79.89, "elapsed_time": "1 day, 3:24:51", "remaining_time": "6:54:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8671, "total_steps": 10853, "loss": 0.1155, "learning_rate": 5.325292723394573e-07, "epoch": 0.798912793108214, "percentage": 79.89, "elapsed_time": "1 day, 3:25:00", "remaining_time": "6:53:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8672, "total_steps": 10853, "loss": 0.1146, "learning_rate": 5.320593680697331e-07, "epoch": 0.799004929285484, "percentage": 79.9, "elapsed_time": "1 day, 3:25:11", "remaining_time": "6:53:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8673, "total_steps": 10853, "loss": 0.1254, "learning_rate": 5.315896465235084e-07, "epoch": 0.7990970654627539, "percentage": 79.91, "elapsed_time": "1 day, 3:25:23", "remaining_time": "6:53:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8674, "total_steps": 10853, "loss": 0.1063, "learning_rate": 5.311201077443961e-07, "epoch": 0.7991892016400239, "percentage": 79.92, "elapsed_time": "1 day, 3:25:34", "remaining_time": "6:53:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8675, "total_steps": 10853, "loss": 0.1186, "learning_rate": 5.306507517759937e-07, "epoch": 0.7992813378172939, "percentage": 79.93, "elapsed_time": "1 day, 3:25:44", "remaining_time": "6:53:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8676, "total_steps": 10853, "loss": 0.1227, "learning_rate": 5.301815786618816e-07, "epoch": 0.7993734739945639, "percentage": 79.94, "elapsed_time": "1 day, 3:25:54", "remaining_time": "6:52:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8677, "total_steps": 10853, "loss": 0.1161, "learning_rate": 5.297125884456214e-07, "epoch": 0.7994656101718339, "percentage": 79.95, "elapsed_time": "1 day, 3:26:04", "remaining_time": "6:52:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8678, "total_steps": 10853, "loss": 0.1262, "learning_rate": 5.292437811707599e-07, "epoch": 0.7995577463491039, "percentage": 79.96, "elapsed_time": "1 day, 3:26:15", "remaining_time": "6:52:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8679, "total_steps": 10853, "loss": 0.1186, "learning_rate": 5.287751568808247e-07, "epoch": 0.799649882526374, "percentage": 79.97, "elapsed_time": "1 day, 3:26:25", "remaining_time": "6:52:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8680, "total_steps": 10853, "loss": 0.1203, "learning_rate": 5.283067156193292e-07, "epoch": 0.799742018703644, "percentage": 79.98, "elapsed_time": "1 day, 3:26:35", "remaining_time": "6:52:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8681, "total_steps": 10853, "loss": 0.1234, "learning_rate": 5.278384574297665e-07, "epoch": 0.799834154880914, "percentage": 79.99, "elapsed_time": "1 day, 3:26:46", "remaining_time": "6:52:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8682, "total_steps": 10853, "loss": 0.1223, "learning_rate": 5.273703823556153e-07, "epoch": 0.799926291058184, "percentage": 80.0, "elapsed_time": "1 day, 3:26:58", "remaining_time": "6:51:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8683, "total_steps": 10853, "loss": 0.1134, "learning_rate": 5.269024904403372e-07, "epoch": 0.800018427235454, "percentage": 80.01, "elapsed_time": "1 day, 3:27:09", "remaining_time": "6:51:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8684, "total_steps": 10853, "loss": 0.1259, "learning_rate": 5.264347817273752e-07, "epoch": 0.800110563412724, "percentage": 80.01, "elapsed_time": "1 day, 3:27:20", "remaining_time": "6:51:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8685, "total_steps": 10853, "loss": 0.1121, "learning_rate": 5.259672562601553e-07, "epoch": 0.800202699589994, "percentage": 80.02, "elapsed_time": "1 day, 3:27:29", "remaining_time": "6:51:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8686, "total_steps": 10853, "loss": 0.1197, "learning_rate": 5.25499914082088e-07, "epoch": 0.800294835767264, "percentage": 80.03, "elapsed_time": "1 day, 3:27:40", "remaining_time": "6:51:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8687, "total_steps": 10853, "loss": 0.1215, "learning_rate": 5.250327552365664e-07, "epoch": 0.800386971944534, "percentage": 80.04, "elapsed_time": "1 day, 3:27:51", "remaining_time": "6:50:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8688, "total_steps": 10853, "loss": 0.1174, "learning_rate": 5.245657797669665e-07, "epoch": 0.800479108121804, "percentage": 80.05, "elapsed_time": "1 day, 3:28:02", "remaining_time": "6:50:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8689, "total_steps": 10853, "loss": 0.1147, "learning_rate": 5.24098987716647e-07, "epoch": 0.800571244299074, "percentage": 80.06, "elapsed_time": "1 day, 3:28:12", "remaining_time": "6:50:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8690, "total_steps": 10853, "loss": 0.12, "learning_rate": 5.236323791289479e-07, "epoch": 0.800663380476344, "percentage": 80.07, "elapsed_time": "1 day, 3:28:23", "remaining_time": "6:50:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8691, "total_steps": 10853, "loss": 0.1316, "learning_rate": 5.231659540471954e-07, "epoch": 0.800755516653614, "percentage": 80.08, "elapsed_time": "1 day, 3:28:35", "remaining_time": "6:50:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8692, "total_steps": 10853, "loss": 0.1253, "learning_rate": 5.226997125146973e-07, "epoch": 0.800847652830884, "percentage": 80.09, "elapsed_time": "1 day, 3:28:44", "remaining_time": "6:49:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8693, "total_steps": 10853, "loss": 0.1198, "learning_rate": 5.222336545747434e-07, "epoch": 0.8009397890081541, "percentage": 80.1, "elapsed_time": "1 day, 3:28:54", "remaining_time": "6:49:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8694, "total_steps": 10853, "loss": 0.1193, "learning_rate": 5.217677802706078e-07, "epoch": 0.8010319251854241, "percentage": 80.11, "elapsed_time": "1 day, 3:29:05", "remaining_time": "6:49:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8695, "total_steps": 10853, "loss": 0.1141, "learning_rate": 5.213020896455462e-07, "epoch": 0.8011240613626941, "percentage": 80.12, "elapsed_time": "1 day, 3:29:16", "remaining_time": "6:49:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8696, "total_steps": 10853, "loss": 0.1207, "learning_rate": 5.208365827427985e-07, "epoch": 0.8012161975399641, "percentage": 80.13, "elapsed_time": "1 day, 3:29:27", "remaining_time": "6:49:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8697, "total_steps": 10853, "loss": 0.127, "learning_rate": 5.203712596055876e-07, "epoch": 0.8013083337172341, "percentage": 80.13, "elapsed_time": "1 day, 3:29:39", "remaining_time": "6:48:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8698, "total_steps": 10853, "loss": 0.1216, "learning_rate": 5.19906120277118e-07, "epoch": 0.8014004698945041, "percentage": 80.14, "elapsed_time": "1 day, 3:29:50", "remaining_time": "6:48:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8699, "total_steps": 10853, "loss": 0.1112, "learning_rate": 5.194411648005778e-07, "epoch": 0.8014926060717741, "percentage": 80.15, "elapsed_time": "1 day, 3:30:03", "remaining_time": "6:48:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8700, "total_steps": 10853, "loss": 0.1264, "learning_rate": 5.189763932191396e-07, "epoch": 0.8015847422490441, "percentage": 80.16, "elapsed_time": "1 day, 3:30:15", "remaining_time": "6:48:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8701, "total_steps": 10853, "loss": 0.116, "learning_rate": 5.185118055759564e-07, "epoch": 0.8016768784263141, "percentage": 80.17, "elapsed_time": "1 day, 3:30:26", "remaining_time": "6:48:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8702, "total_steps": 10853, "loss": 0.1299, "learning_rate": 5.180474019141646e-07, "epoch": 0.8017690146035841, "percentage": 80.18, "elapsed_time": "1 day, 3:30:37", "remaining_time": "6:48:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8703, "total_steps": 10853, "loss": 0.1204, "learning_rate": 5.175831822768848e-07, "epoch": 0.8018611507808541, "percentage": 80.19, "elapsed_time": "1 day, 3:30:48", "remaining_time": "6:47:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8704, "total_steps": 10853, "loss": 0.1096, "learning_rate": 5.171191467072201e-07, "epoch": 0.8019532869581241, "percentage": 80.2, "elapsed_time": "1 day, 3:30:58", "remaining_time": "6:47:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8705, "total_steps": 10853, "loss": 0.1232, "learning_rate": 5.166552952482565e-07, "epoch": 0.8020454231353941, "percentage": 80.21, "elapsed_time": "1 day, 3:31:09", "remaining_time": "6:47:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8706, "total_steps": 10853, "loss": 0.1178, "learning_rate": 5.161916279430623e-07, "epoch": 0.8021375593126642, "percentage": 80.22, "elapsed_time": "1 day, 3:31:20", "remaining_time": "6:47:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8707, "total_steps": 10853, "loss": 0.1317, "learning_rate": 5.157281448346882e-07, "epoch": 0.8022296954899342, "percentage": 80.23, "elapsed_time": "1 day, 3:31:31", "remaining_time": "6:47:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8708, "total_steps": 10853, "loss": 0.1075, "learning_rate": 5.152648459661694e-07, "epoch": 0.8023218316672042, "percentage": 80.24, "elapsed_time": "1 day, 3:31:42", "remaining_time": "6:46:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8709, "total_steps": 10853, "loss": 0.1369, "learning_rate": 5.148017313805237e-07, "epoch": 0.8024139678444742, "percentage": 80.25, "elapsed_time": "1 day, 3:31:53", "remaining_time": "6:46:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8710, "total_steps": 10853, "loss": 0.1216, "learning_rate": 5.143388011207506e-07, "epoch": 0.8025061040217442, "percentage": 80.25, "elapsed_time": "1 day, 3:32:03", "remaining_time": "6:46:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8711, "total_steps": 10853, "loss": 0.1104, "learning_rate": 5.138760552298338e-07, "epoch": 0.8025982401990142, "percentage": 80.26, "elapsed_time": "1 day, 3:32:15", "remaining_time": "6:46:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8712, "total_steps": 10853, "loss": 0.1152, "learning_rate": 5.134134937507387e-07, "epoch": 0.8026903763762842, "percentage": 80.27, "elapsed_time": "1 day, 3:32:25", "remaining_time": "6:46:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8713, "total_steps": 10853, "loss": 0.1127, "learning_rate": 5.129511167264151e-07, "epoch": 0.8027825125535542, "percentage": 80.28, "elapsed_time": "1 day, 3:32:35", "remaining_time": "6:45:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8714, "total_steps": 10853, "loss": 0.1187, "learning_rate": 5.124889241997935e-07, "epoch": 0.8028746487308241, "percentage": 80.29, "elapsed_time": "1 day, 3:32:45", "remaining_time": "6:45:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8715, "total_steps": 10853, "loss": 0.1231, "learning_rate": 5.120269162137889e-07, "epoch": 0.8029667849080941, "percentage": 80.3, "elapsed_time": "1 day, 3:32:56", "remaining_time": "6:45:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8716, "total_steps": 10853, "loss": 0.1229, "learning_rate": 5.115650928113e-07, "epoch": 0.8030589210853641, "percentage": 80.31, "elapsed_time": "1 day, 3:33:07", "remaining_time": "6:45:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8717, "total_steps": 10853, "loss": 0.1245, "learning_rate": 5.111034540352064e-07, "epoch": 0.8031510572626341, "percentage": 80.32, "elapsed_time": "1 day, 3:33:18", "remaining_time": "6:45:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8718, "total_steps": 10853, "loss": 0.1279, "learning_rate": 5.106419999283702e-07, "epoch": 0.8032431934399041, "percentage": 80.33, "elapsed_time": "1 day, 3:33:29", "remaining_time": "6:44:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8719, "total_steps": 10853, "loss": 0.1339, "learning_rate": 5.101807305336385e-07, "epoch": 0.8033353296171741, "percentage": 80.34, "elapsed_time": "1 day, 3:33:40", "remaining_time": "6:44:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8720, "total_steps": 10853, "loss": 0.1218, "learning_rate": 5.0971964589384e-07, "epoch": 0.8034274657944442, "percentage": 80.35, "elapsed_time": "1 day, 3:33:50", "remaining_time": "6:44:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8721, "total_steps": 10853, "loss": 0.1239, "learning_rate": 5.092587460517873e-07, "epoch": 0.8035196019717142, "percentage": 80.36, "elapsed_time": "1 day, 3:34:01", "remaining_time": "6:44:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8722, "total_steps": 10853, "loss": 0.1182, "learning_rate": 5.087980310502743e-07, "epoch": 0.8036117381489842, "percentage": 80.36, "elapsed_time": "1 day, 3:34:12", "remaining_time": "6:44:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8723, "total_steps": 10853, "loss": 0.1129, "learning_rate": 5.083375009320779e-07, "epoch": 0.8037038743262542, "percentage": 80.37, "elapsed_time": "1 day, 3:34:23", "remaining_time": "6:43:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8724, "total_steps": 10853, "loss": 0.1242, "learning_rate": 5.078771557399586e-07, "epoch": 0.8037960105035242, "percentage": 80.38, "elapsed_time": "1 day, 3:34:34", "remaining_time": "6:43:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8725, "total_steps": 10853, "loss": 0.1107, "learning_rate": 5.0741699551666e-07, "epoch": 0.8038881466807942, "percentage": 80.39, "elapsed_time": "1 day, 3:34:44", "remaining_time": "6:43:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8726, "total_steps": 10853, "loss": 0.1124, "learning_rate": 5.069570203049085e-07, "epoch": 0.8039802828580642, "percentage": 80.4, "elapsed_time": "1 day, 3:34:53", "remaining_time": "6:43:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8727, "total_steps": 10853, "loss": 0.1179, "learning_rate": 5.06497230147412e-07, "epoch": 0.8040724190353342, "percentage": 80.41, "elapsed_time": "1 day, 3:35:04", "remaining_time": "6:43:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8728, "total_steps": 10853, "loss": 0.1192, "learning_rate": 5.060376250868615e-07, "epoch": 0.8041645552126042, "percentage": 80.42, "elapsed_time": "1 day, 3:35:15", "remaining_time": "6:43:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8729, "total_steps": 10853, "loss": 0.1268, "learning_rate": 5.055782051659322e-07, "epoch": 0.8042566913898742, "percentage": 80.43, "elapsed_time": "1 day, 3:35:25", "remaining_time": "6:42:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8730, "total_steps": 10853, "loss": 0.1179, "learning_rate": 5.051189704272819e-07, "epoch": 0.8043488275671442, "percentage": 80.44, "elapsed_time": "1 day, 3:35:36", "remaining_time": "6:42:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8731, "total_steps": 10853, "loss": 0.1243, "learning_rate": 5.046599209135492e-07, "epoch": 0.8044409637444142, "percentage": 80.45, "elapsed_time": "1 day, 3:35:47", "remaining_time": "6:42:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8732, "total_steps": 10853, "loss": 0.1159, "learning_rate": 5.042010566673583e-07, "epoch": 0.8045330999216842, "percentage": 80.46, "elapsed_time": "1 day, 3:35:59", "remaining_time": "6:42:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8733, "total_steps": 10853, "loss": 0.1032, "learning_rate": 5.037423777313132e-07, "epoch": 0.8046252360989542, "percentage": 80.47, "elapsed_time": "1 day, 3:36:10", "remaining_time": "6:42:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8734, "total_steps": 10853, "loss": 0.105, "learning_rate": 5.032838841480042e-07, "epoch": 0.8047173722762243, "percentage": 80.48, "elapsed_time": "1 day, 3:36:20", "remaining_time": "6:41:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8735, "total_steps": 10853, "loss": 0.1232, "learning_rate": 5.028255759600004e-07, "epoch": 0.8048095084534943, "percentage": 80.48, "elapsed_time": "1 day, 3:36:30", "remaining_time": "6:41:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8736, "total_steps": 10853, "loss": 0.1129, "learning_rate": 5.023674532098571e-07, "epoch": 0.8049016446307643, "percentage": 80.49, "elapsed_time": "1 day, 3:36:39", "remaining_time": "6:41:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8737, "total_steps": 10853, "loss": 0.1217, "learning_rate": 5.019095159401113e-07, "epoch": 0.8049937808080343, "percentage": 80.5, "elapsed_time": "1 day, 3:36:50", "remaining_time": "6:41:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8738, "total_steps": 10853, "loss": 0.1292, "learning_rate": 5.01451764193282e-07, "epoch": 0.8050859169853043, "percentage": 80.51, "elapsed_time": "1 day, 3:37:01", "remaining_time": "6:41:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8739, "total_steps": 10853, "loss": 0.1202, "learning_rate": 5.009941980118707e-07, "epoch": 0.8051780531625743, "percentage": 80.52, "elapsed_time": "1 day, 3:37:12", "remaining_time": "6:40:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8740, "total_steps": 10853, "loss": 0.1123, "learning_rate": 5.005368174383634e-07, "epoch": 0.8052701893398443, "percentage": 80.53, "elapsed_time": "1 day, 3:37:21", "remaining_time": "6:40:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8741, "total_steps": 10853, "loss": 0.1152, "learning_rate": 5.000796225152277e-07, "epoch": 0.8053623255171143, "percentage": 80.54, "elapsed_time": "1 day, 3:37:32", "remaining_time": "6:40:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8742, "total_steps": 10853, "loss": 0.1098, "learning_rate": 4.996226132849149e-07, "epoch": 0.8054544616943843, "percentage": 80.55, "elapsed_time": "1 day, 3:37:44", "remaining_time": "6:40:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8743, "total_steps": 10853, "loss": 0.1253, "learning_rate": 4.99165789789858e-07, "epoch": 0.8055465978716543, "percentage": 80.56, "elapsed_time": "1 day, 3:37:56", "remaining_time": "6:40:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8744, "total_steps": 10853, "loss": 0.1178, "learning_rate": 4.987091520724721e-07, "epoch": 0.8056387340489243, "percentage": 80.57, "elapsed_time": "1 day, 3:38:06", "remaining_time": "6:39:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8745, "total_steps": 10853, "loss": 0.1197, "learning_rate": 4.982527001751567e-07, "epoch": 0.8057308702261943, "percentage": 80.58, "elapsed_time": "1 day, 3:38:18", "remaining_time": "6:39:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8746, "total_steps": 10853, "loss": 0.1221, "learning_rate": 4.977964341402941e-07, "epoch": 0.8058230064034643, "percentage": 80.59, "elapsed_time": "1 day, 3:38:29", "remaining_time": "6:39:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8747, "total_steps": 10853, "loss": 0.1085, "learning_rate": 4.973403540102476e-07, "epoch": 0.8059151425807344, "percentage": 80.6, "elapsed_time": "1 day, 3:38:40", "remaining_time": "6:39:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8748, "total_steps": 10853, "loss": 0.1055, "learning_rate": 4.968844598273653e-07, "epoch": 0.8060072787580044, "percentage": 80.6, "elapsed_time": "1 day, 3:38:50", "remaining_time": "6:39:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8749, "total_steps": 10853, "loss": 0.111, "learning_rate": 4.964287516339758e-07, "epoch": 0.8060994149352744, "percentage": 80.61, "elapsed_time": "1 day, 3:39:00", "remaining_time": "6:38:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8750, "total_steps": 10853, "loss": 0.1192, "learning_rate": 4.959732294723932e-07, "epoch": 0.8061915511125444, "percentage": 80.62, "elapsed_time": "1 day, 3:39:10", "remaining_time": "6:38:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8751, "total_steps": 10853, "loss": 0.1178, "learning_rate": 4.955178933849111e-07, "epoch": 0.8062836872898144, "percentage": 80.63, "elapsed_time": "1 day, 3:39:21", "remaining_time": "6:38:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8752, "total_steps": 10853, "loss": 0.1223, "learning_rate": 4.950627434138083e-07, "epoch": 0.8063758234670844, "percentage": 80.64, "elapsed_time": "1 day, 3:39:31", "remaining_time": "6:38:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8753, "total_steps": 10853, "loss": 0.1138, "learning_rate": 4.946077796013462e-07, "epoch": 0.8064679596443544, "percentage": 80.65, "elapsed_time": "1 day, 3:39:42", "remaining_time": "6:38:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8754, "total_steps": 10853, "loss": 0.1214, "learning_rate": 4.941530019897669e-07, "epoch": 0.8065600958216244, "percentage": 80.66, "elapsed_time": "1 day, 3:39:54", "remaining_time": "6:38:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8755, "total_steps": 10853, "loss": 0.1144, "learning_rate": 4.93698410621298e-07, "epoch": 0.8066522319988944, "percentage": 80.67, "elapsed_time": "1 day, 3:40:04", "remaining_time": "6:37:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8756, "total_steps": 10853, "loss": 0.1187, "learning_rate": 4.932440055381471e-07, "epoch": 0.8067443681761644, "percentage": 80.68, "elapsed_time": "1 day, 3:40:15", "remaining_time": "6:37:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8757, "total_steps": 10853, "loss": 0.1384, "learning_rate": 4.92789786782506e-07, "epoch": 0.8068365043534343, "percentage": 80.69, "elapsed_time": "1 day, 3:40:27", "remaining_time": "6:37:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8758, "total_steps": 10853, "loss": 0.1064, "learning_rate": 4.923357543965498e-07, "epoch": 0.8069286405307043, "percentage": 80.7, "elapsed_time": "1 day, 3:40:37", "remaining_time": "6:37:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8759, "total_steps": 10853, "loss": 0.109, "learning_rate": 4.918819084224353e-07, "epoch": 0.8070207767079743, "percentage": 80.71, "elapsed_time": "1 day, 3:40:48", "remaining_time": "6:37:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8760, "total_steps": 10853, "loss": 0.1275, "learning_rate": 4.914282489023006e-07, "epoch": 0.8071129128852443, "percentage": 80.72, "elapsed_time": "1 day, 3:40:59", "remaining_time": "6:36:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8761, "total_steps": 10853, "loss": 0.1239, "learning_rate": 4.909747758782693e-07, "epoch": 0.8072050490625144, "percentage": 80.72, "elapsed_time": "1 day, 3:41:09", "remaining_time": "6:36:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8762, "total_steps": 10853, "loss": 0.1128, "learning_rate": 4.905214893924462e-07, "epoch": 0.8072971852397844, "percentage": 80.73, "elapsed_time": "1 day, 3:41:21", "remaining_time": "6:36:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8763, "total_steps": 10853, "loss": 0.1307, "learning_rate": 4.900683894869198e-07, "epoch": 0.8073893214170544, "percentage": 80.74, "elapsed_time": "1 day, 3:41:31", "remaining_time": "6:36:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8764, "total_steps": 10853, "loss": 0.1242, "learning_rate": 4.8961547620376e-07, "epoch": 0.8074814575943244, "percentage": 80.75, "elapsed_time": "1 day, 3:41:42", "remaining_time": "6:36:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8765, "total_steps": 10853, "loss": 0.1142, "learning_rate": 4.891627495850188e-07, "epoch": 0.8075735937715944, "percentage": 80.76, "elapsed_time": "1 day, 3:41:52", "remaining_time": "6:35:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8766, "total_steps": 10853, "loss": 0.1167, "learning_rate": 4.887102096727326e-07, "epoch": 0.8076657299488644, "percentage": 80.77, "elapsed_time": "1 day, 3:42:02", "remaining_time": "6:35:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8767, "total_steps": 10853, "loss": 0.1185, "learning_rate": 4.882578565089205e-07, "epoch": 0.8077578661261344, "percentage": 80.78, "elapsed_time": "1 day, 3:42:14", "remaining_time": "6:35:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8768, "total_steps": 10853, "loss": 0.1279, "learning_rate": 4.878056901355823e-07, "epoch": 0.8078500023034044, "percentage": 80.79, "elapsed_time": "1 day, 3:42:26", "remaining_time": "6:35:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8769, "total_steps": 10853, "loss": 0.1229, "learning_rate": 4.873537105947029e-07, "epoch": 0.8079421384806744, "percentage": 80.8, "elapsed_time": "1 day, 3:42:38", "remaining_time": "6:35:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8770, "total_steps": 10853, "loss": 0.1285, "learning_rate": 4.869019179282478e-07, "epoch": 0.8080342746579444, "percentage": 80.81, "elapsed_time": "1 day, 3:42:49", "remaining_time": "6:34:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8771, "total_steps": 10853, "loss": 0.1232, "learning_rate": 4.864503121781666e-07, "epoch": 0.8081264108352144, "percentage": 80.82, "elapsed_time": "1 day, 3:43:00", "remaining_time": "6:34:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8772, "total_steps": 10853, "loss": 0.1199, "learning_rate": 4.859988933863898e-07, "epoch": 0.8082185470124844, "percentage": 80.83, "elapsed_time": "1 day, 3:43:11", "remaining_time": "6:34:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8773, "total_steps": 10853, "loss": 0.1255, "learning_rate": 4.85547661594833e-07, "epoch": 0.8083106831897544, "percentage": 80.83, "elapsed_time": "1 day, 3:43:21", "remaining_time": "6:34:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8774, "total_steps": 10853, "loss": 0.1305, "learning_rate": 4.850966168453922e-07, "epoch": 0.8084028193670245, "percentage": 80.84, "elapsed_time": "1 day, 3:43:34", "remaining_time": "6:34:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8775, "total_steps": 10853, "loss": 0.1166, "learning_rate": 4.846457591799489e-07, "epoch": 0.8084949555442945, "percentage": 80.85, "elapsed_time": "1 day, 3:43:43", "remaining_time": "6:33:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8776, "total_steps": 10853, "loss": 0.1201, "learning_rate": 4.841950886403623e-07, "epoch": 0.8085870917215645, "percentage": 80.86, "elapsed_time": "1 day, 3:43:54", "remaining_time": "6:33:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8777, "total_steps": 10853, "loss": 0.1337, "learning_rate": 4.837446052684788e-07, "epoch": 0.8086792278988345, "percentage": 80.87, "elapsed_time": "1 day, 3:44:04", "remaining_time": "6:33:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8778, "total_steps": 10853, "loss": 0.1097, "learning_rate": 4.832943091061257e-07, "epoch": 0.8087713640761045, "percentage": 80.88, "elapsed_time": "1 day, 3:44:15", "remaining_time": "6:33:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8779, "total_steps": 10853, "loss": 0.112, "learning_rate": 4.828442001951136e-07, "epoch": 0.8088635002533745, "percentage": 80.89, "elapsed_time": "1 day, 3:44:25", "remaining_time": "6:33:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8780, "total_steps": 10853, "loss": 0.1071, "learning_rate": 4.82394278577234e-07, "epoch": 0.8089556364306445, "percentage": 80.9, "elapsed_time": "1 day, 3:44:36", "remaining_time": "6:33:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8781, "total_steps": 10853, "loss": 0.13, "learning_rate": 4.819445442942633e-07, "epoch": 0.8090477726079145, "percentage": 80.91, "elapsed_time": "1 day, 3:44:48", "remaining_time": "6:32:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8782, "total_steps": 10853, "loss": 0.1148, "learning_rate": 4.814949973879582e-07, "epoch": 0.8091399087851845, "percentage": 80.92, "elapsed_time": "1 day, 3:44:57", "remaining_time": "6:32:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8783, "total_steps": 10853, "loss": 0.1189, "learning_rate": 4.8104563790006e-07, "epoch": 0.8092320449624545, "percentage": 80.93, "elapsed_time": "1 day, 3:45:08", "remaining_time": "6:32:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8784, "total_steps": 10853, "loss": 0.1242, "learning_rate": 4.805964658722922e-07, "epoch": 0.8093241811397245, "percentage": 80.94, "elapsed_time": "1 day, 3:45:19", "remaining_time": "6:32:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8785, "total_steps": 10853, "loss": 0.1259, "learning_rate": 4.801474813463591e-07, "epoch": 0.8094163173169945, "percentage": 80.95, "elapsed_time": "1 day, 3:45:29", "remaining_time": "6:32:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8786, "total_steps": 10853, "loss": 0.1269, "learning_rate": 4.796986843639506e-07, "epoch": 0.8095084534942645, "percentage": 80.95, "elapsed_time": "1 day, 3:45:40", "remaining_time": "6:31:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8787, "total_steps": 10853, "loss": 0.1225, "learning_rate": 4.792500749667359e-07, "epoch": 0.8096005896715345, "percentage": 80.96, "elapsed_time": "1 day, 3:45:52", "remaining_time": "6:31:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8788, "total_steps": 10853, "loss": 0.1164, "learning_rate": 4.788016531963699e-07, "epoch": 0.8096927258488046, "percentage": 80.97, "elapsed_time": "1 day, 3:46:03", "remaining_time": "6:31:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8789, "total_steps": 10853, "loss": 0.1176, "learning_rate": 4.783534190944872e-07, "epoch": 0.8097848620260746, "percentage": 80.98, "elapsed_time": "1 day, 3:46:13", "remaining_time": "6:31:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8790, "total_steps": 10853, "loss": 0.118, "learning_rate": 4.779053727027072e-07, "epoch": 0.8098769982033446, "percentage": 80.99, "elapsed_time": "1 day, 3:46:25", "remaining_time": "6:31:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8791, "total_steps": 10853, "loss": 0.1167, "learning_rate": 4.774575140626317e-07, "epoch": 0.8099691343806146, "percentage": 81.0, "elapsed_time": "1 day, 3:46:37", "remaining_time": "6:30:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8792, "total_steps": 10853, "loss": 0.1186, "learning_rate": 4.770098432158434e-07, "epoch": 0.8100612705578846, "percentage": 81.01, "elapsed_time": "1 day, 3:46:48", "remaining_time": "6:30:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8793, "total_steps": 10853, "loss": 0.1261, "learning_rate": 4.765623602039085e-07, "epoch": 0.8101534067351546, "percentage": 81.02, "elapsed_time": "1 day, 3:46:59", "remaining_time": "6:30:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8794, "total_steps": 10853, "loss": 0.1143, "learning_rate": 4.76115065068376e-07, "epoch": 0.8102455429124246, "percentage": 81.03, "elapsed_time": "1 day, 3:47:10", "remaining_time": "6:30:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8795, "total_steps": 10853, "loss": 0.1198, "learning_rate": 4.756679578507778e-07, "epoch": 0.8103376790896946, "percentage": 81.04, "elapsed_time": "1 day, 3:47:20", "remaining_time": "6:30:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8796, "total_steps": 10853, "loss": 0.1246, "learning_rate": 4.7522103859262813e-07, "epoch": 0.8104298152669646, "percentage": 81.05, "elapsed_time": "1 day, 3:47:31", "remaining_time": "6:29:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8797, "total_steps": 10853, "loss": 0.1088, "learning_rate": 4.7477430733542273e-07, "epoch": 0.8105219514442346, "percentage": 81.06, "elapsed_time": "1 day, 3:47:42", "remaining_time": "6:29:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8798, "total_steps": 10853, "loss": 0.1164, "learning_rate": 4.7432776412064034e-07, "epoch": 0.8106140876215046, "percentage": 81.07, "elapsed_time": "1 day, 3:47:54", "remaining_time": "6:29:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8799, "total_steps": 10853, "loss": 0.1118, "learning_rate": 4.738814089897431e-07, "epoch": 0.8107062237987746, "percentage": 81.07, "elapsed_time": "1 day, 3:48:04", "remaining_time": "6:29:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8800, "total_steps": 10853, "loss": 0.1128, "learning_rate": 4.734352419841756e-07, "epoch": 0.8107983599760445, "percentage": 81.08, "elapsed_time": "1 day, 3:48:14", "remaining_time": "6:29:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8801, "total_steps": 10853, "loss": 0.1121, "learning_rate": 4.7298926314536364e-07, "epoch": 0.8108904961533145, "percentage": 81.09, "elapsed_time": "1 day, 3:48:26", "remaining_time": "6:29:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8802, "total_steps": 10853, "loss": 0.1154, "learning_rate": 4.725434725147171e-07, "epoch": 0.8109826323305847, "percentage": 81.1, "elapsed_time": "1 day, 3:48:37", "remaining_time": "6:28:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8803, "total_steps": 10853, "loss": 0.1266, "learning_rate": 4.720978701336268e-07, "epoch": 0.8110747685078546, "percentage": 81.11, "elapsed_time": "1 day, 3:48:48", "remaining_time": "6:28:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8804, "total_steps": 10853, "loss": 0.1339, "learning_rate": 4.716524560434679e-07, "epoch": 0.8111669046851246, "percentage": 81.12, "elapsed_time": "1 day, 3:48:59", "remaining_time": "6:28:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8805, "total_steps": 10853, "loss": 0.1199, "learning_rate": 4.7120723028559633e-07, "epoch": 0.8112590408623946, "percentage": 81.13, "elapsed_time": "1 day, 3:49:11", "remaining_time": "6:28:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8806, "total_steps": 10853, "loss": 0.1225, "learning_rate": 4.70762192901352e-07, "epoch": 0.8113511770396646, "percentage": 81.14, "elapsed_time": "1 day, 3:49:23", "remaining_time": "6:28:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8807, "total_steps": 10853, "loss": 0.1239, "learning_rate": 4.7031734393205683e-07, "epoch": 0.8114433132169346, "percentage": 81.15, "elapsed_time": "1 day, 3:49:33", "remaining_time": "6:27:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8808, "total_steps": 10853, "loss": 0.1179, "learning_rate": 4.6987268341901455e-07, "epoch": 0.8115354493942046, "percentage": 81.16, "elapsed_time": "1 day, 3:49:44", "remaining_time": "6:27:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8809, "total_steps": 10853, "loss": 0.1174, "learning_rate": 4.6942821140351174e-07, "epoch": 0.8116275855714746, "percentage": 81.17, "elapsed_time": "1 day, 3:49:54", "remaining_time": "6:27:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8810, "total_steps": 10853, "loss": 0.1187, "learning_rate": 4.6898392792681796e-07, "epoch": 0.8117197217487446, "percentage": 81.18, "elapsed_time": "1 day, 3:50:04", "remaining_time": "6:27:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8811, "total_steps": 10853, "loss": 0.1206, "learning_rate": 4.6853983303018493e-07, "epoch": 0.8118118579260146, "percentage": 81.18, "elapsed_time": "1 day, 3:50:15", "remaining_time": "6:27:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8812, "total_steps": 10853, "loss": 0.1181, "learning_rate": 4.680959267548479e-07, "epoch": 0.8119039941032846, "percentage": 81.19, "elapsed_time": "1 day, 3:50:26", "remaining_time": "6:26:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8813, "total_steps": 10853, "loss": 0.1295, "learning_rate": 4.676522091420227e-07, "epoch": 0.8119961302805546, "percentage": 81.2, "elapsed_time": "1 day, 3:50:37", "remaining_time": "6:26:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8814, "total_steps": 10853, "loss": 0.1106, "learning_rate": 4.672086802329079e-07, "epoch": 0.8120882664578246, "percentage": 81.21, "elapsed_time": "1 day, 3:50:49", "remaining_time": "6:26:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8815, "total_steps": 10853, "loss": 0.1226, "learning_rate": 4.667653400686858e-07, "epoch": 0.8121804026350947, "percentage": 81.22, "elapsed_time": "1 day, 3:51:00", "remaining_time": "6:26:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8816, "total_steps": 10853, "loss": 0.1046, "learning_rate": 4.6632218869052085e-07, "epoch": 0.8122725388123647, "percentage": 81.23, "elapsed_time": "1 day, 3:51:10", "remaining_time": "6:26:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8817, "total_steps": 10853, "loss": 0.1274, "learning_rate": 4.6587922613956005e-07, "epoch": 0.8123646749896347, "percentage": 81.24, "elapsed_time": "1 day, 3:51:21", "remaining_time": "6:25:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8818, "total_steps": 10853, "loss": 0.1234, "learning_rate": 4.6543645245693215e-07, "epoch": 0.8124568111669047, "percentage": 81.25, "elapsed_time": "1 day, 3:51:32", "remaining_time": "6:25:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8819, "total_steps": 10853, "loss": 0.1283, "learning_rate": 4.649938676837479e-07, "epoch": 0.8125489473441747, "percentage": 81.26, "elapsed_time": "1 day, 3:51:43", "remaining_time": "6:25:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8820, "total_steps": 10853, "loss": 0.1253, "learning_rate": 4.6455147186110217e-07, "epoch": 0.8126410835214447, "percentage": 81.27, "elapsed_time": "1 day, 3:51:54", "remaining_time": "6:25:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8821, "total_steps": 10853, "loss": 0.1121, "learning_rate": 4.6410926503007187e-07, "epoch": 0.8127332196987147, "percentage": 81.28, "elapsed_time": "1 day, 3:52:05", "remaining_time": "6:25:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8822, "total_steps": 10853, "loss": 0.1219, "learning_rate": 4.636672472317147e-07, "epoch": 0.8128253558759847, "percentage": 81.29, "elapsed_time": "1 day, 3:52:17", "remaining_time": "6:24:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8823, "total_steps": 10853, "loss": 0.1179, "learning_rate": 4.6322541850707336e-07, "epoch": 0.8129174920532547, "percentage": 81.3, "elapsed_time": "1 day, 3:52:27", "remaining_time": "6:24:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8824, "total_steps": 10853, "loss": 0.1201, "learning_rate": 4.6278377889717064e-07, "epoch": 0.8130096282305247, "percentage": 81.3, "elapsed_time": "1 day, 3:52:37", "remaining_time": "6:24:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8825, "total_steps": 10853, "loss": 0.1073, "learning_rate": 4.62342328443014e-07, "epoch": 0.8131017644077947, "percentage": 81.31, "elapsed_time": "1 day, 3:52:49", "remaining_time": "6:24:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8826, "total_steps": 10853, "loss": 0.1228, "learning_rate": 4.6190106718559056e-07, "epoch": 0.8131939005850647, "percentage": 81.32, "elapsed_time": "1 day, 3:52:59", "remaining_time": "6:24:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8827, "total_steps": 10853, "loss": 0.1136, "learning_rate": 4.614599951658727e-07, "epoch": 0.8132860367623347, "percentage": 81.33, "elapsed_time": "1 day, 3:53:10", "remaining_time": "6:24:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8828, "total_steps": 10853, "loss": 0.1072, "learning_rate": 4.6101911242481396e-07, "epoch": 0.8133781729396047, "percentage": 81.34, "elapsed_time": "1 day, 3:53:20", "remaining_time": "6:23:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8829, "total_steps": 10853, "loss": 0.1195, "learning_rate": 4.605784190033502e-07, "epoch": 0.8134703091168748, "percentage": 81.35, "elapsed_time": "1 day, 3:53:32", "remaining_time": "6:23:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8830, "total_steps": 10853, "loss": 0.1129, "learning_rate": 4.6013791494239927e-07, "epoch": 0.8135624452941448, "percentage": 81.36, "elapsed_time": "1 day, 3:53:44", "remaining_time": "6:23:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8831, "total_steps": 10853, "loss": 0.1193, "learning_rate": 4.5969760028286236e-07, "epoch": 0.8136545814714148, "percentage": 81.37, "elapsed_time": "1 day, 3:53:55", "remaining_time": "6:23:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8832, "total_steps": 10853, "loss": 0.1192, "learning_rate": 4.5925747506562287e-07, "epoch": 0.8137467176486848, "percentage": 81.38, "elapsed_time": "1 day, 3:54:06", "remaining_time": "6:23:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8833, "total_steps": 10853, "loss": 0.1143, "learning_rate": 4.5881753933154695e-07, "epoch": 0.8138388538259548, "percentage": 81.39, "elapsed_time": "1 day, 3:54:18", "remaining_time": "6:22:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8834, "total_steps": 10853, "loss": 0.1279, "learning_rate": 4.5837779312148225e-07, "epoch": 0.8139309900032248, "percentage": 81.4, "elapsed_time": "1 day, 3:54:30", "remaining_time": "6:22:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8835, "total_steps": 10853, "loss": 0.129, "learning_rate": 4.5793823647625856e-07, "epoch": 0.8140231261804948, "percentage": 81.41, "elapsed_time": "1 day, 3:54:40", "remaining_time": "6:22:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8836, "total_steps": 10853, "loss": 0.1237, "learning_rate": 4.574988694366894e-07, "epoch": 0.8141152623577648, "percentage": 81.42, "elapsed_time": "1 day, 3:54:52", "remaining_time": "6:22:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8837, "total_steps": 10853, "loss": 0.1119, "learning_rate": 4.570596920435708e-07, "epoch": 0.8142073985350348, "percentage": 81.42, "elapsed_time": "1 day, 3:55:03", "remaining_time": "6:22:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8838, "total_steps": 10853, "loss": 0.1114, "learning_rate": 4.566207043376789e-07, "epoch": 0.8142995347123048, "percentage": 81.43, "elapsed_time": "1 day, 3:55:14", "remaining_time": "6:21:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8839, "total_steps": 10853, "loss": 0.123, "learning_rate": 4.56181906359775e-07, "epoch": 0.8143916708895748, "percentage": 81.44, "elapsed_time": "1 day, 3:55:25", "remaining_time": "6:21:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8840, "total_steps": 10853, "loss": 0.1217, "learning_rate": 4.557432981506005e-07, "epoch": 0.8144838070668448, "percentage": 81.45, "elapsed_time": "1 day, 3:55:35", "remaining_time": "6:21:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8841, "total_steps": 10853, "loss": 0.1194, "learning_rate": 4.5530487975088076e-07, "epoch": 0.8145759432441148, "percentage": 81.46, "elapsed_time": "1 day, 3:55:45", "remaining_time": "6:21:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8842, "total_steps": 10853, "loss": 0.1219, "learning_rate": 4.548666512013236e-07, "epoch": 0.8146680794213849, "percentage": 81.47, "elapsed_time": "1 day, 3:55:56", "remaining_time": "6:21:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8843, "total_steps": 10853, "loss": 0.1186, "learning_rate": 4.5442861254261753e-07, "epoch": 0.8147602155986549, "percentage": 81.48, "elapsed_time": "1 day, 3:56:06", "remaining_time": "6:20:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8844, "total_steps": 10853, "loss": 0.1192, "learning_rate": 4.5399076381543536e-07, "epoch": 0.8148523517759249, "percentage": 81.49, "elapsed_time": "1 day, 3:56:17", "remaining_time": "6:20:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8845, "total_steps": 10853, "loss": 0.112, "learning_rate": 4.5355310506043053e-07, "epoch": 0.8149444879531949, "percentage": 81.5, "elapsed_time": "1 day, 3:56:27", "remaining_time": "6:20:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8846, "total_steps": 10853, "loss": 0.1112, "learning_rate": 4.531156363182407e-07, "epoch": 0.8150366241304648, "percentage": 81.51, "elapsed_time": "1 day, 3:56:37", "remaining_time": "6:20:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8847, "total_steps": 10853, "loss": 0.1274, "learning_rate": 4.526783576294835e-07, "epoch": 0.8151287603077348, "percentage": 81.52, "elapsed_time": "1 day, 3:56:49", "remaining_time": "6:20:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8848, "total_steps": 10853, "loss": 0.1144, "learning_rate": 4.5224126903476136e-07, "epoch": 0.8152208964850048, "percentage": 81.53, "elapsed_time": "1 day, 3:56:59", "remaining_time": "6:20:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8849, "total_steps": 10853, "loss": 0.121, "learning_rate": 4.518043705746578e-07, "epoch": 0.8153130326622748, "percentage": 81.54, "elapsed_time": "1 day, 3:57:10", "remaining_time": "6:19:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8850, "total_steps": 10853, "loss": 0.1259, "learning_rate": 4.5136766228974005e-07, "epoch": 0.8154051688395448, "percentage": 81.54, "elapsed_time": "1 day, 3:57:21", "remaining_time": "6:19:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8851, "total_steps": 10853, "loss": 0.1128, "learning_rate": 4.509311442205538e-07, "epoch": 0.8154973050168148, "percentage": 81.55, "elapsed_time": "1 day, 3:57:31", "remaining_time": "6:19:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8852, "total_steps": 10853, "loss": 0.1173, "learning_rate": 4.504948164076317e-07, "epoch": 0.8155894411940848, "percentage": 81.56, "elapsed_time": "1 day, 3:57:41", "remaining_time": "6:19:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8853, "total_steps": 10853, "loss": 0.108, "learning_rate": 4.5005867889148626e-07, "epoch": 0.8156815773713548, "percentage": 81.57, "elapsed_time": "1 day, 3:57:51", "remaining_time": "6:19:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8854, "total_steps": 10853, "loss": 0.1177, "learning_rate": 4.4962273171261393e-07, "epoch": 0.8157737135486248, "percentage": 81.58, "elapsed_time": "1 day, 3:58:03", "remaining_time": "6:18:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8855, "total_steps": 10853, "loss": 0.1016, "learning_rate": 4.491869749114908e-07, "epoch": 0.8158658497258948, "percentage": 81.59, "elapsed_time": "1 day, 3:58:14", "remaining_time": "6:18:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8856, "total_steps": 10853, "loss": 0.1213, "learning_rate": 4.4875140852857854e-07, "epoch": 0.8159579859031649, "percentage": 81.6, "elapsed_time": "1 day, 3:58:24", "remaining_time": "6:18:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8857, "total_steps": 10853, "loss": 0.1307, "learning_rate": 4.4831603260431787e-07, "epoch": 0.8160501220804349, "percentage": 81.61, "elapsed_time": "1 day, 3:58:36", "remaining_time": "6:18:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8858, "total_steps": 10853, "loss": 0.1084, "learning_rate": 4.478808471791354e-07, "epoch": 0.8161422582577049, "percentage": 81.62, "elapsed_time": "1 day, 3:58:47", "remaining_time": "6:18:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8859, "total_steps": 10853, "loss": 0.1268, "learning_rate": 4.474458522934361e-07, "epoch": 0.8162343944349749, "percentage": 81.63, "elapsed_time": "1 day, 3:58:58", "remaining_time": "6:17:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8860, "total_steps": 10853, "loss": 0.1232, "learning_rate": 4.470110479876105e-07, "epoch": 0.8163265306122449, "percentage": 81.64, "elapsed_time": "1 day, 3:59:10", "remaining_time": "6:17:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8861, "total_steps": 10853, "loss": 0.1086, "learning_rate": 4.4657643430203067e-07, "epoch": 0.8164186667895149, "percentage": 81.65, "elapsed_time": "1 day, 3:59:22", "remaining_time": "6:17:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8862, "total_steps": 10853, "loss": 0.1232, "learning_rate": 4.461420112770501e-07, "epoch": 0.8165108029667849, "percentage": 81.65, "elapsed_time": "1 day, 3:59:32", "remaining_time": "6:17:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8863, "total_steps": 10853, "loss": 0.1166, "learning_rate": 4.45707778953004e-07, "epoch": 0.8166029391440549, "percentage": 81.66, "elapsed_time": "1 day, 3:59:43", "remaining_time": "6:17:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8864, "total_steps": 10853, "loss": 0.1229, "learning_rate": 4.452737373702115e-07, "epoch": 0.8166950753213249, "percentage": 81.67, "elapsed_time": "1 day, 3:59:53", "remaining_time": "6:16:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8865, "total_steps": 10853, "loss": 0.1105, "learning_rate": 4.44839886568974e-07, "epoch": 0.8167872114985949, "percentage": 81.68, "elapsed_time": "1 day, 4:00:05", "remaining_time": "6:16:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8866, "total_steps": 10853, "loss": 0.1207, "learning_rate": 4.444062265895746e-07, "epoch": 0.8168793476758649, "percentage": 81.69, "elapsed_time": "1 day, 4:00:14", "remaining_time": "6:16:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8867, "total_steps": 10853, "loss": 0.1159, "learning_rate": 4.439727574722783e-07, "epoch": 0.8169714838531349, "percentage": 81.7, "elapsed_time": "1 day, 4:00:26", "remaining_time": "6:16:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8868, "total_steps": 10853, "loss": 0.114, "learning_rate": 4.435394792573322e-07, "epoch": 0.8170636200304049, "percentage": 81.71, "elapsed_time": "1 day, 4:00:37", "remaining_time": "6:16:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8869, "total_steps": 10853, "loss": 0.1171, "learning_rate": 4.431063919849668e-07, "epoch": 0.8171557562076749, "percentage": 81.72, "elapsed_time": "1 day, 4:00:48", "remaining_time": "6:15:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8870, "total_steps": 10853, "loss": 0.114, "learning_rate": 4.4267349569539404e-07, "epoch": 0.817247892384945, "percentage": 81.73, "elapsed_time": "1 day, 4:00:58", "remaining_time": "6:15:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8871, "total_steps": 10853, "loss": 0.1259, "learning_rate": 4.422407904288095e-07, "epoch": 0.817340028562215, "percentage": 81.74, "elapsed_time": "1 day, 4:01:09", "remaining_time": "6:15:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8872, "total_steps": 10853, "loss": 0.1072, "learning_rate": 4.418082762253889e-07, "epoch": 0.817432164739485, "percentage": 81.75, "elapsed_time": "1 day, 4:01:19", "remaining_time": "6:15:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8873, "total_steps": 10853, "loss": 0.1004, "learning_rate": 4.4137595312529066e-07, "epoch": 0.817524300916755, "percentage": 81.76, "elapsed_time": "1 day, 4:01:30", "remaining_time": "6:15:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8874, "total_steps": 10853, "loss": 0.1161, "learning_rate": 4.4094382116865704e-07, "epoch": 0.817616437094025, "percentage": 81.77, "elapsed_time": "1 day, 4:01:42", "remaining_time": "6:15:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8875, "total_steps": 10853, "loss": 0.1294, "learning_rate": 4.4051188039561156e-07, "epoch": 0.817708573271295, "percentage": 81.77, "elapsed_time": "1 day, 4:01:53", "remaining_time": "6:14:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8876, "total_steps": 10853, "loss": 0.1223, "learning_rate": 4.400801308462591e-07, "epoch": 0.817800709448565, "percentage": 81.78, "elapsed_time": "1 day, 4:02:04", "remaining_time": "6:14:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8877, "total_steps": 10853, "loss": 0.1133, "learning_rate": 4.396485725606886e-07, "epoch": 0.817892845625835, "percentage": 81.79, "elapsed_time": "1 day, 4:02:16", "remaining_time": "6:14:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8878, "total_steps": 10853, "loss": 0.1228, "learning_rate": 4.3921720557896953e-07, "epoch": 0.817984981803105, "percentage": 81.8, "elapsed_time": "1 day, 4:02:28", "remaining_time": "6:14:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8879, "total_steps": 10853, "loss": 0.1203, "learning_rate": 4.387860299411553e-07, "epoch": 0.818077117980375, "percentage": 81.81, "elapsed_time": "1 day, 4:02:39", "remaining_time": "6:14:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8880, "total_steps": 10853, "loss": 0.1145, "learning_rate": 4.383550456872793e-07, "epoch": 0.818169254157645, "percentage": 81.82, "elapsed_time": "1 day, 4:02:50", "remaining_time": "6:13:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8881, "total_steps": 10853, "loss": 0.1277, "learning_rate": 4.3792425285735935e-07, "epoch": 0.818261390334915, "percentage": 81.83, "elapsed_time": "1 day, 4:03:00", "remaining_time": "6:13:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8882, "total_steps": 10853, "loss": 0.1229, "learning_rate": 4.3749365149139493e-07, "epoch": 0.818353526512185, "percentage": 81.84, "elapsed_time": "1 day, 4:03:12", "remaining_time": "6:13:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8883, "total_steps": 10853, "loss": 0.1073, "learning_rate": 4.3706324162936684e-07, "epoch": 0.8184456626894551, "percentage": 81.85, "elapsed_time": "1 day, 4:03:22", "remaining_time": "6:13:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8884, "total_steps": 10853, "loss": 0.119, "learning_rate": 4.3663302331123815e-07, "epoch": 0.8185377988667251, "percentage": 81.86, "elapsed_time": "1 day, 4:03:33", "remaining_time": "6:13:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8885, "total_steps": 10853, "loss": 0.1149, "learning_rate": 4.362029965769554e-07, "epoch": 0.8186299350439951, "percentage": 81.87, "elapsed_time": "1 day, 4:03:45", "remaining_time": "6:12:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8886, "total_steps": 10853, "loss": 0.1249, "learning_rate": 4.3577316146644677e-07, "epoch": 0.8187220712212651, "percentage": 81.88, "elapsed_time": "1 day, 4:03:56", "remaining_time": "6:12:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8887, "total_steps": 10853, "loss": 0.1158, "learning_rate": 4.353435180196225e-07, "epoch": 0.818814207398535, "percentage": 81.89, "elapsed_time": "1 day, 4:04:07", "remaining_time": "6:12:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8888, "total_steps": 10853, "loss": 0.118, "learning_rate": 4.349140662763751e-07, "epoch": 0.818906343575805, "percentage": 81.89, "elapsed_time": "1 day, 4:04:18", "remaining_time": "6:12:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8889, "total_steps": 10853, "loss": 0.1262, "learning_rate": 4.3448480627657804e-07, "epoch": 0.818998479753075, "percentage": 81.9, "elapsed_time": "1 day, 4:04:30", "remaining_time": "6:12:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8890, "total_steps": 10853, "loss": 0.1236, "learning_rate": 4.3405573806008905e-07, "epoch": 0.819090615930345, "percentage": 81.91, "elapsed_time": "1 day, 4:04:42", "remaining_time": "6:11:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8891, "total_steps": 10853, "loss": 0.1198, "learning_rate": 4.336268616667477e-07, "epoch": 0.819182752107615, "percentage": 81.92, "elapsed_time": "1 day, 4:04:51", "remaining_time": "6:11:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8892, "total_steps": 10853, "loss": 0.1159, "learning_rate": 4.3319817713637415e-07, "epoch": 0.819274888284885, "percentage": 81.93, "elapsed_time": "1 day, 4:05:02", "remaining_time": "6:11:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8893, "total_steps": 10853, "loss": 0.1145, "learning_rate": 4.327696845087728e-07, "epoch": 0.819367024462155, "percentage": 81.94, "elapsed_time": "1 day, 4:05:13", "remaining_time": "6:11:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8894, "total_steps": 10853, "loss": 0.1148, "learning_rate": 4.323413838237281e-07, "epoch": 0.819459160639425, "percentage": 81.95, "elapsed_time": "1 day, 4:05:23", "remaining_time": "6:11:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8895, "total_steps": 10853, "loss": 0.1044, "learning_rate": 4.319132751210084e-07, "epoch": 0.819551296816695, "percentage": 81.96, "elapsed_time": "1 day, 4:05:34", "remaining_time": "6:11:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8896, "total_steps": 10853, "loss": 0.1277, "learning_rate": 4.3148535844036444e-07, "epoch": 0.819643432993965, "percentage": 81.97, "elapsed_time": "1 day, 4:05:45", "remaining_time": "6:10:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8897, "total_steps": 10853, "loss": 0.1042, "learning_rate": 4.310576338215269e-07, "epoch": 0.8197355691712351, "percentage": 81.98, "elapsed_time": "1 day, 4:05:56", "remaining_time": "6:10:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8898, "total_steps": 10853, "loss": 0.1137, "learning_rate": 4.3063010130421133e-07, "epoch": 0.8198277053485051, "percentage": 81.99, "elapsed_time": "1 day, 4:06:07", "remaining_time": "6:10:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8899, "total_steps": 10853, "loss": 0.1196, "learning_rate": 4.302027609281129e-07, "epoch": 0.8199198415257751, "percentage": 82.0, "elapsed_time": "1 day, 4:06:19", "remaining_time": "6:10:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8900, "total_steps": 10853, "loss": 0.1255, "learning_rate": 4.2977561273291166e-07, "epoch": 0.8200119777030451, "percentage": 82.0, "elapsed_time": "1 day, 4:06:30", "remaining_time": "6:10:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8901, "total_steps": 10853, "loss": 0.1116, "learning_rate": 4.2934865675826666e-07, "epoch": 0.8201041138803151, "percentage": 82.01, "elapsed_time": "1 day, 4:06:40", "remaining_time": "6:09:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8902, "total_steps": 10853, "loss": 0.1194, "learning_rate": 4.289218930438219e-07, "epoch": 0.8201962500575851, "percentage": 82.02, "elapsed_time": "1 day, 4:06:51", "remaining_time": "6:09:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8903, "total_steps": 10853, "loss": 0.1276, "learning_rate": 4.284953216292029e-07, "epoch": 0.8202883862348551, "percentage": 82.03, "elapsed_time": "1 day, 4:07:02", "remaining_time": "6:09:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8904, "total_steps": 10853, "loss": 0.1178, "learning_rate": 4.280689425540163e-07, "epoch": 0.8203805224121251, "percentage": 82.04, "elapsed_time": "1 day, 4:07:13", "remaining_time": "6:09:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8905, "total_steps": 10853, "loss": 0.1096, "learning_rate": 4.2764275585785054e-07, "epoch": 0.8204726585893951, "percentage": 82.05, "elapsed_time": "1 day, 4:07:23", "remaining_time": "6:09:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8906, "total_steps": 10853, "loss": 0.1183, "learning_rate": 4.27216761580278e-07, "epoch": 0.8205647947666651, "percentage": 82.06, "elapsed_time": "1 day, 4:07:34", "remaining_time": "6:08:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8907, "total_steps": 10853, "loss": 0.1202, "learning_rate": 4.2679095976085217e-07, "epoch": 0.8206569309439351, "percentage": 82.07, "elapsed_time": "1 day, 4:07:45", "remaining_time": "6:08:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8908, "total_steps": 10853, "loss": 0.1181, "learning_rate": 4.2636535043910965e-07, "epoch": 0.8207490671212051, "percentage": 82.08, "elapsed_time": "1 day, 4:07:55", "remaining_time": "6:08:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8909, "total_steps": 10853, "loss": 0.1126, "learning_rate": 4.2593993365456746e-07, "epoch": 0.8208412032984751, "percentage": 82.09, "elapsed_time": "1 day, 4:08:05", "remaining_time": "6:08:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8910, "total_steps": 10853, "loss": 0.1177, "learning_rate": 4.255147094467249e-07, "epoch": 0.8209333394757452, "percentage": 82.1, "elapsed_time": "1 day, 4:08:18", "remaining_time": "6:08:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8911, "total_steps": 10853, "loss": 0.1262, "learning_rate": 4.250896778550648e-07, "epoch": 0.8210254756530152, "percentage": 82.11, "elapsed_time": "1 day, 4:08:29", "remaining_time": "6:07:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8912, "total_steps": 10853, "loss": 0.1115, "learning_rate": 4.246648389190522e-07, "epoch": 0.8211176118302852, "percentage": 82.12, "elapsed_time": "1 day, 4:08:38", "remaining_time": "6:07:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8913, "total_steps": 10853, "loss": 0.1262, "learning_rate": 4.24240192678132e-07, "epoch": 0.8212097480075552, "percentage": 82.12, "elapsed_time": "1 day, 4:08:49", "remaining_time": "6:07:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8914, "total_steps": 10853, "loss": 0.115, "learning_rate": 4.23815739171734e-07, "epoch": 0.8213018841848252, "percentage": 82.13, "elapsed_time": "1 day, 4:08:58", "remaining_time": "6:07:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8915, "total_steps": 10853, "loss": 0.1298, "learning_rate": 4.233914784392673e-07, "epoch": 0.8213940203620952, "percentage": 82.14, "elapsed_time": "1 day, 4:09:09", "remaining_time": "6:07:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8916, "total_steps": 10853, "loss": 0.1166, "learning_rate": 4.229674105201259e-07, "epoch": 0.8214861565393652, "percentage": 82.15, "elapsed_time": "1 day, 4:09:19", "remaining_time": "6:07:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8917, "total_steps": 10853, "loss": 0.116, "learning_rate": 4.225435354536833e-07, "epoch": 0.8215782927166352, "percentage": 82.16, "elapsed_time": "1 day, 4:09:30", "remaining_time": "6:06:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8918, "total_steps": 10853, "loss": 0.1141, "learning_rate": 4.221198532792972e-07, "epoch": 0.8216704288939052, "percentage": 82.17, "elapsed_time": "1 day, 4:09:38", "remaining_time": "6:06:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8919, "total_steps": 10853, "loss": 0.1184, "learning_rate": 4.2169636403630697e-07, "epoch": 0.8217625650711752, "percentage": 82.18, "elapsed_time": "1 day, 4:09:48", "remaining_time": "6:06:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8920, "total_steps": 10853, "loss": 0.1157, "learning_rate": 4.212730677640328e-07, "epoch": 0.8218547012484452, "percentage": 82.19, "elapsed_time": "1 day, 4:09:59", "remaining_time": "6:06:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8921, "total_steps": 10853, "loss": 0.12, "learning_rate": 4.2084996450177744e-07, "epoch": 0.8219468374257152, "percentage": 82.2, "elapsed_time": "1 day, 4:10:10", "remaining_time": "6:06:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8922, "total_steps": 10853, "loss": 0.1286, "learning_rate": 4.20427054288827e-07, "epoch": 0.8220389736029852, "percentage": 82.21, "elapsed_time": "1 day, 4:10:21", "remaining_time": "6:05:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8923, "total_steps": 10853, "loss": 0.1252, "learning_rate": 4.20004337164448e-07, "epoch": 0.8221311097802552, "percentage": 82.22, "elapsed_time": "1 day, 4:10:32", "remaining_time": "6:05:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8924, "total_steps": 10853, "loss": 0.1116, "learning_rate": 4.1958181316789084e-07, "epoch": 0.8222232459575253, "percentage": 82.23, "elapsed_time": "1 day, 4:10:41", "remaining_time": "6:05:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8925, "total_steps": 10853, "loss": 0.1131, "learning_rate": 4.1915948233838625e-07, "epoch": 0.8223153821347953, "percentage": 82.24, "elapsed_time": "1 day, 4:10:54", "remaining_time": "6:05:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8926, "total_steps": 10853, "loss": 0.119, "learning_rate": 4.1873734471514685e-07, "epoch": 0.8224075183120653, "percentage": 82.24, "elapsed_time": "1 day, 4:11:04", "remaining_time": "6:05:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8927, "total_steps": 10853, "loss": 0.1098, "learning_rate": 4.1831540033736935e-07, "epoch": 0.8224996544893353, "percentage": 82.25, "elapsed_time": "1 day, 4:11:14", "remaining_time": "6:04:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8928, "total_steps": 10853, "loss": 0.1201, "learning_rate": 4.1789364924423067e-07, "epoch": 0.8225917906666053, "percentage": 82.26, "elapsed_time": "1 day, 4:11:25", "remaining_time": "6:04:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8929, "total_steps": 10853, "loss": 0.1212, "learning_rate": 4.174720914748914e-07, "epoch": 0.8226839268438753, "percentage": 82.27, "elapsed_time": "1 day, 4:11:36", "remaining_time": "6:04:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8930, "total_steps": 10853, "loss": 0.1146, "learning_rate": 4.1705072706849287e-07, "epoch": 0.8227760630211453, "percentage": 82.28, "elapsed_time": "1 day, 4:11:47", "remaining_time": "6:04:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8931, "total_steps": 10853, "loss": 0.1214, "learning_rate": 4.166295560641576e-07, "epoch": 0.8228681991984153, "percentage": 82.29, "elapsed_time": "1 day, 4:11:59", "remaining_time": "6:04:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8932, "total_steps": 10853, "loss": 0.1155, "learning_rate": 4.1620857850099227e-07, "epoch": 0.8229603353756852, "percentage": 82.3, "elapsed_time": "1 day, 4:12:10", "remaining_time": "6:03:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8933, "total_steps": 10853, "loss": 0.1293, "learning_rate": 4.157877944180852e-07, "epoch": 0.8230524715529552, "percentage": 82.31, "elapsed_time": "1 day, 4:12:19", "remaining_time": "6:03:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8934, "total_steps": 10853, "loss": 0.128, "learning_rate": 4.153672038545054e-07, "epoch": 0.8231446077302252, "percentage": 82.32, "elapsed_time": "1 day, 4:12:30", "remaining_time": "6:03:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8935, "total_steps": 10853, "loss": 0.1413, "learning_rate": 4.1494680684930485e-07, "epoch": 0.8232367439074952, "percentage": 82.33, "elapsed_time": "1 day, 4:12:41", "remaining_time": "6:03:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8936, "total_steps": 10853, "loss": 0.1247, "learning_rate": 4.1452660344151826e-07, "epoch": 0.8233288800847652, "percentage": 82.34, "elapsed_time": "1 day, 4:12:51", "remaining_time": "6:03:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8937, "total_steps": 10853, "loss": 0.1045, "learning_rate": 4.141065936701613e-07, "epoch": 0.8234210162620353, "percentage": 82.35, "elapsed_time": "1 day, 4:13:02", "remaining_time": "6:02:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8938, "total_steps": 10853, "loss": 0.1285, "learning_rate": 4.1368677757423064e-07, "epoch": 0.8235131524393053, "percentage": 82.36, "elapsed_time": "1 day, 4:13:14", "remaining_time": "6:02:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8939, "total_steps": 10853, "loss": 0.1302, "learning_rate": 4.1326715519270725e-07, "epoch": 0.8236052886165753, "percentage": 82.36, "elapsed_time": "1 day, 4:13:25", "remaining_time": "6:02:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8940, "total_steps": 10853, "loss": 0.1276, "learning_rate": 4.1284772656455334e-07, "epoch": 0.8236974247938453, "percentage": 82.37, "elapsed_time": "1 day, 4:13:36", "remaining_time": "6:02:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8941, "total_steps": 10853, "loss": 0.1341, "learning_rate": 4.12428491728713e-07, "epoch": 0.8237895609711153, "percentage": 82.38, "elapsed_time": "1 day, 4:13:47", "remaining_time": "6:02:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8942, "total_steps": 10853, "loss": 0.121, "learning_rate": 4.1200945072411207e-07, "epoch": 0.8238816971483853, "percentage": 82.39, "elapsed_time": "1 day, 4:13:57", "remaining_time": "6:02:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8943, "total_steps": 10853, "loss": 0.1326, "learning_rate": 4.1159060358965745e-07, "epoch": 0.8239738333256553, "percentage": 82.4, "elapsed_time": "1 day, 4:14:09", "remaining_time": "6:01:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8944, "total_steps": 10853, "loss": 0.1183, "learning_rate": 4.111719503642403e-07, "epoch": 0.8240659695029253, "percentage": 82.41, "elapsed_time": "1 day, 4:14:19", "remaining_time": "6:01:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8945, "total_steps": 10853, "loss": 0.1355, "learning_rate": 4.1075349108673306e-07, "epoch": 0.8241581056801953, "percentage": 82.42, "elapsed_time": "1 day, 4:14:28", "remaining_time": "6:01:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8946, "total_steps": 10853, "loss": 0.1413, "learning_rate": 4.1033522579598804e-07, "epoch": 0.8242502418574653, "percentage": 82.43, "elapsed_time": "1 day, 4:14:38", "remaining_time": "6:01:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8947, "total_steps": 10853, "loss": 0.1146, "learning_rate": 4.0991715453084307e-07, "epoch": 0.8243423780347353, "percentage": 82.44, "elapsed_time": "1 day, 4:14:48", "remaining_time": "6:01:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8948, "total_steps": 10853, "loss": 0.1172, "learning_rate": 4.0949927733011455e-07, "epoch": 0.8244345142120053, "percentage": 82.45, "elapsed_time": "1 day, 4:14:59", "remaining_time": "6:00:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8949, "total_steps": 10853, "loss": 0.1142, "learning_rate": 4.0908159423260374e-07, "epoch": 0.8245266503892753, "percentage": 82.46, "elapsed_time": "1 day, 4:15:10", "remaining_time": "6:00:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8950, "total_steps": 10853, "loss": 0.1162, "learning_rate": 4.086641052770915e-07, "epoch": 0.8246187865665453, "percentage": 82.47, "elapsed_time": "1 day, 4:15:22", "remaining_time": "6:00:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8951, "total_steps": 10853, "loss": 0.1209, "learning_rate": 4.082468105023418e-07, "epoch": 0.8247109227438154, "percentage": 82.47, "elapsed_time": "1 day, 4:15:33", "remaining_time": "6:00:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8952, "total_steps": 10853, "loss": 0.1143, "learning_rate": 4.078297099471018e-07, "epoch": 0.8248030589210854, "percentage": 82.48, "elapsed_time": "1 day, 4:15:43", "remaining_time": "6:00:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8953, "total_steps": 10853, "loss": 0.1254, "learning_rate": 4.0741280365009765e-07, "epoch": 0.8248951950983554, "percentage": 82.49, "elapsed_time": "1 day, 4:15:54", "remaining_time": "5:59:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8954, "total_steps": 10853, "loss": 0.118, "learning_rate": 4.069960916500404e-07, "epoch": 0.8249873312756254, "percentage": 82.5, "elapsed_time": "1 day, 4:16:05", "remaining_time": "5:59:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8955, "total_steps": 10853, "loss": 0.1236, "learning_rate": 4.065795739856207e-07, "epoch": 0.8250794674528954, "percentage": 82.51, "elapsed_time": "1 day, 4:16:16", "remaining_time": "5:59:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8956, "total_steps": 10853, "loss": 0.1026, "learning_rate": 4.0616325069551296e-07, "epoch": 0.8251716036301654, "percentage": 82.52, "elapsed_time": "1 day, 4:16:26", "remaining_time": "5:59:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8957, "total_steps": 10853, "loss": 0.1185, "learning_rate": 4.057471218183734e-07, "epoch": 0.8252637398074354, "percentage": 82.53, "elapsed_time": "1 day, 4:16:36", "remaining_time": "5:59:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8958, "total_steps": 10853, "loss": 0.1287, "learning_rate": 4.0533118739283864e-07, "epoch": 0.8253558759847054, "percentage": 82.54, "elapsed_time": "1 day, 4:16:46", "remaining_time": "5:58:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8959, "total_steps": 10853, "loss": 0.1096, "learning_rate": 4.049154474575284e-07, "epoch": 0.8254480121619754, "percentage": 82.55, "elapsed_time": "1 day, 4:16:56", "remaining_time": "5:58:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8960, "total_steps": 10853, "loss": 0.1254, "learning_rate": 4.04499902051044e-07, "epoch": 0.8255401483392454, "percentage": 82.56, "elapsed_time": "1 day, 4:17:06", "remaining_time": "5:58:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8961, "total_steps": 10853, "loss": 0.1216, "learning_rate": 4.0408455121196957e-07, "epoch": 0.8256322845165154, "percentage": 82.57, "elapsed_time": "1 day, 4:17:16", "remaining_time": "5:58:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8962, "total_steps": 10853, "loss": 0.1069, "learning_rate": 4.0366939497887033e-07, "epoch": 0.8257244206937854, "percentage": 82.58, "elapsed_time": "1 day, 4:17:25", "remaining_time": "5:58:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8963, "total_steps": 10853, "loss": 0.1267, "learning_rate": 4.032544333902935e-07, "epoch": 0.8258165568710554, "percentage": 82.59, "elapsed_time": "1 day, 4:17:35", "remaining_time": "5:57:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8964, "total_steps": 10853, "loss": 0.1182, "learning_rate": 4.028396664847678e-07, "epoch": 0.8259086930483254, "percentage": 82.59, "elapsed_time": "1 day, 4:17:46", "remaining_time": "5:57:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8965, "total_steps": 10853, "loss": 0.1126, "learning_rate": 4.0242509430080456e-07, "epoch": 0.8260008292255955, "percentage": 82.6, "elapsed_time": "1 day, 4:17:57", "remaining_time": "5:57:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8966, "total_steps": 10853, "loss": 0.1324, "learning_rate": 4.0201071687689746e-07, "epoch": 0.8260929654028655, "percentage": 82.61, "elapsed_time": "1 day, 4:18:09", "remaining_time": "5:57:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8967, "total_steps": 10853, "loss": 0.1165, "learning_rate": 4.0159653425152074e-07, "epoch": 0.8261851015801355, "percentage": 82.62, "elapsed_time": "1 day, 4:18:20", "remaining_time": "5:57:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8968, "total_steps": 10853, "loss": 0.1046, "learning_rate": 4.011825464631322e-07, "epoch": 0.8262772377574055, "percentage": 82.63, "elapsed_time": "1 day, 4:18:30", "remaining_time": "5:57:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8969, "total_steps": 10853, "loss": 0.113, "learning_rate": 4.0076875355016975e-07, "epoch": 0.8263693739346755, "percentage": 82.64, "elapsed_time": "1 day, 4:18:40", "remaining_time": "5:56:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8970, "total_steps": 10853, "loss": 0.1175, "learning_rate": 4.003551555510549e-07, "epoch": 0.8264615101119455, "percentage": 82.65, "elapsed_time": "1 day, 4:18:50", "remaining_time": "5:56:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8971, "total_steps": 10853, "loss": 0.1273, "learning_rate": 3.99941752504189e-07, "epoch": 0.8265536462892155, "percentage": 82.66, "elapsed_time": "1 day, 4:19:01", "remaining_time": "5:56:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8972, "total_steps": 10853, "loss": 0.1277, "learning_rate": 3.995285444479574e-07, "epoch": 0.8266457824664855, "percentage": 82.67, "elapsed_time": "1 day, 4:19:12", "remaining_time": "5:56:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8973, "total_steps": 10853, "loss": 0.1156, "learning_rate": 3.9911553142072733e-07, "epoch": 0.8267379186437555, "percentage": 82.68, "elapsed_time": "1 day, 4:19:22", "remaining_time": "5:56:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8974, "total_steps": 10853, "loss": 0.1268, "learning_rate": 3.987027134608462e-07, "epoch": 0.8268300548210255, "percentage": 82.69, "elapsed_time": "1 day, 4:19:35", "remaining_time": "5:55:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8975, "total_steps": 10853, "loss": 0.1246, "learning_rate": 3.9829009060664363e-07, "epoch": 0.8269221909982954, "percentage": 82.7, "elapsed_time": "1 day, 4:19:45", "remaining_time": "5:55:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8976, "total_steps": 10853, "loss": 0.1066, "learning_rate": 3.9787766289643233e-07, "epoch": 0.8270143271755654, "percentage": 82.71, "elapsed_time": "1 day, 4:19:56", "remaining_time": "5:55:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8977, "total_steps": 10853, "loss": 0.1135, "learning_rate": 3.974654303685063e-07, "epoch": 0.8271064633528354, "percentage": 82.71, "elapsed_time": "1 day, 4:20:08", "remaining_time": "5:55:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8978, "total_steps": 10853, "loss": 0.111, "learning_rate": 3.97053393061142e-07, "epoch": 0.8271985995301055, "percentage": 82.72, "elapsed_time": "1 day, 4:20:17", "remaining_time": "5:55:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8979, "total_steps": 10853, "loss": 0.1093, "learning_rate": 3.966415510125965e-07, "epoch": 0.8272907357073755, "percentage": 82.73, "elapsed_time": "1 day, 4:20:28", "remaining_time": "5:54:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8980, "total_steps": 10853, "loss": 0.1204, "learning_rate": 3.9622990426110867e-07, "epoch": 0.8273828718846455, "percentage": 82.74, "elapsed_time": "1 day, 4:20:38", "remaining_time": "5:54:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8981, "total_steps": 10853, "loss": 0.1204, "learning_rate": 3.958184528449005e-07, "epoch": 0.8274750080619155, "percentage": 82.75, "elapsed_time": "1 day, 4:20:48", "remaining_time": "5:54:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8982, "total_steps": 10853, "loss": 0.127, "learning_rate": 3.954071968021755e-07, "epoch": 0.8275671442391855, "percentage": 82.76, "elapsed_time": "1 day, 4:21:00", "remaining_time": "5:54:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8983, "total_steps": 10853, "loss": 0.1071, "learning_rate": 3.9499613617111965e-07, "epoch": 0.8276592804164555, "percentage": 82.77, "elapsed_time": "1 day, 4:21:10", "remaining_time": "5:54:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8984, "total_steps": 10853, "loss": 0.1233, "learning_rate": 3.945852709898987e-07, "epoch": 0.8277514165937255, "percentage": 82.78, "elapsed_time": "1 day, 4:21:21", "remaining_time": "5:53:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8985, "total_steps": 10853, "loss": 0.1155, "learning_rate": 3.941746012966616e-07, "epoch": 0.8278435527709955, "percentage": 82.79, "elapsed_time": "1 day, 4:21:33", "remaining_time": "5:53:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8986, "total_steps": 10853, "loss": 0.1245, "learning_rate": 3.937641271295392e-07, "epoch": 0.8279356889482655, "percentage": 82.8, "elapsed_time": "1 day, 4:21:44", "remaining_time": "5:53:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8987, "total_steps": 10853, "loss": 0.1329, "learning_rate": 3.93353848526645e-07, "epoch": 0.8280278251255355, "percentage": 82.81, "elapsed_time": "1 day, 4:21:55", "remaining_time": "5:53:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8988, "total_steps": 10853, "loss": 0.1149, "learning_rate": 3.9294376552607233e-07, "epoch": 0.8281199613028055, "percentage": 82.82, "elapsed_time": "1 day, 4:22:05", "remaining_time": "5:53:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8989, "total_steps": 10853, "loss": 0.1091, "learning_rate": 3.92533878165898e-07, "epoch": 0.8282120974800755, "percentage": 82.83, "elapsed_time": "1 day, 4:22:16", "remaining_time": "5:52:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8990, "total_steps": 10853, "loss": 0.1123, "learning_rate": 3.921241864841793e-07, "epoch": 0.8283042336573455, "percentage": 82.83, "elapsed_time": "1 day, 4:22:25", "remaining_time": "5:52:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8991, "total_steps": 10853, "loss": 0.1122, "learning_rate": 3.917146905189576e-07, "epoch": 0.8283963698346155, "percentage": 82.84, "elapsed_time": "1 day, 4:22:36", "remaining_time": "5:52:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8992, "total_steps": 10853, "loss": 0.1155, "learning_rate": 3.913053903082531e-07, "epoch": 0.8284885060118856, "percentage": 82.85, "elapsed_time": "1 day, 4:22:45", "remaining_time": "5:52:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8993, "total_steps": 10853, "loss": 0.1204, "learning_rate": 3.9089628589007e-07, "epoch": 0.8285806421891556, "percentage": 82.86, "elapsed_time": "1 day, 4:22:56", "remaining_time": "5:52:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8994, "total_steps": 10853, "loss": 0.1287, "learning_rate": 3.9048737730239427e-07, "epoch": 0.8286727783664256, "percentage": 82.87, "elapsed_time": "1 day, 4:23:07", "remaining_time": "5:52:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8995, "total_steps": 10853, "loss": 0.1032, "learning_rate": 3.9007866458319275e-07, "epoch": 0.8287649145436956, "percentage": 82.88, "elapsed_time": "1 day, 4:23:16", "remaining_time": "5:51:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8996, "total_steps": 10853, "loss": 0.1183, "learning_rate": 3.8967014777041344e-07, "epoch": 0.8288570507209656, "percentage": 82.89, "elapsed_time": "1 day, 4:23:27", "remaining_time": "5:51:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8997, "total_steps": 10853, "loss": 0.12, "learning_rate": 3.892618269019882e-07, "epoch": 0.8289491868982356, "percentage": 82.9, "elapsed_time": "1 day, 4:23:37", "remaining_time": "5:51:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8998, "total_steps": 10853, "loss": 0.1162, "learning_rate": 3.888537020158295e-07, "epoch": 0.8290413230755056, "percentage": 82.91, "elapsed_time": "1 day, 4:23:48", "remaining_time": "5:51:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8999, "total_steps": 10853, "loss": 0.1206, "learning_rate": 3.8844577314983254e-07, "epoch": 0.8291334592527756, "percentage": 82.92, "elapsed_time": "1 day, 4:23:59", "remaining_time": "5:51:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9000, "total_steps": 10853, "loss": 0.1147, "learning_rate": 3.8803804034187235e-07, "epoch": 0.8292255954300456, "percentage": 82.93, "elapsed_time": "1 day, 4:24:10", "remaining_time": "5:50:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9000, "total_steps": 10853, "eval_loss": 0.11866238713264465, "epoch": 0.8292255954300456, "percentage": 82.93, "elapsed_time": "1 day, 4:29:09", "remaining_time": "5:51:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9001, "total_steps": 10853, "loss": 0.1019, "learning_rate": 3.8763050362980723e-07, "epoch": 0.8293177316073156, "percentage": 82.94, "elapsed_time": "1 day, 4:29:20", "remaining_time": "5:51:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9002, "total_steps": 10853, "loss": 0.1274, "learning_rate": 3.8722316305147693e-07, "epoch": 0.8294098677845856, "percentage": 82.94, "elapsed_time": "1 day, 4:29:31", "remaining_time": "5:51:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9003, "total_steps": 10853, "loss": 0.1017, "learning_rate": 3.8681601864470396e-07, "epoch": 0.8295020039618556, "percentage": 82.95, "elapsed_time": "1 day, 4:29:42", "remaining_time": "5:51:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9004, "total_steps": 10853, "loss": 0.1246, "learning_rate": 3.864090704472906e-07, "epoch": 0.8295941401391256, "percentage": 82.96, "elapsed_time": "1 day, 4:29:54", "remaining_time": "5:51:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9005, "total_steps": 10853, "loss": 0.118, "learning_rate": 3.86002318497023e-07, "epoch": 0.8296862763163957, "percentage": 82.97, "elapsed_time": "1 day, 4:30:05", "remaining_time": "5:50:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9006, "total_steps": 10853, "loss": 0.1339, "learning_rate": 3.855957628316673e-07, "epoch": 0.8297784124936657, "percentage": 82.98, "elapsed_time": "1 day, 4:30:16", "remaining_time": "5:50:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9007, "total_steps": 10853, "loss": 0.1323, "learning_rate": 3.8518940348897277e-07, "epoch": 0.8298705486709357, "percentage": 82.99, "elapsed_time": "1 day, 4:30:28", "remaining_time": "5:50:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9008, "total_steps": 10853, "loss": 0.1181, "learning_rate": 3.8478324050666926e-07, "epoch": 0.8299626848482057, "percentage": 83.0, "elapsed_time": "1 day, 4:30:38", "remaining_time": "5:50:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9009, "total_steps": 10853, "loss": 0.1142, "learning_rate": 3.8437727392246966e-07, "epoch": 0.8300548210254757, "percentage": 83.01, "elapsed_time": "1 day, 4:30:48", "remaining_time": "5:50:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9010, "total_steps": 10853, "loss": 0.1252, "learning_rate": 3.839715037740677e-07, "epoch": 0.8301469572027457, "percentage": 83.02, "elapsed_time": "1 day, 4:30:59", "remaining_time": "5:49:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9011, "total_steps": 10853, "loss": 0.1252, "learning_rate": 3.835659300991401e-07, "epoch": 0.8302390933800157, "percentage": 83.03, "elapsed_time": "1 day, 4:31:10", "remaining_time": "5:49:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9012, "total_steps": 10853, "loss": 0.1179, "learning_rate": 3.8316055293534353e-07, "epoch": 0.8303312295572857, "percentage": 83.04, "elapsed_time": "1 day, 4:31:20", "remaining_time": "5:49:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9013, "total_steps": 10853, "loss": 0.1157, "learning_rate": 3.82755372320317e-07, "epoch": 0.8304233657345557, "percentage": 83.05, "elapsed_time": "1 day, 4:31:29", "remaining_time": "5:49:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9014, "total_steps": 10853, "loss": 0.1145, "learning_rate": 3.823503882916818e-07, "epoch": 0.8305155019118257, "percentage": 83.06, "elapsed_time": "1 day, 4:31:40", "remaining_time": "5:49:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9015, "total_steps": 10853, "loss": 0.1112, "learning_rate": 3.819456008870412e-07, "epoch": 0.8306076380890957, "percentage": 83.06, "elapsed_time": "1 day, 4:31:51", "remaining_time": "5:49:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9016, "total_steps": 10853, "loss": 0.124, "learning_rate": 3.815410101439798e-07, "epoch": 0.8306997742663657, "percentage": 83.07, "elapsed_time": "1 day, 4:32:02", "remaining_time": "5:48:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9017, "total_steps": 10853, "loss": 0.108, "learning_rate": 3.8113661610006375e-07, "epoch": 0.8307919104436357, "percentage": 83.08, "elapsed_time": "1 day, 4:32:12", "remaining_time": "5:48:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9018, "total_steps": 10853, "loss": 0.125, "learning_rate": 3.8073241879284045e-07, "epoch": 0.8308840466209056, "percentage": 83.09, "elapsed_time": "1 day, 4:32:22", "remaining_time": "5:48:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9019, "total_steps": 10853, "loss": 0.111, "learning_rate": 3.803284182598399e-07, "epoch": 0.8309761827981758, "percentage": 83.1, "elapsed_time": "1 day, 4:32:33", "remaining_time": "5:48:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9020, "total_steps": 10853, "loss": 0.1183, "learning_rate": 3.799246145385746e-07, "epoch": 0.8310683189754458, "percentage": 83.11, "elapsed_time": "1 day, 4:32:43", "remaining_time": "5:48:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9021, "total_steps": 10853, "loss": 0.1062, "learning_rate": 3.795210076665362e-07, "epoch": 0.8311604551527157, "percentage": 83.12, "elapsed_time": "1 day, 4:32:54", "remaining_time": "5:47:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9022, "total_steps": 10853, "loss": 0.1121, "learning_rate": 3.791175976812014e-07, "epoch": 0.8312525913299857, "percentage": 83.13, "elapsed_time": "1 day, 4:33:06", "remaining_time": "5:47:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9023, "total_steps": 10853, "loss": 0.1291, "learning_rate": 3.78714384620025e-07, "epoch": 0.8313447275072557, "percentage": 83.14, "elapsed_time": "1 day, 4:33:17", "remaining_time": "5:47:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9024, "total_steps": 10853, "loss": 0.1217, "learning_rate": 3.7831136852044705e-07, "epoch": 0.8314368636845257, "percentage": 83.15, "elapsed_time": "1 day, 4:33:28", "remaining_time": "5:47:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9025, "total_steps": 10853, "loss": 0.1077, "learning_rate": 3.7790854941988615e-07, "epoch": 0.8315289998617957, "percentage": 83.16, "elapsed_time": "1 day, 4:33:39", "remaining_time": "5:47:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9026, "total_steps": 10853, "loss": 0.1153, "learning_rate": 3.7750592735574494e-07, "epoch": 0.8316211360390657, "percentage": 83.17, "elapsed_time": "1 day, 4:33:50", "remaining_time": "5:46:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9027, "total_steps": 10853, "loss": 0.1163, "learning_rate": 3.7710350236540737e-07, "epoch": 0.8317132722163357, "percentage": 83.18, "elapsed_time": "1 day, 4:34:01", "remaining_time": "5:46:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9028, "total_steps": 10853, "loss": 0.1261, "learning_rate": 3.7670127448623804e-07, "epoch": 0.8318054083936057, "percentage": 83.18, "elapsed_time": "1 day, 4:34:13", "remaining_time": "5:46:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9029, "total_steps": 10853, "loss": 0.1142, "learning_rate": 3.7629924375558347e-07, "epoch": 0.8318975445708757, "percentage": 83.19, "elapsed_time": "1 day, 4:34:23", "remaining_time": "5:46:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9030, "total_steps": 10853, "loss": 0.1193, "learning_rate": 3.7589741021077234e-07, "epoch": 0.8319896807481457, "percentage": 83.2, "elapsed_time": "1 day, 4:34:35", "remaining_time": "5:46:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9031, "total_steps": 10853, "loss": 0.1123, "learning_rate": 3.7549577388911546e-07, "epoch": 0.8320818169254157, "percentage": 83.21, "elapsed_time": "1 day, 4:34:45", "remaining_time": "5:45:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9032, "total_steps": 10853, "loss": 0.11, "learning_rate": 3.7509433482790515e-07, "epoch": 0.8321739531026857, "percentage": 83.22, "elapsed_time": "1 day, 4:34:56", "remaining_time": "5:45:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9033, "total_steps": 10853, "loss": 0.1089, "learning_rate": 3.7469309306441466e-07, "epoch": 0.8322660892799558, "percentage": 83.23, "elapsed_time": "1 day, 4:35:06", "remaining_time": "5:45:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9034, "total_steps": 10853, "loss": 0.1325, "learning_rate": 3.742920486358986e-07, "epoch": 0.8323582254572258, "percentage": 83.24, "elapsed_time": "1 day, 4:35:19", "remaining_time": "5:45:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9035, "total_steps": 10853, "loss": 0.1124, "learning_rate": 3.738912015795945e-07, "epoch": 0.8324503616344958, "percentage": 83.25, "elapsed_time": "1 day, 4:35:29", "remaining_time": "5:45:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9036, "total_steps": 10853, "loss": 0.1197, "learning_rate": 3.734905519327217e-07, "epoch": 0.8325424978117658, "percentage": 83.26, "elapsed_time": "1 day, 4:35:39", "remaining_time": "5:44:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9037, "total_steps": 10853, "loss": 0.1235, "learning_rate": 3.7309009973247963e-07, "epoch": 0.8326346339890358, "percentage": 83.27, "elapsed_time": "1 day, 4:35:50", "remaining_time": "5:44:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9038, "total_steps": 10853, "loss": 0.1057, "learning_rate": 3.72689845016051e-07, "epoch": 0.8327267701663058, "percentage": 83.28, "elapsed_time": "1 day, 4:36:01", "remaining_time": "5:44:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9039, "total_steps": 10853, "loss": 0.1238, "learning_rate": 3.722897878205989e-07, "epoch": 0.8328189063435758, "percentage": 83.29, "elapsed_time": "1 day, 4:36:12", "remaining_time": "5:44:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9040, "total_steps": 10853, "loss": 0.1158, "learning_rate": 3.718899281832686e-07, "epoch": 0.8329110425208458, "percentage": 83.29, "elapsed_time": "1 day, 4:36:22", "remaining_time": "5:44:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9041, "total_steps": 10853, "loss": 0.1161, "learning_rate": 3.7149026614118844e-07, "epoch": 0.8330031786981158, "percentage": 83.3, "elapsed_time": "1 day, 4:36:35", "remaining_time": "5:44:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9042, "total_steps": 10853, "loss": 0.1125, "learning_rate": 3.7109080173146543e-07, "epoch": 0.8330953148753858, "percentage": 83.31, "elapsed_time": "1 day, 4:36:45", "remaining_time": "5:43:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9043, "total_steps": 10853, "loss": 0.1229, "learning_rate": 3.7069153499119134e-07, "epoch": 0.8331874510526558, "percentage": 83.32, "elapsed_time": "1 day, 4:36:56", "remaining_time": "5:43:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9044, "total_steps": 10853, "loss": 0.1178, "learning_rate": 3.7029246595743666e-07, "epoch": 0.8332795872299258, "percentage": 83.33, "elapsed_time": "1 day, 4:37:07", "remaining_time": "5:43:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9045, "total_steps": 10853, "loss": 0.109, "learning_rate": 3.6989359466725603e-07, "epoch": 0.8333717234071958, "percentage": 83.34, "elapsed_time": "1 day, 4:37:17", "remaining_time": "5:43:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9046, "total_steps": 10853, "loss": 0.1136, "learning_rate": 3.6949492115768425e-07, "epoch": 0.8334638595844659, "percentage": 83.35, "elapsed_time": "1 day, 4:37:27", "remaining_time": "5:43:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9047, "total_steps": 10853, "loss": 0.1124, "learning_rate": 3.6909644546573806e-07, "epoch": 0.8335559957617359, "percentage": 83.36, "elapsed_time": "1 day, 4:37:39", "remaining_time": "5:42:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9048, "total_steps": 10853, "loss": 0.1116, "learning_rate": 3.686981676284171e-07, "epoch": 0.8336481319390059, "percentage": 83.37, "elapsed_time": "1 day, 4:37:49", "remaining_time": "5:42:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9049, "total_steps": 10853, "loss": 0.1274, "learning_rate": 3.6830008768270033e-07, "epoch": 0.8337402681162759, "percentage": 83.38, "elapsed_time": "1 day, 4:38:00", "remaining_time": "5:42:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9050, "total_steps": 10853, "loss": 0.115, "learning_rate": 3.679022056655493e-07, "epoch": 0.8338324042935459, "percentage": 83.39, "elapsed_time": "1 day, 4:38:12", "remaining_time": "5:42:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9051, "total_steps": 10853, "loss": 0.1113, "learning_rate": 3.675045216139081e-07, "epoch": 0.8339245404708159, "percentage": 83.4, "elapsed_time": "1 day, 4:38:22", "remaining_time": "5:42:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9052, "total_steps": 10853, "loss": 0.1242, "learning_rate": 3.6710703556470136e-07, "epoch": 0.8340166766480859, "percentage": 83.41, "elapsed_time": "1 day, 4:38:34", "remaining_time": "5:41:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9053, "total_steps": 10853, "loss": 0.1243, "learning_rate": 3.667097475548367e-07, "epoch": 0.8341088128253559, "percentage": 83.41, "elapsed_time": "1 day, 4:38:46", "remaining_time": "5:41:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9054, "total_steps": 10853, "loss": 0.1226, "learning_rate": 3.663126576212014e-07, "epoch": 0.8342009490026259, "percentage": 83.42, "elapsed_time": "1 day, 4:38:56", "remaining_time": "5:41:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9055, "total_steps": 10853, "loss": 0.1171, "learning_rate": 3.659157658006651e-07, "epoch": 0.8342930851798959, "percentage": 83.43, "elapsed_time": "1 day, 4:39:06", "remaining_time": "5:41:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9056, "total_steps": 10853, "loss": 0.1175, "learning_rate": 3.655190721300794e-07, "epoch": 0.8343852213571659, "percentage": 83.44, "elapsed_time": "1 day, 4:39:17", "remaining_time": "5:41:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9057, "total_steps": 10853, "loss": 0.1133, "learning_rate": 3.651225766462782e-07, "epoch": 0.8344773575344359, "percentage": 83.45, "elapsed_time": "1 day, 4:39:28", "remaining_time": "5:40:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9058, "total_steps": 10853, "loss": 0.1168, "learning_rate": 3.647262793860751e-07, "epoch": 0.8345694937117059, "percentage": 83.46, "elapsed_time": "1 day, 4:39:39", "remaining_time": "5:40:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9059, "total_steps": 10853, "loss": 0.1251, "learning_rate": 3.643301803862673e-07, "epoch": 0.8346616298889759, "percentage": 83.47, "elapsed_time": "1 day, 4:39:50", "remaining_time": "5:40:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9060, "total_steps": 10853, "loss": 0.1249, "learning_rate": 3.639342796836312e-07, "epoch": 0.834753766066246, "percentage": 83.48, "elapsed_time": "1 day, 4:40:01", "remaining_time": "5:40:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9061, "total_steps": 10853, "loss": 0.1167, "learning_rate": 3.63538577314928e-07, "epoch": 0.834845902243516, "percentage": 83.49, "elapsed_time": "1 day, 4:40:11", "remaining_time": "5:40:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9062, "total_steps": 10853, "loss": 0.1089, "learning_rate": 3.6314307331689725e-07, "epoch": 0.834938038420786, "percentage": 83.5, "elapsed_time": "1 day, 4:40:21", "remaining_time": "5:40:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9063, "total_steps": 10853, "loss": 0.1173, "learning_rate": 3.6274776772626197e-07, "epoch": 0.835030174598056, "percentage": 83.51, "elapsed_time": "1 day, 4:40:31", "remaining_time": "5:39:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9064, "total_steps": 10853, "loss": 0.1236, "learning_rate": 3.6235266057972727e-07, "epoch": 0.835122310775326, "percentage": 83.52, "elapsed_time": "1 day, 4:40:42", "remaining_time": "5:39:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9065, "total_steps": 10853, "loss": 0.1312, "learning_rate": 3.6195775191397776e-07, "epoch": 0.835214446952596, "percentage": 83.53, "elapsed_time": "1 day, 4:40:52", "remaining_time": "5:39:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9066, "total_steps": 10853, "loss": 0.1333, "learning_rate": 3.615630417656807e-07, "epoch": 0.8353065831298659, "percentage": 83.53, "elapsed_time": "1 day, 4:41:03", "remaining_time": "5:39:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9067, "total_steps": 10853, "loss": 0.1159, "learning_rate": 3.611685301714854e-07, "epoch": 0.8353987193071359, "percentage": 83.54, "elapsed_time": "1 day, 4:41:15", "remaining_time": "5:39:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9068, "total_steps": 10853, "loss": 0.1156, "learning_rate": 3.607742171680223e-07, "epoch": 0.8354908554844059, "percentage": 83.55, "elapsed_time": "1 day, 4:41:26", "remaining_time": "5:38:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9069, "total_steps": 10853, "loss": 0.136, "learning_rate": 3.6038010279190376e-07, "epoch": 0.8355829916616759, "percentage": 83.56, "elapsed_time": "1 day, 4:41:37", "remaining_time": "5:38:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9070, "total_steps": 10853, "loss": 0.1076, "learning_rate": 3.5998618707972303e-07, "epoch": 0.8356751278389459, "percentage": 83.57, "elapsed_time": "1 day, 4:41:48", "remaining_time": "5:38:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9071, "total_steps": 10853, "loss": 0.1148, "learning_rate": 3.5959247006805446e-07, "epoch": 0.8357672640162159, "percentage": 83.58, "elapsed_time": "1 day, 4:42:00", "remaining_time": "5:38:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9072, "total_steps": 10853, "loss": 0.1193, "learning_rate": 3.5919895179345546e-07, "epoch": 0.8358594001934859, "percentage": 83.59, "elapsed_time": "1 day, 4:42:10", "remaining_time": "5:38:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9073, "total_steps": 10853, "loss": 0.1248, "learning_rate": 3.5880563229246434e-07, "epoch": 0.835951536370756, "percentage": 83.6, "elapsed_time": "1 day, 4:42:21", "remaining_time": "5:37:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9074, "total_steps": 10853, "loss": 0.1213, "learning_rate": 3.58412511601601e-07, "epoch": 0.836043672548026, "percentage": 83.61, "elapsed_time": "1 day, 4:42:32", "remaining_time": "5:37:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9075, "total_steps": 10853, "loss": 0.1158, "learning_rate": 3.5801958975736653e-07, "epoch": 0.836135808725296, "percentage": 83.62, "elapsed_time": "1 day, 4:42:41", "remaining_time": "5:37:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9076, "total_steps": 10853, "loss": 0.1121, "learning_rate": 3.576268667962432e-07, "epoch": 0.836227944902566, "percentage": 83.63, "elapsed_time": "1 day, 4:42:50", "remaining_time": "5:37:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9077, "total_steps": 10853, "loss": 0.1185, "learning_rate": 3.5723434275469593e-07, "epoch": 0.836320081079836, "percentage": 83.64, "elapsed_time": "1 day, 4:43:01", "remaining_time": "5:37:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9078, "total_steps": 10853, "loss": 0.1203, "learning_rate": 3.5684201766917087e-07, "epoch": 0.836412217257106, "percentage": 83.65, "elapsed_time": "1 day, 4:43:13", "remaining_time": "5:36:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9079, "total_steps": 10853, "loss": 0.1246, "learning_rate": 3.564498915760947e-07, "epoch": 0.836504353434376, "percentage": 83.65, "elapsed_time": "1 day, 4:43:25", "remaining_time": "5:36:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9080, "total_steps": 10853, "loss": 0.1123, "learning_rate": 3.560579645118775e-07, "epoch": 0.836596489611646, "percentage": 83.66, "elapsed_time": "1 day, 4:43:34", "remaining_time": "5:36:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9081, "total_steps": 10853, "loss": 0.1242, "learning_rate": 3.556662365129082e-07, "epoch": 0.836688625788916, "percentage": 83.67, "elapsed_time": "1 day, 4:43:47", "remaining_time": "5:36:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9082, "total_steps": 10853, "loss": 0.1313, "learning_rate": 3.5527470761556024e-07, "epoch": 0.836780761966186, "percentage": 83.68, "elapsed_time": "1 day, 4:43:58", "remaining_time": "5:36:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9083, "total_steps": 10853, "loss": 0.1277, "learning_rate": 3.5488337785618607e-07, "epoch": 0.836872898143456, "percentage": 83.69, "elapsed_time": "1 day, 4:44:08", "remaining_time": "5:35:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9084, "total_steps": 10853, "loss": 0.1239, "learning_rate": 3.5449224727112094e-07, "epoch": 0.836965034320726, "percentage": 83.7, "elapsed_time": "1 day, 4:44:19", "remaining_time": "5:35:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9085, "total_steps": 10853, "loss": 0.1185, "learning_rate": 3.541013158966816e-07, "epoch": 0.837057170497996, "percentage": 83.71, "elapsed_time": "1 day, 4:44:30", "remaining_time": "5:35:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9086, "total_steps": 10853, "loss": 0.1136, "learning_rate": 3.5371058376916733e-07, "epoch": 0.837149306675266, "percentage": 83.72, "elapsed_time": "1 day, 4:44:40", "remaining_time": "5:35:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9087, "total_steps": 10853, "loss": 0.1196, "learning_rate": 3.5332005092485496e-07, "epoch": 0.8372414428525361, "percentage": 83.73, "elapsed_time": "1 day, 4:44:51", "remaining_time": "5:35:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9088, "total_steps": 10853, "loss": 0.1114, "learning_rate": 3.529297174000071e-07, "epoch": 0.8373335790298061, "percentage": 83.74, "elapsed_time": "1 day, 4:45:02", "remaining_time": "5:35:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9089, "total_steps": 10853, "loss": 0.114, "learning_rate": 3.525395832308659e-07, "epoch": 0.8374257152070761, "percentage": 83.75, "elapsed_time": "1 day, 4:45:12", "remaining_time": "5:34:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9090, "total_steps": 10853, "loss": 0.117, "learning_rate": 3.52149648453656e-07, "epoch": 0.8375178513843461, "percentage": 83.76, "elapsed_time": "1 day, 4:45:22", "remaining_time": "5:34:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9091, "total_steps": 10853, "loss": 0.1179, "learning_rate": 3.5175991310458207e-07, "epoch": 0.8376099875616161, "percentage": 83.76, "elapsed_time": "1 day, 4:45:33", "remaining_time": "5:34:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9092, "total_steps": 10853, "loss": 0.1279, "learning_rate": 3.513703772198318e-07, "epoch": 0.8377021237388861, "percentage": 83.77, "elapsed_time": "1 day, 4:45:44", "remaining_time": "5:34:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9093, "total_steps": 10853, "loss": 0.1223, "learning_rate": 3.5098104083557264e-07, "epoch": 0.8377942599161561, "percentage": 83.78, "elapsed_time": "1 day, 4:45:55", "remaining_time": "5:34:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9094, "total_steps": 10853, "loss": 0.1046, "learning_rate": 3.5059190398795603e-07, "epoch": 0.8378863960934261, "percentage": 83.79, "elapsed_time": "1 day, 4:46:06", "remaining_time": "5:33:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9095, "total_steps": 10853, "loss": 0.1206, "learning_rate": 3.5020296671311154e-07, "epoch": 0.8379785322706961, "percentage": 83.8, "elapsed_time": "1 day, 4:46:15", "remaining_time": "5:33:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9096, "total_steps": 10853, "loss": 0.113, "learning_rate": 3.498142290471529e-07, "epoch": 0.8380706684479661, "percentage": 83.81, "elapsed_time": "1 day, 4:46:26", "remaining_time": "5:33:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9097, "total_steps": 10853, "loss": 0.1135, "learning_rate": 3.4942569102617534e-07, "epoch": 0.8381628046252361, "percentage": 83.82, "elapsed_time": "1 day, 4:46:35", "remaining_time": "5:33:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9098, "total_steps": 10853, "loss": 0.1017, "learning_rate": 3.490373526862531e-07, "epoch": 0.8382549408025061, "percentage": 83.83, "elapsed_time": "1 day, 4:46:46", "remaining_time": "5:33:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9099, "total_steps": 10853, "loss": 0.1135, "learning_rate": 3.4864921406344483e-07, "epoch": 0.8383470769797761, "percentage": 83.84, "elapsed_time": "1 day, 4:46:57", "remaining_time": "5:32:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9100, "total_steps": 10853, "loss": 0.1116, "learning_rate": 3.482612751937878e-07, "epoch": 0.8384392131570461, "percentage": 83.85, "elapsed_time": "1 day, 4:47:09", "remaining_time": "5:32:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9101, "total_steps": 10853, "loss": 0.1188, "learning_rate": 3.4787353611330317e-07, "epoch": 0.8385313493343162, "percentage": 83.86, "elapsed_time": "1 day, 4:47:20", "remaining_time": "5:32:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9102, "total_steps": 10853, "loss": 0.1167, "learning_rate": 3.4748599685799274e-07, "epoch": 0.8386234855115862, "percentage": 83.87, "elapsed_time": "1 day, 4:47:30", "remaining_time": "5:32:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9103, "total_steps": 10853, "loss": 0.1087, "learning_rate": 3.470986574638391e-07, "epoch": 0.8387156216888562, "percentage": 83.88, "elapsed_time": "1 day, 4:47:41", "remaining_time": "5:32:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9104, "total_steps": 10853, "loss": 0.1325, "learning_rate": 3.4671151796680654e-07, "epoch": 0.8388077578661262, "percentage": 83.88, "elapsed_time": "1 day, 4:47:53", "remaining_time": "5:31:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9105, "total_steps": 10853, "loss": 0.1305, "learning_rate": 3.46324578402841e-07, "epoch": 0.8388998940433962, "percentage": 83.89, "elapsed_time": "1 day, 4:48:04", "remaining_time": "5:31:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9106, "total_steps": 10853, "loss": 0.1225, "learning_rate": 3.459378388078702e-07, "epoch": 0.8389920302206662, "percentage": 83.9, "elapsed_time": "1 day, 4:48:13", "remaining_time": "5:31:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9107, "total_steps": 10853, "loss": 0.117, "learning_rate": 3.4555129921780337e-07, "epoch": 0.8390841663979361, "percentage": 83.91, "elapsed_time": "1 day, 4:48:25", "remaining_time": "5:31:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9108, "total_steps": 10853, "loss": 0.1177, "learning_rate": 3.4516495966853054e-07, "epoch": 0.8391763025752061, "percentage": 83.92, "elapsed_time": "1 day, 4:48:36", "remaining_time": "5:31:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9109, "total_steps": 10853, "loss": 0.1247, "learning_rate": 3.447788201959223e-07, "epoch": 0.8392684387524761, "percentage": 83.93, "elapsed_time": "1 day, 4:48:47", "remaining_time": "5:30:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9110, "total_steps": 10853, "loss": 0.1367, "learning_rate": 3.443928808358327e-07, "epoch": 0.8393605749297461, "percentage": 83.94, "elapsed_time": "1 day, 4:48:57", "remaining_time": "5:30:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9111, "total_steps": 10853, "loss": 0.1182, "learning_rate": 3.4400714162409644e-07, "epoch": 0.8394527111070161, "percentage": 83.95, "elapsed_time": "1 day, 4:49:08", "remaining_time": "5:30:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9112, "total_steps": 10853, "loss": 0.109, "learning_rate": 3.4362160259652887e-07, "epoch": 0.8395448472842861, "percentage": 83.96, "elapsed_time": "1 day, 4:49:19", "remaining_time": "5:30:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9113, "total_steps": 10853, "loss": 0.1369, "learning_rate": 3.4323626378892775e-07, "epoch": 0.8396369834615561, "percentage": 83.97, "elapsed_time": "1 day, 4:49:30", "remaining_time": "5:30:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9114, "total_steps": 10853, "loss": 0.1153, "learning_rate": 3.4285112523707143e-07, "epoch": 0.8397291196388262, "percentage": 83.98, "elapsed_time": "1 day, 4:49:41", "remaining_time": "5:30:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9115, "total_steps": 10853, "loss": 0.1089, "learning_rate": 3.424661869767207e-07, "epoch": 0.8398212558160962, "percentage": 83.99, "elapsed_time": "1 day, 4:49:53", "remaining_time": "5:29:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9116, "total_steps": 10853, "loss": 0.1121, "learning_rate": 3.4208144904361613e-07, "epoch": 0.8399133919933662, "percentage": 84.0, "elapsed_time": "1 day, 4:50:04", "remaining_time": "5:29:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9117, "total_steps": 10853, "loss": 0.1259, "learning_rate": 3.4169691147348137e-07, "epoch": 0.8400055281706362, "percentage": 84.0, "elapsed_time": "1 day, 4:50:15", "remaining_time": "5:29:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9118, "total_steps": 10853, "loss": 0.1266, "learning_rate": 3.4131257430202124e-07, "epoch": 0.8400976643479062, "percentage": 84.01, "elapsed_time": "1 day, 4:50:25", "remaining_time": "5:29:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9119, "total_steps": 10853, "loss": 0.1256, "learning_rate": 3.4092843756492075e-07, "epoch": 0.8401898005251762, "percentage": 84.02, "elapsed_time": "1 day, 4:50:37", "remaining_time": "5:29:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9120, "total_steps": 10853, "loss": 0.1343, "learning_rate": 3.405445012978467e-07, "epoch": 0.8402819367024462, "percentage": 84.03, "elapsed_time": "1 day, 4:50:47", "remaining_time": "5:28:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9121, "total_steps": 10853, "loss": 0.1311, "learning_rate": 3.4016076553644806e-07, "epoch": 0.8403740728797162, "percentage": 84.04, "elapsed_time": "1 day, 4:50:58", "remaining_time": "5:28:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9122, "total_steps": 10853, "loss": 0.1291, "learning_rate": 3.397772303163549e-07, "epoch": 0.8404662090569862, "percentage": 84.05, "elapsed_time": "1 day, 4:51:09", "remaining_time": "5:28:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9123, "total_steps": 10853, "loss": 0.1196, "learning_rate": 3.3939389567317876e-07, "epoch": 0.8405583452342562, "percentage": 84.06, "elapsed_time": "1 day, 4:51:19", "remaining_time": "5:28:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9124, "total_steps": 10853, "loss": 0.1328, "learning_rate": 3.39010761642512e-07, "epoch": 0.8406504814115262, "percentage": 84.07, "elapsed_time": "1 day, 4:51:29", "remaining_time": "5:28:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9125, "total_steps": 10853, "loss": 0.1244, "learning_rate": 3.386278282599281e-07, "epoch": 0.8407426175887962, "percentage": 84.08, "elapsed_time": "1 day, 4:51:40", "remaining_time": "5:27:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9126, "total_steps": 10853, "loss": 0.1117, "learning_rate": 3.3824509556098314e-07, "epoch": 0.8408347537660662, "percentage": 84.09, "elapsed_time": "1 day, 4:51:51", "remaining_time": "5:27:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9127, "total_steps": 10853, "loss": 0.1171, "learning_rate": 3.3786256358121327e-07, "epoch": 0.8409268899433362, "percentage": 84.1, "elapsed_time": "1 day, 4:52:01", "remaining_time": "5:27:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9128, "total_steps": 10853, "loss": 0.1185, "learning_rate": 3.37480232356138e-07, "epoch": 0.8410190261206063, "percentage": 84.11, "elapsed_time": "1 day, 4:52:13", "remaining_time": "5:27:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9129, "total_steps": 10853, "loss": 0.1124, "learning_rate": 3.3709810192125576e-07, "epoch": 0.8411111622978763, "percentage": 84.11, "elapsed_time": "1 day, 4:52:23", "remaining_time": "5:27:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9130, "total_steps": 10853, "loss": 0.1231, "learning_rate": 3.3671617231204683e-07, "epoch": 0.8412032984751463, "percentage": 84.12, "elapsed_time": "1 day, 4:52:34", "remaining_time": "5:26:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9131, "total_steps": 10853, "loss": 0.1145, "learning_rate": 3.3633444356397425e-07, "epoch": 0.8412954346524163, "percentage": 84.13, "elapsed_time": "1 day, 4:52:44", "remaining_time": "5:26:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9132, "total_steps": 10853, "loss": 0.1174, "learning_rate": 3.3595291571248216e-07, "epoch": 0.8413875708296863, "percentage": 84.14, "elapsed_time": "1 day, 4:52:56", "remaining_time": "5:26:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9133, "total_steps": 10853, "loss": 0.1235, "learning_rate": 3.355715887929939e-07, "epoch": 0.8414797070069563, "percentage": 84.15, "elapsed_time": "1 day, 4:53:08", "remaining_time": "5:26:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9134, "total_steps": 10853, "loss": 0.1113, "learning_rate": 3.351904628409172e-07, "epoch": 0.8415718431842263, "percentage": 84.16, "elapsed_time": "1 day, 4:53:19", "remaining_time": "5:26:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9135, "total_steps": 10853, "loss": 0.1195, "learning_rate": 3.348095378916386e-07, "epoch": 0.8416639793614963, "percentage": 84.17, "elapsed_time": "1 day, 4:53:32", "remaining_time": "5:26:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9136, "total_steps": 10853, "loss": 0.1163, "learning_rate": 3.34428813980528e-07, "epoch": 0.8417561155387663, "percentage": 84.18, "elapsed_time": "1 day, 4:53:44", "remaining_time": "5:25:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9137, "total_steps": 10853, "loss": 0.1051, "learning_rate": 3.3404829114293437e-07, "epoch": 0.8418482517160363, "percentage": 84.19, "elapsed_time": "1 day, 4:53:54", "remaining_time": "5:25:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9138, "total_steps": 10853, "loss": 0.1023, "learning_rate": 3.336679694141898e-07, "epoch": 0.8419403878933063, "percentage": 84.2, "elapsed_time": "1 day, 4:54:04", "remaining_time": "5:25:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9139, "total_steps": 10853, "loss": 0.1073, "learning_rate": 3.3328784882960817e-07, "epoch": 0.8420325240705763, "percentage": 84.21, "elapsed_time": "1 day, 4:54:14", "remaining_time": "5:25:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9140, "total_steps": 10853, "loss": 0.1217, "learning_rate": 3.3290792942448303e-07, "epoch": 0.8421246602478463, "percentage": 84.22, "elapsed_time": "1 day, 4:54:25", "remaining_time": "5:25:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9141, "total_steps": 10853, "loss": 0.1176, "learning_rate": 3.325282112340894e-07, "epoch": 0.8422167964251164, "percentage": 84.23, "elapsed_time": "1 day, 4:54:35", "remaining_time": "5:24:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9142, "total_steps": 10853, "loss": 0.123, "learning_rate": 3.321486942936844e-07, "epoch": 0.8423089326023864, "percentage": 84.23, "elapsed_time": "1 day, 4:54:46", "remaining_time": "5:24:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9143, "total_steps": 10853, "loss": 0.1099, "learning_rate": 3.317693786385065e-07, "epoch": 0.8424010687796564, "percentage": 84.24, "elapsed_time": "1 day, 4:54:55", "remaining_time": "5:24:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9144, "total_steps": 10853, "loss": 0.1144, "learning_rate": 3.3139026430377583e-07, "epoch": 0.8424932049569264, "percentage": 84.25, "elapsed_time": "1 day, 4:55:06", "remaining_time": "5:24:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9145, "total_steps": 10853, "loss": 0.1102, "learning_rate": 3.3101135132469237e-07, "epoch": 0.8425853411341964, "percentage": 84.26, "elapsed_time": "1 day, 4:55:16", "remaining_time": "5:24:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9146, "total_steps": 10853, "loss": 0.1203, "learning_rate": 3.306326397364379e-07, "epoch": 0.8426774773114664, "percentage": 84.27, "elapsed_time": "1 day, 4:55:25", "remaining_time": "5:23:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9147, "total_steps": 10853, "loss": 0.1287, "learning_rate": 3.3025412957417624e-07, "epoch": 0.8427696134887364, "percentage": 84.28, "elapsed_time": "1 day, 4:55:37", "remaining_time": "5:23:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9148, "total_steps": 10853, "loss": 0.1219, "learning_rate": 3.298758208730529e-07, "epoch": 0.8428617496660064, "percentage": 84.29, "elapsed_time": "1 day, 4:55:47", "remaining_time": "5:23:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9149, "total_steps": 10853, "loss": 0.1287, "learning_rate": 3.294977136681923e-07, "epoch": 0.8429538858432764, "percentage": 84.3, "elapsed_time": "1 day, 4:56:00", "remaining_time": "5:23:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9150, "total_steps": 10853, "loss": 0.1199, "learning_rate": 3.291198079947033e-07, "epoch": 0.8430460220205463, "percentage": 84.31, "elapsed_time": "1 day, 4:56:12", "remaining_time": "5:23:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9151, "total_steps": 10853, "loss": 0.1208, "learning_rate": 3.2874210388767313e-07, "epoch": 0.8431381581978163, "percentage": 84.32, "elapsed_time": "1 day, 4:56:22", "remaining_time": "5:22:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9152, "total_steps": 10853, "loss": 0.1169, "learning_rate": 3.2836460138217287e-07, "epoch": 0.8432302943750863, "percentage": 84.33, "elapsed_time": "1 day, 4:56:32", "remaining_time": "5:22:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9153, "total_steps": 10853, "loss": 0.1298, "learning_rate": 3.279873005132525e-07, "epoch": 0.8433224305523563, "percentage": 84.34, "elapsed_time": "1 day, 4:56:42", "remaining_time": "5:22:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9154, "total_steps": 10853, "loss": 0.1129, "learning_rate": 3.276102013159452e-07, "epoch": 0.8434145667296263, "percentage": 84.35, "elapsed_time": "1 day, 4:56:53", "remaining_time": "5:22:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9155, "total_steps": 10853, "loss": 0.1152, "learning_rate": 3.272333038252648e-07, "epoch": 0.8435067029068964, "percentage": 84.35, "elapsed_time": "1 day, 4:57:03", "remaining_time": "5:22:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9156, "total_steps": 10853, "loss": 0.122, "learning_rate": 3.2685660807620563e-07, "epoch": 0.8435988390841664, "percentage": 84.36, "elapsed_time": "1 day, 4:57:14", "remaining_time": "5:21:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9157, "total_steps": 10853, "loss": 0.1273, "learning_rate": 3.2648011410374463e-07, "epoch": 0.8436909752614364, "percentage": 84.37, "elapsed_time": "1 day, 4:57:25", "remaining_time": "5:21:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9158, "total_steps": 10853, "loss": 0.115, "learning_rate": 3.2610382194283865e-07, "epoch": 0.8437831114387064, "percentage": 84.38, "elapsed_time": "1 day, 4:57:36", "remaining_time": "5:21:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9159, "total_steps": 10853, "loss": 0.1175, "learning_rate": 3.257277316284266e-07, "epoch": 0.8438752476159764, "percentage": 84.39, "elapsed_time": "1 day, 4:57:48", "remaining_time": "5:21:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9160, "total_steps": 10853, "loss": 0.1144, "learning_rate": 3.253518431954286e-07, "epoch": 0.8439673837932464, "percentage": 84.4, "elapsed_time": "1 day, 4:57:57", "remaining_time": "5:21:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9161, "total_steps": 10853, "loss": 0.1138, "learning_rate": 3.249761566787474e-07, "epoch": 0.8440595199705164, "percentage": 84.41, "elapsed_time": "1 day, 4:58:08", "remaining_time": "5:21:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9162, "total_steps": 10853, "loss": 0.1183, "learning_rate": 3.2460067211326274e-07, "epoch": 0.8441516561477864, "percentage": 84.42, "elapsed_time": "1 day, 4:58:19", "remaining_time": "5:20:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9163, "total_steps": 10853, "loss": 0.1125, "learning_rate": 3.2422538953383986e-07, "epoch": 0.8442437923250564, "percentage": 84.43, "elapsed_time": "1 day, 4:58:31", "remaining_time": "5:20:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9164, "total_steps": 10853, "loss": 0.1214, "learning_rate": 3.2385030897532364e-07, "epoch": 0.8443359285023264, "percentage": 84.44, "elapsed_time": "1 day, 4:58:42", "remaining_time": "5:20:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9165, "total_steps": 10853, "loss": 0.1172, "learning_rate": 3.234754304725413e-07, "epoch": 0.8444280646795964, "percentage": 84.45, "elapsed_time": "1 day, 4:58:53", "remaining_time": "5:20:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9166, "total_steps": 10853, "loss": 0.1084, "learning_rate": 3.2310075406029875e-07, "epoch": 0.8445202008568664, "percentage": 84.46, "elapsed_time": "1 day, 4:59:04", "remaining_time": "5:20:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9167, "total_steps": 10853, "loss": 0.1329, "learning_rate": 3.22726279773386e-07, "epoch": 0.8446123370341364, "percentage": 84.47, "elapsed_time": "1 day, 4:59:15", "remaining_time": "5:19:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9168, "total_steps": 10853, "loss": 0.1116, "learning_rate": 3.223520076465719e-07, "epoch": 0.8447044732114064, "percentage": 84.47, "elapsed_time": "1 day, 4:59:25", "remaining_time": "5:19:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9169, "total_steps": 10853, "loss": 0.1112, "learning_rate": 3.219779377146087e-07, "epoch": 0.8447966093886765, "percentage": 84.48, "elapsed_time": "1 day, 4:59:35", "remaining_time": "5:19:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9170, "total_steps": 10853, "loss": 0.1319, "learning_rate": 3.2160407001222805e-07, "epoch": 0.8448887455659465, "percentage": 84.49, "elapsed_time": "1 day, 4:59:47", "remaining_time": "5:19:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9171, "total_steps": 10853, "loss": 0.1196, "learning_rate": 3.2123040457414377e-07, "epoch": 0.8449808817432165, "percentage": 84.5, "elapsed_time": "1 day, 4:59:57", "remaining_time": "5:19:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9172, "total_steps": 10853, "loss": 0.1205, "learning_rate": 3.208569414350515e-07, "epoch": 0.8450730179204865, "percentage": 84.51, "elapsed_time": "1 day, 5:00:08", "remaining_time": "5:18:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9173, "total_steps": 10853, "loss": 0.1247, "learning_rate": 3.204836806296269e-07, "epoch": 0.8451651540977565, "percentage": 84.52, "elapsed_time": "1 day, 5:00:20", "remaining_time": "5:18:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9174, "total_steps": 10853, "loss": 0.1333, "learning_rate": 3.201106221925265e-07, "epoch": 0.8452572902750265, "percentage": 84.53, "elapsed_time": "1 day, 5:00:30", "remaining_time": "5:18:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9175, "total_steps": 10853, "loss": 0.1047, "learning_rate": 3.197377661583892e-07, "epoch": 0.8453494264522965, "percentage": 84.54, "elapsed_time": "1 day, 5:00:40", "remaining_time": "5:18:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9176, "total_steps": 10853, "loss": 0.108, "learning_rate": 3.1936511256183524e-07, "epoch": 0.8454415626295665, "percentage": 84.55, "elapsed_time": "1 day, 5:00:52", "remaining_time": "5:18:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9177, "total_steps": 10853, "loss": 0.119, "learning_rate": 3.1899266143746556e-07, "epoch": 0.8455336988068365, "percentage": 84.56, "elapsed_time": "1 day, 5:01:02", "remaining_time": "5:17:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9178, "total_steps": 10853, "loss": 0.1151, "learning_rate": 3.1862041281986224e-07, "epoch": 0.8456258349841065, "percentage": 84.57, "elapsed_time": "1 day, 5:01:13", "remaining_time": "5:17:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9179, "total_steps": 10853, "loss": 0.1141, "learning_rate": 3.182483667435876e-07, "epoch": 0.8457179711613765, "percentage": 84.58, "elapsed_time": "1 day, 5:01:22", "remaining_time": "5:17:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9180, "total_steps": 10853, "loss": 0.107, "learning_rate": 3.1787652324318715e-07, "epoch": 0.8458101073386465, "percentage": 84.58, "elapsed_time": "1 day, 5:01:32", "remaining_time": "5:17:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9181, "total_steps": 10853, "loss": 0.1229, "learning_rate": 3.1750488235318675e-07, "epoch": 0.8459022435159165, "percentage": 84.59, "elapsed_time": "1 day, 5:01:43", "remaining_time": "5:17:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9182, "total_steps": 10853, "loss": 0.124, "learning_rate": 3.171334441080923e-07, "epoch": 0.8459943796931866, "percentage": 84.6, "elapsed_time": "1 day, 5:01:55", "remaining_time": "5:17:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9183, "total_steps": 10853, "loss": 0.1179, "learning_rate": 3.1676220854239326e-07, "epoch": 0.8460865158704566, "percentage": 84.61, "elapsed_time": "1 day, 5:02:06", "remaining_time": "5:16:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9184, "total_steps": 10853, "loss": 0.1211, "learning_rate": 3.1639117569055744e-07, "epoch": 0.8461786520477266, "percentage": 84.62, "elapsed_time": "1 day, 5:02:17", "remaining_time": "5:16:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9185, "total_steps": 10853, "loss": 0.115, "learning_rate": 3.160203455870359e-07, "epoch": 0.8462707882249966, "percentage": 84.63, "elapsed_time": "1 day, 5:02:27", "remaining_time": "5:16:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9186, "total_steps": 10853, "loss": 0.1096, "learning_rate": 3.156497182662607e-07, "epoch": 0.8463629244022666, "percentage": 84.64, "elapsed_time": "1 day, 5:02:37", "remaining_time": "5:16:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9187, "total_steps": 10853, "loss": 0.1346, "learning_rate": 3.1527929376264393e-07, "epoch": 0.8464550605795366, "percentage": 84.65, "elapsed_time": "1 day, 5:02:49", "remaining_time": "5:16:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9188, "total_steps": 10853, "loss": 0.1204, "learning_rate": 3.149090721105805e-07, "epoch": 0.8465471967568066, "percentage": 84.66, "elapsed_time": "1 day, 5:02:59", "remaining_time": "5:15:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9189, "total_steps": 10853, "loss": 0.1205, "learning_rate": 3.145390533444442e-07, "epoch": 0.8466393329340766, "percentage": 84.67, "elapsed_time": "1 day, 5:03:10", "remaining_time": "5:15:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9190, "total_steps": 10853, "loss": 0.124, "learning_rate": 3.1416923749859244e-07, "epoch": 0.8467314691113466, "percentage": 84.68, "elapsed_time": "1 day, 5:03:22", "remaining_time": "5:15:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9191, "total_steps": 10853, "loss": 0.118, "learning_rate": 3.1379962460736183e-07, "epoch": 0.8468236052886166, "percentage": 84.69, "elapsed_time": "1 day, 5:03:33", "remaining_time": "5:15:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9192, "total_steps": 10853, "loss": 0.1262, "learning_rate": 3.1343021470507134e-07, "epoch": 0.8469157414658866, "percentage": 84.7, "elapsed_time": "1 day, 5:03:45", "remaining_time": "5:15:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9193, "total_steps": 10853, "loss": 0.1217, "learning_rate": 3.1306100782602126e-07, "epoch": 0.8470078776431565, "percentage": 84.7, "elapsed_time": "1 day, 5:03:56", "remaining_time": "5:14:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9194, "total_steps": 10853, "loss": 0.1292, "learning_rate": 3.12692004004492e-07, "epoch": 0.8471000138204265, "percentage": 84.71, "elapsed_time": "1 day, 5:04:09", "remaining_time": "5:14:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9195, "total_steps": 10853, "loss": 0.111, "learning_rate": 3.1232320327474504e-07, "epoch": 0.8471921499976965, "percentage": 84.72, "elapsed_time": "1 day, 5:04:20", "remaining_time": "5:14:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9196, "total_steps": 10853, "loss": 0.1091, "learning_rate": 3.11954605671024e-07, "epoch": 0.8472842861749666, "percentage": 84.73, "elapsed_time": "1 day, 5:04:31", "remaining_time": "5:14:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9197, "total_steps": 10853, "loss": 0.1209, "learning_rate": 3.1158621122755336e-07, "epoch": 0.8473764223522366, "percentage": 84.74, "elapsed_time": "1 day, 5:04:43", "remaining_time": "5:14:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9198, "total_steps": 10853, "loss": 0.1186, "learning_rate": 3.112180199785389e-07, "epoch": 0.8474685585295066, "percentage": 84.75, "elapsed_time": "1 day, 5:04:53", "remaining_time": "5:13:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9199, "total_steps": 10853, "loss": 0.1168, "learning_rate": 3.1085003195816697e-07, "epoch": 0.8475606947067766, "percentage": 84.76, "elapsed_time": "1 day, 5:05:06", "remaining_time": "5:13:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9200, "total_steps": 10853, "loss": 0.1167, "learning_rate": 3.1048224720060473e-07, "epoch": 0.8476528308840466, "percentage": 84.77, "elapsed_time": "1 day, 5:05:16", "remaining_time": "5:13:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9201, "total_steps": 10853, "loss": 0.1063, "learning_rate": 3.1011466574000144e-07, "epoch": 0.8477449670613166, "percentage": 84.78, "elapsed_time": "1 day, 5:05:27", "remaining_time": "5:13:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9202, "total_steps": 10853, "loss": 0.1141, "learning_rate": 3.097472876104876e-07, "epoch": 0.8478371032385866, "percentage": 84.79, "elapsed_time": "1 day, 5:05:37", "remaining_time": "5:13:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9203, "total_steps": 10853, "loss": 0.1119, "learning_rate": 3.093801128461735e-07, "epoch": 0.8479292394158566, "percentage": 84.8, "elapsed_time": "1 day, 5:05:48", "remaining_time": "5:13:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9204, "total_steps": 10853, "loss": 0.1122, "learning_rate": 3.0901314148115203e-07, "epoch": 0.8480213755931266, "percentage": 84.81, "elapsed_time": "1 day, 5:06:00", "remaining_time": "5:12:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9205, "total_steps": 10853, "loss": 0.1162, "learning_rate": 3.0864637354949545e-07, "epoch": 0.8481135117703966, "percentage": 84.82, "elapsed_time": "1 day, 5:06:10", "remaining_time": "5:12:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9206, "total_steps": 10853, "loss": 0.1159, "learning_rate": 3.082798090852596e-07, "epoch": 0.8482056479476666, "percentage": 84.82, "elapsed_time": "1 day, 5:06:21", "remaining_time": "5:12:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9207, "total_steps": 10853, "loss": 0.1139, "learning_rate": 3.079134481224788e-07, "epoch": 0.8482977841249366, "percentage": 84.83, "elapsed_time": "1 day, 5:06:31", "remaining_time": "5:12:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9208, "total_steps": 10853, "loss": 0.1213, "learning_rate": 3.075472906951704e-07, "epoch": 0.8483899203022066, "percentage": 84.84, "elapsed_time": "1 day, 5:06:42", "remaining_time": "5:12:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9209, "total_steps": 10853, "loss": 0.1308, "learning_rate": 3.0718133683733247e-07, "epoch": 0.8484820564794767, "percentage": 84.85, "elapsed_time": "1 day, 5:06:55", "remaining_time": "5:11:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9210, "total_steps": 10853, "loss": 0.114, "learning_rate": 3.0681558658294334e-07, "epoch": 0.8485741926567467, "percentage": 84.86, "elapsed_time": "1 day, 5:07:05", "remaining_time": "5:11:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9211, "total_steps": 10853, "loss": 0.1167, "learning_rate": 3.0645003996596254e-07, "epoch": 0.8486663288340167, "percentage": 84.87, "elapsed_time": "1 day, 5:07:15", "remaining_time": "5:11:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9212, "total_steps": 10853, "loss": 0.1199, "learning_rate": 3.0608469702033185e-07, "epoch": 0.8487584650112867, "percentage": 84.88, "elapsed_time": "1 day, 5:07:27", "remaining_time": "5:11:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9213, "total_steps": 10853, "loss": 0.1144, "learning_rate": 3.057195577799729e-07, "epoch": 0.8488506011885567, "percentage": 84.89, "elapsed_time": "1 day, 5:07:37", "remaining_time": "5:11:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9214, "total_steps": 10853, "loss": 0.1234, "learning_rate": 3.053546222787895e-07, "epoch": 0.8489427373658267, "percentage": 84.9, "elapsed_time": "1 day, 5:07:49", "remaining_time": "5:10:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9215, "total_steps": 10853, "loss": 0.1122, "learning_rate": 3.0498989055066597e-07, "epoch": 0.8490348735430967, "percentage": 84.91, "elapsed_time": "1 day, 5:07:58", "remaining_time": "5:10:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9216, "total_steps": 10853, "loss": 0.1278, "learning_rate": 3.046253626294665e-07, "epoch": 0.8491270097203667, "percentage": 84.92, "elapsed_time": "1 day, 5:08:09", "remaining_time": "5:10:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9217, "total_steps": 10853, "loss": 0.1021, "learning_rate": 3.0426103854903856e-07, "epoch": 0.8492191458976367, "percentage": 84.93, "elapsed_time": "1 day, 5:08:20", "remaining_time": "5:10:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9218, "total_steps": 10853, "loss": 0.1133, "learning_rate": 3.0389691834320944e-07, "epoch": 0.8493112820749067, "percentage": 84.94, "elapsed_time": "1 day, 5:08:32", "remaining_time": "5:10:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9219, "total_steps": 10853, "loss": 0.1102, "learning_rate": 3.0353300204578854e-07, "epoch": 0.8494034182521767, "percentage": 84.94, "elapsed_time": "1 day, 5:08:43", "remaining_time": "5:09:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9220, "total_steps": 10853, "loss": 0.1097, "learning_rate": 3.031692896905644e-07, "epoch": 0.8494955544294467, "percentage": 84.95, "elapsed_time": "1 day, 5:08:54", "remaining_time": "5:09:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9221, "total_steps": 10853, "loss": 0.1198, "learning_rate": 3.0280578131130805e-07, "epoch": 0.8495876906067167, "percentage": 84.96, "elapsed_time": "1 day, 5:09:04", "remaining_time": "5:09:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9222, "total_steps": 10853, "loss": 0.1018, "learning_rate": 3.024424769417711e-07, "epoch": 0.8496798267839867, "percentage": 84.97, "elapsed_time": "1 day, 5:09:14", "remaining_time": "5:09:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9223, "total_steps": 10853, "loss": 0.1181, "learning_rate": 3.020793766156871e-07, "epoch": 0.8497719629612568, "percentage": 84.98, "elapsed_time": "1 day, 5:09:24", "remaining_time": "5:09:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9224, "total_steps": 10853, "loss": 0.1215, "learning_rate": 3.017164803667691e-07, "epoch": 0.8498640991385268, "percentage": 84.99, "elapsed_time": "1 day, 5:09:35", "remaining_time": "5:08:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9225, "total_steps": 10853, "loss": 0.1153, "learning_rate": 3.013537882287132e-07, "epoch": 0.8499562353157968, "percentage": 85.0, "elapsed_time": "1 day, 5:09:47", "remaining_time": "5:08:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9226, "total_steps": 10853, "loss": 0.1153, "learning_rate": 3.0099130023519384e-07, "epoch": 0.8500483714930668, "percentage": 85.01, "elapsed_time": "1 day, 5:09:57", "remaining_time": "5:08:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9227, "total_steps": 10853, "loss": 0.1125, "learning_rate": 3.0062901641986967e-07, "epoch": 0.8501405076703368, "percentage": 85.02, "elapsed_time": "1 day, 5:10:08", "remaining_time": "5:08:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9228, "total_steps": 10853, "loss": 0.1192, "learning_rate": 3.002669368163774e-07, "epoch": 0.8502326438476068, "percentage": 85.03, "elapsed_time": "1 day, 5:10:19", "remaining_time": "5:08:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9229, "total_steps": 10853, "loss": 0.1319, "learning_rate": 2.999050614583368e-07, "epoch": 0.8503247800248768, "percentage": 85.04, "elapsed_time": "1 day, 5:10:30", "remaining_time": "5:08:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9230, "total_steps": 10853, "loss": 0.1178, "learning_rate": 2.995433903793485e-07, "epoch": 0.8504169162021468, "percentage": 85.05, "elapsed_time": "1 day, 5:10:40", "remaining_time": "5:07:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9231, "total_steps": 10853, "loss": 0.1113, "learning_rate": 2.9918192361299335e-07, "epoch": 0.8505090523794168, "percentage": 85.05, "elapsed_time": "1 day, 5:10:51", "remaining_time": "5:07:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9232, "total_steps": 10853, "loss": 0.1157, "learning_rate": 2.988206611928329e-07, "epoch": 0.8506011885566868, "percentage": 85.06, "elapsed_time": "1 day, 5:11:03", "remaining_time": "5:07:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9233, "total_steps": 10853, "loss": 0.1199, "learning_rate": 2.984596031524109e-07, "epoch": 0.8506933247339568, "percentage": 85.07, "elapsed_time": "1 day, 5:11:13", "remaining_time": "5:07:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9234, "total_steps": 10853, "loss": 0.0979, "learning_rate": 2.980987495252516e-07, "epoch": 0.8507854609112268, "percentage": 85.08, "elapsed_time": "1 day, 5:11:23", "remaining_time": "5:07:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9235, "total_steps": 10853, "loss": 0.128, "learning_rate": 2.9773810034486095e-07, "epoch": 0.8508775970884968, "percentage": 85.09, "elapsed_time": "1 day, 5:11:33", "remaining_time": "5:06:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9236, "total_steps": 10853, "loss": 0.117, "learning_rate": 2.973776556447247e-07, "epoch": 0.8509697332657667, "percentage": 85.1, "elapsed_time": "1 day, 5:11:43", "remaining_time": "5:06:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9237, "total_steps": 10853, "loss": 0.1349, "learning_rate": 2.970174154583097e-07, "epoch": 0.8510618694430369, "percentage": 85.11, "elapsed_time": "1 day, 5:11:55", "remaining_time": "5:06:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9238, "total_steps": 10853, "loss": 0.1157, "learning_rate": 2.9665737981906475e-07, "epoch": 0.8511540056203069, "percentage": 85.12, "elapsed_time": "1 day, 5:12:06", "remaining_time": "5:06:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9239, "total_steps": 10853, "loss": 0.1131, "learning_rate": 2.962975487604197e-07, "epoch": 0.8512461417975768, "percentage": 85.13, "elapsed_time": "1 day, 5:12:17", "remaining_time": "5:06:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9240, "total_steps": 10853, "loss": 0.1091, "learning_rate": 2.9593792231578407e-07, "epoch": 0.8513382779748468, "percentage": 85.14, "elapsed_time": "1 day, 5:12:29", "remaining_time": "5:05:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9241, "total_steps": 10853, "loss": 0.1133, "learning_rate": 2.9557850051854935e-07, "epoch": 0.8514304141521168, "percentage": 85.15, "elapsed_time": "1 day, 5:12:39", "remaining_time": "5:05:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9242, "total_steps": 10853, "loss": 0.1073, "learning_rate": 2.9521928340208867e-07, "epoch": 0.8515225503293868, "percentage": 85.16, "elapsed_time": "1 day, 5:12:49", "remaining_time": "5:05:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9243, "total_steps": 10853, "loss": 0.1111, "learning_rate": 2.9486027099975416e-07, "epoch": 0.8516146865066568, "percentage": 85.17, "elapsed_time": "1 day, 5:13:00", "remaining_time": "5:05:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9244, "total_steps": 10853, "loss": 0.1238, "learning_rate": 2.9450146334488144e-07, "epoch": 0.8517068226839268, "percentage": 85.17, "elapsed_time": "1 day, 5:13:11", "remaining_time": "5:05:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9245, "total_steps": 10853, "loss": 0.1185, "learning_rate": 2.9414286047078495e-07, "epoch": 0.8517989588611968, "percentage": 85.18, "elapsed_time": "1 day, 5:13:21", "remaining_time": "5:04:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9246, "total_steps": 10853, "loss": 0.1249, "learning_rate": 2.937844624107608e-07, "epoch": 0.8518910950384668, "percentage": 85.19, "elapsed_time": "1 day, 5:13:31", "remaining_time": "5:04:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9247, "total_steps": 10853, "loss": 0.1271, "learning_rate": 2.934262691980877e-07, "epoch": 0.8519832312157368, "percentage": 85.2, "elapsed_time": "1 day, 5:13:43", "remaining_time": "5:04:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9248, "total_steps": 10853, "loss": 0.1238, "learning_rate": 2.930682808660226e-07, "epoch": 0.8520753673930068, "percentage": 85.21, "elapsed_time": "1 day, 5:13:54", "remaining_time": "5:04:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9249, "total_steps": 10853, "loss": 0.112, "learning_rate": 2.927104974478048e-07, "epoch": 0.8521675035702768, "percentage": 85.22, "elapsed_time": "1 day, 5:14:04", "remaining_time": "5:04:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9250, "total_steps": 10853, "loss": 0.1095, "learning_rate": 2.9235291897665497e-07, "epoch": 0.8522596397475469, "percentage": 85.23, "elapsed_time": "1 day, 5:14:14", "remaining_time": "5:04:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9251, "total_steps": 10853, "loss": 0.123, "learning_rate": 2.91995545485774e-07, "epoch": 0.8523517759248169, "percentage": 85.24, "elapsed_time": "1 day, 5:14:27", "remaining_time": "5:03:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9252, "total_steps": 10853, "loss": 0.1111, "learning_rate": 2.9163837700834473e-07, "epoch": 0.8524439121020869, "percentage": 85.25, "elapsed_time": "1 day, 5:14:38", "remaining_time": "5:03:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9253, "total_steps": 10853, "loss": 0.1201, "learning_rate": 2.912814135775299e-07, "epoch": 0.8525360482793569, "percentage": 85.26, "elapsed_time": "1 day, 5:14:50", "remaining_time": "5:03:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9254, "total_steps": 10853, "loss": 0.1185, "learning_rate": 2.909246552264733e-07, "epoch": 0.8526281844566269, "percentage": 85.27, "elapsed_time": "1 day, 5:15:00", "remaining_time": "5:03:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9255, "total_steps": 10853, "loss": 0.1233, "learning_rate": 2.905681019882997e-07, "epoch": 0.8527203206338969, "percentage": 85.28, "elapsed_time": "1 day, 5:15:10", "remaining_time": "5:03:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9256, "total_steps": 10853, "loss": 0.1089, "learning_rate": 2.902117538961166e-07, "epoch": 0.8528124568111669, "percentage": 85.29, "elapsed_time": "1 day, 5:15:21", "remaining_time": "5:02:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9257, "total_steps": 10853, "loss": 0.1232, "learning_rate": 2.898556109830092e-07, "epoch": 0.8529045929884369, "percentage": 85.29, "elapsed_time": "1 day, 5:15:32", "remaining_time": "5:02:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9258, "total_steps": 10853, "loss": 0.1198, "learning_rate": 2.894996732820468e-07, "epoch": 0.8529967291657069, "percentage": 85.3, "elapsed_time": "1 day, 5:15:44", "remaining_time": "5:02:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9259, "total_steps": 10853, "loss": 0.1308, "learning_rate": 2.8914394082627694e-07, "epoch": 0.8530888653429769, "percentage": 85.31, "elapsed_time": "1 day, 5:15:56", "remaining_time": "5:02:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9260, "total_steps": 10853, "loss": 0.108, "learning_rate": 2.8878841364873067e-07, "epoch": 0.8531810015202469, "percentage": 85.32, "elapsed_time": "1 day, 5:16:08", "remaining_time": "5:02:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9261, "total_steps": 10853, "loss": 0.1229, "learning_rate": 2.8843309178241766e-07, "epoch": 0.8532731376975169, "percentage": 85.33, "elapsed_time": "1 day, 5:16:19", "remaining_time": "5:01:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9262, "total_steps": 10853, "loss": 0.117, "learning_rate": 2.880779752603302e-07, "epoch": 0.8533652738747869, "percentage": 85.34, "elapsed_time": "1 day, 5:16:30", "remaining_time": "5:01:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9263, "total_steps": 10853, "loss": 0.1109, "learning_rate": 2.877230641154413e-07, "epoch": 0.8534574100520569, "percentage": 85.35, "elapsed_time": "1 day, 5:16:41", "remaining_time": "5:01:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9264, "total_steps": 10853, "loss": 0.1217, "learning_rate": 2.873683583807038e-07, "epoch": 0.853549546229327, "percentage": 85.36, "elapsed_time": "1 day, 5:16:52", "remaining_time": "5:01:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9265, "total_steps": 10853, "loss": 0.1217, "learning_rate": 2.8701385808905217e-07, "epoch": 0.853641682406597, "percentage": 85.37, "elapsed_time": "1 day, 5:17:03", "remaining_time": "5:01:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9266, "total_steps": 10853, "loss": 0.1176, "learning_rate": 2.8665956327340175e-07, "epoch": 0.853733818583867, "percentage": 85.38, "elapsed_time": "1 day, 5:17:13", "remaining_time": "5:00:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9267, "total_steps": 10853, "loss": 0.1179, "learning_rate": 2.8630547396664905e-07, "epoch": 0.853825954761137, "percentage": 85.39, "elapsed_time": "1 day, 5:17:24", "remaining_time": "5:00:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9268, "total_steps": 10853, "loss": 0.1261, "learning_rate": 2.8595159020167186e-07, "epoch": 0.853918090938407, "percentage": 85.4, "elapsed_time": "1 day, 5:17:35", "remaining_time": "5:00:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9269, "total_steps": 10853, "loss": 0.1234, "learning_rate": 2.855979120113278e-07, "epoch": 0.854010227115677, "percentage": 85.4, "elapsed_time": "1 day, 5:17:45", "remaining_time": "5:00:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9270, "total_steps": 10853, "loss": 0.1259, "learning_rate": 2.8524443942845567e-07, "epoch": 0.854102363292947, "percentage": 85.41, "elapsed_time": "1 day, 5:17:55", "remaining_time": "5:00:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9271, "total_steps": 10853, "loss": 0.1159, "learning_rate": 2.848911724858755e-07, "epoch": 0.854194499470217, "percentage": 85.42, "elapsed_time": "1 day, 5:18:07", "remaining_time": "5:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9272, "total_steps": 10853, "loss": 0.1004, "learning_rate": 2.8453811121638834e-07, "epoch": 0.854286635647487, "percentage": 85.43, "elapsed_time": "1 day, 5:18:17", "remaining_time": "4:59:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9273, "total_steps": 10853, "loss": 0.1227, "learning_rate": 2.841852556527763e-07, "epoch": 0.854378771824757, "percentage": 85.44, "elapsed_time": "1 day, 5:18:29", "remaining_time": "4:59:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9274, "total_steps": 10853, "loss": 0.1102, "learning_rate": 2.8383260582780206e-07, "epoch": 0.854470908002027, "percentage": 85.45, "elapsed_time": "1 day, 5:18:40", "remaining_time": "4:59:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9275, "total_steps": 10853, "loss": 0.1181, "learning_rate": 2.8348016177420833e-07, "epoch": 0.854563044179297, "percentage": 85.46, "elapsed_time": "1 day, 5:18:50", "remaining_time": "4:59:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9276, "total_steps": 10853, "loss": 0.1146, "learning_rate": 2.8312792352472003e-07, "epoch": 0.854655180356567, "percentage": 85.47, "elapsed_time": "1 day, 5:19:02", "remaining_time": "4:59:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9277, "total_steps": 10853, "loss": 0.1052, "learning_rate": 2.8277589111204315e-07, "epoch": 0.8547473165338371, "percentage": 85.48, "elapsed_time": "1 day, 5:19:11", "remaining_time": "4:58:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9278, "total_steps": 10853, "loss": 0.1172, "learning_rate": 2.824240645688628e-07, "epoch": 0.8548394527111071, "percentage": 85.49, "elapsed_time": "1 day, 5:19:23", "remaining_time": "4:58:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9279, "total_steps": 10853, "loss": 0.1088, "learning_rate": 2.8207244392784715e-07, "epoch": 0.8549315888883771, "percentage": 85.5, "elapsed_time": "1 day, 5:19:32", "remaining_time": "4:58:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9280, "total_steps": 10853, "loss": 0.1206, "learning_rate": 2.817210292216435e-07, "epoch": 0.8550237250656471, "percentage": 85.51, "elapsed_time": "1 day, 5:19:43", "remaining_time": "4:58:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9281, "total_steps": 10853, "loss": 0.1142, "learning_rate": 2.813698204828816e-07, "epoch": 0.855115861242917, "percentage": 85.52, "elapsed_time": "1 day, 5:19:53", "remaining_time": "4:58:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9282, "total_steps": 10853, "loss": 0.1293, "learning_rate": 2.8101881774416975e-07, "epoch": 0.855207997420187, "percentage": 85.52, "elapsed_time": "1 day, 5:20:04", "remaining_time": "4:57:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9283, "total_steps": 10853, "loss": 0.116, "learning_rate": 2.806680210380999e-07, "epoch": 0.855300133597457, "percentage": 85.53, "elapsed_time": "1 day, 5:20:16", "remaining_time": "4:57:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9284, "total_steps": 10853, "loss": 0.1172, "learning_rate": 2.8031743039724337e-07, "epoch": 0.855392269774727, "percentage": 85.54, "elapsed_time": "1 day, 5:20:28", "remaining_time": "4:57:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9285, "total_steps": 10853, "loss": 0.1127, "learning_rate": 2.7996704585415227e-07, "epoch": 0.855484405951997, "percentage": 85.55, "elapsed_time": "1 day, 5:20:41", "remaining_time": "4:57:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9286, "total_steps": 10853, "loss": 0.1091, "learning_rate": 2.796168674413596e-07, "epoch": 0.855576542129267, "percentage": 85.56, "elapsed_time": "1 day, 5:20:51", "remaining_time": "4:57:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9287, "total_steps": 10853, "loss": 0.1069, "learning_rate": 2.7926689519137963e-07, "epoch": 0.855668678306537, "percentage": 85.57, "elapsed_time": "1 day, 5:21:02", "remaining_time": "4:56:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9288, "total_steps": 10853, "loss": 0.127, "learning_rate": 2.7891712913670765e-07, "epoch": 0.855760814483807, "percentage": 85.58, "elapsed_time": "1 day, 5:21:14", "remaining_time": "4:56:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9289, "total_steps": 10853, "loss": 0.1174, "learning_rate": 2.785675693098194e-07, "epoch": 0.855852950661077, "percentage": 85.59, "elapsed_time": "1 day, 5:21:23", "remaining_time": "4:56:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9290, "total_steps": 10853, "loss": 0.1122, "learning_rate": 2.782182157431718e-07, "epoch": 0.855945086838347, "percentage": 85.6, "elapsed_time": "1 day, 5:21:34", "remaining_time": "4:56:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9291, "total_steps": 10853, "loss": 0.1131, "learning_rate": 2.778690684692012e-07, "epoch": 0.8560372230156171, "percentage": 85.61, "elapsed_time": "1 day, 5:21:47", "remaining_time": "4:56:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9292, "total_steps": 10853, "loss": 0.1357, "learning_rate": 2.7752012752032683e-07, "epoch": 0.8561293591928871, "percentage": 85.62, "elapsed_time": "1 day, 5:21:59", "remaining_time": "4:56:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9293, "total_steps": 10853, "loss": 0.1097, "learning_rate": 2.7717139292894824e-07, "epoch": 0.8562214953701571, "percentage": 85.63, "elapsed_time": "1 day, 5:22:08", "remaining_time": "4:55:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9294, "total_steps": 10853, "loss": 0.1174, "learning_rate": 2.768228647274446e-07, "epoch": 0.8563136315474271, "percentage": 85.64, "elapsed_time": "1 day, 5:22:19", "remaining_time": "4:55:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9295, "total_steps": 10853, "loss": 0.1146, "learning_rate": 2.7647454294817773e-07, "epoch": 0.8564057677246971, "percentage": 85.64, "elapsed_time": "1 day, 5:22:31", "remaining_time": "4:55:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9296, "total_steps": 10853, "loss": 0.1086, "learning_rate": 2.7612642762348844e-07, "epoch": 0.8564979039019671, "percentage": 85.65, "elapsed_time": "1 day, 5:22:40", "remaining_time": "4:55:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9297, "total_steps": 10853, "loss": 0.1143, "learning_rate": 2.757785187857001e-07, "epoch": 0.8565900400792371, "percentage": 85.66, "elapsed_time": "1 day, 5:22:51", "remaining_time": "4:55:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9298, "total_steps": 10853, "loss": 0.1122, "learning_rate": 2.7543081646711487e-07, "epoch": 0.8566821762565071, "percentage": 85.67, "elapsed_time": "1 day, 5:23:02", "remaining_time": "4:54:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9299, "total_steps": 10853, "loss": 0.1133, "learning_rate": 2.7508332070001807e-07, "epoch": 0.8567743124337771, "percentage": 85.68, "elapsed_time": "1 day, 5:23:13", "remaining_time": "4:54:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9300, "total_steps": 10853, "loss": 0.1231, "learning_rate": 2.74736031516675e-07, "epoch": 0.8568664486110471, "percentage": 85.69, "elapsed_time": "1 day, 5:23:24", "remaining_time": "4:54:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9301, "total_steps": 10853, "loss": 0.125, "learning_rate": 2.7438894894933013e-07, "epoch": 0.8569585847883171, "percentage": 85.7, "elapsed_time": "1 day, 5:23:36", "remaining_time": "4:54:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9302, "total_steps": 10853, "loss": 0.1151, "learning_rate": 2.7404207303021153e-07, "epoch": 0.8570507209655871, "percentage": 85.71, "elapsed_time": "1 day, 5:23:46", "remaining_time": "4:54:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9303, "total_steps": 10853, "loss": 0.1224, "learning_rate": 2.736954037915254e-07, "epoch": 0.8571428571428571, "percentage": 85.72, "elapsed_time": "1 day, 5:23:56", "remaining_time": "4:53:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9304, "total_steps": 10853, "loss": 0.1293, "learning_rate": 2.733489412654608e-07, "epoch": 0.8572349933201272, "percentage": 85.73, "elapsed_time": "1 day, 5:24:07", "remaining_time": "4:53:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9305, "total_steps": 10853, "loss": 0.1279, "learning_rate": 2.730026854841869e-07, "epoch": 0.8573271294973972, "percentage": 85.74, "elapsed_time": "1 day, 5:24:18", "remaining_time": "4:53:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9306, "total_steps": 10853, "loss": 0.127, "learning_rate": 2.7265663647985357e-07, "epoch": 0.8574192656746672, "percentage": 85.75, "elapsed_time": "1 day, 5:24:29", "remaining_time": "4:53:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9307, "total_steps": 10853, "loss": 0.1252, "learning_rate": 2.723107942845907e-07, "epoch": 0.8575114018519372, "percentage": 85.76, "elapsed_time": "1 day, 5:24:40", "remaining_time": "4:53:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9308, "total_steps": 10853, "loss": 0.1186, "learning_rate": 2.7196515893051003e-07, "epoch": 0.8576035380292072, "percentage": 85.76, "elapsed_time": "1 day, 5:24:51", "remaining_time": "4:52:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9309, "total_steps": 10853, "loss": 0.1247, "learning_rate": 2.7161973044970453e-07, "epoch": 0.8576956742064772, "percentage": 85.77, "elapsed_time": "1 day, 5:25:01", "remaining_time": "4:52:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9310, "total_steps": 10853, "loss": 0.1087, "learning_rate": 2.712745088742472e-07, "epoch": 0.8577878103837472, "percentage": 85.78, "elapsed_time": "1 day, 5:25:13", "remaining_time": "4:52:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9311, "total_steps": 10853, "loss": 0.1201, "learning_rate": 2.7092949423619145e-07, "epoch": 0.8578799465610172, "percentage": 85.79, "elapsed_time": "1 day, 5:25:23", "remaining_time": "4:52:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9312, "total_steps": 10853, "loss": 0.1166, "learning_rate": 2.7058468656757183e-07, "epoch": 0.8579720827382872, "percentage": 85.8, "elapsed_time": "1 day, 5:25:33", "remaining_time": "4:52:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9313, "total_steps": 10853, "loss": 0.108, "learning_rate": 2.702400859004037e-07, "epoch": 0.8580642189155572, "percentage": 85.81, "elapsed_time": "1 day, 5:25:42", "remaining_time": "4:51:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9314, "total_steps": 10853, "loss": 0.1199, "learning_rate": 2.698956922666843e-07, "epoch": 0.8581563550928272, "percentage": 85.82, "elapsed_time": "1 day, 5:25:54", "remaining_time": "4:51:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9315, "total_steps": 10853, "loss": 0.116, "learning_rate": 2.695515056983894e-07, "epoch": 0.8582484912700972, "percentage": 85.83, "elapsed_time": "1 day, 5:26:04", "remaining_time": "4:51:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9316, "total_steps": 10853, "loss": 0.1138, "learning_rate": 2.692075262274771e-07, "epoch": 0.8583406274473672, "percentage": 85.84, "elapsed_time": "1 day, 5:26:16", "remaining_time": "4:51:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9317, "total_steps": 10853, "loss": 0.125, "learning_rate": 2.6886375388588656e-07, "epoch": 0.8584327636246372, "percentage": 85.85, "elapsed_time": "1 day, 5:26:27", "remaining_time": "4:51:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9318, "total_steps": 10853, "loss": 0.1359, "learning_rate": 2.6852018870553664e-07, "epoch": 0.8585248998019073, "percentage": 85.86, "elapsed_time": "1 day, 5:26:39", "remaining_time": "4:51:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9319, "total_steps": 10853, "loss": 0.1345, "learning_rate": 2.6817683071832687e-07, "epoch": 0.8586170359791773, "percentage": 85.87, "elapsed_time": "1 day, 5:26:50", "remaining_time": "4:50:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9320, "total_steps": 10853, "loss": 0.1088, "learning_rate": 2.6783367995613846e-07, "epoch": 0.8587091721564473, "percentage": 85.87, "elapsed_time": "1 day, 5:27:00", "remaining_time": "4:50:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9321, "total_steps": 10853, "loss": 0.1125, "learning_rate": 2.6749073645083333e-07, "epoch": 0.8588013083337173, "percentage": 85.88, "elapsed_time": "1 day, 5:27:10", "remaining_time": "4:50:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9322, "total_steps": 10853, "loss": 0.1189, "learning_rate": 2.6714800023425385e-07, "epoch": 0.8588934445109873, "percentage": 85.89, "elapsed_time": "1 day, 5:27:22", "remaining_time": "4:50:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9323, "total_steps": 10853, "loss": 0.1195, "learning_rate": 2.668054713382229e-07, "epoch": 0.8589855806882573, "percentage": 85.9, "elapsed_time": "1 day, 5:27:33", "remaining_time": "4:50:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9324, "total_steps": 10853, "loss": 0.1161, "learning_rate": 2.6646314979454386e-07, "epoch": 0.8590777168655273, "percentage": 85.91, "elapsed_time": "1 day, 5:27:46", "remaining_time": "4:49:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9325, "total_steps": 10853, "loss": 0.1269, "learning_rate": 2.6612103563500165e-07, "epoch": 0.8591698530427972, "percentage": 85.92, "elapsed_time": "1 day, 5:27:56", "remaining_time": "4:49:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9326, "total_steps": 10853, "loss": 0.1229, "learning_rate": 2.657791288913622e-07, "epoch": 0.8592619892200672, "percentage": 85.93, "elapsed_time": "1 day, 5:28:08", "remaining_time": "4:49:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9327, "total_steps": 10853, "loss": 0.1115, "learning_rate": 2.6543742959537074e-07, "epoch": 0.8593541253973372, "percentage": 85.94, "elapsed_time": "1 day, 5:28:20", "remaining_time": "4:49:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9328, "total_steps": 10853, "loss": 0.1084, "learning_rate": 2.650959377787549e-07, "epoch": 0.8594462615746072, "percentage": 85.95, "elapsed_time": "1 day, 5:28:31", "remaining_time": "4:49:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9329, "total_steps": 10853, "loss": 0.1102, "learning_rate": 2.647546534732209e-07, "epoch": 0.8595383977518772, "percentage": 85.96, "elapsed_time": "1 day, 5:28:42", "remaining_time": "4:48:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9330, "total_steps": 10853, "loss": 0.1158, "learning_rate": 2.6441357671045833e-07, "epoch": 0.8596305339291472, "percentage": 85.97, "elapsed_time": "1 day, 5:28:52", "remaining_time": "4:48:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9331, "total_steps": 10853, "loss": 0.1164, "learning_rate": 2.640727075221361e-07, "epoch": 0.8597226701064172, "percentage": 85.98, "elapsed_time": "1 day, 5:29:02", "remaining_time": "4:48:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9332, "total_steps": 10853, "loss": 0.1201, "learning_rate": 2.637320459399031e-07, "epoch": 0.8598148062836873, "percentage": 85.99, "elapsed_time": "1 day, 5:29:12", "remaining_time": "4:48:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9333, "total_steps": 10853, "loss": 0.1084, "learning_rate": 2.6339159199539085e-07, "epoch": 0.8599069424609573, "percentage": 85.99, "elapsed_time": "1 day, 5:29:22", "remaining_time": "4:48:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9334, "total_steps": 10853, "loss": 0.1143, "learning_rate": 2.6305134572020943e-07, "epoch": 0.8599990786382273, "percentage": 86.0, "elapsed_time": "1 day, 5:29:32", "remaining_time": "4:47:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9335, "total_steps": 10853, "loss": 0.1144, "learning_rate": 2.6271130714595164e-07, "epoch": 0.8600912148154973, "percentage": 86.01, "elapsed_time": "1 day, 5:29:43", "remaining_time": "4:47:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9336, "total_steps": 10853, "loss": 0.1077, "learning_rate": 2.623714763041896e-07, "epoch": 0.8601833509927673, "percentage": 86.02, "elapsed_time": "1 day, 5:29:54", "remaining_time": "4:47:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9337, "total_steps": 10853, "loss": 0.1173, "learning_rate": 2.620318532264765e-07, "epoch": 0.8602754871700373, "percentage": 86.03, "elapsed_time": "1 day, 5:30:06", "remaining_time": "4:47:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9338, "total_steps": 10853, "loss": 0.1242, "learning_rate": 2.6169243794434725e-07, "epoch": 0.8603676233473073, "percentage": 86.04, "elapsed_time": "1 day, 5:30:17", "remaining_time": "4:47:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9339, "total_steps": 10853, "loss": 0.1232, "learning_rate": 2.613532304893163e-07, "epoch": 0.8604597595245773, "percentage": 86.05, "elapsed_time": "1 day, 5:30:28", "remaining_time": "4:47:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9340, "total_steps": 10853, "loss": 0.1135, "learning_rate": 2.610142308928779e-07, "epoch": 0.8605518957018473, "percentage": 86.06, "elapsed_time": "1 day, 5:30:37", "remaining_time": "4:46:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9341, "total_steps": 10853, "loss": 0.1242, "learning_rate": 2.6067543918650935e-07, "epoch": 0.8606440318791173, "percentage": 86.07, "elapsed_time": "1 day, 5:30:49", "remaining_time": "4:46:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9342, "total_steps": 10853, "loss": 0.1129, "learning_rate": 2.603368554016672e-07, "epoch": 0.8607361680563873, "percentage": 86.08, "elapsed_time": "1 day, 5:31:00", "remaining_time": "4:46:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9343, "total_steps": 10853, "loss": 0.1158, "learning_rate": 2.5999847956978963e-07, "epoch": 0.8608283042336573, "percentage": 86.09, "elapsed_time": "1 day, 5:31:11", "remaining_time": "4:46:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9344, "total_steps": 10853, "loss": 0.1109, "learning_rate": 2.5966031172229427e-07, "epoch": 0.8609204404109273, "percentage": 86.1, "elapsed_time": "1 day, 5:31:22", "remaining_time": "4:46:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9345, "total_steps": 10853, "loss": 0.1157, "learning_rate": 2.593223518905796e-07, "epoch": 0.8610125765881974, "percentage": 86.11, "elapsed_time": "1 day, 5:31:33", "remaining_time": "4:45:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9346, "total_steps": 10853, "loss": 0.1084, "learning_rate": 2.589846001060259e-07, "epoch": 0.8611047127654674, "percentage": 86.11, "elapsed_time": "1 day, 5:31:44", "remaining_time": "4:45:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9347, "total_steps": 10853, "loss": 0.1254, "learning_rate": 2.586470563999935e-07, "epoch": 0.8611968489427374, "percentage": 86.12, "elapsed_time": "1 day, 5:31:54", "remaining_time": "4:45:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9348, "total_steps": 10853, "loss": 0.1179, "learning_rate": 2.5830972080382265e-07, "epoch": 0.8612889851200074, "percentage": 86.13, "elapsed_time": "1 day, 5:32:05", "remaining_time": "4:45:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9349, "total_steps": 10853, "loss": 0.1269, "learning_rate": 2.5797259334883613e-07, "epoch": 0.8613811212972774, "percentage": 86.14, "elapsed_time": "1 day, 5:32:15", "remaining_time": "4:45:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9350, "total_steps": 10853, "loss": 0.1274, "learning_rate": 2.5763567406633496e-07, "epoch": 0.8614732574745474, "percentage": 86.15, "elapsed_time": "1 day, 5:32:28", "remaining_time": "4:44:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9351, "total_steps": 10853, "loss": 0.1256, "learning_rate": 2.5729896298760325e-07, "epoch": 0.8615653936518174, "percentage": 86.16, "elapsed_time": "1 day, 5:32:39", "remaining_time": "4:44:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9352, "total_steps": 10853, "loss": 0.1186, "learning_rate": 2.569624601439039e-07, "epoch": 0.8616575298290874, "percentage": 86.17, "elapsed_time": "1 day, 5:32:50", "remaining_time": "4:44:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9353, "total_steps": 10853, "loss": 0.113, "learning_rate": 2.566261655664812e-07, "epoch": 0.8617496660063574, "percentage": 86.18, "elapsed_time": "1 day, 5:33:01", "remaining_time": "4:44:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9354, "total_steps": 10853, "loss": 0.1014, "learning_rate": 2.562900792865611e-07, "epoch": 0.8618418021836274, "percentage": 86.19, "elapsed_time": "1 day, 5:33:12", "remaining_time": "4:44:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9355, "total_steps": 10853, "loss": 0.1127, "learning_rate": 2.5595420133534887e-07, "epoch": 0.8619339383608974, "percentage": 86.2, "elapsed_time": "1 day, 5:33:22", "remaining_time": "4:43:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9356, "total_steps": 10853, "loss": 0.1104, "learning_rate": 2.5561853174402964e-07, "epoch": 0.8620260745381674, "percentage": 86.21, "elapsed_time": "1 day, 5:33:33", "remaining_time": "4:43:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9357, "total_steps": 10853, "loss": 0.1077, "learning_rate": 2.5528307054377145e-07, "epoch": 0.8621182107154374, "percentage": 86.22, "elapsed_time": "1 day, 5:33:44", "remaining_time": "4:43:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9358, "total_steps": 10853, "loss": 0.1051, "learning_rate": 2.549478177657219e-07, "epoch": 0.8622103468927074, "percentage": 86.23, "elapsed_time": "1 day, 5:33:54", "remaining_time": "4:43:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9359, "total_steps": 10853, "loss": 0.1252, "learning_rate": 2.546127734410095e-07, "epoch": 0.8623024830699775, "percentage": 86.23, "elapsed_time": "1 day, 5:34:04", "remaining_time": "4:43:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9360, "total_steps": 10853, "loss": 0.119, "learning_rate": 2.542779376007426e-07, "epoch": 0.8623946192472475, "percentage": 86.24, "elapsed_time": "1 day, 5:34:17", "remaining_time": "4:43:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9361, "total_steps": 10853, "loss": 0.1024, "learning_rate": 2.5394331027601056e-07, "epoch": 0.8624867554245175, "percentage": 86.25, "elapsed_time": "1 day, 5:34:28", "remaining_time": "4:42:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9362, "total_steps": 10853, "loss": 0.1241, "learning_rate": 2.5360889149788375e-07, "epoch": 0.8625788916017875, "percentage": 86.26, "elapsed_time": "1 day, 5:34:38", "remaining_time": "4:42:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9363, "total_steps": 10853, "loss": 0.114, "learning_rate": 2.532746812974132e-07, "epoch": 0.8626710277790575, "percentage": 86.27, "elapsed_time": "1 day, 5:34:49", "remaining_time": "4:42:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9364, "total_steps": 10853, "loss": 0.1213, "learning_rate": 2.529406797056305e-07, "epoch": 0.8627631639563275, "percentage": 86.28, "elapsed_time": "1 day, 5:35:01", "remaining_time": "4:42:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9365, "total_steps": 10853, "loss": 0.1229, "learning_rate": 2.5260688675354806e-07, "epoch": 0.8628553001335975, "percentage": 86.29, "elapsed_time": "1 day, 5:35:14", "remaining_time": "4:42:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9366, "total_steps": 10853, "loss": 0.1208, "learning_rate": 2.5227330247215716e-07, "epoch": 0.8629474363108675, "percentage": 86.3, "elapsed_time": "1 day, 5:35:25", "remaining_time": "4:41:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9367, "total_steps": 10853, "loss": 0.1139, "learning_rate": 2.519399268924322e-07, "epoch": 0.8630395724881375, "percentage": 86.31, "elapsed_time": "1 day, 5:35:35", "remaining_time": "4:41:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9368, "total_steps": 10853, "loss": 0.1034, "learning_rate": 2.516067600453273e-07, "epoch": 0.8631317086654074, "percentage": 86.32, "elapsed_time": "1 day, 5:35:45", "remaining_time": "4:41:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9369, "total_steps": 10853, "loss": 0.1284, "learning_rate": 2.5127380196177634e-07, "epoch": 0.8632238448426774, "percentage": 86.33, "elapsed_time": "1 day, 5:35:55", "remaining_time": "4:41:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9370, "total_steps": 10853, "loss": 0.1095, "learning_rate": 2.509410526726952e-07, "epoch": 0.8633159810199474, "percentage": 86.34, "elapsed_time": "1 day, 5:36:07", "remaining_time": "4:41:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9371, "total_steps": 10853, "loss": 0.1001, "learning_rate": 2.5060851220897906e-07, "epoch": 0.8634081171972174, "percentage": 86.34, "elapsed_time": "1 day, 5:36:17", "remaining_time": "4:40:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9372, "total_steps": 10853, "loss": 0.1185, "learning_rate": 2.5027618060150526e-07, "epoch": 0.8635002533744875, "percentage": 86.35, "elapsed_time": "1 day, 5:36:28", "remaining_time": "4:40:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9373, "total_steps": 10853, "loss": 0.1218, "learning_rate": 2.4994405788112933e-07, "epoch": 0.8635923895517575, "percentage": 86.36, "elapsed_time": "1 day, 5:36:40", "remaining_time": "4:40:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9374, "total_steps": 10853, "loss": 0.1081, "learning_rate": 2.4961214407869e-07, "epoch": 0.8636845257290275, "percentage": 86.37, "elapsed_time": "1 day, 5:36:50", "remaining_time": "4:40:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9375, "total_steps": 10853, "loss": 0.1181, "learning_rate": 2.492804392250059e-07, "epoch": 0.8637766619062975, "percentage": 86.38, "elapsed_time": "1 day, 5:37:01", "remaining_time": "4:40:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9376, "total_steps": 10853, "loss": 0.1295, "learning_rate": 2.489489433508752e-07, "epoch": 0.8638687980835675, "percentage": 86.39, "elapsed_time": "1 day, 5:37:12", "remaining_time": "4:39:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9377, "total_steps": 10853, "loss": 0.1197, "learning_rate": 2.486176564870768e-07, "epoch": 0.8639609342608375, "percentage": 86.4, "elapsed_time": "1 day, 5:37:22", "remaining_time": "4:39:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9378, "total_steps": 10853, "loss": 0.1371, "learning_rate": 2.4828657866437123e-07, "epoch": 0.8640530704381075, "percentage": 86.41, "elapsed_time": "1 day, 5:37:33", "remaining_time": "4:39:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9379, "total_steps": 10853, "loss": 0.1164, "learning_rate": 2.479557099134991e-07, "epoch": 0.8641452066153775, "percentage": 86.42, "elapsed_time": "1 day, 5:37:44", "remaining_time": "4:39:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9380, "total_steps": 10853, "loss": 0.1094, "learning_rate": 2.4762505026518224e-07, "epoch": 0.8642373427926475, "percentage": 86.43, "elapsed_time": "1 day, 5:37:55", "remaining_time": "4:39:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9381, "total_steps": 10853, "loss": 0.1158, "learning_rate": 2.4729459975012194e-07, "epoch": 0.8643294789699175, "percentage": 86.44, "elapsed_time": "1 day, 5:38:05", "remaining_time": "4:39:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9382, "total_steps": 10853, "loss": 0.1136, "learning_rate": 2.46964358399e-07, "epoch": 0.8644216151471875, "percentage": 86.45, "elapsed_time": "1 day, 5:38:15", "remaining_time": "4:38:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9383, "total_steps": 10853, "loss": 0.1124, "learning_rate": 2.4663432624247975e-07, "epoch": 0.8645137513244575, "percentage": 86.46, "elapsed_time": "1 day, 5:38:25", "remaining_time": "4:38:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9384, "total_steps": 10853, "loss": 0.1108, "learning_rate": 2.4630450331120547e-07, "epoch": 0.8646058875017275, "percentage": 86.46, "elapsed_time": "1 day, 5:38:36", "remaining_time": "4:38:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9385, "total_steps": 10853, "loss": 0.1162, "learning_rate": 2.4597488963579995e-07, "epoch": 0.8646980236789975, "percentage": 86.47, "elapsed_time": "1 day, 5:38:45", "remaining_time": "4:38:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9386, "total_steps": 10853, "loss": 0.1106, "learning_rate": 2.4564548524686925e-07, "epoch": 0.8647901598562676, "percentage": 86.48, "elapsed_time": "1 day, 5:38:57", "remaining_time": "4:38:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9387, "total_steps": 10853, "loss": 0.1097, "learning_rate": 2.4531629017499724e-07, "epoch": 0.8648822960335376, "percentage": 86.49, "elapsed_time": "1 day, 5:39:08", "remaining_time": "4:37:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9388, "total_steps": 10853, "loss": 0.1241, "learning_rate": 2.449873044507503e-07, "epoch": 0.8649744322108076, "percentage": 86.5, "elapsed_time": "1 day, 5:39:19", "remaining_time": "4:37:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9389, "total_steps": 10853, "loss": 0.1127, "learning_rate": 2.446585281046751e-07, "epoch": 0.8650665683880776, "percentage": 86.51, "elapsed_time": "1 day, 5:39:30", "remaining_time": "4:37:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9390, "total_steps": 10853, "loss": 0.1269, "learning_rate": 2.443299611672981e-07, "epoch": 0.8651587045653476, "percentage": 86.52, "elapsed_time": "1 day, 5:39:40", "remaining_time": "4:37:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9391, "total_steps": 10853, "loss": 0.119, "learning_rate": 2.44001603669127e-07, "epoch": 0.8652508407426176, "percentage": 86.53, "elapsed_time": "1 day, 5:39:52", "remaining_time": "4:37:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9392, "total_steps": 10853, "loss": 0.1097, "learning_rate": 2.4367345564065003e-07, "epoch": 0.8653429769198876, "percentage": 86.54, "elapsed_time": "1 day, 5:40:03", "remaining_time": "4:36:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9393, "total_steps": 10853, "loss": 0.1069, "learning_rate": 2.433455171123356e-07, "epoch": 0.8654351130971576, "percentage": 86.55, "elapsed_time": "1 day, 5:40:13", "remaining_time": "4:36:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9394, "total_steps": 10853, "loss": 0.1077, "learning_rate": 2.4301778811463255e-07, "epoch": 0.8655272492744276, "percentage": 86.56, "elapsed_time": "1 day, 5:40:24", "remaining_time": "4:36:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9395, "total_steps": 10853, "loss": 0.1186, "learning_rate": 2.426902686779706e-07, "epoch": 0.8656193854516976, "percentage": 86.57, "elapsed_time": "1 day, 5:40:34", "remaining_time": "4:36:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9396, "total_steps": 10853, "loss": 0.1208, "learning_rate": 2.4236295883276e-07, "epoch": 0.8657115216289676, "percentage": 86.58, "elapsed_time": "1 day, 5:40:45", "remaining_time": "4:36:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9397, "total_steps": 10853, "loss": 0.1047, "learning_rate": 2.420358586093921e-07, "epoch": 0.8658036578062376, "percentage": 86.58, "elapsed_time": "1 day, 5:40:56", "remaining_time": "4:35:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9398, "total_steps": 10853, "loss": 0.1115, "learning_rate": 2.4170896803823785e-07, "epoch": 0.8658957939835076, "percentage": 86.59, "elapsed_time": "1 day, 5:41:06", "remaining_time": "4:35:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9399, "total_steps": 10853, "loss": 0.1091, "learning_rate": 2.4138228714964853e-07, "epoch": 0.8659879301607776, "percentage": 86.6, "elapsed_time": "1 day, 5:41:18", "remaining_time": "4:35:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9400, "total_steps": 10853, "loss": 0.1232, "learning_rate": 2.4105581597395705e-07, "epoch": 0.8660800663380477, "percentage": 86.61, "elapsed_time": "1 day, 5:41:28", "remaining_time": "4:35:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9401, "total_steps": 10853, "loss": 0.1203, "learning_rate": 2.4072955454147643e-07, "epoch": 0.8661722025153177, "percentage": 86.62, "elapsed_time": "1 day, 5:41:40", "remaining_time": "4:35:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9402, "total_steps": 10853, "loss": 0.1242, "learning_rate": 2.4040350288249944e-07, "epoch": 0.8662643386925877, "percentage": 86.63, "elapsed_time": "1 day, 5:41:51", "remaining_time": "4:34:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9403, "total_steps": 10853, "loss": 0.1155, "learning_rate": 2.400776610273006e-07, "epoch": 0.8663564748698577, "percentage": 86.64, "elapsed_time": "1 day, 5:42:02", "remaining_time": "4:34:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9404, "total_steps": 10853, "loss": 0.1121, "learning_rate": 2.397520290061339e-07, "epoch": 0.8664486110471277, "percentage": 86.65, "elapsed_time": "1 day, 5:42:12", "remaining_time": "4:34:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9405, "total_steps": 10853, "loss": 0.1171, "learning_rate": 2.394266068492351e-07, "epoch": 0.8665407472243977, "percentage": 86.66, "elapsed_time": "1 day, 5:42:23", "remaining_time": "4:34:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9406, "total_steps": 10853, "loss": 0.0941, "learning_rate": 2.391013945868187e-07, "epoch": 0.8666328834016677, "percentage": 86.67, "elapsed_time": "1 day, 5:42:33", "remaining_time": "4:34:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9407, "total_steps": 10853, "loss": 0.1126, "learning_rate": 2.38776392249081e-07, "epoch": 0.8667250195789377, "percentage": 86.68, "elapsed_time": "1 day, 5:42:44", "remaining_time": "4:34:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9408, "total_steps": 10853, "loss": 0.1272, "learning_rate": 2.38451599866199e-07, "epoch": 0.8668171557562077, "percentage": 86.69, "elapsed_time": "1 day, 5:42:54", "remaining_time": "4:33:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9409, "total_steps": 10853, "loss": 0.1321, "learning_rate": 2.381270174683295e-07, "epoch": 0.8669092919334777, "percentage": 86.69, "elapsed_time": "1 day, 5:43:05", "remaining_time": "4:33:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9410, "total_steps": 10853, "loss": 0.1165, "learning_rate": 2.3780264508560942e-07, "epoch": 0.8670014281107477, "percentage": 86.7, "elapsed_time": "1 day, 5:43:15", "remaining_time": "4:33:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9411, "total_steps": 10853, "loss": 0.1198, "learning_rate": 2.3747848274815716e-07, "epoch": 0.8670935642880176, "percentage": 86.71, "elapsed_time": "1 day, 5:43:25", "remaining_time": "4:33:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9412, "total_steps": 10853, "loss": 0.1263, "learning_rate": 2.3715453048607118e-07, "epoch": 0.8671857004652876, "percentage": 86.72, "elapsed_time": "1 day, 5:43:37", "remaining_time": "4:33:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9413, "total_steps": 10853, "loss": 0.1116, "learning_rate": 2.368307883294313e-07, "epoch": 0.8672778366425578, "percentage": 86.73, "elapsed_time": "1 day, 5:43:47", "remaining_time": "4:32:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9414, "total_steps": 10853, "loss": 0.1236, "learning_rate": 2.3650725630829598e-07, "epoch": 0.8673699728198278, "percentage": 86.74, "elapsed_time": "1 day, 5:43:58", "remaining_time": "4:32:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9415, "total_steps": 10853, "loss": 0.1241, "learning_rate": 2.3618393445270504e-07, "epoch": 0.8674621089970977, "percentage": 86.75, "elapsed_time": "1 day, 5:44:08", "remaining_time": "4:32:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9416, "total_steps": 10853, "loss": 0.1042, "learning_rate": 2.3586082279267952e-07, "epoch": 0.8675542451743677, "percentage": 86.76, "elapsed_time": "1 day, 5:44:19", "remaining_time": "4:32:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9417, "total_steps": 10853, "loss": 0.121, "learning_rate": 2.355379213582204e-07, "epoch": 0.8676463813516377, "percentage": 86.77, "elapsed_time": "1 day, 5:44:29", "remaining_time": "4:32:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9418, "total_steps": 10853, "loss": 0.1124, "learning_rate": 2.3521523017930954e-07, "epoch": 0.8677385175289077, "percentage": 86.78, "elapsed_time": "1 day, 5:44:40", "remaining_time": "4:31:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9419, "total_steps": 10853, "loss": 0.1225, "learning_rate": 2.3489274928590795e-07, "epoch": 0.8678306537061777, "percentage": 86.79, "elapsed_time": "1 day, 5:44:50", "remaining_time": "4:31:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9420, "total_steps": 10853, "loss": 0.1151, "learning_rate": 2.3457047870795808e-07, "epoch": 0.8679227898834477, "percentage": 86.8, "elapsed_time": "1 day, 5:44:59", "remaining_time": "4:31:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9421, "total_steps": 10853, "loss": 0.1168, "learning_rate": 2.3424841847538292e-07, "epoch": 0.8680149260607177, "percentage": 86.81, "elapsed_time": "1 day, 5:45:11", "remaining_time": "4:31:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9422, "total_steps": 10853, "loss": 0.1193, "learning_rate": 2.3392656861808666e-07, "epoch": 0.8681070622379877, "percentage": 86.81, "elapsed_time": "1 day, 5:45:22", "remaining_time": "4:31:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9423, "total_steps": 10853, "loss": 0.1207, "learning_rate": 2.3360492916595174e-07, "epoch": 0.8681991984152577, "percentage": 86.82, "elapsed_time": "1 day, 5:45:33", "remaining_time": "4:30:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9424, "total_steps": 10853, "loss": 0.1091, "learning_rate": 2.332835001488437e-07, "epoch": 0.8682913345925277, "percentage": 86.83, "elapsed_time": "1 day, 5:45:43", "remaining_time": "4:30:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9425, "total_steps": 10853, "loss": 0.125, "learning_rate": 2.3296228159660594e-07, "epoch": 0.8683834707697977, "percentage": 86.84, "elapsed_time": "1 day, 5:45:53", "remaining_time": "4:30:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9426, "total_steps": 10853, "loss": 0.1147, "learning_rate": 2.3264127353906485e-07, "epoch": 0.8684756069470677, "percentage": 86.85, "elapsed_time": "1 day, 5:46:03", "remaining_time": "4:30:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9427, "total_steps": 10853, "loss": 0.1096, "learning_rate": 2.323204760060252e-07, "epoch": 0.8685677431243378, "percentage": 86.86, "elapsed_time": "1 day, 5:46:15", "remaining_time": "4:30:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9428, "total_steps": 10853, "loss": 0.1005, "learning_rate": 2.3199988902727317e-07, "epoch": 0.8686598793016078, "percentage": 86.87, "elapsed_time": "1 day, 5:46:27", "remaining_time": "4:30:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9429, "total_steps": 10853, "loss": 0.1304, "learning_rate": 2.3167951263257633e-07, "epoch": 0.8687520154788778, "percentage": 86.88, "elapsed_time": "1 day, 5:46:37", "remaining_time": "4:29:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9430, "total_steps": 10853, "loss": 0.1127, "learning_rate": 2.313593468516806e-07, "epoch": 0.8688441516561478, "percentage": 86.89, "elapsed_time": "1 day, 5:46:48", "remaining_time": "4:29:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9431, "total_steps": 10853, "loss": 0.1247, "learning_rate": 2.3103939171431305e-07, "epoch": 0.8689362878334178, "percentage": 86.9, "elapsed_time": "1 day, 5:46:58", "remaining_time": "4:29:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9432, "total_steps": 10853, "loss": 0.1306, "learning_rate": 2.307196472501824e-07, "epoch": 0.8690284240106878, "percentage": 86.91, "elapsed_time": "1 day, 5:47:10", "remaining_time": "4:29:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9433, "total_steps": 10853, "loss": 0.1105, "learning_rate": 2.3040011348897689e-07, "epoch": 0.8691205601879578, "percentage": 86.92, "elapsed_time": "1 day, 5:47:21", "remaining_time": "4:29:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9434, "total_steps": 10853, "loss": 0.115, "learning_rate": 2.3008079046036525e-07, "epoch": 0.8692126963652278, "percentage": 86.93, "elapsed_time": "1 day, 5:47:31", "remaining_time": "4:28:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9435, "total_steps": 10853, "loss": 0.1076, "learning_rate": 2.2976167819399652e-07, "epoch": 0.8693048325424978, "percentage": 86.93, "elapsed_time": "1 day, 5:47:43", "remaining_time": "4:28:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9436, "total_steps": 10853, "loss": 0.1058, "learning_rate": 2.294427767195001e-07, "epoch": 0.8693969687197678, "percentage": 86.94, "elapsed_time": "1 day, 5:47:55", "remaining_time": "4:28:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9437, "total_steps": 10853, "loss": 0.1161, "learning_rate": 2.291240860664859e-07, "epoch": 0.8694891048970378, "percentage": 86.95, "elapsed_time": "1 day, 5:48:05", "remaining_time": "4:28:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9438, "total_steps": 10853, "loss": 0.1101, "learning_rate": 2.288056062645455e-07, "epoch": 0.8695812410743078, "percentage": 86.96, "elapsed_time": "1 day, 5:48:17", "remaining_time": "4:28:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9439, "total_steps": 10853, "loss": 0.1008, "learning_rate": 2.2848733734324835e-07, "epoch": 0.8696733772515778, "percentage": 86.97, "elapsed_time": "1 day, 5:48:29", "remaining_time": "4:27:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9440, "total_steps": 10853, "loss": 0.1293, "learning_rate": 2.281692793321469e-07, "epoch": 0.8697655134288479, "percentage": 86.98, "elapsed_time": "1 day, 5:48:40", "remaining_time": "4:27:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9441, "total_steps": 10853, "loss": 0.1233, "learning_rate": 2.2785143226077166e-07, "epoch": 0.8698576496061179, "percentage": 86.99, "elapsed_time": "1 day, 5:48:52", "remaining_time": "4:27:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9442, "total_steps": 10853, "loss": 0.1296, "learning_rate": 2.2753379615863575e-07, "epoch": 0.8699497857833879, "percentage": 87.0, "elapsed_time": "1 day, 5:49:03", "remaining_time": "4:27:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9443, "total_steps": 10853, "loss": 0.1169, "learning_rate": 2.2721637105523193e-07, "epoch": 0.8700419219606579, "percentage": 87.01, "elapsed_time": "1 day, 5:49:15", "remaining_time": "4:27:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9444, "total_steps": 10853, "loss": 0.1167, "learning_rate": 2.268991569800319e-07, "epoch": 0.8701340581379279, "percentage": 87.02, "elapsed_time": "1 day, 5:49:25", "remaining_time": "4:26:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9445, "total_steps": 10853, "loss": 0.1224, "learning_rate": 2.2658215396249046e-07, "epoch": 0.8702261943151979, "percentage": 87.03, "elapsed_time": "1 day, 5:49:36", "remaining_time": "4:26:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9446, "total_steps": 10853, "loss": 0.1238, "learning_rate": 2.2626536203204014e-07, "epoch": 0.8703183304924679, "percentage": 87.04, "elapsed_time": "1 day, 5:49:47", "remaining_time": "4:26:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9447, "total_steps": 10853, "loss": 0.1181, "learning_rate": 2.2594878121809633e-07, "epoch": 0.8704104666697379, "percentage": 87.05, "elapsed_time": "1 day, 5:49:57", "remaining_time": "4:26:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9448, "total_steps": 10853, "loss": 0.1227, "learning_rate": 2.2563241155005216e-07, "epoch": 0.8705026028470079, "percentage": 87.05, "elapsed_time": "1 day, 5:50:08", "remaining_time": "4:26:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9449, "total_steps": 10853, "loss": 0.1176, "learning_rate": 2.2531625305728362e-07, "epoch": 0.8705947390242779, "percentage": 87.06, "elapsed_time": "1 day, 5:50:19", "remaining_time": "4:26:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9450, "total_steps": 10853, "loss": 0.1041, "learning_rate": 2.2500030576914606e-07, "epoch": 0.8706868752015479, "percentage": 87.07, "elapsed_time": "1 day, 5:50:31", "remaining_time": "4:25:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9451, "total_steps": 10853, "loss": 0.1215, "learning_rate": 2.2468456971497493e-07, "epoch": 0.8707790113788179, "percentage": 87.08, "elapsed_time": "1 day, 5:50:42", "remaining_time": "4:25:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9452, "total_steps": 10853, "loss": 0.1197, "learning_rate": 2.2436904492408596e-07, "epoch": 0.8708711475560879, "percentage": 87.09, "elapsed_time": "1 day, 5:50:53", "remaining_time": "4:25:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9453, "total_steps": 10853, "loss": 0.1261, "learning_rate": 2.2405373142577597e-07, "epoch": 0.8709632837333579, "percentage": 87.1, "elapsed_time": "1 day, 5:51:05", "remaining_time": "4:25:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9454, "total_steps": 10853, "loss": 0.127, "learning_rate": 2.237386292493221e-07, "epoch": 0.871055419910628, "percentage": 87.11, "elapsed_time": "1 day, 5:51:17", "remaining_time": "4:25:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9455, "total_steps": 10853, "loss": 0.122, "learning_rate": 2.2342373842398208e-07, "epoch": 0.871147556087898, "percentage": 87.12, "elapsed_time": "1 day, 5:51:27", "remaining_time": "4:24:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9456, "total_steps": 10853, "loss": 0.117, "learning_rate": 2.2310905897899275e-07, "epoch": 0.871239692265168, "percentage": 87.13, "elapsed_time": "1 day, 5:51:39", "remaining_time": "4:24:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9457, "total_steps": 10853, "loss": 0.1128, "learning_rate": 2.227945909435719e-07, "epoch": 0.871331828442438, "percentage": 87.14, "elapsed_time": "1 day, 5:51:50", "remaining_time": "4:24:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9458, "total_steps": 10853, "loss": 0.1213, "learning_rate": 2.224803343469184e-07, "epoch": 0.871423964619708, "percentage": 87.15, "elapsed_time": "1 day, 5:52:00", "remaining_time": "4:24:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9459, "total_steps": 10853, "loss": 0.1114, "learning_rate": 2.2216628921821138e-07, "epoch": 0.8715161007969779, "percentage": 87.16, "elapsed_time": "1 day, 5:52:11", "remaining_time": "4:24:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9460, "total_steps": 10853, "loss": 0.1113, "learning_rate": 2.2185245558660918e-07, "epoch": 0.8716082369742479, "percentage": 87.16, "elapsed_time": "1 day, 5:52:23", "remaining_time": "4:23:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9461, "total_steps": 10853, "loss": 0.1237, "learning_rate": 2.215388334812521e-07, "epoch": 0.8717003731515179, "percentage": 87.17, "elapsed_time": "1 day, 5:52:33", "remaining_time": "4:23:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9462, "total_steps": 10853, "loss": 0.1051, "learning_rate": 2.2122542293125883e-07, "epoch": 0.8717925093287879, "percentage": 87.18, "elapsed_time": "1 day, 5:52:44", "remaining_time": "4:23:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9463, "total_steps": 10853, "loss": 0.105, "learning_rate": 2.2091222396573104e-07, "epoch": 0.8718846455060579, "percentage": 87.19, "elapsed_time": "1 day, 5:52:55", "remaining_time": "4:23:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9464, "total_steps": 10853, "loss": 0.1051, "learning_rate": 2.20599236613748e-07, "epoch": 0.8719767816833279, "percentage": 87.2, "elapsed_time": "1 day, 5:53:05", "remaining_time": "4:23:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9465, "total_steps": 10853, "loss": 0.1156, "learning_rate": 2.2028646090437117e-07, "epoch": 0.8720689178605979, "percentage": 87.21, "elapsed_time": "1 day, 5:53:15", "remaining_time": "4:22:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9466, "total_steps": 10853, "loss": 0.1137, "learning_rate": 2.199738968666418e-07, "epoch": 0.8721610540378679, "percentage": 87.22, "elapsed_time": "1 day, 5:53:26", "remaining_time": "4:22:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9467, "total_steps": 10853, "loss": 0.1247, "learning_rate": 2.1966154452958216e-07, "epoch": 0.8722531902151379, "percentage": 87.23, "elapsed_time": "1 day, 5:53:37", "remaining_time": "4:22:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9468, "total_steps": 10853, "loss": 0.1066, "learning_rate": 2.1934940392219272e-07, "epoch": 0.872345326392408, "percentage": 87.24, "elapsed_time": "1 day, 5:53:47", "remaining_time": "4:22:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9469, "total_steps": 10853, "loss": 0.1197, "learning_rate": 2.190374750734567e-07, "epoch": 0.872437462569678, "percentage": 87.25, "elapsed_time": "1 day, 5:53:59", "remaining_time": "4:22:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9470, "total_steps": 10853, "loss": 0.1091, "learning_rate": 2.187257580123367e-07, "epoch": 0.872529598746948, "percentage": 87.26, "elapsed_time": "1 day, 5:54:08", "remaining_time": "4:22:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9471, "total_steps": 10853, "loss": 0.1204, "learning_rate": 2.1841425276777544e-07, "epoch": 0.872621734924218, "percentage": 87.27, "elapsed_time": "1 day, 5:54:20", "remaining_time": "4:21:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9472, "total_steps": 10853, "loss": 0.1285, "learning_rate": 2.1810295936869675e-07, "epoch": 0.872713871101488, "percentage": 87.28, "elapsed_time": "1 day, 5:54:31", "remaining_time": "4:21:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9473, "total_steps": 10853, "loss": 0.1288, "learning_rate": 2.1779187784400385e-07, "epoch": 0.872806007278758, "percentage": 87.28, "elapsed_time": "1 day, 5:54:41", "remaining_time": "4:21:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9474, "total_steps": 10853, "loss": 0.1141, "learning_rate": 2.1748100822258034e-07, "epoch": 0.872898143456028, "percentage": 87.29, "elapsed_time": "1 day, 5:54:51", "remaining_time": "4:21:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9475, "total_steps": 10853, "loss": 0.108, "learning_rate": 2.171703505332909e-07, "epoch": 0.872990279633298, "percentage": 87.3, "elapsed_time": "1 day, 5:55:00", "remaining_time": "4:21:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9476, "total_steps": 10853, "loss": 0.126, "learning_rate": 2.1685990480498048e-07, "epoch": 0.873082415810568, "percentage": 87.31, "elapsed_time": "1 day, 5:55:12", "remaining_time": "4:20:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9477, "total_steps": 10853, "loss": 0.1134, "learning_rate": 2.1654967106647328e-07, "epoch": 0.873174551987838, "percentage": 87.32, "elapsed_time": "1 day, 5:55:23", "remaining_time": "4:20:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9478, "total_steps": 10853, "loss": 0.1207, "learning_rate": 2.1623964934657516e-07, "epoch": 0.873266688165108, "percentage": 87.33, "elapsed_time": "1 day, 5:55:34", "remaining_time": "4:20:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9479, "total_steps": 10853, "loss": 0.1184, "learning_rate": 2.159298396740711e-07, "epoch": 0.873358824342378, "percentage": 87.34, "elapsed_time": "1 day, 5:55:45", "remaining_time": "4:20:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9480, "total_steps": 10853, "loss": 0.1221, "learning_rate": 2.1562024207772758e-07, "epoch": 0.873450960519648, "percentage": 87.35, "elapsed_time": "1 day, 5:55:56", "remaining_time": "4:20:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9481, "total_steps": 10853, "loss": 0.1073, "learning_rate": 2.1531085658628992e-07, "epoch": 0.8735430966969181, "percentage": 87.36, "elapsed_time": "1 day, 5:56:07", "remaining_time": "4:19:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9482, "total_steps": 10853, "loss": 0.1219, "learning_rate": 2.1500168322848515e-07, "epoch": 0.8736352328741881, "percentage": 87.37, "elapsed_time": "1 day, 5:56:18", "remaining_time": "4:19:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9483, "total_steps": 10853, "loss": 0.1207, "learning_rate": 2.1469272203302055e-07, "epoch": 0.8737273690514581, "percentage": 87.38, "elapsed_time": "1 day, 5:56:29", "remaining_time": "4:19:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9484, "total_steps": 10853, "loss": 0.1136, "learning_rate": 2.143839730285824e-07, "epoch": 0.8738195052287281, "percentage": 87.39, "elapsed_time": "1 day, 5:56:39", "remaining_time": "4:19:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9485, "total_steps": 10853, "loss": 0.1162, "learning_rate": 2.1407543624383798e-07, "epoch": 0.8739116414059981, "percentage": 87.4, "elapsed_time": "1 day, 5:56:50", "remaining_time": "4:19:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9486, "total_steps": 10853, "loss": 0.1213, "learning_rate": 2.1376711170743553e-07, "epoch": 0.8740037775832681, "percentage": 87.4, "elapsed_time": "1 day, 5:57:01", "remaining_time": "4:18:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9487, "total_steps": 10853, "loss": 0.1139, "learning_rate": 2.134589994480027e-07, "epoch": 0.8740959137605381, "percentage": 87.41, "elapsed_time": "1 day, 5:57:12", "remaining_time": "4:18:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9488, "total_steps": 10853, "loss": 0.1191, "learning_rate": 2.1315109949414824e-07, "epoch": 0.8741880499378081, "percentage": 87.42, "elapsed_time": "1 day, 5:57:24", "remaining_time": "4:18:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9489, "total_steps": 10853, "loss": 0.1219, "learning_rate": 2.1284341187446046e-07, "epoch": 0.8742801861150781, "percentage": 87.43, "elapsed_time": "1 day, 5:57:33", "remaining_time": "4:18:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9490, "total_steps": 10853, "loss": 0.1052, "learning_rate": 2.1253593661750727e-07, "epoch": 0.8743723222923481, "percentage": 87.44, "elapsed_time": "1 day, 5:57:44", "remaining_time": "4:18:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9491, "total_steps": 10853, "loss": 0.1236, "learning_rate": 2.1222867375183893e-07, "epoch": 0.8744644584696181, "percentage": 87.45, "elapsed_time": "1 day, 5:57:56", "remaining_time": "4:18:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9492, "total_steps": 10853, "loss": 0.1145, "learning_rate": 2.1192162330598453e-07, "epoch": 0.8745565946468881, "percentage": 87.46, "elapsed_time": "1 day, 5:58:07", "remaining_time": "4:17:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9493, "total_steps": 10853, "loss": 0.1095, "learning_rate": 2.1161478530845353e-07, "epoch": 0.8746487308241581, "percentage": 87.47, "elapsed_time": "1 day, 5:58:18", "remaining_time": "4:17:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9494, "total_steps": 10853, "loss": 0.1261, "learning_rate": 2.1130815978773616e-07, "epoch": 0.8747408670014281, "percentage": 87.48, "elapsed_time": "1 day, 5:58:31", "remaining_time": "4:17:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9495, "total_steps": 10853, "loss": 0.1235, "learning_rate": 2.1100174677230217e-07, "epoch": 0.8748330031786982, "percentage": 87.49, "elapsed_time": "1 day, 5:58:42", "remaining_time": "4:17:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9496, "total_steps": 10853, "loss": 0.1102, "learning_rate": 2.1069554629060297e-07, "epoch": 0.8749251393559682, "percentage": 87.5, "elapsed_time": "1 day, 5:58:54", "remaining_time": "4:17:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9497, "total_steps": 10853, "loss": 0.1151, "learning_rate": 2.10389558371068e-07, "epoch": 0.8750172755332382, "percentage": 87.51, "elapsed_time": "1 day, 5:59:05", "remaining_time": "4:16:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9498, "total_steps": 10853, "loss": 0.1251, "learning_rate": 2.1008378304210876e-07, "epoch": 0.8751094117105082, "percentage": 87.51, "elapsed_time": "1 day, 5:59:17", "remaining_time": "4:16:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9499, "total_steps": 10853, "loss": 0.1164, "learning_rate": 2.0977822033211748e-07, "epoch": 0.8752015478877782, "percentage": 87.52, "elapsed_time": "1 day, 5:59:27", "remaining_time": "4:16:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9500, "total_steps": 10853, "loss": 0.1175, "learning_rate": 2.0947287026946428e-07, "epoch": 0.8752936840650481, "percentage": 87.53, "elapsed_time": "1 day, 5:59:38", "remaining_time": "4:16:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9500, "total_steps": 10853, "eval_loss": 0.1174582913517952, "epoch": 0.8752936840650481, "percentage": 87.53, "elapsed_time": "1 day, 6:04:37", "remaining_time": "4:17:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9501, "total_steps": 10853, "loss": 0.1057, "learning_rate": 2.091677328825023e-07, "epoch": 0.8753858202423181, "percentage": 87.54, "elapsed_time": "1 day, 6:04:48", "remaining_time": "4:16:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9502, "total_steps": 10853, "loss": 0.1122, "learning_rate": 2.0886280819956223e-07, "epoch": 0.8754779564195881, "percentage": 87.55, "elapsed_time": "1 day, 6:05:00", "remaining_time": "4:16:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9503, "total_steps": 10853, "loss": 0.1268, "learning_rate": 2.0855809624895694e-07, "epoch": 0.8755700925968581, "percentage": 87.56, "elapsed_time": "1 day, 6:05:10", "remaining_time": "4:16:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9504, "total_steps": 10853, "loss": 0.1225, "learning_rate": 2.082535970589794e-07, "epoch": 0.8756622287741281, "percentage": 87.57, "elapsed_time": "1 day, 6:05:20", "remaining_time": "4:16:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9505, "total_steps": 10853, "loss": 0.1134, "learning_rate": 2.0794931065790226e-07, "epoch": 0.8757543649513981, "percentage": 87.58, "elapsed_time": "1 day, 6:05:30", "remaining_time": "4:16:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9506, "total_steps": 10853, "loss": 0.1185, "learning_rate": 2.076452370739776e-07, "epoch": 0.8758465011286681, "percentage": 87.59, "elapsed_time": "1 day, 6:05:40", "remaining_time": "4:15:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9507, "total_steps": 10853, "loss": 0.1309, "learning_rate": 2.0734137633543954e-07, "epoch": 0.8759386373059381, "percentage": 87.6, "elapsed_time": "1 day, 6:05:52", "remaining_time": "4:15:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9508, "total_steps": 10853, "loss": 0.1102, "learning_rate": 2.0703772847050136e-07, "epoch": 0.8760307734832082, "percentage": 87.61, "elapsed_time": "1 day, 6:06:02", "remaining_time": "4:15:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9509, "total_steps": 10853, "loss": 0.1214, "learning_rate": 2.0673429350735742e-07, "epoch": 0.8761229096604782, "percentage": 87.62, "elapsed_time": "1 day, 6:06:13", "remaining_time": "4:15:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9510, "total_steps": 10853, "loss": 0.1051, "learning_rate": 2.06431071474181e-07, "epoch": 0.8762150458377482, "percentage": 87.63, "elapsed_time": "1 day, 6:06:24", "remaining_time": "4:15:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9511, "total_steps": 10853, "loss": 0.1133, "learning_rate": 2.0612806239912602e-07, "epoch": 0.8763071820150182, "percentage": 87.63, "elapsed_time": "1 day, 6:06:34", "remaining_time": "4:14:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9512, "total_steps": 10853, "loss": 0.1122, "learning_rate": 2.0582526631032745e-07, "epoch": 0.8763993181922882, "percentage": 87.64, "elapsed_time": "1 day, 6:06:44", "remaining_time": "4:14:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9513, "total_steps": 10853, "loss": 0.1183, "learning_rate": 2.0552268323590002e-07, "epoch": 0.8764914543695582, "percentage": 87.65, "elapsed_time": "1 day, 6:06:54", "remaining_time": "4:14:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9514, "total_steps": 10853, "loss": 0.1233, "learning_rate": 2.052203132039382e-07, "epoch": 0.8765835905468282, "percentage": 87.66, "elapsed_time": "1 day, 6:07:04", "remaining_time": "4:14:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9515, "total_steps": 10853, "loss": 0.1184, "learning_rate": 2.0491815624251733e-07, "epoch": 0.8766757267240982, "percentage": 87.67, "elapsed_time": "1 day, 6:07:15", "remaining_time": "4:14:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9516, "total_steps": 10853, "loss": 0.1145, "learning_rate": 2.046162123796927e-07, "epoch": 0.8767678629013682, "percentage": 87.68, "elapsed_time": "1 day, 6:07:26", "remaining_time": "4:13:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9517, "total_steps": 10853, "loss": 0.1326, "learning_rate": 2.043144816434997e-07, "epoch": 0.8768599990786382, "percentage": 87.69, "elapsed_time": "1 day, 6:07:38", "remaining_time": "4:13:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9518, "total_steps": 10853, "loss": 0.1136, "learning_rate": 2.0401296406195426e-07, "epoch": 0.8769521352559082, "percentage": 87.7, "elapsed_time": "1 day, 6:07:50", "remaining_time": "4:13:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9519, "total_steps": 10853, "loss": 0.1127, "learning_rate": 2.0371165966305173e-07, "epoch": 0.8770442714331782, "percentage": 87.71, "elapsed_time": "1 day, 6:08:00", "remaining_time": "4:13:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9520, "total_steps": 10853, "loss": 0.1084, "learning_rate": 2.0341056847476947e-07, "epoch": 0.8771364076104482, "percentage": 87.72, "elapsed_time": "1 day, 6:08:09", "remaining_time": "4:13:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9521, "total_steps": 10853, "loss": 0.1112, "learning_rate": 2.031096905250629e-07, "epoch": 0.8772285437877182, "percentage": 87.73, "elapsed_time": "1 day, 6:08:21", "remaining_time": "4:12:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9522, "total_steps": 10853, "loss": 0.1172, "learning_rate": 2.0280902584186828e-07, "epoch": 0.8773206799649883, "percentage": 87.74, "elapsed_time": "1 day, 6:08:32", "remaining_time": "4:12:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9523, "total_steps": 10853, "loss": 0.1247, "learning_rate": 2.02508574453103e-07, "epoch": 0.8774128161422583, "percentage": 87.75, "elapsed_time": "1 day, 6:08:43", "remaining_time": "4:12:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9524, "total_steps": 10853, "loss": 0.1203, "learning_rate": 2.0220833638666393e-07, "epoch": 0.8775049523195283, "percentage": 87.75, "elapsed_time": "1 day, 6:08:54", "remaining_time": "4:12:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9525, "total_steps": 10853, "loss": 0.1152, "learning_rate": 2.0190831167042846e-07, "epoch": 0.8775970884967983, "percentage": 87.76, "elapsed_time": "1 day, 6:09:04", "remaining_time": "4:12:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9526, "total_steps": 10853, "loss": 0.1214, "learning_rate": 2.016085003322535e-07, "epoch": 0.8776892246740683, "percentage": 87.77, "elapsed_time": "1 day, 6:09:14", "remaining_time": "4:12:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9527, "total_steps": 10853, "loss": 0.1146, "learning_rate": 2.013089023999762e-07, "epoch": 0.8777813608513383, "percentage": 87.78, "elapsed_time": "1 day, 6:09:25", "remaining_time": "4:11:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9528, "total_steps": 10853, "loss": 0.1116, "learning_rate": 2.010095179014146e-07, "epoch": 0.8778734970286083, "percentage": 87.79, "elapsed_time": "1 day, 6:09:37", "remaining_time": "4:11:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9529, "total_steps": 10853, "loss": 0.1279, "learning_rate": 2.00710346864367e-07, "epoch": 0.8779656332058783, "percentage": 87.8, "elapsed_time": "1 day, 6:09:47", "remaining_time": "4:11:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9530, "total_steps": 10853, "loss": 0.1249, "learning_rate": 2.0041138931661124e-07, "epoch": 0.8780577693831483, "percentage": 87.81, "elapsed_time": "1 day, 6:09:59", "remaining_time": "4:11:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9531, "total_steps": 10853, "loss": 0.1194, "learning_rate": 2.0011264528590562e-07, "epoch": 0.8781499055604183, "percentage": 87.82, "elapsed_time": "1 day, 6:10:08", "remaining_time": "4:11:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9532, "total_steps": 10853, "loss": 0.1085, "learning_rate": 1.9981411479998798e-07, "epoch": 0.8782420417376883, "percentage": 87.83, "elapsed_time": "1 day, 6:10:18", "remaining_time": "4:10:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9533, "total_steps": 10853, "loss": 0.1102, "learning_rate": 1.9951579788657748e-07, "epoch": 0.8783341779149583, "percentage": 87.84, "elapsed_time": "1 day, 6:10:28", "remaining_time": "4:10:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9534, "total_steps": 10853, "loss": 0.1242, "learning_rate": 1.9921769457337286e-07, "epoch": 0.8784263140922283, "percentage": 87.85, "elapsed_time": "1 day, 6:10:39", "remaining_time": "4:10:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9535, "total_steps": 10853, "loss": 0.114, "learning_rate": 1.9891980488805278e-07, "epoch": 0.8785184502694983, "percentage": 87.86, "elapsed_time": "1 day, 6:10:50", "remaining_time": "4:10:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9536, "total_steps": 10853, "loss": 0.1306, "learning_rate": 1.986221288582768e-07, "epoch": 0.8786105864467684, "percentage": 87.87, "elapsed_time": "1 day, 6:11:02", "remaining_time": "4:10:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9537, "total_steps": 10853, "loss": 0.1214, "learning_rate": 1.9832466651168337e-07, "epoch": 0.8787027226240384, "percentage": 87.87, "elapsed_time": "1 day, 6:11:11", "remaining_time": "4:09:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9538, "total_steps": 10853, "loss": 0.1056, "learning_rate": 1.9802741787589258e-07, "epoch": 0.8787948588013084, "percentage": 87.88, "elapsed_time": "1 day, 6:11:23", "remaining_time": "4:09:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9539, "total_steps": 10853, "loss": 0.116, "learning_rate": 1.977303829785035e-07, "epoch": 0.8788869949785784, "percentage": 87.89, "elapsed_time": "1 day, 6:11:34", "remaining_time": "4:09:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9540, "total_steps": 10853, "loss": 0.1243, "learning_rate": 1.9743356184709628e-07, "epoch": 0.8789791311558484, "percentage": 87.9, "elapsed_time": "1 day, 6:11:45", "remaining_time": "4:09:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9541, "total_steps": 10853, "loss": 0.129, "learning_rate": 1.9713695450923054e-07, "epoch": 0.8790712673331184, "percentage": 87.91, "elapsed_time": "1 day, 6:11:56", "remaining_time": "4:09:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9542, "total_steps": 10853, "loss": 0.1198, "learning_rate": 1.968405609924473e-07, "epoch": 0.8791634035103884, "percentage": 87.92, "elapsed_time": "1 day, 6:12:08", "remaining_time": "4:08:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9543, "total_steps": 10853, "loss": 0.1231, "learning_rate": 1.9654438132426485e-07, "epoch": 0.8792555396876583, "percentage": 87.93, "elapsed_time": "1 day, 6:12:19", "remaining_time": "4:08:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9544, "total_steps": 10853, "loss": 0.1083, "learning_rate": 1.9624841553218476e-07, "epoch": 0.8793476758649283, "percentage": 87.94, "elapsed_time": "1 day, 6:12:29", "remaining_time": "4:08:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9545, "total_steps": 10853, "loss": 0.1317, "learning_rate": 1.9595266364368705e-07, "epoch": 0.8794398120421983, "percentage": 87.95, "elapsed_time": "1 day, 6:12:40", "remaining_time": "4:08:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9546, "total_steps": 10853, "loss": 0.1113, "learning_rate": 1.9565712568623274e-07, "epoch": 0.8795319482194683, "percentage": 87.96, "elapsed_time": "1 day, 6:12:50", "remaining_time": "4:08:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9547, "total_steps": 10853, "loss": 0.1127, "learning_rate": 1.9536180168726214e-07, "epoch": 0.8796240843967383, "percentage": 87.97, "elapsed_time": "1 day, 6:13:01", "remaining_time": "4:08:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9548, "total_steps": 10853, "loss": 0.119, "learning_rate": 1.9506669167419667e-07, "epoch": 0.8797162205740083, "percentage": 87.98, "elapsed_time": "1 day, 6:13:11", "remaining_time": "4:07:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9549, "total_steps": 10853, "loss": 0.1274, "learning_rate": 1.9477179567443632e-07, "epoch": 0.8798083567512784, "percentage": 87.98, "elapsed_time": "1 day, 6:13:23", "remaining_time": "4:07:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9550, "total_steps": 10853, "loss": 0.1202, "learning_rate": 1.9447711371536365e-07, "epoch": 0.8799004929285484, "percentage": 87.99, "elapsed_time": "1 day, 6:13:35", "remaining_time": "4:07:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9551, "total_steps": 10853, "loss": 0.1171, "learning_rate": 1.9418264582433844e-07, "epoch": 0.8799926291058184, "percentage": 88.0, "elapsed_time": "1 day, 6:13:46", "remaining_time": "4:07:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9552, "total_steps": 10853, "loss": 0.1167, "learning_rate": 1.9388839202870268e-07, "epoch": 0.8800847652830884, "percentage": 88.01, "elapsed_time": "1 day, 6:13:56", "remaining_time": "4:07:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9553, "total_steps": 10853, "loss": 0.1042, "learning_rate": 1.9359435235577818e-07, "epoch": 0.8801769014603584, "percentage": 88.02, "elapsed_time": "1 day, 6:14:07", "remaining_time": "4:06:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9554, "total_steps": 10853, "loss": 0.1253, "learning_rate": 1.9330052683286666e-07, "epoch": 0.8802690376376284, "percentage": 88.03, "elapsed_time": "1 day, 6:14:18", "remaining_time": "4:06:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9555, "total_steps": 10853, "loss": 0.1134, "learning_rate": 1.930069154872488e-07, "epoch": 0.8803611738148984, "percentage": 88.04, "elapsed_time": "1 day, 6:14:29", "remaining_time": "4:06:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9556, "total_steps": 10853, "loss": 0.1213, "learning_rate": 1.92713518346187e-07, "epoch": 0.8804533099921684, "percentage": 88.05, "elapsed_time": "1 day, 6:14:39", "remaining_time": "4:06:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9557, "total_steps": 10853, "loss": 0.1185, "learning_rate": 1.9242033543692362e-07, "epoch": 0.8805454461694384, "percentage": 88.06, "elapsed_time": "1 day, 6:14:49", "remaining_time": "4:06:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9558, "total_steps": 10853, "loss": 0.1214, "learning_rate": 1.9212736678668075e-07, "epoch": 0.8806375823467084, "percentage": 88.07, "elapsed_time": "1 day, 6:15:01", "remaining_time": "4:05:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9559, "total_steps": 10853, "loss": 0.1142, "learning_rate": 1.9183461242266027e-07, "epoch": 0.8807297185239784, "percentage": 88.08, "elapsed_time": "1 day, 6:15:11", "remaining_time": "4:05:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9560, "total_steps": 10853, "loss": 0.1147, "learning_rate": 1.9154207237204403e-07, "epoch": 0.8808218547012484, "percentage": 88.09, "elapsed_time": "1 day, 6:15:20", "remaining_time": "4:05:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9561, "total_steps": 10853, "loss": 0.1299, "learning_rate": 1.9124974666199476e-07, "epoch": 0.8809139908785184, "percentage": 88.1, "elapsed_time": "1 day, 6:15:30", "remaining_time": "4:05:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9562, "total_steps": 10853, "loss": 0.1131, "learning_rate": 1.909576353196549e-07, "epoch": 0.8810061270557884, "percentage": 88.1, "elapsed_time": "1 day, 6:15:41", "remaining_time": "4:05:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9563, "total_steps": 10853, "loss": 0.113, "learning_rate": 1.9066573837214773e-07, "epoch": 0.8810982632330585, "percentage": 88.11, "elapsed_time": "1 day, 6:15:50", "remaining_time": "4:04:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9564, "total_steps": 10853, "loss": 0.117, "learning_rate": 1.90374055846575e-07, "epoch": 0.8811903994103285, "percentage": 88.12, "elapsed_time": "1 day, 6:16:01", "remaining_time": "4:04:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9565, "total_steps": 10853, "loss": 0.1208, "learning_rate": 1.9008258777001963e-07, "epoch": 0.8812825355875985, "percentage": 88.13, "elapsed_time": "1 day, 6:16:11", "remaining_time": "4:04:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9566, "total_steps": 10853, "loss": 0.1116, "learning_rate": 1.8979133416954453e-07, "epoch": 0.8813746717648685, "percentage": 88.14, "elapsed_time": "1 day, 6:16:21", "remaining_time": "4:04:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9567, "total_steps": 10853, "loss": 0.1252, "learning_rate": 1.8950029507219302e-07, "epoch": 0.8814668079421385, "percentage": 88.15, "elapsed_time": "1 day, 6:16:32", "remaining_time": "4:04:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9568, "total_steps": 10853, "loss": 0.1207, "learning_rate": 1.8920947050498711e-07, "epoch": 0.8815589441194085, "percentage": 88.16, "elapsed_time": "1 day, 6:16:43", "remaining_time": "4:03:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9569, "total_steps": 10853, "loss": 0.1293, "learning_rate": 1.889188604949313e-07, "epoch": 0.8816510802966785, "percentage": 88.17, "elapsed_time": "1 day, 6:16:53", "remaining_time": "4:03:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9570, "total_steps": 10853, "loss": 0.1005, "learning_rate": 1.8862846506900762e-07, "epoch": 0.8817432164739485, "percentage": 88.18, "elapsed_time": "1 day, 6:17:04", "remaining_time": "4:03:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9571, "total_steps": 10853, "loss": 0.1113, "learning_rate": 1.8833828425418006e-07, "epoch": 0.8818353526512185, "percentage": 88.19, "elapsed_time": "1 day, 6:17:14", "remaining_time": "4:03:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9572, "total_steps": 10853, "loss": 0.1122, "learning_rate": 1.8804831807739094e-07, "epoch": 0.8819274888284885, "percentage": 88.2, "elapsed_time": "1 day, 6:17:24", "remaining_time": "4:03:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9573, "total_steps": 10853, "loss": 0.118, "learning_rate": 1.8775856656556458e-07, "epoch": 0.8820196250057585, "percentage": 88.21, "elapsed_time": "1 day, 6:17:35", "remaining_time": "4:03:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9574, "total_steps": 10853, "loss": 0.1242, "learning_rate": 1.8746902974560443e-07, "epoch": 0.8821117611830285, "percentage": 88.22, "elapsed_time": "1 day, 6:17:45", "remaining_time": "4:02:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9575, "total_steps": 10853, "loss": 0.123, "learning_rate": 1.8717970764439374e-07, "epoch": 0.8822038973602985, "percentage": 88.22, "elapsed_time": "1 day, 6:17:57", "remaining_time": "4:02:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9576, "total_steps": 10853, "loss": 0.1278, "learning_rate": 1.8689060028879602e-07, "epoch": 0.8822960335375686, "percentage": 88.23, "elapsed_time": "1 day, 6:18:08", "remaining_time": "4:02:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9577, "total_steps": 10853, "loss": 0.1193, "learning_rate": 1.866017077056545e-07, "epoch": 0.8823881697148386, "percentage": 88.24, "elapsed_time": "1 day, 6:18:19", "remaining_time": "4:02:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9578, "total_steps": 10853, "loss": 0.1184, "learning_rate": 1.8631302992179383e-07, "epoch": 0.8824803058921086, "percentage": 88.25, "elapsed_time": "1 day, 6:18:29", "remaining_time": "4:02:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9579, "total_steps": 10853, "loss": 0.1092, "learning_rate": 1.860245669640176e-07, "epoch": 0.8825724420693786, "percentage": 88.26, "elapsed_time": "1 day, 6:18:39", "remaining_time": "4:01:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9580, "total_steps": 10853, "loss": 0.1111, "learning_rate": 1.857363188591091e-07, "epoch": 0.8826645782466486, "percentage": 88.27, "elapsed_time": "1 day, 6:18:50", "remaining_time": "4:01:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9581, "total_steps": 10853, "loss": 0.1079, "learning_rate": 1.8544828563383243e-07, "epoch": 0.8827567144239186, "percentage": 88.28, "elapsed_time": "1 day, 6:19:00", "remaining_time": "4:01:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9582, "total_steps": 10853, "loss": 0.1275, "learning_rate": 1.8516046731493127e-07, "epoch": 0.8828488506011886, "percentage": 88.29, "elapsed_time": "1 day, 6:19:11", "remaining_time": "4:01:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9583, "total_steps": 10853, "loss": 0.1096, "learning_rate": 1.848728639291303e-07, "epoch": 0.8829409867784586, "percentage": 88.3, "elapsed_time": "1 day, 6:19:21", "remaining_time": "4:01:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9584, "total_steps": 10853, "loss": 0.1191, "learning_rate": 1.8458547550313287e-07, "epoch": 0.8830331229557286, "percentage": 88.31, "elapsed_time": "1 day, 6:19:32", "remaining_time": "4:00:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9585, "total_steps": 10853, "loss": 0.1137, "learning_rate": 1.8429830206362325e-07, "epoch": 0.8831252591329986, "percentage": 88.32, "elapsed_time": "1 day, 6:19:43", "remaining_time": "4:00:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9586, "total_steps": 10853, "loss": 0.1138, "learning_rate": 1.8401134363726536e-07, "epoch": 0.8832173953102685, "percentage": 88.33, "elapsed_time": "1 day, 6:19:53", "remaining_time": "4:00:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9587, "total_steps": 10853, "loss": 0.1152, "learning_rate": 1.8372460025070343e-07, "epoch": 0.8833095314875385, "percentage": 88.34, "elapsed_time": "1 day, 6:20:03", "remaining_time": "4:00:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9588, "total_steps": 10853, "loss": 0.1113, "learning_rate": 1.8343807193056201e-07, "epoch": 0.8834016676648085, "percentage": 88.34, "elapsed_time": "1 day, 6:20:13", "remaining_time": "4:00:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9589, "total_steps": 10853, "loss": 0.1149, "learning_rate": 1.8315175870344455e-07, "epoch": 0.8834938038420785, "percentage": 88.35, "elapsed_time": "1 day, 6:20:24", "remaining_time": "3:59:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9590, "total_steps": 10853, "loss": 0.1154, "learning_rate": 1.8286566059593615e-07, "epoch": 0.8835859400193486, "percentage": 88.36, "elapsed_time": "1 day, 6:20:34", "remaining_time": "3:59:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9591, "total_steps": 10853, "loss": 0.1185, "learning_rate": 1.825797776346e-07, "epoch": 0.8836780761966186, "percentage": 88.37, "elapsed_time": "1 day, 6:20:45", "remaining_time": "3:59:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9592, "total_steps": 10853, "loss": 0.1243, "learning_rate": 1.8229410984598128e-07, "epoch": 0.8837702123738886, "percentage": 88.38, "elapsed_time": "1 day, 6:20:57", "remaining_time": "3:59:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9593, "total_steps": 10853, "loss": 0.1225, "learning_rate": 1.820086572566035e-07, "epoch": 0.8838623485511586, "percentage": 88.39, "elapsed_time": "1 day, 6:21:07", "remaining_time": "3:59:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9594, "total_steps": 10853, "loss": 0.1082, "learning_rate": 1.8172341989297154e-07, "epoch": 0.8839544847284286, "percentage": 88.4, "elapsed_time": "1 day, 6:21:19", "remaining_time": "3:59:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9595, "total_steps": 10853, "loss": 0.1082, "learning_rate": 1.814383977815698e-07, "epoch": 0.8840466209056986, "percentage": 88.41, "elapsed_time": "1 day, 6:21:28", "remaining_time": "3:58:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9596, "total_steps": 10853, "loss": 0.1237, "learning_rate": 1.8115359094886238e-07, "epoch": 0.8841387570829686, "percentage": 88.42, "elapsed_time": "1 day, 6:21:39", "remaining_time": "3:58:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9597, "total_steps": 10853, "loss": 0.1181, "learning_rate": 1.808689994212931e-07, "epoch": 0.8842308932602386, "percentage": 88.43, "elapsed_time": "1 day, 6:21:50", "remaining_time": "3:58:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9598, "total_steps": 10853, "loss": 0.1093, "learning_rate": 1.8058462322528698e-07, "epoch": 0.8843230294375086, "percentage": 88.44, "elapsed_time": "1 day, 6:22:00", "remaining_time": "3:58:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9599, "total_steps": 10853, "loss": 0.1191, "learning_rate": 1.8030046238724814e-07, "epoch": 0.8844151656147786, "percentage": 88.45, "elapsed_time": "1 day, 6:22:11", "remaining_time": "3:58:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9600, "total_steps": 10853, "loss": 0.1228, "learning_rate": 1.8001651693356131e-07, "epoch": 0.8845073017920486, "percentage": 88.45, "elapsed_time": "1 day, 6:22:22", "remaining_time": "3:57:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9601, "total_steps": 10853, "loss": 0.0991, "learning_rate": 1.797327868905907e-07, "epoch": 0.8845994379693186, "percentage": 88.46, "elapsed_time": "1 day, 6:22:33", "remaining_time": "3:57:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9602, "total_steps": 10853, "loss": 0.1168, "learning_rate": 1.7944927228467995e-07, "epoch": 0.8846915741465886, "percentage": 88.47, "elapsed_time": "1 day, 6:22:43", "remaining_time": "3:57:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9603, "total_steps": 10853, "loss": 0.1077, "learning_rate": 1.791659731421541e-07, "epoch": 0.8847837103238586, "percentage": 88.48, "elapsed_time": "1 day, 6:22:54", "remaining_time": "3:57:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9604, "total_steps": 10853, "loss": 0.1165, "learning_rate": 1.7888288948931799e-07, "epoch": 0.8848758465011287, "percentage": 88.49, "elapsed_time": "1 day, 6:23:03", "remaining_time": "3:57:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9605, "total_steps": 10853, "loss": 0.1154, "learning_rate": 1.786000213524547e-07, "epoch": 0.8849679826783987, "percentage": 88.5, "elapsed_time": "1 day, 6:23:14", "remaining_time": "3:56:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9606, "total_steps": 10853, "loss": 0.1077, "learning_rate": 1.783173687578299e-07, "epoch": 0.8850601188556687, "percentage": 88.51, "elapsed_time": "1 day, 6:23:25", "remaining_time": "3:56:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9607, "total_steps": 10853, "loss": 0.1249, "learning_rate": 1.7803493173168679e-07, "epoch": 0.8851522550329387, "percentage": 88.52, "elapsed_time": "1 day, 6:23:37", "remaining_time": "3:56:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9608, "total_steps": 10853, "loss": 0.1197, "learning_rate": 1.777527103002505e-07, "epoch": 0.8852443912102087, "percentage": 88.53, "elapsed_time": "1 day, 6:23:47", "remaining_time": "3:56:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9609, "total_steps": 10853, "loss": 0.1178, "learning_rate": 1.7747070448972475e-07, "epoch": 0.8853365273874787, "percentage": 88.54, "elapsed_time": "1 day, 6:23:57", "remaining_time": "3:56:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9610, "total_steps": 10853, "loss": 0.1295, "learning_rate": 1.7718891432629392e-07, "epoch": 0.8854286635647487, "percentage": 88.55, "elapsed_time": "1 day, 6:24:08", "remaining_time": "3:55:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9611, "total_steps": 10853, "loss": 0.1169, "learning_rate": 1.769073398361229e-07, "epoch": 0.8855207997420187, "percentage": 88.56, "elapsed_time": "1 day, 6:24:18", "remaining_time": "3:55:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9612, "total_steps": 10853, "loss": 0.1211, "learning_rate": 1.7662598104535522e-07, "epoch": 0.8856129359192887, "percentage": 88.57, "elapsed_time": "1 day, 6:24:28", "remaining_time": "3:55:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9613, "total_steps": 10853, "loss": 0.1217, "learning_rate": 1.7634483798011498e-07, "epoch": 0.8857050720965587, "percentage": 88.57, "elapsed_time": "1 day, 6:24:39", "remaining_time": "3:55:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9614, "total_steps": 10853, "loss": 0.1138, "learning_rate": 1.760639106665063e-07, "epoch": 0.8857972082738287, "percentage": 88.58, "elapsed_time": "1 day, 6:24:49", "remaining_time": "3:55:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9615, "total_steps": 10853, "loss": 0.1135, "learning_rate": 1.7578319913061387e-07, "epoch": 0.8858893444510987, "percentage": 88.59, "elapsed_time": "1 day, 6:24:59", "remaining_time": "3:54:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9616, "total_steps": 10853, "loss": 0.108, "learning_rate": 1.7550270339850212e-07, "epoch": 0.8859814806283687, "percentage": 88.6, "elapsed_time": "1 day, 6:25:10", "remaining_time": "3:54:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9617, "total_steps": 10853, "loss": 0.1213, "learning_rate": 1.7522242349621438e-07, "epoch": 0.8860736168056388, "percentage": 88.61, "elapsed_time": "1 day, 6:25:19", "remaining_time": "3:54:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9618, "total_steps": 10853, "loss": 0.1252, "learning_rate": 1.7494235944977427e-07, "epoch": 0.8861657529829088, "percentage": 88.62, "elapsed_time": "1 day, 6:25:31", "remaining_time": "3:54:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9619, "total_steps": 10853, "loss": 0.1088, "learning_rate": 1.7466251128518629e-07, "epoch": 0.8862578891601788, "percentage": 88.63, "elapsed_time": "1 day, 6:25:41", "remaining_time": "3:54:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9620, "total_steps": 10853, "loss": 0.1051, "learning_rate": 1.7438287902843465e-07, "epoch": 0.8863500253374488, "percentage": 88.64, "elapsed_time": "1 day, 6:25:50", "remaining_time": "3:54:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9621, "total_steps": 10853, "loss": 0.1175, "learning_rate": 1.7410346270548328e-07, "epoch": 0.8864421615147188, "percentage": 88.65, "elapsed_time": "1 day, 6:26:01", "remaining_time": "3:53:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9622, "total_steps": 10853, "loss": 0.1309, "learning_rate": 1.7382426234227562e-07, "epoch": 0.8865342976919888, "percentage": 88.66, "elapsed_time": "1 day, 6:26:13", "remaining_time": "3:53:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9623, "total_steps": 10853, "loss": 0.1191, "learning_rate": 1.735452779647351e-07, "epoch": 0.8866264338692588, "percentage": 88.67, "elapsed_time": "1 day, 6:26:25", "remaining_time": "3:53:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9624, "total_steps": 10853, "loss": 0.1308, "learning_rate": 1.7326650959876595e-07, "epoch": 0.8867185700465288, "percentage": 88.68, "elapsed_time": "1 day, 6:26:35", "remaining_time": "3:53:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9625, "total_steps": 10853, "loss": 0.1118, "learning_rate": 1.7298795727025226e-07, "epoch": 0.8868107062237988, "percentage": 88.69, "elapsed_time": "1 day, 6:26:46", "remaining_time": "3:53:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9626, "total_steps": 10853, "loss": 0.1202, "learning_rate": 1.7270962100505688e-07, "epoch": 0.8869028424010688, "percentage": 88.69, "elapsed_time": "1 day, 6:26:58", "remaining_time": "3:52:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9627, "total_steps": 10853, "loss": 0.1208, "learning_rate": 1.724315008290234e-07, "epoch": 0.8869949785783388, "percentage": 88.7, "elapsed_time": "1 day, 6:27:10", "remaining_time": "3:52:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9628, "total_steps": 10853, "loss": 0.1204, "learning_rate": 1.7215359676797604e-07, "epoch": 0.8870871147556088, "percentage": 88.71, "elapsed_time": "1 day, 6:27:21", "remaining_time": "3:52:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9629, "total_steps": 10853, "loss": 0.1137, "learning_rate": 1.7187590884771789e-07, "epoch": 0.8871792509328787, "percentage": 88.72, "elapsed_time": "1 day, 6:27:32", "remaining_time": "3:52:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9630, "total_steps": 10853, "loss": 0.1184, "learning_rate": 1.7159843709403156e-07, "epoch": 0.8872713871101487, "percentage": 88.73, "elapsed_time": "1 day, 6:27:43", "remaining_time": "3:52:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9631, "total_steps": 10853, "loss": 0.1182, "learning_rate": 1.7132118153268097e-07, "epoch": 0.8873635232874189, "percentage": 88.74, "elapsed_time": "1 day, 6:27:54", "remaining_time": "3:51:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9632, "total_steps": 10853, "loss": 0.1161, "learning_rate": 1.7104414218940934e-07, "epoch": 0.8874556594646889, "percentage": 88.75, "elapsed_time": "1 day, 6:28:05", "remaining_time": "3:51:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9633, "total_steps": 10853, "loss": 0.1063, "learning_rate": 1.7076731908994032e-07, "epoch": 0.8875477956419588, "percentage": 88.76, "elapsed_time": "1 day, 6:28:16", "remaining_time": "3:51:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9634, "total_steps": 10853, "loss": 0.1297, "learning_rate": 1.704907122599761e-07, "epoch": 0.8876399318192288, "percentage": 88.77, "elapsed_time": "1 day, 6:28:27", "remaining_time": "3:51:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9635, "total_steps": 10853, "loss": 0.1123, "learning_rate": 1.7021432172519974e-07, "epoch": 0.8877320679964988, "percentage": 88.78, "elapsed_time": "1 day, 6:28:37", "remaining_time": "3:51:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9636, "total_steps": 10853, "loss": 0.115, "learning_rate": 1.6993814751127435e-07, "epoch": 0.8878242041737688, "percentage": 88.79, "elapsed_time": "1 day, 6:28:49", "remaining_time": "3:50:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9637, "total_steps": 10853, "loss": 0.103, "learning_rate": 1.69662189643843e-07, "epoch": 0.8879163403510388, "percentage": 88.8, "elapsed_time": "1 day, 6:28:58", "remaining_time": "3:50:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9638, "total_steps": 10853, "loss": 0.1093, "learning_rate": 1.69386448148528e-07, "epoch": 0.8880084765283088, "percentage": 88.8, "elapsed_time": "1 day, 6:29:07", "remaining_time": "3:50:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9639, "total_steps": 10853, "loss": 0.1155, "learning_rate": 1.691109230509322e-07, "epoch": 0.8881006127055788, "percentage": 88.81, "elapsed_time": "1 day, 6:29:16", "remaining_time": "3:50:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9640, "total_steps": 10853, "loss": 0.1164, "learning_rate": 1.6883561437663788e-07, "epoch": 0.8881927488828488, "percentage": 88.82, "elapsed_time": "1 day, 6:29:26", "remaining_time": "3:50:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9641, "total_steps": 10853, "loss": 0.1115, "learning_rate": 1.6856052215120794e-07, "epoch": 0.8882848850601188, "percentage": 88.83, "elapsed_time": "1 day, 6:29:37", "remaining_time": "3:50:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9642, "total_steps": 10853, "loss": 0.1166, "learning_rate": 1.682856464001839e-07, "epoch": 0.8883770212373888, "percentage": 88.84, "elapsed_time": "1 day, 6:29:47", "remaining_time": "3:49:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9643, "total_steps": 10853, "loss": 0.1115, "learning_rate": 1.680109871490887e-07, "epoch": 0.8884691574146588, "percentage": 88.85, "elapsed_time": "1 day, 6:29:56", "remaining_time": "3:49:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9644, "total_steps": 10853, "loss": 0.1105, "learning_rate": 1.6773654442342468e-07, "epoch": 0.8885612935919289, "percentage": 88.86, "elapsed_time": "1 day, 6:30:07", "remaining_time": "3:49:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9645, "total_steps": 10853, "loss": 0.1284, "learning_rate": 1.6746231824867316e-07, "epoch": 0.8886534297691989, "percentage": 88.87, "elapsed_time": "1 day, 6:30:19", "remaining_time": "3:49:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9646, "total_steps": 10853, "loss": 0.1139, "learning_rate": 1.671883086502968e-07, "epoch": 0.8887455659464689, "percentage": 88.88, "elapsed_time": "1 day, 6:30:29", "remaining_time": "3:49:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9647, "total_steps": 10853, "loss": 0.1339, "learning_rate": 1.669145156537366e-07, "epoch": 0.8888377021237389, "percentage": 88.89, "elapsed_time": "1 day, 6:30:41", "remaining_time": "3:48:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9648, "total_steps": 10853, "loss": 0.1203, "learning_rate": 1.6664093928441456e-07, "epoch": 0.8889298383010089, "percentage": 88.9, "elapsed_time": "1 day, 6:30:51", "remaining_time": "3:48:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9649, "total_steps": 10853, "loss": 0.12, "learning_rate": 1.6636757956773302e-07, "epoch": 0.8890219744782789, "percentage": 88.91, "elapsed_time": "1 day, 6:31:02", "remaining_time": "3:48:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9650, "total_steps": 10853, "loss": 0.1227, "learning_rate": 1.6609443652907287e-07, "epoch": 0.8891141106555489, "percentage": 88.92, "elapsed_time": "1 day, 6:31:12", "remaining_time": "3:48:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9651, "total_steps": 10853, "loss": 0.1299, "learning_rate": 1.6582151019379517e-07, "epoch": 0.8892062468328189, "percentage": 88.92, "elapsed_time": "1 day, 6:31:22", "remaining_time": "3:48:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9652, "total_steps": 10853, "loss": 0.1126, "learning_rate": 1.655488005872413e-07, "epoch": 0.8892983830100889, "percentage": 88.93, "elapsed_time": "1 day, 6:31:32", "remaining_time": "3:47:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9653, "total_steps": 10853, "loss": 0.1178, "learning_rate": 1.6527630773473248e-07, "epoch": 0.8893905191873589, "percentage": 88.94, "elapsed_time": "1 day, 6:31:43", "remaining_time": "3:47:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9654, "total_steps": 10853, "loss": 0.1246, "learning_rate": 1.650040316615703e-07, "epoch": 0.8894826553646289, "percentage": 88.95, "elapsed_time": "1 day, 6:31:54", "remaining_time": "3:47:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9655, "total_steps": 10853, "loss": 0.124, "learning_rate": 1.647319723930349e-07, "epoch": 0.8895747915418989, "percentage": 88.96, "elapsed_time": "1 day, 6:32:05", "remaining_time": "3:47:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9656, "total_steps": 10853, "loss": 0.1252, "learning_rate": 1.6446012995438688e-07, "epoch": 0.8896669277191689, "percentage": 88.97, "elapsed_time": "1 day, 6:32:15", "remaining_time": "3:47:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9657, "total_steps": 10853, "loss": 0.1311, "learning_rate": 1.6418850437086715e-07, "epoch": 0.8897590638964389, "percentage": 88.98, "elapsed_time": "1 day, 6:32:27", "remaining_time": "3:46:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9658, "total_steps": 10853, "loss": 0.1232, "learning_rate": 1.6391709566769664e-07, "epoch": 0.889851200073709, "percentage": 88.99, "elapsed_time": "1 day, 6:32:37", "remaining_time": "3:46:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9659, "total_steps": 10853, "loss": 0.1053, "learning_rate": 1.6364590387007468e-07, "epoch": 0.889943336250979, "percentage": 89.0, "elapsed_time": "1 day, 6:32:48", "remaining_time": "3:46:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9660, "total_steps": 10853, "loss": 0.1118, "learning_rate": 1.6337492900318246e-07, "epoch": 0.890035472428249, "percentage": 89.01, "elapsed_time": "1 day, 6:33:00", "remaining_time": "3:46:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9661, "total_steps": 10853, "loss": 0.11, "learning_rate": 1.6310417109217906e-07, "epoch": 0.890127608605519, "percentage": 89.02, "elapsed_time": "1 day, 6:33:11", "remaining_time": "3:46:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9662, "total_steps": 10853, "loss": 0.1077, "learning_rate": 1.6283363016220548e-07, "epoch": 0.890219744782789, "percentage": 89.03, "elapsed_time": "1 day, 6:33:21", "remaining_time": "3:45:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9663, "total_steps": 10853, "loss": 0.126, "learning_rate": 1.6256330623838024e-07, "epoch": 0.890311880960059, "percentage": 89.04, "elapsed_time": "1 day, 6:33:32", "remaining_time": "3:45:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9664, "total_steps": 10853, "loss": 0.108, "learning_rate": 1.6229319934580378e-07, "epoch": 0.890404017137329, "percentage": 89.04, "elapsed_time": "1 day, 6:33:44", "remaining_time": "3:45:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9665, "total_steps": 10853, "loss": 0.1216, "learning_rate": 1.6202330950955552e-07, "epoch": 0.890496153314599, "percentage": 89.05, "elapsed_time": "1 day, 6:33:55", "remaining_time": "3:45:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9666, "total_steps": 10853, "loss": 0.1239, "learning_rate": 1.6175363675469485e-07, "epoch": 0.890588289491869, "percentage": 89.06, "elapsed_time": "1 day, 6:34:05", "remaining_time": "3:45:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9667, "total_steps": 10853, "loss": 0.1171, "learning_rate": 1.6148418110626008e-07, "epoch": 0.890680425669139, "percentage": 89.07, "elapsed_time": "1 day, 6:34:16", "remaining_time": "3:45:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9668, "total_steps": 10853, "loss": 0.1137, "learning_rate": 1.612149425892709e-07, "epoch": 0.890772561846409, "percentage": 89.08, "elapsed_time": "1 day, 6:34:27", "remaining_time": "3:44:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9669, "total_steps": 10853, "loss": 0.1142, "learning_rate": 1.6094592122872594e-07, "epoch": 0.890864698023679, "percentage": 89.09, "elapsed_time": "1 day, 6:34:37", "remaining_time": "3:44:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9670, "total_steps": 10853, "loss": 0.1146, "learning_rate": 1.6067711704960408e-07, "epoch": 0.890956834200949, "percentage": 89.1, "elapsed_time": "1 day, 6:34:48", "remaining_time": "3:44:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9671, "total_steps": 10853, "loss": 0.1258, "learning_rate": 1.60408530076864e-07, "epoch": 0.8910489703782191, "percentage": 89.11, "elapsed_time": "1 day, 6:34:59", "remaining_time": "3:44:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9672, "total_steps": 10853, "loss": 0.1125, "learning_rate": 1.6014016033544329e-07, "epoch": 0.8911411065554891, "percentage": 89.12, "elapsed_time": "1 day, 6:35:11", "remaining_time": "3:44:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9673, "total_steps": 10853, "loss": 0.1134, "learning_rate": 1.5987200785026024e-07, "epoch": 0.8912332427327591, "percentage": 89.13, "elapsed_time": "1 day, 6:35:21", "remaining_time": "3:43:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9674, "total_steps": 10853, "loss": 0.1234, "learning_rate": 1.5960407264621335e-07, "epoch": 0.891325378910029, "percentage": 89.14, "elapsed_time": "1 day, 6:35:33", "remaining_time": "3:43:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9675, "total_steps": 10853, "loss": 0.1207, "learning_rate": 1.5933635474818048e-07, "epoch": 0.891417515087299, "percentage": 89.15, "elapsed_time": "1 day, 6:35:44", "remaining_time": "3:43:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9676, "total_steps": 10853, "loss": 0.1169, "learning_rate": 1.5906885418101897e-07, "epoch": 0.891509651264569, "percentage": 89.16, "elapsed_time": "1 day, 6:35:54", "remaining_time": "3:43:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9677, "total_steps": 10853, "loss": 0.1155, "learning_rate": 1.588015709695659e-07, "epoch": 0.891601787441839, "percentage": 89.16, "elapsed_time": "1 day, 6:36:05", "remaining_time": "3:43:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9678, "total_steps": 10853, "loss": 0.112, "learning_rate": 1.5853450513863887e-07, "epoch": 0.891693923619109, "percentage": 89.17, "elapsed_time": "1 day, 6:36:17", "remaining_time": "3:42:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9679, "total_steps": 10853, "loss": 0.1149, "learning_rate": 1.582676567130356e-07, "epoch": 0.891786059796379, "percentage": 89.18, "elapsed_time": "1 day, 6:36:27", "remaining_time": "3:42:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9680, "total_steps": 10853, "loss": 0.1197, "learning_rate": 1.5800102571753185e-07, "epoch": 0.891878195973649, "percentage": 89.19, "elapsed_time": "1 day, 6:36:38", "remaining_time": "3:42:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9681, "total_steps": 10853, "loss": 0.118, "learning_rate": 1.5773461217688552e-07, "epoch": 0.891970332150919, "percentage": 89.2, "elapsed_time": "1 day, 6:36:49", "remaining_time": "3:42:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9682, "total_steps": 10853, "loss": 0.1155, "learning_rate": 1.5746841611583185e-07, "epoch": 0.892062468328189, "percentage": 89.21, "elapsed_time": "1 day, 6:37:01", "remaining_time": "3:42:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9683, "total_steps": 10853, "loss": 0.1078, "learning_rate": 1.572024375590883e-07, "epoch": 0.892154604505459, "percentage": 89.22, "elapsed_time": "1 day, 6:37:12", "remaining_time": "3:41:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9684, "total_steps": 10853, "loss": 0.1154, "learning_rate": 1.5693667653135043e-07, "epoch": 0.892246740682729, "percentage": 89.23, "elapsed_time": "1 day, 6:37:22", "remaining_time": "3:41:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9685, "total_steps": 10853, "loss": 0.1133, "learning_rate": 1.56671133057294e-07, "epoch": 0.8923388768599991, "percentage": 89.24, "elapsed_time": "1 day, 6:37:34", "remaining_time": "3:41:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9686, "total_steps": 10853, "loss": 0.1101, "learning_rate": 1.5640580716157566e-07, "epoch": 0.8924310130372691, "percentage": 89.25, "elapsed_time": "1 day, 6:37:45", "remaining_time": "3:41:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9687, "total_steps": 10853, "loss": 0.1093, "learning_rate": 1.5614069886883021e-07, "epoch": 0.8925231492145391, "percentage": 89.26, "elapsed_time": "1 day, 6:37:55", "remaining_time": "3:41:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9688, "total_steps": 10853, "loss": 0.1294, "learning_rate": 1.5587580820367294e-07, "epoch": 0.8926152853918091, "percentage": 89.27, "elapsed_time": "1 day, 6:38:08", "remaining_time": "3:41:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9689, "total_steps": 10853, "loss": 0.1232, "learning_rate": 1.5561113519069887e-07, "epoch": 0.8927074215690791, "percentage": 89.27, "elapsed_time": "1 day, 6:38:19", "remaining_time": "3:40:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9690, "total_steps": 10853, "loss": 0.1154, "learning_rate": 1.5534667985448336e-07, "epoch": 0.8927995577463491, "percentage": 89.28, "elapsed_time": "1 day, 6:38:29", "remaining_time": "3:40:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9691, "total_steps": 10853, "loss": 0.1114, "learning_rate": 1.5508244221958125e-07, "epoch": 0.8928916939236191, "percentage": 89.29, "elapsed_time": "1 day, 6:38:41", "remaining_time": "3:40:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9692, "total_steps": 10853, "loss": 0.1236, "learning_rate": 1.5481842231052702e-07, "epoch": 0.8929838301008891, "percentage": 89.3, "elapsed_time": "1 day, 6:38:52", "remaining_time": "3:40:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9693, "total_steps": 10853, "loss": 0.0956, "learning_rate": 1.5455462015183388e-07, "epoch": 0.8930759662781591, "percentage": 89.31, "elapsed_time": "1 day, 6:39:01", "remaining_time": "3:40:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9694, "total_steps": 10853, "loss": 0.1096, "learning_rate": 1.5429103576799692e-07, "epoch": 0.8931681024554291, "percentage": 89.32, "elapsed_time": "1 day, 6:39:13", "remaining_time": "3:39:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9695, "total_steps": 10853, "loss": 0.1274, "learning_rate": 1.540276691834902e-07, "epoch": 0.8932602386326991, "percentage": 89.33, "elapsed_time": "1 day, 6:39:25", "remaining_time": "3:39:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9696, "total_steps": 10853, "loss": 0.1311, "learning_rate": 1.537645204227664e-07, "epoch": 0.8933523748099691, "percentage": 89.34, "elapsed_time": "1 day, 6:39:36", "remaining_time": "3:39:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9697, "total_steps": 10853, "loss": 0.1183, "learning_rate": 1.5350158951025957e-07, "epoch": 0.8934445109872391, "percentage": 89.35, "elapsed_time": "1 day, 6:39:47", "remaining_time": "3:39:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9698, "total_steps": 10853, "loss": 0.1249, "learning_rate": 1.5323887647038266e-07, "epoch": 0.8935366471645091, "percentage": 89.36, "elapsed_time": "1 day, 6:39:58", "remaining_time": "3:39:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9699, "total_steps": 10853, "loss": 0.1138, "learning_rate": 1.5297638132752867e-07, "epoch": 0.8936287833417792, "percentage": 89.37, "elapsed_time": "1 day, 6:40:07", "remaining_time": "3:38:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9700, "total_steps": 10853, "loss": 0.1103, "learning_rate": 1.5271410410607008e-07, "epoch": 0.8937209195190492, "percentage": 89.38, "elapsed_time": "1 day, 6:40:19", "remaining_time": "3:38:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9701, "total_steps": 10853, "loss": 0.1194, "learning_rate": 1.5245204483035958e-07, "epoch": 0.8938130556963192, "percentage": 89.39, "elapsed_time": "1 day, 6:40:29", "remaining_time": "3:38:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9702, "total_steps": 10853, "loss": 0.1208, "learning_rate": 1.5219020352472914e-07, "epoch": 0.8939051918735892, "percentage": 89.39, "elapsed_time": "1 day, 6:40:39", "remaining_time": "3:38:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9703, "total_steps": 10853, "loss": 0.113, "learning_rate": 1.519285802134915e-07, "epoch": 0.8939973280508592, "percentage": 89.4, "elapsed_time": "1 day, 6:40:51", "remaining_time": "3:38:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9704, "total_steps": 10853, "loss": 0.1217, "learning_rate": 1.5166717492093808e-07, "epoch": 0.8940894642281292, "percentage": 89.41, "elapsed_time": "1 day, 6:41:01", "remaining_time": "3:37:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9705, "total_steps": 10853, "loss": 0.1104, "learning_rate": 1.5140598767133947e-07, "epoch": 0.8941816004053992, "percentage": 89.42, "elapsed_time": "1 day, 6:41:13", "remaining_time": "3:37:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9706, "total_steps": 10853, "loss": 0.1129, "learning_rate": 1.5114501848894792e-07, "epoch": 0.8942737365826692, "percentage": 89.43, "elapsed_time": "1 day, 6:41:24", "remaining_time": "3:37:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9707, "total_steps": 10853, "loss": 0.1195, "learning_rate": 1.5088426739799405e-07, "epoch": 0.8943658727599392, "percentage": 89.44, "elapsed_time": "1 day, 6:41:35", "remaining_time": "3:37:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9708, "total_steps": 10853, "loss": 0.1222, "learning_rate": 1.5062373442268908e-07, "epoch": 0.8944580089372092, "percentage": 89.45, "elapsed_time": "1 day, 6:41:46", "remaining_time": "3:37:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9709, "total_steps": 10853, "loss": 0.1151, "learning_rate": 1.5036341958722334e-07, "epoch": 0.8945501451144792, "percentage": 89.46, "elapsed_time": "1 day, 6:41:57", "remaining_time": "3:37:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9710, "total_steps": 10853, "loss": 0.1205, "learning_rate": 1.501033229157667e-07, "epoch": 0.8946422812917492, "percentage": 89.47, "elapsed_time": "1 day, 6:42:08", "remaining_time": "3:36:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9711, "total_steps": 10853, "loss": 0.1126, "learning_rate": 1.4984344443246924e-07, "epoch": 0.8947344174690192, "percentage": 89.48, "elapsed_time": "1 day, 6:42:18", "remaining_time": "3:36:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9712, "total_steps": 10853, "loss": 0.0968, "learning_rate": 1.495837841614614e-07, "epoch": 0.8948265536462893, "percentage": 89.49, "elapsed_time": "1 day, 6:42:28", "remaining_time": "3:36:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9713, "total_steps": 10853, "loss": 0.1116, "learning_rate": 1.493243421268517e-07, "epoch": 0.8949186898235593, "percentage": 89.5, "elapsed_time": "1 day, 6:42:38", "remaining_time": "3:36:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9714, "total_steps": 10853, "loss": 0.1048, "learning_rate": 1.4906511835273003e-07, "epoch": 0.8950108260008293, "percentage": 89.51, "elapsed_time": "1 day, 6:42:49", "remaining_time": "3:36:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9715, "total_steps": 10853, "loss": 0.122, "learning_rate": 1.4880611286316487e-07, "epoch": 0.8951029621780993, "percentage": 89.51, "elapsed_time": "1 day, 6:43:00", "remaining_time": "3:35:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9716, "total_steps": 10853, "loss": 0.1316, "learning_rate": 1.4854732568220566e-07, "epoch": 0.8951950983553693, "percentage": 89.52, "elapsed_time": "1 day, 6:43:10", "remaining_time": "3:35:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9717, "total_steps": 10853, "loss": 0.1169, "learning_rate": 1.4828875683387977e-07, "epoch": 0.8952872345326393, "percentage": 89.53, "elapsed_time": "1 day, 6:43:20", "remaining_time": "3:35:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9718, "total_steps": 10853, "loss": 0.1094, "learning_rate": 1.4803040634219612e-07, "epoch": 0.8953793707099093, "percentage": 89.54, "elapsed_time": "1 day, 6:43:31", "remaining_time": "3:35:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9719, "total_steps": 10853, "loss": 0.12, "learning_rate": 1.4777227423114271e-07, "epoch": 0.8954715068871792, "percentage": 89.55, "elapsed_time": "1 day, 6:43:42", "remaining_time": "3:35:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9720, "total_steps": 10853, "loss": 0.1258, "learning_rate": 1.4751436052468677e-07, "epoch": 0.8955636430644492, "percentage": 89.56, "elapsed_time": "1 day, 6:43:50", "remaining_time": "3:34:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9721, "total_steps": 10853, "loss": 0.1086, "learning_rate": 1.4725666524677496e-07, "epoch": 0.8956557792417192, "percentage": 89.57, "elapsed_time": "1 day, 6:44:01", "remaining_time": "3:34:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9722, "total_steps": 10853, "loss": 0.1211, "learning_rate": 1.4699918842133536e-07, "epoch": 0.8957479154189892, "percentage": 89.58, "elapsed_time": "1 day, 6:44:11", "remaining_time": "3:34:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9723, "total_steps": 10853, "loss": 0.1035, "learning_rate": 1.4674193007227416e-07, "epoch": 0.8958400515962592, "percentage": 89.59, "elapsed_time": "1 day, 6:44:22", "remaining_time": "3:34:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9724, "total_steps": 10853, "loss": 0.1188, "learning_rate": 1.464848902234786e-07, "epoch": 0.8959321877735292, "percentage": 89.6, "elapsed_time": "1 day, 6:44:32", "remaining_time": "3:34:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9725, "total_steps": 10853, "loss": 0.1209, "learning_rate": 1.4622806889881407e-07, "epoch": 0.8960243239507992, "percentage": 89.61, "elapsed_time": "1 day, 6:44:43", "remaining_time": "3:33:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9726, "total_steps": 10853, "loss": 0.1165, "learning_rate": 1.4597146612212622e-07, "epoch": 0.8961164601280693, "percentage": 89.62, "elapsed_time": "1 day, 6:44:54", "remaining_time": "3:33:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9727, "total_steps": 10853, "loss": 0.123, "learning_rate": 1.457150819172412e-07, "epoch": 0.8962085963053393, "percentage": 89.62, "elapsed_time": "1 day, 6:45:05", "remaining_time": "3:33:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9728, "total_steps": 10853, "loss": 0.1088, "learning_rate": 1.454589163079645e-07, "epoch": 0.8963007324826093, "percentage": 89.63, "elapsed_time": "1 day, 6:45:16", "remaining_time": "3:33:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9729, "total_steps": 10853, "loss": 0.112, "learning_rate": 1.4520296931808064e-07, "epoch": 0.8963928686598793, "percentage": 89.64, "elapsed_time": "1 day, 6:45:26", "remaining_time": "3:33:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9730, "total_steps": 10853, "loss": 0.1236, "learning_rate": 1.449472409713548e-07, "epoch": 0.8964850048371493, "percentage": 89.65, "elapsed_time": "1 day, 6:45:37", "remaining_time": "3:33:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9731, "total_steps": 10853, "loss": 0.1181, "learning_rate": 1.4469173129153052e-07, "epoch": 0.8965771410144193, "percentage": 89.66, "elapsed_time": "1 day, 6:45:47", "remaining_time": "3:32:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9732, "total_steps": 10853, "loss": 0.1305, "learning_rate": 1.4443644030233268e-07, "epoch": 0.8966692771916893, "percentage": 89.67, "elapsed_time": "1 day, 6:45:59", "remaining_time": "3:32:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9733, "total_steps": 10853, "loss": 0.1068, "learning_rate": 1.4418136802746507e-07, "epoch": 0.8967614133689593, "percentage": 89.68, "elapsed_time": "1 day, 6:46:10", "remaining_time": "3:32:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9734, "total_steps": 10853, "loss": 0.1221, "learning_rate": 1.4392651449061075e-07, "epoch": 0.8968535495462293, "percentage": 89.69, "elapsed_time": "1 day, 6:46:20", "remaining_time": "3:32:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9735, "total_steps": 10853, "loss": 0.1085, "learning_rate": 1.4367187971543352e-07, "epoch": 0.8969456857234993, "percentage": 89.7, "elapsed_time": "1 day, 6:46:31", "remaining_time": "3:32:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9736, "total_steps": 10853, "loss": 0.0992, "learning_rate": 1.434174637255753e-07, "epoch": 0.8970378219007693, "percentage": 89.71, "elapsed_time": "1 day, 6:46:42", "remaining_time": "3:31:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9737, "total_steps": 10853, "loss": 0.128, "learning_rate": 1.4316326654465972e-07, "epoch": 0.8971299580780393, "percentage": 89.72, "elapsed_time": "1 day, 6:46:53", "remaining_time": "3:31:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9738, "total_steps": 10853, "loss": 0.1228, "learning_rate": 1.429092881962882e-07, "epoch": 0.8972220942553093, "percentage": 89.73, "elapsed_time": "1 day, 6:47:04", "remaining_time": "3:31:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9739, "total_steps": 10853, "loss": 0.1189, "learning_rate": 1.4265552870404265e-07, "epoch": 0.8973142304325794, "percentage": 89.74, "elapsed_time": "1 day, 6:47:16", "remaining_time": "3:31:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9740, "total_steps": 10853, "loss": 0.1261, "learning_rate": 1.4240198809148537e-07, "epoch": 0.8974063666098494, "percentage": 89.74, "elapsed_time": "1 day, 6:47:26", "remaining_time": "3:31:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9741, "total_steps": 10853, "loss": 0.1085, "learning_rate": 1.421486663821575e-07, "epoch": 0.8974985027871194, "percentage": 89.75, "elapsed_time": "1 day, 6:47:36", "remaining_time": "3:30:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9742, "total_steps": 10853, "loss": 0.1145, "learning_rate": 1.4189556359957917e-07, "epoch": 0.8975906389643894, "percentage": 89.76, "elapsed_time": "1 day, 6:47:46", "remaining_time": "3:30:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9743, "total_steps": 10853, "loss": 0.1196, "learning_rate": 1.4164267976725154e-07, "epoch": 0.8976827751416594, "percentage": 89.77, "elapsed_time": "1 day, 6:47:57", "remaining_time": "3:30:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9744, "total_steps": 10853, "loss": 0.1232, "learning_rate": 1.41390014908655e-07, "epoch": 0.8977749113189294, "percentage": 89.78, "elapsed_time": "1 day, 6:48:08", "remaining_time": "3:30:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9745, "total_steps": 10853, "loss": 0.1113, "learning_rate": 1.4113756904724967e-07, "epoch": 0.8978670474961994, "percentage": 89.79, "elapsed_time": "1 day, 6:48:17", "remaining_time": "3:30:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9746, "total_steps": 10853, "loss": 0.124, "learning_rate": 1.4088534220647487e-07, "epoch": 0.8979591836734694, "percentage": 89.8, "elapsed_time": "1 day, 6:48:28", "remaining_time": "3:29:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9747, "total_steps": 10853, "loss": 0.1108, "learning_rate": 1.4063333440974963e-07, "epoch": 0.8980513198507394, "percentage": 89.81, "elapsed_time": "1 day, 6:48:41", "remaining_time": "3:29:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9748, "total_steps": 10853, "loss": 0.1071, "learning_rate": 1.403815456804733e-07, "epoch": 0.8981434560280094, "percentage": 89.82, "elapsed_time": "1 day, 6:48:51", "remaining_time": "3:29:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9749, "total_steps": 10853, "loss": 0.1143, "learning_rate": 1.4012997604202466e-07, "epoch": 0.8982355922052794, "percentage": 89.83, "elapsed_time": "1 day, 6:49:02", "remaining_time": "3:29:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9750, "total_steps": 10853, "loss": 0.1079, "learning_rate": 1.3987862551776143e-07, "epoch": 0.8983277283825494, "percentage": 89.84, "elapsed_time": "1 day, 6:49:12", "remaining_time": "3:29:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9751, "total_steps": 10853, "loss": 0.1136, "learning_rate": 1.3962749413102216e-07, "epoch": 0.8984198645598194, "percentage": 89.85, "elapsed_time": "1 day, 6:49:22", "remaining_time": "3:29:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9752, "total_steps": 10853, "loss": 0.1209, "learning_rate": 1.3937658190512377e-07, "epoch": 0.8985120007370894, "percentage": 89.86, "elapsed_time": "1 day, 6:49:32", "remaining_time": "3:28:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9753, "total_steps": 10853, "loss": 0.114, "learning_rate": 1.3912588886336397e-07, "epoch": 0.8986041369143595, "percentage": 89.86, "elapsed_time": "1 day, 6:49:44", "remaining_time": "3:28:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9754, "total_steps": 10853, "loss": 0.1234, "learning_rate": 1.388754150290192e-07, "epoch": 0.8986962730916295, "percentage": 89.87, "elapsed_time": "1 day, 6:49:55", "remaining_time": "3:28:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9755, "total_steps": 10853, "loss": 0.1042, "learning_rate": 1.3862516042534634e-07, "epoch": 0.8987884092688995, "percentage": 89.88, "elapsed_time": "1 day, 6:50:05", "remaining_time": "3:28:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9756, "total_steps": 10853, "loss": 0.1192, "learning_rate": 1.3837512507558188e-07, "epoch": 0.8988805454461695, "percentage": 89.89, "elapsed_time": "1 day, 6:50:16", "remaining_time": "3:28:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9757, "total_steps": 10853, "loss": 0.1131, "learning_rate": 1.3812530900294107e-07, "epoch": 0.8989726816234395, "percentage": 89.9, "elapsed_time": "1 day, 6:50:27", "remaining_time": "3:27:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9758, "total_steps": 10853, "loss": 0.1141, "learning_rate": 1.37875712230619e-07, "epoch": 0.8990648178007095, "percentage": 89.91, "elapsed_time": "1 day, 6:50:38", "remaining_time": "3:27:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9759, "total_steps": 10853, "loss": 0.1255, "learning_rate": 1.376263347817916e-07, "epoch": 0.8991569539779795, "percentage": 89.92, "elapsed_time": "1 day, 6:50:49", "remaining_time": "3:27:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9760, "total_steps": 10853, "loss": 0.1206, "learning_rate": 1.3737717667961308e-07, "epoch": 0.8992490901552495, "percentage": 89.93, "elapsed_time": "1 day, 6:50:59", "remaining_time": "3:27:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9761, "total_steps": 10853, "loss": 0.1116, "learning_rate": 1.371282379472183e-07, "epoch": 0.8993412263325195, "percentage": 89.94, "elapsed_time": "1 day, 6:51:10", "remaining_time": "3:27:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9762, "total_steps": 10853, "loss": 0.1131, "learning_rate": 1.3687951860772098e-07, "epoch": 0.8994333625097894, "percentage": 89.95, "elapsed_time": "1 day, 6:51:20", "remaining_time": "3:26:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9763, "total_steps": 10853, "loss": 0.1157, "learning_rate": 1.366310186842143e-07, "epoch": 0.8995254986870594, "percentage": 89.96, "elapsed_time": "1 day, 6:51:31", "remaining_time": "3:26:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9764, "total_steps": 10853, "loss": 0.1205, "learning_rate": 1.3638273819977205e-07, "epoch": 0.8996176348643294, "percentage": 89.97, "elapsed_time": "1 day, 6:51:42", "remaining_time": "3:26:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9765, "total_steps": 10853, "loss": 0.1234, "learning_rate": 1.3613467717744661e-07, "epoch": 0.8997097710415994, "percentage": 89.98, "elapsed_time": "1 day, 6:51:52", "remaining_time": "3:26:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9766, "total_steps": 10853, "loss": 0.122, "learning_rate": 1.358868356402715e-07, "epoch": 0.8998019072188694, "percentage": 89.98, "elapsed_time": "1 day, 6:52:02", "remaining_time": "3:26:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9767, "total_steps": 10853, "loss": 0.1273, "learning_rate": 1.3563921361125804e-07, "epoch": 0.8998940433961395, "percentage": 89.99, "elapsed_time": "1 day, 6:52:12", "remaining_time": "3:25:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9768, "total_steps": 10853, "loss": 0.1182, "learning_rate": 1.3539181111339754e-07, "epoch": 0.8999861795734095, "percentage": 90.0, "elapsed_time": "1 day, 6:52:22", "remaining_time": "3:25:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9769, "total_steps": 10853, "loss": 0.106, "learning_rate": 1.3514462816966195e-07, "epoch": 0.9000783157506795, "percentage": 90.01, "elapsed_time": "1 day, 6:52:34", "remaining_time": "3:25:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9770, "total_steps": 10853, "loss": 0.1252, "learning_rate": 1.3489766480300232e-07, "epoch": 0.9001704519279495, "percentage": 90.02, "elapsed_time": "1 day, 6:52:45", "remaining_time": "3:25:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9771, "total_steps": 10853, "loss": 0.1209, "learning_rate": 1.3465092103634892e-07, "epoch": 0.9002625881052195, "percentage": 90.03, "elapsed_time": "1 day, 6:52:55", "remaining_time": "3:25:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9772, "total_steps": 10853, "loss": 0.1249, "learning_rate": 1.3440439689261232e-07, "epoch": 0.9003547242824895, "percentage": 90.04, "elapsed_time": "1 day, 6:53:05", "remaining_time": "3:24:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9773, "total_steps": 10853, "loss": 0.1133, "learning_rate": 1.3415809239468198e-07, "epoch": 0.9004468604597595, "percentage": 90.05, "elapsed_time": "1 day, 6:53:15", "remaining_time": "3:24:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9774, "total_steps": 10853, "loss": 0.1198, "learning_rate": 1.3391200756542738e-07, "epoch": 0.9005389966370295, "percentage": 90.06, "elapsed_time": "1 day, 6:53:25", "remaining_time": "3:24:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9775, "total_steps": 10853, "loss": 0.1186, "learning_rate": 1.336661424276972e-07, "epoch": 0.9006311328142995, "percentage": 90.07, "elapsed_time": "1 day, 6:53:36", "remaining_time": "3:24:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9776, "total_steps": 10853, "loss": 0.112, "learning_rate": 1.334204970043204e-07, "epoch": 0.9007232689915695, "percentage": 90.08, "elapsed_time": "1 day, 6:53:47", "remaining_time": "3:24:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9777, "total_steps": 10853, "loss": 0.1186, "learning_rate": 1.331750713181054e-07, "epoch": 0.9008154051688395, "percentage": 90.09, "elapsed_time": "1 day, 6:53:58", "remaining_time": "3:24:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9778, "total_steps": 10853, "loss": 0.1217, "learning_rate": 1.3292986539184011e-07, "epoch": 0.9009075413461095, "percentage": 90.09, "elapsed_time": "1 day, 6:54:08", "remaining_time": "3:23:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9779, "total_steps": 10853, "loss": 0.1181, "learning_rate": 1.32684879248291e-07, "epoch": 0.9009996775233795, "percentage": 90.1, "elapsed_time": "1 day, 6:54:20", "remaining_time": "3:23:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9780, "total_steps": 10853, "loss": 0.113, "learning_rate": 1.324401129102057e-07, "epoch": 0.9010918137006496, "percentage": 90.11, "elapsed_time": "1 day, 6:54:31", "remaining_time": "3:23:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9781, "total_steps": 10853, "loss": 0.1229, "learning_rate": 1.321955664003105e-07, "epoch": 0.9011839498779196, "percentage": 90.12, "elapsed_time": "1 day, 6:54:41", "remaining_time": "3:23:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9782, "total_steps": 10853, "loss": 0.109, "learning_rate": 1.3195123974131252e-07, "epoch": 0.9012760860551896, "percentage": 90.13, "elapsed_time": "1 day, 6:54:51", "remaining_time": "3:23:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9783, "total_steps": 10853, "loss": 0.1244, "learning_rate": 1.317071329558961e-07, "epoch": 0.9013682222324596, "percentage": 90.14, "elapsed_time": "1 day, 6:55:02", "remaining_time": "3:22:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9784, "total_steps": 10853, "loss": 0.1171, "learning_rate": 1.3146324606672754e-07, "epoch": 0.9014603584097296, "percentage": 90.15, "elapsed_time": "1 day, 6:55:11", "remaining_time": "3:22:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9785, "total_steps": 10853, "loss": 0.1112, "learning_rate": 1.3121957909645155e-07, "epoch": 0.9015524945869996, "percentage": 90.16, "elapsed_time": "1 day, 6:55:22", "remaining_time": "3:22:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9786, "total_steps": 10853, "loss": 0.1296, "learning_rate": 1.309761320676925e-07, "epoch": 0.9016446307642696, "percentage": 90.17, "elapsed_time": "1 day, 6:55:34", "remaining_time": "3:22:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9787, "total_steps": 10853, "loss": 0.1211, "learning_rate": 1.3073290500305452e-07, "epoch": 0.9017367669415396, "percentage": 90.18, "elapsed_time": "1 day, 6:55:46", "remaining_time": "3:22:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9788, "total_steps": 10853, "loss": 0.1165, "learning_rate": 1.3048989792512096e-07, "epoch": 0.9018289031188096, "percentage": 90.19, "elapsed_time": "1 day, 6:55:57", "remaining_time": "3:21:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9789, "total_steps": 10853, "loss": 0.1174, "learning_rate": 1.3024711085645597e-07, "epoch": 0.9019210392960796, "percentage": 90.2, "elapsed_time": "1 day, 6:56:08", "remaining_time": "3:21:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9790, "total_steps": 10853, "loss": 0.1151, "learning_rate": 1.3000454381960127e-07, "epoch": 0.9020131754733496, "percentage": 90.21, "elapsed_time": "1 day, 6:56:19", "remaining_time": "3:21:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9791, "total_steps": 10853, "loss": 0.113, "learning_rate": 1.297621968370802e-07, "epoch": 0.9021053116506196, "percentage": 90.21, "elapsed_time": "1 day, 6:56:30", "remaining_time": "3:21:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9792, "total_steps": 10853, "loss": 0.13, "learning_rate": 1.2952006993139393e-07, "epoch": 0.9021974478278896, "percentage": 90.22, "elapsed_time": "1 day, 6:56:41", "remaining_time": "3:21:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9793, "total_steps": 10853, "loss": 0.1248, "learning_rate": 1.2927816312502422e-07, "epoch": 0.9022895840051596, "percentage": 90.23, "elapsed_time": "1 day, 6:56:53", "remaining_time": "3:20:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9794, "total_steps": 10853, "loss": 0.121, "learning_rate": 1.2903647644043254e-07, "epoch": 0.9023817201824297, "percentage": 90.24, "elapsed_time": "1 day, 6:57:03", "remaining_time": "3:20:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9795, "total_steps": 10853, "loss": 0.1118, "learning_rate": 1.2879500990005926e-07, "epoch": 0.9024738563596997, "percentage": 90.25, "elapsed_time": "1 day, 6:57:14", "remaining_time": "3:20:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9796, "total_steps": 10853, "loss": 0.1199, "learning_rate": 1.2855376352632427e-07, "epoch": 0.9025659925369697, "percentage": 90.26, "elapsed_time": "1 day, 6:57:25", "remaining_time": "3:20:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9797, "total_steps": 10853, "loss": 0.1116, "learning_rate": 1.2831273734162736e-07, "epoch": 0.9026581287142397, "percentage": 90.27, "elapsed_time": "1 day, 6:57:35", "remaining_time": "3:20:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9798, "total_steps": 10853, "loss": 0.127, "learning_rate": 1.280719313683479e-07, "epoch": 0.9027502648915097, "percentage": 90.28, "elapsed_time": "1 day, 6:57:46", "remaining_time": "3:20:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9799, "total_steps": 10853, "loss": 0.1309, "learning_rate": 1.2783134562884547e-07, "epoch": 0.9028424010687797, "percentage": 90.29, "elapsed_time": "1 day, 6:57:57", "remaining_time": "3:19:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9800, "total_steps": 10853, "loss": 0.1242, "learning_rate": 1.275909801454578e-07, "epoch": 0.9029345372460497, "percentage": 90.3, "elapsed_time": "1 day, 6:58:08", "remaining_time": "3:19:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9801, "total_steps": 10853, "loss": 0.1172, "learning_rate": 1.2735083494050255e-07, "epoch": 0.9030266734233197, "percentage": 90.31, "elapsed_time": "1 day, 6:58:20", "remaining_time": "3:19:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9802, "total_steps": 10853, "loss": 0.1197, "learning_rate": 1.2711091003627773e-07, "epoch": 0.9031188096005897, "percentage": 90.32, "elapsed_time": "1 day, 6:58:30", "remaining_time": "3:19:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9803, "total_steps": 10853, "loss": 0.1187, "learning_rate": 1.2687120545506054e-07, "epoch": 0.9032109457778597, "percentage": 90.33, "elapsed_time": "1 day, 6:58:42", "remaining_time": "3:19:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9804, "total_steps": 10853, "loss": 0.1189, "learning_rate": 1.2663172121910705e-07, "epoch": 0.9033030819551296, "percentage": 90.33, "elapsed_time": "1 day, 6:58:51", "remaining_time": "3:18:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9805, "total_steps": 10853, "loss": 0.1092, "learning_rate": 1.263924573506542e-07, "epoch": 0.9033952181323996, "percentage": 90.34, "elapsed_time": "1 day, 6:59:02", "remaining_time": "3:18:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9806, "total_steps": 10853, "loss": 0.1253, "learning_rate": 1.2615341387191644e-07, "epoch": 0.9034873543096696, "percentage": 90.35, "elapsed_time": "1 day, 6:59:12", "remaining_time": "3:18:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9807, "total_steps": 10853, "loss": 0.1108, "learning_rate": 1.2591459080509017e-07, "epoch": 0.9035794904869398, "percentage": 90.36, "elapsed_time": "1 day, 6:59:22", "remaining_time": "3:18:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9808, "total_steps": 10853, "loss": 0.1146, "learning_rate": 1.2567598817234932e-07, "epoch": 0.9036716266642097, "percentage": 90.37, "elapsed_time": "1 day, 6:59:33", "remaining_time": "3:18:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9809, "total_steps": 10853, "loss": 0.1208, "learning_rate": 1.2543760599584842e-07, "epoch": 0.9037637628414797, "percentage": 90.38, "elapsed_time": "1 day, 6:59:45", "remaining_time": "3:17:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9810, "total_steps": 10853, "loss": 0.1109, "learning_rate": 1.2519944429772168e-07, "epoch": 0.9038558990187497, "percentage": 90.39, "elapsed_time": "1 day, 6:59:56", "remaining_time": "3:17:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9811, "total_steps": 10853, "loss": 0.1333, "learning_rate": 1.2496150310008226e-07, "epoch": 0.9039480351960197, "percentage": 90.4, "elapsed_time": "1 day, 7:00:08", "remaining_time": "3:17:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9812, "total_steps": 10853, "loss": 0.1166, "learning_rate": 1.2472378242502247e-07, "epoch": 0.9040401713732897, "percentage": 90.41, "elapsed_time": "1 day, 7:00:18", "remaining_time": "3:17:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9813, "total_steps": 10853, "loss": 0.1123, "learning_rate": 1.2448628229461522e-07, "epoch": 0.9041323075505597, "percentage": 90.42, "elapsed_time": "1 day, 7:00:29", "remaining_time": "3:17:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9814, "total_steps": 10853, "loss": 0.1059, "learning_rate": 1.2424900273091206e-07, "epoch": 0.9042244437278297, "percentage": 90.43, "elapsed_time": "1 day, 7:00:39", "remaining_time": "3:16:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9815, "total_steps": 10853, "loss": 0.1171, "learning_rate": 1.2401194375594532e-07, "epoch": 0.9043165799050997, "percentage": 90.44, "elapsed_time": "1 day, 7:00:50", "remaining_time": "3:16:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9816, "total_steps": 10853, "loss": 0.1137, "learning_rate": 1.237751053917252e-07, "epoch": 0.9044087160823697, "percentage": 90.45, "elapsed_time": "1 day, 7:01:00", "remaining_time": "3:16:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9817, "total_steps": 10853, "loss": 0.1166, "learning_rate": 1.235384876602419e-07, "epoch": 0.9045008522596397, "percentage": 90.45, "elapsed_time": "1 day, 7:01:11", "remaining_time": "3:16:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9818, "total_steps": 10853, "loss": 0.1109, "learning_rate": 1.233020905834656e-07, "epoch": 0.9045929884369097, "percentage": 90.46, "elapsed_time": "1 day, 7:01:24", "remaining_time": "3:16:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9819, "total_steps": 10853, "loss": 0.1236, "learning_rate": 1.2306591418334624e-07, "epoch": 0.9046851246141797, "percentage": 90.47, "elapsed_time": "1 day, 7:01:36", "remaining_time": "3:16:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9820, "total_steps": 10853, "loss": 0.1238, "learning_rate": 1.2282995848181267e-07, "epoch": 0.9047772607914497, "percentage": 90.48, "elapsed_time": "1 day, 7:01:47", "remaining_time": "3:15:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9821, "total_steps": 10853, "loss": 0.1026, "learning_rate": 1.2259422350077348e-07, "epoch": 0.9048693969687198, "percentage": 90.49, "elapsed_time": "1 day, 7:01:57", "remaining_time": "3:15:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9822, "total_steps": 10853, "loss": 0.1147, "learning_rate": 1.223587092621162e-07, "epoch": 0.9049615331459898, "percentage": 90.5, "elapsed_time": "1 day, 7:02:09", "remaining_time": "3:15:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9823, "total_steps": 10853, "loss": 0.1168, "learning_rate": 1.2212341578770854e-07, "epoch": 0.9050536693232598, "percentage": 90.51, "elapsed_time": "1 day, 7:02:19", "remaining_time": "3:15:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9824, "total_steps": 10853, "loss": 0.1158, "learning_rate": 1.2188834309939806e-07, "epoch": 0.9051458055005298, "percentage": 90.52, "elapsed_time": "1 day, 7:02:32", "remaining_time": "3:15:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9825, "total_steps": 10853, "loss": 0.1126, "learning_rate": 1.2165349121901037e-07, "epoch": 0.9052379416777998, "percentage": 90.53, "elapsed_time": "1 day, 7:02:43", "remaining_time": "3:14:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9826, "total_steps": 10853, "loss": 0.1137, "learning_rate": 1.2141886016835246e-07, "epoch": 0.9053300778550698, "percentage": 90.54, "elapsed_time": "1 day, 7:02:55", "remaining_time": "3:14:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9827, "total_steps": 10853, "loss": 0.1172, "learning_rate": 1.2118444996920887e-07, "epoch": 0.9054222140323398, "percentage": 90.55, "elapsed_time": "1 day, 7:03:06", "remaining_time": "3:14:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9828, "total_steps": 10853, "loss": 0.1186, "learning_rate": 1.2095026064334548e-07, "epoch": 0.9055143502096098, "percentage": 90.56, "elapsed_time": "1 day, 7:03:17", "remaining_time": "3:14:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9829, "total_steps": 10853, "loss": 0.1197, "learning_rate": 1.207162922125063e-07, "epoch": 0.9056064863868798, "percentage": 90.56, "elapsed_time": "1 day, 7:03:29", "remaining_time": "3:14:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9830, "total_steps": 10853, "loss": 0.1071, "learning_rate": 1.2048254469841508e-07, "epoch": 0.9056986225641498, "percentage": 90.57, "elapsed_time": "1 day, 7:03:39", "remaining_time": "3:13:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9831, "total_steps": 10853, "loss": 0.1223, "learning_rate": 1.2024901812277639e-07, "epoch": 0.9057907587414198, "percentage": 90.58, "elapsed_time": "1 day, 7:03:49", "remaining_time": "3:13:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9832, "total_steps": 10853, "loss": 0.1132, "learning_rate": 1.2001571250727233e-07, "epoch": 0.9058828949186898, "percentage": 90.59, "elapsed_time": "1 day, 7:04:00", "remaining_time": "3:13:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9833, "total_steps": 10853, "loss": 0.1131, "learning_rate": 1.1978262787356504e-07, "epoch": 0.9059750310959598, "percentage": 90.6, "elapsed_time": "1 day, 7:04:11", "remaining_time": "3:13:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9834, "total_steps": 10853, "loss": 0.114, "learning_rate": 1.1954976424329716e-07, "epoch": 0.9060671672732298, "percentage": 90.61, "elapsed_time": "1 day, 7:04:20", "remaining_time": "3:13:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9835, "total_steps": 10853, "loss": 0.1168, "learning_rate": 1.193171216380895e-07, "epoch": 0.9061593034504999, "percentage": 90.62, "elapsed_time": "1 day, 7:04:31", "remaining_time": "3:12:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9836, "total_steps": 10853, "loss": 0.1175, "learning_rate": 1.1908470007954392e-07, "epoch": 0.9062514396277699, "percentage": 90.63, "elapsed_time": "1 day, 7:04:42", "remaining_time": "3:12:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9837, "total_steps": 10853, "loss": 0.1165, "learning_rate": 1.188524995892401e-07, "epoch": 0.9063435758050399, "percentage": 90.64, "elapsed_time": "1 day, 7:04:53", "remaining_time": "3:12:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9838, "total_steps": 10853, "loss": 0.1181, "learning_rate": 1.1862052018873777e-07, "epoch": 0.9064357119823099, "percentage": 90.65, "elapsed_time": "1 day, 7:05:03", "remaining_time": "3:12:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9839, "total_steps": 10853, "loss": 0.1342, "learning_rate": 1.1838876189957632e-07, "epoch": 0.9065278481595799, "percentage": 90.66, "elapsed_time": "1 day, 7:05:15", "remaining_time": "3:12:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9840, "total_steps": 10853, "loss": 0.1159, "learning_rate": 1.1815722474327495e-07, "epoch": 0.9066199843368499, "percentage": 90.67, "elapsed_time": "1 day, 7:05:25", "remaining_time": "3:12:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9841, "total_steps": 10853, "loss": 0.115, "learning_rate": 1.1792590874133119e-07, "epoch": 0.9067121205141199, "percentage": 90.68, "elapsed_time": "1 day, 7:05:33", "remaining_time": "3:11:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9842, "total_steps": 10853, "loss": 0.1225, "learning_rate": 1.176948139152237e-07, "epoch": 0.9068042566913899, "percentage": 90.68, "elapsed_time": "1 day, 7:05:44", "remaining_time": "3:11:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9843, "total_steps": 10853, "loss": 0.1236, "learning_rate": 1.1746394028640862e-07, "epoch": 0.9068963928686599, "percentage": 90.69, "elapsed_time": "1 day, 7:05:55", "remaining_time": "3:11:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9844, "total_steps": 10853, "loss": 0.119, "learning_rate": 1.1723328787632354e-07, "epoch": 0.9069885290459299, "percentage": 90.7, "elapsed_time": "1 day, 7:06:07", "remaining_time": "3:11:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9845, "total_steps": 10853, "loss": 0.1105, "learning_rate": 1.1700285670638356e-07, "epoch": 0.9070806652231999, "percentage": 90.71, "elapsed_time": "1 day, 7:06:17", "remaining_time": "3:11:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9846, "total_steps": 10853, "loss": 0.1135, "learning_rate": 1.1677264679798489e-07, "epoch": 0.9071728014004699, "percentage": 90.72, "elapsed_time": "1 day, 7:06:28", "remaining_time": "3:10:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9847, "total_steps": 10853, "loss": 0.0993, "learning_rate": 1.1654265817250294e-07, "epoch": 0.9072649375777398, "percentage": 90.73, "elapsed_time": "1 day, 7:06:37", "remaining_time": "3:10:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9848, "total_steps": 10853, "loss": 0.1209, "learning_rate": 1.1631289085129143e-07, "epoch": 0.90735707375501, "percentage": 90.74, "elapsed_time": "1 day, 7:06:49", "remaining_time": "3:10:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9849, "total_steps": 10853, "loss": 0.1099, "learning_rate": 1.1608334485568446e-07, "epoch": 0.90744920993228, "percentage": 90.75, "elapsed_time": "1 day, 7:06:58", "remaining_time": "3:10:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9850, "total_steps": 10853, "loss": 0.1128, "learning_rate": 1.1585402020699548e-07, "epoch": 0.90754134610955, "percentage": 90.76, "elapsed_time": "1 day, 7:07:09", "remaining_time": "3:10:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9851, "total_steps": 10853, "loss": 0.1223, "learning_rate": 1.1562491692651723e-07, "epoch": 0.90763348228682, "percentage": 90.77, "elapsed_time": "1 day, 7:07:19", "remaining_time": "3:09:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9852, "total_steps": 10853, "loss": 0.124, "learning_rate": 1.153960350355221e-07, "epoch": 0.90772561846409, "percentage": 90.78, "elapsed_time": "1 day, 7:07:31", "remaining_time": "3:09:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9853, "total_steps": 10853, "loss": 0.1159, "learning_rate": 1.1516737455526228e-07, "epoch": 0.9078177546413599, "percentage": 90.79, "elapsed_time": "1 day, 7:07:42", "remaining_time": "3:09:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9854, "total_steps": 10853, "loss": 0.1184, "learning_rate": 1.14938935506968e-07, "epoch": 0.9079098908186299, "percentage": 90.8, "elapsed_time": "1 day, 7:07:54", "remaining_time": "3:09:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9855, "total_steps": 10853, "loss": 0.1362, "learning_rate": 1.1471071791185007e-07, "epoch": 0.9080020269958999, "percentage": 90.8, "elapsed_time": "1 day, 7:08:04", "remaining_time": "3:09:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9856, "total_steps": 10853, "loss": 0.1233, "learning_rate": 1.1448272179109848e-07, "epoch": 0.9080941631731699, "percentage": 90.81, "elapsed_time": "1 day, 7:08:16", "remaining_time": "3:08:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9857, "total_steps": 10853, "loss": 0.1238, "learning_rate": 1.1425494716588353e-07, "epoch": 0.9081862993504399, "percentage": 90.82, "elapsed_time": "1 day, 7:08:28", "remaining_time": "3:08:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9858, "total_steps": 10853, "loss": 0.1067, "learning_rate": 1.1402739405735303e-07, "epoch": 0.9082784355277099, "percentage": 90.83, "elapsed_time": "1 day, 7:08:39", "remaining_time": "3:08:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9859, "total_steps": 10853, "loss": 0.1212, "learning_rate": 1.1380006248663616e-07, "epoch": 0.9083705717049799, "percentage": 90.84, "elapsed_time": "1 day, 7:08:50", "remaining_time": "3:08:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9860, "total_steps": 10853, "loss": 0.1184, "learning_rate": 1.1357295247483997e-07, "epoch": 0.9084627078822499, "percentage": 90.85, "elapsed_time": "1 day, 7:09:00", "remaining_time": "3:08:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9861, "total_steps": 10853, "loss": 0.1253, "learning_rate": 1.1334606404305226e-07, "epoch": 0.9085548440595199, "percentage": 90.86, "elapsed_time": "1 day, 7:09:12", "remaining_time": "3:08:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9862, "total_steps": 10853, "loss": 0.1063, "learning_rate": 1.13119397212339e-07, "epoch": 0.90864698023679, "percentage": 90.87, "elapsed_time": "1 day, 7:09:22", "remaining_time": "3:07:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9863, "total_steps": 10853, "loss": 0.1021, "learning_rate": 1.1289295200374667e-07, "epoch": 0.90873911641406, "percentage": 90.88, "elapsed_time": "1 day, 7:09:33", "remaining_time": "3:07:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9864, "total_steps": 10853, "loss": 0.1124, "learning_rate": 1.1266672843830095e-07, "epoch": 0.90883125259133, "percentage": 90.89, "elapsed_time": "1 day, 7:09:44", "remaining_time": "3:07:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9865, "total_steps": 10853, "loss": 0.1071, "learning_rate": 1.1244072653700644e-07, "epoch": 0.9089233887686, "percentage": 90.9, "elapsed_time": "1 day, 7:09:55", "remaining_time": "3:07:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9866, "total_steps": 10853, "loss": 0.1143, "learning_rate": 1.122149463208469e-07, "epoch": 0.90901552494587, "percentage": 90.91, "elapsed_time": "1 day, 7:10:05", "remaining_time": "3:07:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9867, "total_steps": 10853, "loss": 0.1183, "learning_rate": 1.1198938781078694e-07, "epoch": 0.90910766112314, "percentage": 90.91, "elapsed_time": "1 day, 7:10:15", "remaining_time": "3:06:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9868, "total_steps": 10853, "loss": 0.1078, "learning_rate": 1.1176405102776899e-07, "epoch": 0.90919979730041, "percentage": 90.92, "elapsed_time": "1 day, 7:10:24", "remaining_time": "3:06:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9869, "total_steps": 10853, "loss": 0.1149, "learning_rate": 1.1153893599271631e-07, "epoch": 0.90929193347768, "percentage": 90.93, "elapsed_time": "1 day, 7:10:35", "remaining_time": "3:06:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9870, "total_steps": 10853, "loss": 0.1122, "learning_rate": 1.1131404272653051e-07, "epoch": 0.90938406965495, "percentage": 90.94, "elapsed_time": "1 day, 7:10:46", "remaining_time": "3:06:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9871, "total_steps": 10853, "loss": 0.1212, "learning_rate": 1.1108937125009266e-07, "epoch": 0.90947620583222, "percentage": 90.95, "elapsed_time": "1 day, 7:10:57", "remaining_time": "3:06:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9872, "total_steps": 10853, "loss": 0.1276, "learning_rate": 1.1086492158426387e-07, "epoch": 0.90956834200949, "percentage": 90.96, "elapsed_time": "1 day, 7:11:08", "remaining_time": "3:05:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9873, "total_steps": 10853, "loss": 0.117, "learning_rate": 1.106406937498844e-07, "epoch": 0.90966047818676, "percentage": 90.97, "elapsed_time": "1 day, 7:11:17", "remaining_time": "3:05:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9874, "total_steps": 10853, "loss": 0.1188, "learning_rate": 1.1041668776777342e-07, "epoch": 0.90975261436403, "percentage": 90.98, "elapsed_time": "1 day, 7:11:28", "remaining_time": "3:05:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9875, "total_steps": 10853, "loss": 0.1167, "learning_rate": 1.1019290365873042e-07, "epoch": 0.9098447505413001, "percentage": 90.99, "elapsed_time": "1 day, 7:11:39", "remaining_time": "3:05:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9876, "total_steps": 10853, "loss": 0.1238, "learning_rate": 1.0996934144353322e-07, "epoch": 0.9099368867185701, "percentage": 91.0, "elapsed_time": "1 day, 7:11:50", "remaining_time": "3:05:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9877, "total_steps": 10853, "loss": 0.131, "learning_rate": 1.0974600114293993e-07, "epoch": 0.9100290228958401, "percentage": 91.01, "elapsed_time": "1 day, 7:12:02", "remaining_time": "3:04:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9878, "total_steps": 10853, "loss": 0.1243, "learning_rate": 1.0952288277768786e-07, "epoch": 0.9101211590731101, "percentage": 91.02, "elapsed_time": "1 day, 7:12:14", "remaining_time": "3:04:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9879, "total_steps": 10853, "loss": 0.1114, "learning_rate": 1.0929998636849321e-07, "epoch": 0.9102132952503801, "percentage": 91.03, "elapsed_time": "1 day, 7:12:23", "remaining_time": "3:04:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9880, "total_steps": 10853, "loss": 0.1047, "learning_rate": 1.090773119360522e-07, "epoch": 0.9103054314276501, "percentage": 91.03, "elapsed_time": "1 day, 7:12:33", "remaining_time": "3:04:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9881, "total_steps": 10853, "loss": 0.115, "learning_rate": 1.0885485950103997e-07, "epoch": 0.9103975676049201, "percentage": 91.04, "elapsed_time": "1 day, 7:12:44", "remaining_time": "3:04:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9882, "total_steps": 10853, "loss": 0.1102, "learning_rate": 1.0863262908411165e-07, "epoch": 0.9104897037821901, "percentage": 91.05, "elapsed_time": "1 day, 7:12:54", "remaining_time": "3:04:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9883, "total_steps": 10853, "loss": 0.1195, "learning_rate": 1.0841062070590074e-07, "epoch": 0.9105818399594601, "percentage": 91.06, "elapsed_time": "1 day, 7:13:08", "remaining_time": "3:03:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9884, "total_steps": 10853, "loss": 0.107, "learning_rate": 1.0818883438702105e-07, "epoch": 0.9106739761367301, "percentage": 91.07, "elapsed_time": "1 day, 7:13:18", "remaining_time": "3:03:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9885, "total_steps": 10853, "loss": 0.1209, "learning_rate": 1.0796727014806607e-07, "epoch": 0.9107661123140001, "percentage": 91.08, "elapsed_time": "1 day, 7:13:29", "remaining_time": "3:03:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9886, "total_steps": 10853, "loss": 0.119, "learning_rate": 1.0774592800960715e-07, "epoch": 0.9108582484912701, "percentage": 91.09, "elapsed_time": "1 day, 7:13:40", "remaining_time": "3:03:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9887, "total_steps": 10853, "loss": 0.117, "learning_rate": 1.0752480799219616e-07, "epoch": 0.9109503846685401, "percentage": 91.1, "elapsed_time": "1 day, 7:13:51", "remaining_time": "3:03:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9888, "total_steps": 10853, "loss": 0.1242, "learning_rate": 1.073039101163642e-07, "epoch": 0.91104252084581, "percentage": 91.11, "elapsed_time": "1 day, 7:14:03", "remaining_time": "3:02:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9889, "total_steps": 10853, "loss": 0.103, "learning_rate": 1.0708323440262153e-07, "epoch": 0.9111346570230802, "percentage": 91.12, "elapsed_time": "1 day, 7:14:13", "remaining_time": "3:02:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9890, "total_steps": 10853, "loss": 0.1183, "learning_rate": 1.0686278087145868e-07, "epoch": 0.9112267932003502, "percentage": 91.13, "elapsed_time": "1 day, 7:14:23", "remaining_time": "3:02:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9891, "total_steps": 10853, "loss": 0.112, "learning_rate": 1.0664254954334402e-07, "epoch": 0.9113189293776202, "percentage": 91.14, "elapsed_time": "1 day, 7:14:36", "remaining_time": "3:02:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9892, "total_steps": 10853, "loss": 0.1163, "learning_rate": 1.064225404387259e-07, "epoch": 0.9114110655548902, "percentage": 91.15, "elapsed_time": "1 day, 7:14:47", "remaining_time": "3:02:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9893, "total_steps": 10853, "loss": 0.1219, "learning_rate": 1.0620275357803244e-07, "epoch": 0.9115032017321602, "percentage": 91.15, "elapsed_time": "1 day, 7:14:58", "remaining_time": "3:01:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9894, "total_steps": 10853, "loss": 0.1149, "learning_rate": 1.059831889816712e-07, "epoch": 0.9115953379094301, "percentage": 91.16, "elapsed_time": "1 day, 7:15:09", "remaining_time": "3:01:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9895, "total_steps": 10853, "loss": 0.1091, "learning_rate": 1.0576384667002837e-07, "epoch": 0.9116874740867001, "percentage": 91.17, "elapsed_time": "1 day, 7:15:20", "remaining_time": "3:01:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9896, "total_steps": 10853, "loss": 0.1245, "learning_rate": 1.0554472666347043e-07, "epoch": 0.9117796102639701, "percentage": 91.18, "elapsed_time": "1 day, 7:15:30", "remaining_time": "3:01:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9897, "total_steps": 10853, "loss": 0.1224, "learning_rate": 1.0532582898234167e-07, "epoch": 0.9118717464412401, "percentage": 91.19, "elapsed_time": "1 day, 7:15:41", "remaining_time": "3:01:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9898, "total_steps": 10853, "loss": 0.1278, "learning_rate": 1.0510715364696806e-07, "epoch": 0.9119638826185101, "percentage": 91.2, "elapsed_time": "1 day, 7:15:52", "remaining_time": "3:00:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9899, "total_steps": 10853, "loss": 0.1071, "learning_rate": 1.048887006776525e-07, "epoch": 0.9120560187957801, "percentage": 91.21, "elapsed_time": "1 day, 7:16:02", "remaining_time": "3:00:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9900, "total_steps": 10853, "loss": 0.1179, "learning_rate": 1.0467047009467878e-07, "epoch": 0.9121481549730501, "percentage": 91.22, "elapsed_time": "1 day, 7:16:13", "remaining_time": "3:00:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9901, "total_steps": 10853, "loss": 0.1222, "learning_rate": 1.0445246191831015e-07, "epoch": 0.9122402911503201, "percentage": 91.23, "elapsed_time": "1 day, 7:16:24", "remaining_time": "3:00:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9902, "total_steps": 10853, "loss": 0.1223, "learning_rate": 1.0423467616878819e-07, "epoch": 0.9123324273275901, "percentage": 91.24, "elapsed_time": "1 day, 7:16:34", "remaining_time": "3:00:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9903, "total_steps": 10853, "loss": 0.1113, "learning_rate": 1.040171128663342e-07, "epoch": 0.9124245635048602, "percentage": 91.25, "elapsed_time": "1 day, 7:16:45", "remaining_time": "3:00:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9904, "total_steps": 10853, "loss": 0.1258, "learning_rate": 1.03799772031149e-07, "epoch": 0.9125166996821302, "percentage": 91.26, "elapsed_time": "1 day, 7:16:55", "remaining_time": "2:59:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9905, "total_steps": 10853, "loss": 0.1107, "learning_rate": 1.035826536834128e-07, "epoch": 0.9126088358594002, "percentage": 91.27, "elapsed_time": "1 day, 7:17:05", "remaining_time": "2:59:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9906, "total_steps": 10853, "loss": 0.1129, "learning_rate": 1.0336575784328534e-07, "epoch": 0.9127009720366702, "percentage": 91.27, "elapsed_time": "1 day, 7:17:16", "remaining_time": "2:59:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9907, "total_steps": 10853, "loss": 0.1155, "learning_rate": 1.031490845309055e-07, "epoch": 0.9127931082139402, "percentage": 91.28, "elapsed_time": "1 day, 7:17:26", "remaining_time": "2:59:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9908, "total_steps": 10853, "loss": 0.1136, "learning_rate": 1.029326337663905e-07, "epoch": 0.9128852443912102, "percentage": 91.29, "elapsed_time": "1 day, 7:17:38", "remaining_time": "2:59:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9909, "total_steps": 10853, "loss": 0.1117, "learning_rate": 1.0271640556983875e-07, "epoch": 0.9129773805684802, "percentage": 91.3, "elapsed_time": "1 day, 7:17:47", "remaining_time": "2:58:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9910, "total_steps": 10853, "loss": 0.1191, "learning_rate": 1.0250039996132637e-07, "epoch": 0.9130695167457502, "percentage": 91.31, "elapsed_time": "1 day, 7:17:59", "remaining_time": "2:58:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9911, "total_steps": 10853, "loss": 0.116, "learning_rate": 1.0228461696091041e-07, "epoch": 0.9131616529230202, "percentage": 91.32, "elapsed_time": "1 day, 7:18:09", "remaining_time": "2:58:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9912, "total_steps": 10853, "loss": 0.1203, "learning_rate": 1.0206905658862592e-07, "epoch": 0.9132537891002902, "percentage": 91.33, "elapsed_time": "1 day, 7:18:19", "remaining_time": "2:58:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9913, "total_steps": 10853, "loss": 0.1039, "learning_rate": 1.0185371886448719e-07, "epoch": 0.9133459252775602, "percentage": 91.34, "elapsed_time": "1 day, 7:18:29", "remaining_time": "2:58:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9914, "total_steps": 10853, "loss": 0.1293, "learning_rate": 1.016386038084885e-07, "epoch": 0.9134380614548302, "percentage": 91.35, "elapsed_time": "1 day, 7:18:41", "remaining_time": "2:57:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9915, "total_steps": 10853, "loss": 0.1026, "learning_rate": 1.0142371144060414e-07, "epoch": 0.9135301976321002, "percentage": 91.36, "elapsed_time": "1 day, 7:18:52", "remaining_time": "2:57:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9916, "total_steps": 10853, "loss": 0.1125, "learning_rate": 1.0120904178078594e-07, "epoch": 0.9136223338093703, "percentage": 91.37, "elapsed_time": "1 day, 7:19:02", "remaining_time": "2:57:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9917, "total_steps": 10853, "loss": 0.1161, "learning_rate": 1.0099459484896684e-07, "epoch": 0.9137144699866403, "percentage": 91.38, "elapsed_time": "1 day, 7:19:14", "remaining_time": "2:57:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9918, "total_steps": 10853, "loss": 0.1201, "learning_rate": 1.007803706650573e-07, "epoch": 0.9138066061639103, "percentage": 91.38, "elapsed_time": "1 day, 7:19:25", "remaining_time": "2:57:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9919, "total_steps": 10853, "loss": 0.1082, "learning_rate": 1.0056636924894864e-07, "epoch": 0.9138987423411803, "percentage": 91.39, "elapsed_time": "1 day, 7:19:36", "remaining_time": "2:56:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9920, "total_steps": 10853, "loss": 0.111, "learning_rate": 1.0035259062051079e-07, "epoch": 0.9139908785184503, "percentage": 91.4, "elapsed_time": "1 day, 7:19:46", "remaining_time": "2:56:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9921, "total_steps": 10853, "loss": 0.1107, "learning_rate": 1.0013903479959313e-07, "epoch": 0.9140830146957203, "percentage": 91.41, "elapsed_time": "1 day, 7:19:58", "remaining_time": "2:56:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9922, "total_steps": 10853, "loss": 0.1183, "learning_rate": 9.992570180602484e-08, "epoch": 0.9141751508729903, "percentage": 91.42, "elapsed_time": "1 day, 7:20:10", "remaining_time": "2:56:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9923, "total_steps": 10853, "loss": 0.1186, "learning_rate": 9.971259165961312e-08, "epoch": 0.9142672870502603, "percentage": 91.43, "elapsed_time": "1 day, 7:20:19", "remaining_time": "2:56:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9924, "total_steps": 10853, "loss": 0.1103, "learning_rate": 9.949970438014544e-08, "epoch": 0.9143594232275303, "percentage": 91.44, "elapsed_time": "1 day, 7:20:30", "remaining_time": "2:56:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9925, "total_steps": 10853, "loss": 0.1068, "learning_rate": 9.928703998738853e-08, "epoch": 0.9144515594048003, "percentage": 91.45, "elapsed_time": "1 day, 7:20:41", "remaining_time": "2:55:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9926, "total_steps": 10853, "loss": 0.1131, "learning_rate": 9.907459850108824e-08, "epoch": 0.9145436955820703, "percentage": 91.46, "elapsed_time": "1 day, 7:20:52", "remaining_time": "2:55:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9927, "total_steps": 10853, "loss": 0.1147, "learning_rate": 9.886237994097048e-08, "epoch": 0.9146358317593403, "percentage": 91.47, "elapsed_time": "1 day, 7:21:04", "remaining_time": "2:55:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9928, "total_steps": 10853, "loss": 0.115, "learning_rate": 9.86503843267389e-08, "epoch": 0.9147279679366103, "percentage": 91.48, "elapsed_time": "1 day, 7:21:14", "remaining_time": "2:55:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9929, "total_steps": 10853, "loss": 0.1271, "learning_rate": 9.843861167807722e-08, "epoch": 0.9148201041138803, "percentage": 91.49, "elapsed_time": "1 day, 7:21:25", "remaining_time": "2:55:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9930, "total_steps": 10853, "loss": 0.1077, "learning_rate": 9.822706201464915e-08, "epoch": 0.9149122402911504, "percentage": 91.5, "elapsed_time": "1 day, 7:21:34", "remaining_time": "2:54:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9931, "total_steps": 10853, "loss": 0.1187, "learning_rate": 9.801573535609677e-08, "epoch": 0.9150043764684204, "percentage": 91.5, "elapsed_time": "1 day, 7:21:45", "remaining_time": "2:54:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9932, "total_steps": 10853, "loss": 0.122, "learning_rate": 9.780463172204186e-08, "epoch": 0.9150965126456904, "percentage": 91.51, "elapsed_time": "1 day, 7:21:58", "remaining_time": "2:54:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9933, "total_steps": 10853, "loss": 0.1159, "learning_rate": 9.759375113208541e-08, "epoch": 0.9151886488229604, "percentage": 91.52, "elapsed_time": "1 day, 7:22:09", "remaining_time": "2:54:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9934, "total_steps": 10853, "loss": 0.1297, "learning_rate": 9.738309360580789e-08, "epoch": 0.9152807850002304, "percentage": 91.53, "elapsed_time": "1 day, 7:22:20", "remaining_time": "2:54:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9935, "total_steps": 10853, "loss": 0.1173, "learning_rate": 9.717265916276863e-08, "epoch": 0.9153729211775004, "percentage": 91.54, "elapsed_time": "1 day, 7:22:30", "remaining_time": "2:53:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9936, "total_steps": 10853, "loss": 0.1032, "learning_rate": 9.696244782250675e-08, "epoch": 0.9154650573547704, "percentage": 91.55, "elapsed_time": "1 day, 7:22:41", "remaining_time": "2:53:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9937, "total_steps": 10853, "loss": 0.1208, "learning_rate": 9.675245960453966e-08, "epoch": 0.9155571935320403, "percentage": 91.56, "elapsed_time": "1 day, 7:22:53", "remaining_time": "2:53:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9938, "total_steps": 10853, "loss": 0.1273, "learning_rate": 9.654269452836567e-08, "epoch": 0.9156493297093103, "percentage": 91.57, "elapsed_time": "1 day, 7:23:04", "remaining_time": "2:53:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9939, "total_steps": 10853, "loss": 0.1111, "learning_rate": 9.633315261346115e-08, "epoch": 0.9157414658865803, "percentage": 91.58, "elapsed_time": "1 day, 7:23:16", "remaining_time": "2:53:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9940, "total_steps": 10853, "loss": 0.1238, "learning_rate": 9.612383387928248e-08, "epoch": 0.9158336020638503, "percentage": 91.59, "elapsed_time": "1 day, 7:23:28", "remaining_time": "2:52:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9941, "total_steps": 10853, "loss": 0.1171, "learning_rate": 9.59147383452641e-08, "epoch": 0.9159257382411203, "percentage": 91.6, "elapsed_time": "1 day, 7:23:37", "remaining_time": "2:52:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9942, "total_steps": 10853, "loss": 0.1187, "learning_rate": 9.570586603082078e-08, "epoch": 0.9160178744183903, "percentage": 91.61, "elapsed_time": "1 day, 7:23:48", "remaining_time": "2:52:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9943, "total_steps": 10853, "loss": 0.1153, "learning_rate": 9.549721695534669e-08, "epoch": 0.9161100105956604, "percentage": 91.62, "elapsed_time": "1 day, 7:23:58", "remaining_time": "2:52:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9944, "total_steps": 10853, "loss": 0.1151, "learning_rate": 9.528879113821526e-08, "epoch": 0.9162021467729304, "percentage": 91.62, "elapsed_time": "1 day, 7:24:08", "remaining_time": "2:52:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9945, "total_steps": 10853, "loss": 0.1149, "learning_rate": 9.508058859877794e-08, "epoch": 0.9162942829502004, "percentage": 91.63, "elapsed_time": "1 day, 7:24:20", "remaining_time": "2:52:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9946, "total_steps": 10853, "loss": 0.1153, "learning_rate": 9.487260935636678e-08, "epoch": 0.9163864191274704, "percentage": 91.64, "elapsed_time": "1 day, 7:24:32", "remaining_time": "2:51:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9947, "total_steps": 10853, "loss": 0.109, "learning_rate": 9.466485343029269e-08, "epoch": 0.9164785553047404, "percentage": 91.65, "elapsed_time": "1 day, 7:24:42", "remaining_time": "2:51:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9948, "total_steps": 10853, "loss": 0.1125, "learning_rate": 9.44573208398461e-08, "epoch": 0.9165706914820104, "percentage": 91.66, "elapsed_time": "1 day, 7:24:53", "remaining_time": "2:51:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9949, "total_steps": 10853, "loss": 0.1159, "learning_rate": 9.425001160429603e-08, "epoch": 0.9166628276592804, "percentage": 91.67, "elapsed_time": "1 day, 7:25:03", "remaining_time": "2:51:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9950, "total_steps": 10853, "loss": 0.1183, "learning_rate": 9.404292574289126e-08, "epoch": 0.9167549638365504, "percentage": 91.68, "elapsed_time": "1 day, 7:25:14", "remaining_time": "2:51:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9951, "total_steps": 10853, "loss": 0.1044, "learning_rate": 9.383606327485973e-08, "epoch": 0.9168471000138204, "percentage": 91.69, "elapsed_time": "1 day, 7:25:24", "remaining_time": "2:50:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9952, "total_steps": 10853, "loss": 0.1214, "learning_rate": 9.362942421940885e-08, "epoch": 0.9169392361910904, "percentage": 91.7, "elapsed_time": "1 day, 7:25:36", "remaining_time": "2:50:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9953, "total_steps": 10853, "loss": 0.1217, "learning_rate": 9.342300859572467e-08, "epoch": 0.9170313723683604, "percentage": 91.71, "elapsed_time": "1 day, 7:25:46", "remaining_time": "2:50:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9954, "total_steps": 10853, "loss": 0.1228, "learning_rate": 9.321681642297298e-08, "epoch": 0.9171235085456304, "percentage": 91.72, "elapsed_time": "1 day, 7:25:57", "remaining_time": "2:50:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9955, "total_steps": 10853, "loss": 0.1061, "learning_rate": 9.301084772029928e-08, "epoch": 0.9172156447229004, "percentage": 91.73, "elapsed_time": "1 day, 7:26:08", "remaining_time": "2:50:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9956, "total_steps": 10853, "loss": 0.123, "learning_rate": 9.280510250682745e-08, "epoch": 0.9173077809001704, "percentage": 91.74, "elapsed_time": "1 day, 7:26:19", "remaining_time": "2:49:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9957, "total_steps": 10853, "loss": 0.1017, "learning_rate": 9.259958080166081e-08, "epoch": 0.9173999170774405, "percentage": 91.74, "elapsed_time": "1 day, 7:26:29", "remaining_time": "2:49:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9958, "total_steps": 10853, "loss": 0.1098, "learning_rate": 9.23942826238819e-08, "epoch": 0.9174920532547105, "percentage": 91.75, "elapsed_time": "1 day, 7:26:40", "remaining_time": "2:49:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9959, "total_steps": 10853, "loss": 0.1111, "learning_rate": 9.218920799255293e-08, "epoch": 0.9175841894319805, "percentage": 91.76, "elapsed_time": "1 day, 7:26:52", "remaining_time": "2:49:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9960, "total_steps": 10853, "loss": 0.1157, "learning_rate": 9.198435692671565e-08, "epoch": 0.9176763256092505, "percentage": 91.77, "elapsed_time": "1 day, 7:27:04", "remaining_time": "2:49:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9961, "total_steps": 10853, "loss": 0.1131, "learning_rate": 9.177972944538982e-08, "epoch": 0.9177684617865205, "percentage": 91.78, "elapsed_time": "1 day, 7:27:15", "remaining_time": "2:49:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9962, "total_steps": 10853, "loss": 0.1171, "learning_rate": 9.157532556757526e-08, "epoch": 0.9178605979637905, "percentage": 91.79, "elapsed_time": "1 day, 7:27:26", "remaining_time": "2:48:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9963, "total_steps": 10853, "loss": 0.115, "learning_rate": 9.137114531225066e-08, "epoch": 0.9179527341410605, "percentage": 91.8, "elapsed_time": "1 day, 7:27:37", "remaining_time": "2:48:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9964, "total_steps": 10853, "loss": 0.1291, "learning_rate": 9.116718869837449e-08, "epoch": 0.9180448703183305, "percentage": 91.81, "elapsed_time": "1 day, 7:27:48", "remaining_time": "2:48:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9965, "total_steps": 10853, "loss": 0.1164, "learning_rate": 9.096345574488435e-08, "epoch": 0.9181370064956005, "percentage": 91.82, "elapsed_time": "1 day, 7:27:58", "remaining_time": "2:48:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9966, "total_steps": 10853, "loss": 0.1134, "learning_rate": 9.075994647069653e-08, "epoch": 0.9182291426728705, "percentage": 91.83, "elapsed_time": "1 day, 7:28:10", "remaining_time": "2:48:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9967, "total_steps": 10853, "loss": 0.1246, "learning_rate": 9.0556660894707e-08, "epoch": 0.9183212788501405, "percentage": 91.84, "elapsed_time": "1 day, 7:28:22", "remaining_time": "2:47:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9968, "total_steps": 10853, "loss": 0.1085, "learning_rate": 9.035359903579039e-08, "epoch": 0.9184134150274105, "percentage": 91.85, "elapsed_time": "1 day, 7:28:33", "remaining_time": "2:47:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9969, "total_steps": 10853, "loss": 0.116, "learning_rate": 9.015076091280189e-08, "epoch": 0.9185055512046805, "percentage": 91.85, "elapsed_time": "1 day, 7:28:43", "remaining_time": "2:47:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9970, "total_steps": 10853, "loss": 0.1085, "learning_rate": 8.994814654457451e-08, "epoch": 0.9185976873819506, "percentage": 91.86, "elapsed_time": "1 day, 7:28:54", "remaining_time": "2:47:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9971, "total_steps": 10853, "loss": 0.1122, "learning_rate": 8.974575594992124e-08, "epoch": 0.9186898235592206, "percentage": 91.87, "elapsed_time": "1 day, 7:29:04", "remaining_time": "2:47:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9972, "total_steps": 10853, "loss": 0.11, "learning_rate": 8.954358914763373e-08, "epoch": 0.9187819597364906, "percentage": 91.88, "elapsed_time": "1 day, 7:29:15", "remaining_time": "2:46:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9973, "total_steps": 10853, "loss": 0.1037, "learning_rate": 8.934164615648333e-08, "epoch": 0.9188740959137606, "percentage": 91.89, "elapsed_time": "1 day, 7:29:26", "remaining_time": "2:46:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9974, "total_steps": 10853, "loss": 0.1063, "learning_rate": 8.913992699522062e-08, "epoch": 0.9189662320910306, "percentage": 91.9, "elapsed_time": "1 day, 7:29:37", "remaining_time": "2:46:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9975, "total_steps": 10853, "loss": 0.115, "learning_rate": 8.893843168257504e-08, "epoch": 0.9190583682683006, "percentage": 91.91, "elapsed_time": "1 day, 7:29:47", "remaining_time": "2:46:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9976, "total_steps": 10853, "loss": 0.105, "learning_rate": 8.873716023725581e-08, "epoch": 0.9191505044455706, "percentage": 91.92, "elapsed_time": "1 day, 7:29:58", "remaining_time": "2:46:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9977, "total_steps": 10853, "loss": 0.1249, "learning_rate": 8.853611267795076e-08, "epoch": 0.9192426406228406, "percentage": 91.93, "elapsed_time": "1 day, 7:30:08", "remaining_time": "2:45:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9978, "total_steps": 10853, "loss": 0.0996, "learning_rate": 8.833528902332688e-08, "epoch": 0.9193347768001106, "percentage": 91.94, "elapsed_time": "1 day, 7:30:19", "remaining_time": "2:45:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9979, "total_steps": 10853, "loss": 0.1141, "learning_rate": 8.813468929203095e-08, "epoch": 0.9194269129773806, "percentage": 91.95, "elapsed_time": "1 day, 7:30:30", "remaining_time": "2:45:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9980, "total_steps": 10853, "loss": 0.1184, "learning_rate": 8.793431350268861e-08, "epoch": 0.9195190491546505, "percentage": 91.96, "elapsed_time": "1 day, 7:30:42", "remaining_time": "2:45:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9981, "total_steps": 10853, "loss": 0.1151, "learning_rate": 8.773416167390525e-08, "epoch": 0.9196111853319205, "percentage": 91.97, "elapsed_time": "1 day, 7:30:53", "remaining_time": "2:45:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9982, "total_steps": 10853, "loss": 0.1048, "learning_rate": 8.753423382426463e-08, "epoch": 0.9197033215091905, "percentage": 91.97, "elapsed_time": "1 day, 7:31:04", "remaining_time": "2:45:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9983, "total_steps": 10853, "loss": 0.1165, "learning_rate": 8.733452997232967e-08, "epoch": 0.9197954576864605, "percentage": 91.98, "elapsed_time": "1 day, 7:31:15", "remaining_time": "2:44:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9984, "total_steps": 10853, "loss": 0.1319, "learning_rate": 8.713505013664303e-08, "epoch": 0.9198875938637306, "percentage": 91.99, "elapsed_time": "1 day, 7:31:27", "remaining_time": "2:44:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9985, "total_steps": 10853, "loss": 0.1245, "learning_rate": 8.693579433572741e-08, "epoch": 0.9199797300410006, "percentage": 92.0, "elapsed_time": "1 day, 7:31:38", "remaining_time": "2:44:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9986, "total_steps": 10853, "loss": 0.1272, "learning_rate": 8.673676258808244e-08, "epoch": 0.9200718662182706, "percentage": 92.01, "elapsed_time": "1 day, 7:31:48", "remaining_time": "2:44:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9987, "total_steps": 10853, "loss": 0.105, "learning_rate": 8.653795491218891e-08, "epoch": 0.9201640023955406, "percentage": 92.02, "elapsed_time": "1 day, 7:31:59", "remaining_time": "2:44:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9988, "total_steps": 10853, "loss": 0.1134, "learning_rate": 8.633937132650593e-08, "epoch": 0.9202561385728106, "percentage": 92.03, "elapsed_time": "1 day, 7:32:12", "remaining_time": "2:43:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9989, "total_steps": 10853, "loss": 0.1193, "learning_rate": 8.614101184947238e-08, "epoch": 0.9203482747500806, "percentage": 92.04, "elapsed_time": "1 day, 7:32:23", "remaining_time": "2:43:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9990, "total_steps": 10853, "loss": 0.1097, "learning_rate": 8.594287649950544e-08, "epoch": 0.9204404109273506, "percentage": 92.05, "elapsed_time": "1 day, 7:32:34", "remaining_time": "2:43:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9991, "total_steps": 10853, "loss": 0.1103, "learning_rate": 8.574496529500209e-08, "epoch": 0.9205325471046206, "percentage": 92.06, "elapsed_time": "1 day, 7:32:45", "remaining_time": "2:43:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9992, "total_steps": 10853, "loss": 0.1192, "learning_rate": 8.554727825433872e-08, "epoch": 0.9206246832818906, "percentage": 92.07, "elapsed_time": "1 day, 7:32:56", "remaining_time": "2:43:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9993, "total_steps": 10853, "loss": 0.1158, "learning_rate": 8.53498153958704e-08, "epoch": 0.9207168194591606, "percentage": 92.08, "elapsed_time": "1 day, 7:33:07", "remaining_time": "2:42:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9994, "total_steps": 10853, "loss": 0.1144, "learning_rate": 8.515257673793159e-08, "epoch": 0.9208089556364306, "percentage": 92.09, "elapsed_time": "1 day, 7:33:19", "remaining_time": "2:42:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9995, "total_steps": 10853, "loss": 0.1202, "learning_rate": 8.4955562298836e-08, "epoch": 0.9209010918137006, "percentage": 92.09, "elapsed_time": "1 day, 7:33:30", "remaining_time": "2:42:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9996, "total_steps": 10853, "loss": 0.1071, "learning_rate": 8.475877209687594e-08, "epoch": 0.9209932279909706, "percentage": 92.1, "elapsed_time": "1 day, 7:33:42", "remaining_time": "2:42:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9997, "total_steps": 10853, "loss": 0.1209, "learning_rate": 8.456220615032429e-08, "epoch": 0.9210853641682406, "percentage": 92.11, "elapsed_time": "1 day, 7:33:53", "remaining_time": "2:42:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9998, "total_steps": 10853, "loss": 0.1226, "learning_rate": 8.436586447743172e-08, "epoch": 0.9211775003455107, "percentage": 92.12, "elapsed_time": "1 day, 7:34:05", "remaining_time": "2:41:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9999, "total_steps": 10853, "loss": 0.1157, "learning_rate": 8.416974709642839e-08, "epoch": 0.9212696365227807, "percentage": 92.13, "elapsed_time": "1 day, 7:34:15", "remaining_time": "2:41:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10000, "total_steps": 10853, "loss": 0.1117, "learning_rate": 8.397385402552415e-08, "epoch": 0.9213617727000507, "percentage": 92.14, "elapsed_time": "1 day, 7:34:24", "remaining_time": "2:41:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10000, "total_steps": 10853, "eval_loss": 0.11681114137172699, "epoch": 0.9213617727000507, "percentage": 92.14, "elapsed_time": "1 day, 7:39:25", "remaining_time": "2:42:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10001, "total_steps": 10853, "loss": 0.1116, "learning_rate": 8.377818528290754e-08, "epoch": 0.9214539088773207, "percentage": 92.15, "elapsed_time": "1 day, 7:39:35", "remaining_time": "2:41:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10002, "total_steps": 10853, "loss": 0.1208, "learning_rate": 8.358274088674651e-08, "epoch": 0.9215460450545907, "percentage": 92.16, "elapsed_time": "1 day, 7:39:46", "remaining_time": "2:41:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10003, "total_steps": 10853, "loss": 0.1114, "learning_rate": 8.338752085518819e-08, "epoch": 0.9216381812318607, "percentage": 92.17, "elapsed_time": "1 day, 7:39:57", "remaining_time": "2:41:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10004, "total_steps": 10853, "loss": 0.1073, "learning_rate": 8.31925252063584e-08, "epoch": 0.9217303174091307, "percentage": 92.18, "elapsed_time": "1 day, 7:40:08", "remaining_time": "2:41:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10005, "total_steps": 10853, "loss": 0.1133, "learning_rate": 8.299775395836262e-08, "epoch": 0.9218224535864007, "percentage": 92.19, "elapsed_time": "1 day, 7:40:20", "remaining_time": "2:41:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10006, "total_steps": 10853, "loss": 0.1163, "learning_rate": 8.280320712928585e-08, "epoch": 0.9219145897636707, "percentage": 92.2, "elapsed_time": "1 day, 7:40:32", "remaining_time": "2:40:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10007, "total_steps": 10853, "loss": 0.1158, "learning_rate": 8.260888473719114e-08, "epoch": 0.9220067259409407, "percentage": 92.2, "elapsed_time": "1 day, 7:40:42", "remaining_time": "2:40:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10008, "total_steps": 10853, "loss": 0.116, "learning_rate": 8.241478680012183e-08, "epoch": 0.9220988621182107, "percentage": 92.21, "elapsed_time": "1 day, 7:40:53", "remaining_time": "2:40:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10009, "total_steps": 10853, "loss": 0.1193, "learning_rate": 8.222091333609989e-08, "epoch": 0.9221909982954807, "percentage": 92.22, "elapsed_time": "1 day, 7:41:03", "remaining_time": "2:40:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10010, "total_steps": 10853, "loss": 0.1092, "learning_rate": 8.202726436312619e-08, "epoch": 0.9222831344727507, "percentage": 92.23, "elapsed_time": "1 day, 7:41:13", "remaining_time": "2:40:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10011, "total_steps": 10853, "loss": 0.1194, "learning_rate": 8.183383989918109e-08, "epoch": 0.9223752706500208, "percentage": 92.24, "elapsed_time": "1 day, 7:41:23", "remaining_time": "2:39:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10012, "total_steps": 10853, "loss": 0.12, "learning_rate": 8.164063996222438e-08, "epoch": 0.9224674068272908, "percentage": 92.25, "elapsed_time": "1 day, 7:41:35", "remaining_time": "2:39:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10013, "total_steps": 10853, "loss": 0.1137, "learning_rate": 8.14476645701942e-08, "epoch": 0.9225595430045608, "percentage": 92.26, "elapsed_time": "1 day, 7:41:46", "remaining_time": "2:39:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10014, "total_steps": 10853, "loss": 0.1155, "learning_rate": 8.125491374100902e-08, "epoch": 0.9226516791818308, "percentage": 92.27, "elapsed_time": "1 day, 7:41:56", "remaining_time": "2:39:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10015, "total_steps": 10853, "loss": 0.1185, "learning_rate": 8.106238749256562e-08, "epoch": 0.9227438153591008, "percentage": 92.28, "elapsed_time": "1 day, 7:42:06", "remaining_time": "2:39:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10016, "total_steps": 10853, "loss": 0.1193, "learning_rate": 8.087008584273942e-08, "epoch": 0.9228359515363708, "percentage": 92.29, "elapsed_time": "1 day, 7:42:16", "remaining_time": "2:38:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10017, "total_steps": 10853, "loss": 0.1079, "learning_rate": 8.067800880938615e-08, "epoch": 0.9229280877136408, "percentage": 92.3, "elapsed_time": "1 day, 7:42:28", "remaining_time": "2:38:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10018, "total_steps": 10853, "loss": 0.1118, "learning_rate": 8.048615641034013e-08, "epoch": 0.9230202238909108, "percentage": 92.31, "elapsed_time": "1 day, 7:42:37", "remaining_time": "2:38:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10019, "total_steps": 10853, "loss": 0.1182, "learning_rate": 8.029452866341492e-08, "epoch": 0.9231123600681808, "percentage": 92.32, "elapsed_time": "1 day, 7:42:49", "remaining_time": "2:38:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10020, "total_steps": 10853, "loss": 0.1062, "learning_rate": 8.010312558640348e-08, "epoch": 0.9232044962454508, "percentage": 92.32, "elapsed_time": "1 day, 7:43:01", "remaining_time": "2:38:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10021, "total_steps": 10853, "loss": 0.1207, "learning_rate": 7.991194719707663e-08, "epoch": 0.9232966324227208, "percentage": 92.33, "elapsed_time": "1 day, 7:43:12", "remaining_time": "2:38:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10022, "total_steps": 10853, "loss": 0.1263, "learning_rate": 7.972099351318624e-08, "epoch": 0.9233887685999908, "percentage": 92.34, "elapsed_time": "1 day, 7:43:22", "remaining_time": "2:37:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10023, "total_steps": 10853, "loss": 0.1171, "learning_rate": 7.953026455246233e-08, "epoch": 0.9234809047772607, "percentage": 92.35, "elapsed_time": "1 day, 7:43:33", "remaining_time": "2:37:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10024, "total_steps": 10853, "loss": 0.1118, "learning_rate": 7.933976033261348e-08, "epoch": 0.9235730409545307, "percentage": 92.36, "elapsed_time": "1 day, 7:43:43", "remaining_time": "2:37:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10025, "total_steps": 10853, "loss": 0.1221, "learning_rate": 7.914948087132862e-08, "epoch": 0.9236651771318009, "percentage": 92.37, "elapsed_time": "1 day, 7:43:54", "remaining_time": "2:37:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10026, "total_steps": 10853, "loss": 0.1164, "learning_rate": 7.895942618627472e-08, "epoch": 0.9237573133090708, "percentage": 92.38, "elapsed_time": "1 day, 7:44:04", "remaining_time": "2:37:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10027, "total_steps": 10853, "loss": 0.1168, "learning_rate": 7.876959629509907e-08, "epoch": 0.9238494494863408, "percentage": 92.39, "elapsed_time": "1 day, 7:44:14", "remaining_time": "2:36:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10028, "total_steps": 10853, "loss": 0.1153, "learning_rate": 7.85799912154267e-08, "epoch": 0.9239415856636108, "percentage": 92.4, "elapsed_time": "1 day, 7:44:25", "remaining_time": "2:36:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10029, "total_steps": 10853, "loss": 0.1043, "learning_rate": 7.839061096486273e-08, "epoch": 0.9240337218408808, "percentage": 92.41, "elapsed_time": "1 day, 7:44:36", "remaining_time": "2:36:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10030, "total_steps": 10853, "loss": 0.1252, "learning_rate": 7.82014555609914e-08, "epoch": 0.9241258580181508, "percentage": 92.42, "elapsed_time": "1 day, 7:44:47", "remaining_time": "2:36:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10031, "total_steps": 10853, "loss": 0.1076, "learning_rate": 7.801252502137535e-08, "epoch": 0.9242179941954208, "percentage": 92.43, "elapsed_time": "1 day, 7:44:58", "remaining_time": "2:36:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10032, "total_steps": 10853, "loss": 0.1244, "learning_rate": 7.782381936355693e-08, "epoch": 0.9243101303726908, "percentage": 92.44, "elapsed_time": "1 day, 7:45:09", "remaining_time": "2:35:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10033, "total_steps": 10853, "loss": 0.1219, "learning_rate": 7.763533860505767e-08, "epoch": 0.9244022665499608, "percentage": 92.44, "elapsed_time": "1 day, 7:45:19", "remaining_time": "2:35:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10034, "total_steps": 10853, "loss": 0.1115, "learning_rate": 7.744708276337776e-08, "epoch": 0.9244944027272308, "percentage": 92.45, "elapsed_time": "1 day, 7:45:29", "remaining_time": "2:35:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10035, "total_steps": 10853, "loss": 0.111, "learning_rate": 7.725905185599735e-08, "epoch": 0.9245865389045008, "percentage": 92.46, "elapsed_time": "1 day, 7:45:40", "remaining_time": "2:35:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10036, "total_steps": 10853, "loss": 0.1079, "learning_rate": 7.707124590037445e-08, "epoch": 0.9246786750817708, "percentage": 92.47, "elapsed_time": "1 day, 7:45:52", "remaining_time": "2:35:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10037, "total_steps": 10853, "loss": 0.1057, "learning_rate": 7.688366491394706e-08, "epoch": 0.9247708112590408, "percentage": 92.48, "elapsed_time": "1 day, 7:46:01", "remaining_time": "2:34:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10038, "total_steps": 10853, "loss": 0.1076, "learning_rate": 7.669630891413204e-08, "epoch": 0.9248629474363109, "percentage": 92.49, "elapsed_time": "1 day, 7:46:13", "remaining_time": "2:34:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10039, "total_steps": 10853, "loss": 0.108, "learning_rate": 7.650917791832608e-08, "epoch": 0.9249550836135809, "percentage": 92.5, "elapsed_time": "1 day, 7:46:25", "remaining_time": "2:34:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10040, "total_steps": 10853, "loss": 0.1187, "learning_rate": 7.632227194390301e-08, "epoch": 0.9250472197908509, "percentage": 92.51, "elapsed_time": "1 day, 7:46:34", "remaining_time": "2:34:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10041, "total_steps": 10853, "loss": 0.1087, "learning_rate": 7.613559100821843e-08, "epoch": 0.9251393559681209, "percentage": 92.52, "elapsed_time": "1 day, 7:46:45", "remaining_time": "2:34:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10042, "total_steps": 10853, "loss": 0.1131, "learning_rate": 7.594913512860485e-08, "epoch": 0.9252314921453909, "percentage": 92.53, "elapsed_time": "1 day, 7:46:56", "remaining_time": "2:34:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10043, "total_steps": 10853, "loss": 0.1129, "learning_rate": 7.57629043223751e-08, "epoch": 0.9253236283226609, "percentage": 92.54, "elapsed_time": "1 day, 7:47:07", "remaining_time": "2:33:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10044, "total_steps": 10853, "loss": 0.1123, "learning_rate": 7.557689860682032e-08, "epoch": 0.9254157644999309, "percentage": 92.55, "elapsed_time": "1 day, 7:47:18", "remaining_time": "2:33:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10045, "total_steps": 10853, "loss": 0.1235, "learning_rate": 7.539111799921145e-08, "epoch": 0.9255079006772009, "percentage": 92.56, "elapsed_time": "1 day, 7:47:29", "remaining_time": "2:33:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10046, "total_steps": 10853, "loss": 0.1157, "learning_rate": 7.520556251679856e-08, "epoch": 0.9256000368544709, "percentage": 92.56, "elapsed_time": "1 day, 7:47:40", "remaining_time": "2:33:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10047, "total_steps": 10853, "loss": 0.114, "learning_rate": 7.502023217680982e-08, "epoch": 0.9256921730317409, "percentage": 92.57, "elapsed_time": "1 day, 7:47:51", "remaining_time": "2:33:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10048, "total_steps": 10853, "loss": 0.1203, "learning_rate": 7.483512699645368e-08, "epoch": 0.9257843092090109, "percentage": 92.58, "elapsed_time": "1 day, 7:48:04", "remaining_time": "2:32:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10049, "total_steps": 10853, "loss": 0.1253, "learning_rate": 7.465024699291696e-08, "epoch": 0.9258764453862809, "percentage": 92.59, "elapsed_time": "1 day, 7:48:15", "remaining_time": "2:32:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10050, "total_steps": 10853, "loss": 0.1269, "learning_rate": 7.446559218336563e-08, "epoch": 0.9259685815635509, "percentage": 92.6, "elapsed_time": "1 day, 7:48:26", "remaining_time": "2:32:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10051, "total_steps": 10853, "loss": 0.1184, "learning_rate": 7.428116258494545e-08, "epoch": 0.9260607177408209, "percentage": 92.61, "elapsed_time": "1 day, 7:48:39", "remaining_time": "2:32:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10052, "total_steps": 10853, "loss": 0.117, "learning_rate": 7.409695821478046e-08, "epoch": 0.926152853918091, "percentage": 92.62, "elapsed_time": "1 day, 7:48:49", "remaining_time": "2:32:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10053, "total_steps": 10853, "loss": 0.117, "learning_rate": 7.391297908997341e-08, "epoch": 0.926244990095361, "percentage": 92.63, "elapsed_time": "1 day, 7:49:00", "remaining_time": "2:31:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10054, "total_steps": 10853, "loss": 0.1085, "learning_rate": 7.372922522760755e-08, "epoch": 0.926337126272631, "percentage": 92.64, "elapsed_time": "1 day, 7:49:11", "remaining_time": "2:31:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10055, "total_steps": 10853, "loss": 0.1202, "learning_rate": 7.354569664474426e-08, "epoch": 0.926429262449901, "percentage": 92.65, "elapsed_time": "1 day, 7:49:21", "remaining_time": "2:31:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10056, "total_steps": 10853, "loss": 0.1233, "learning_rate": 7.33623933584246e-08, "epoch": 0.926521398627171, "percentage": 92.66, "elapsed_time": "1 day, 7:49:32", "remaining_time": "2:31:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10057, "total_steps": 10853, "loss": 0.1249, "learning_rate": 7.317931538566747e-08, "epoch": 0.926613534804441, "percentage": 92.67, "elapsed_time": "1 day, 7:49:44", "remaining_time": "2:31:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10058, "total_steps": 10853, "loss": 0.1226, "learning_rate": 7.299646274347205e-08, "epoch": 0.926705670981711, "percentage": 92.67, "elapsed_time": "1 day, 7:49:55", "remaining_time": "2:30:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10059, "total_steps": 10853, "loss": 0.1245, "learning_rate": 7.281383544881642e-08, "epoch": 0.926797807158981, "percentage": 92.68, "elapsed_time": "1 day, 7:50:06", "remaining_time": "2:30:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10060, "total_steps": 10853, "loss": 0.1312, "learning_rate": 7.263143351865759e-08, "epoch": 0.926889943336251, "percentage": 92.69, "elapsed_time": "1 day, 7:50:18", "remaining_time": "2:30:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10061, "total_steps": 10853, "loss": 0.1208, "learning_rate": 7.244925696993088e-08, "epoch": 0.926982079513521, "percentage": 92.7, "elapsed_time": "1 day, 7:50:29", "remaining_time": "2:30:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10062, "total_steps": 10853, "loss": 0.1289, "learning_rate": 7.226730581955249e-08, "epoch": 0.927074215690791, "percentage": 92.71, "elapsed_time": "1 day, 7:50:40", "remaining_time": "2:30:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10063, "total_steps": 10853, "loss": 0.1232, "learning_rate": 7.208558008441557e-08, "epoch": 0.927166351868061, "percentage": 92.72, "elapsed_time": "1 day, 7:50:52", "remaining_time": "2:30:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10064, "total_steps": 10853, "loss": 0.1098, "learning_rate": 7.190407978139413e-08, "epoch": 0.927258488045331, "percentage": 92.73, "elapsed_time": "1 day, 7:51:02", "remaining_time": "2:29:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10065, "total_steps": 10853, "loss": 0.1188, "learning_rate": 7.172280492733996e-08, "epoch": 0.927350624222601, "percentage": 92.74, "elapsed_time": "1 day, 7:51:13", "remaining_time": "2:29:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10066, "total_steps": 10853, "loss": 0.1243, "learning_rate": 7.15417555390846e-08, "epoch": 0.9274427603998711, "percentage": 92.75, "elapsed_time": "1 day, 7:51:23", "remaining_time": "2:29:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10067, "total_steps": 10853, "loss": 0.1197, "learning_rate": 7.136093163343877e-08, "epoch": 0.927534896577141, "percentage": 92.76, "elapsed_time": "1 day, 7:51:35", "remaining_time": "2:29:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10068, "total_steps": 10853, "loss": 0.1086, "learning_rate": 7.118033322719209e-08, "epoch": 0.927627032754411, "percentage": 92.77, "elapsed_time": "1 day, 7:51:45", "remaining_time": "2:29:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10069, "total_steps": 10853, "loss": 0.1215, "learning_rate": 7.099996033711254e-08, "epoch": 0.927719168931681, "percentage": 92.78, "elapsed_time": "1 day, 7:51:57", "remaining_time": "2:28:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10070, "total_steps": 10853, "loss": 0.1098, "learning_rate": 7.081981297994784e-08, "epoch": 0.927811305108951, "percentage": 92.79, "elapsed_time": "1 day, 7:52:06", "remaining_time": "2:28:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10071, "total_steps": 10853, "loss": 0.1197, "learning_rate": 7.063989117242514e-08, "epoch": 0.927903441286221, "percentage": 92.79, "elapsed_time": "1 day, 7:52:16", "remaining_time": "2:28:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10072, "total_steps": 10853, "loss": 0.1078, "learning_rate": 7.046019493125028e-08, "epoch": 0.927995577463491, "percentage": 92.8, "elapsed_time": "1 day, 7:52:26", "remaining_time": "2:28:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10073, "total_steps": 10853, "loss": 0.1216, "learning_rate": 7.028072427310767e-08, "epoch": 0.928087713640761, "percentage": 92.81, "elapsed_time": "1 day, 7:52:36", "remaining_time": "2:28:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10074, "total_steps": 10853, "loss": 0.1143, "learning_rate": 7.010147921466121e-08, "epoch": 0.928179849818031, "percentage": 92.82, "elapsed_time": "1 day, 7:52:47", "remaining_time": "2:27:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10075, "total_steps": 10853, "loss": 0.1201, "learning_rate": 6.992245977255369e-08, "epoch": 0.928271985995301, "percentage": 92.83, "elapsed_time": "1 day, 7:53:00", "remaining_time": "2:27:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10076, "total_steps": 10853, "loss": 0.1263, "learning_rate": 6.974366596340765e-08, "epoch": 0.928364122172571, "percentage": 92.84, "elapsed_time": "1 day, 7:53:11", "remaining_time": "2:27:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10077, "total_steps": 10853, "loss": 0.1206, "learning_rate": 6.95650978038237e-08, "epoch": 0.928456258349841, "percentage": 92.85, "elapsed_time": "1 day, 7:53:22", "remaining_time": "2:27:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10078, "total_steps": 10853, "loss": 0.1152, "learning_rate": 6.93867553103822e-08, "epoch": 0.928548394527111, "percentage": 92.86, "elapsed_time": "1 day, 7:53:33", "remaining_time": "2:27:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10079, "total_steps": 10853, "loss": 0.1242, "learning_rate": 6.920863849964154e-08, "epoch": 0.9286405307043811, "percentage": 92.87, "elapsed_time": "1 day, 7:53:45", "remaining_time": "2:26:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10080, "total_steps": 10853, "loss": 0.1256, "learning_rate": 6.903074738814047e-08, "epoch": 0.9287326668816511, "percentage": 92.88, "elapsed_time": "1 day, 7:53:56", "remaining_time": "2:26:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10081, "total_steps": 10853, "loss": 0.1183, "learning_rate": 6.88530819923966e-08, "epoch": 0.9288248030589211, "percentage": 92.89, "elapsed_time": "1 day, 7:54:05", "remaining_time": "2:26:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10082, "total_steps": 10853, "loss": 0.1297, "learning_rate": 6.867564232890534e-08, "epoch": 0.9289169392361911, "percentage": 92.9, "elapsed_time": "1 day, 7:54:18", "remaining_time": "2:26:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10083, "total_steps": 10853, "loss": 0.1128, "learning_rate": 6.849842841414239e-08, "epoch": 0.9290090754134611, "percentage": 92.91, "elapsed_time": "1 day, 7:54:28", "remaining_time": "2:26:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10084, "total_steps": 10853, "loss": 0.1116, "learning_rate": 6.832144026456211e-08, "epoch": 0.9291012115907311, "percentage": 92.91, "elapsed_time": "1 day, 7:54:40", "remaining_time": "2:26:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10085, "total_steps": 10853, "loss": 0.118, "learning_rate": 6.8144677896598e-08, "epoch": 0.9291933477680011, "percentage": 92.92, "elapsed_time": "1 day, 7:54:51", "remaining_time": "2:25:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10086, "total_steps": 10853, "loss": 0.1133, "learning_rate": 6.796814132666196e-08, "epoch": 0.9292854839452711, "percentage": 92.93, "elapsed_time": "1 day, 7:55:01", "remaining_time": "2:25:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10087, "total_steps": 10853, "loss": 0.1161, "learning_rate": 6.779183057114585e-08, "epoch": 0.9293776201225411, "percentage": 92.94, "elapsed_time": "1 day, 7:55:10", "remaining_time": "2:25:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10088, "total_steps": 10853, "loss": 0.1207, "learning_rate": 6.761574564641993e-08, "epoch": 0.9294697562998111, "percentage": 92.95, "elapsed_time": "1 day, 7:55:22", "remaining_time": "2:25:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10089, "total_steps": 10853, "loss": 0.1209, "learning_rate": 6.743988656883388e-08, "epoch": 0.9295618924770811, "percentage": 92.96, "elapsed_time": "1 day, 7:55:33", "remaining_time": "2:25:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10090, "total_steps": 10853, "loss": 0.1173, "learning_rate": 6.726425335471632e-08, "epoch": 0.9296540286543511, "percentage": 92.97, "elapsed_time": "1 day, 7:55:45", "remaining_time": "2:24:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10091, "total_steps": 10853, "loss": 0.1112, "learning_rate": 6.708884602037446e-08, "epoch": 0.9297461648316211, "percentage": 92.98, "elapsed_time": "1 day, 7:55:55", "remaining_time": "2:24:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10092, "total_steps": 10853, "loss": 0.1244, "learning_rate": 6.691366458209503e-08, "epoch": 0.9298383010088911, "percentage": 92.99, "elapsed_time": "1 day, 7:56:06", "remaining_time": "2:24:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10093, "total_steps": 10853, "loss": 0.1152, "learning_rate": 6.673870905614387e-08, "epoch": 0.9299304371861612, "percentage": 93.0, "elapsed_time": "1 day, 7:56:17", "remaining_time": "2:24:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10094, "total_steps": 10853, "loss": 0.1192, "learning_rate": 6.656397945876525e-08, "epoch": 0.9300225733634312, "percentage": 93.01, "elapsed_time": "1 day, 7:56:25", "remaining_time": "2:24:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10095, "total_steps": 10853, "loss": 0.1152, "learning_rate": 6.638947580618338e-08, "epoch": 0.9301147095407012, "percentage": 93.02, "elapsed_time": "1 day, 7:56:37", "remaining_time": "2:23:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10096, "total_steps": 10853, "loss": 0.1184, "learning_rate": 6.621519811460003e-08, "epoch": 0.9302068457179712, "percentage": 93.02, "elapsed_time": "1 day, 7:56:47", "remaining_time": "2:23:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10097, "total_steps": 10853, "loss": 0.1102, "learning_rate": 6.60411464001981e-08, "epoch": 0.9302989818952412, "percentage": 93.03, "elapsed_time": "1 day, 7:56:58", "remaining_time": "2:23:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10098, "total_steps": 10853, "loss": 0.1119, "learning_rate": 6.586732067913715e-08, "epoch": 0.9303911180725112, "percentage": 93.04, "elapsed_time": "1 day, 7:57:08", "remaining_time": "2:23:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10099, "total_steps": 10853, "loss": 0.1234, "learning_rate": 6.56937209675576e-08, "epoch": 0.9304832542497812, "percentage": 93.05, "elapsed_time": "1 day, 7:57:20", "remaining_time": "2:23:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10100, "total_steps": 10853, "loss": 0.1198, "learning_rate": 6.552034728157824e-08, "epoch": 0.9305753904270512, "percentage": 93.06, "elapsed_time": "1 day, 7:57:30", "remaining_time": "2:22:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10101, "total_steps": 10853, "loss": 0.1124, "learning_rate": 6.534719963729646e-08, "epoch": 0.9306675266043212, "percentage": 93.07, "elapsed_time": "1 day, 7:57:40", "remaining_time": "2:22:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10102, "total_steps": 10853, "loss": 0.1198, "learning_rate": 6.517427805078913e-08, "epoch": 0.9307596627815912, "percentage": 93.08, "elapsed_time": "1 day, 7:57:51", "remaining_time": "2:22:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10103, "total_steps": 10853, "loss": 0.0994, "learning_rate": 6.500158253811228e-08, "epoch": 0.9308517989588612, "percentage": 93.09, "elapsed_time": "1 day, 7:58:02", "remaining_time": "2:22:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10104, "total_steps": 10853, "loss": 0.1136, "learning_rate": 6.482911311530033e-08, "epoch": 0.9309439351361312, "percentage": 93.1, "elapsed_time": "1 day, 7:58:12", "remaining_time": "2:22:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10105, "total_steps": 10853, "loss": 0.1036, "learning_rate": 6.465686979836766e-08, "epoch": 0.9310360713134012, "percentage": 93.11, "elapsed_time": "1 day, 7:58:22", "remaining_time": "2:22:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10106, "total_steps": 10853, "loss": 0.1159, "learning_rate": 6.44848526033065e-08, "epoch": 0.9311282074906713, "percentage": 93.12, "elapsed_time": "1 day, 7:58:33", "remaining_time": "2:21:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10107, "total_steps": 10853, "loss": 0.1105, "learning_rate": 6.43130615460888e-08, "epoch": 0.9312203436679413, "percentage": 93.13, "elapsed_time": "1 day, 7:58:43", "remaining_time": "2:21:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10108, "total_steps": 10853, "loss": 0.1284, "learning_rate": 6.41414966426654e-08, "epoch": 0.9313124798452113, "percentage": 93.14, "elapsed_time": "1 day, 7:58:54", "remaining_time": "2:21:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10109, "total_steps": 10853, "loss": 0.1205, "learning_rate": 6.397015790896633e-08, "epoch": 0.9314046160224813, "percentage": 93.14, "elapsed_time": "1 day, 7:59:04", "remaining_time": "2:21:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10110, "total_steps": 10853, "loss": 0.1076, "learning_rate": 6.379904536090053e-08, "epoch": 0.9314967521997513, "percentage": 93.15, "elapsed_time": "1 day, 7:59:15", "remaining_time": "2:21:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10111, "total_steps": 10853, "loss": 0.1098, "learning_rate": 6.362815901435532e-08, "epoch": 0.9315888883770213, "percentage": 93.16, "elapsed_time": "1 day, 7:59:26", "remaining_time": "2:20:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10112, "total_steps": 10853, "loss": 0.1224, "learning_rate": 6.34574988851977e-08, "epoch": 0.9316810245542912, "percentage": 93.17, "elapsed_time": "1 day, 7:59:38", "remaining_time": "2:20:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10113, "total_steps": 10853, "loss": 0.117, "learning_rate": 6.328706498927361e-08, "epoch": 0.9317731607315612, "percentage": 93.18, "elapsed_time": "1 day, 7:59:47", "remaining_time": "2:20:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10114, "total_steps": 10853, "loss": 0.1074, "learning_rate": 6.311685734240791e-08, "epoch": 0.9318652969088312, "percentage": 93.19, "elapsed_time": "1 day, 7:59:58", "remaining_time": "2:20:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10115, "total_steps": 10853, "loss": 0.119, "learning_rate": 6.294687596040406e-08, "epoch": 0.9319574330861012, "percentage": 93.2, "elapsed_time": "1 day, 8:00:08", "remaining_time": "2:20:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10116, "total_steps": 10853, "loss": 0.1014, "learning_rate": 6.277712085904524e-08, "epoch": 0.9320495692633712, "percentage": 93.21, "elapsed_time": "1 day, 8:00:18", "remaining_time": "2:19:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10117, "total_steps": 10853, "loss": 0.134, "learning_rate": 6.260759205409278e-08, "epoch": 0.9321417054406412, "percentage": 93.22, "elapsed_time": "1 day, 8:00:30", "remaining_time": "2:19:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10118, "total_steps": 10853, "loss": 0.1008, "learning_rate": 6.243828956128794e-08, "epoch": 0.9322338416179112, "percentage": 93.23, "elapsed_time": "1 day, 8:00:41", "remaining_time": "2:19:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10119, "total_steps": 10853, "loss": 0.1025, "learning_rate": 6.226921339635012e-08, "epoch": 0.9323259777951812, "percentage": 93.24, "elapsed_time": "1 day, 8:00:52", "remaining_time": "2:19:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10120, "total_steps": 10853, "loss": 0.1259, "learning_rate": 6.210036357497811e-08, "epoch": 0.9324181139724513, "percentage": 93.25, "elapsed_time": "1 day, 8:01:03", "remaining_time": "2:19:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10121, "total_steps": 10853, "loss": 0.1199, "learning_rate": 6.193174011284997e-08, "epoch": 0.9325102501497213, "percentage": 93.26, "elapsed_time": "1 day, 8:01:12", "remaining_time": "2:18:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10122, "total_steps": 10853, "loss": 0.1029, "learning_rate": 6.176334302562204e-08, "epoch": 0.9326023863269913, "percentage": 93.26, "elapsed_time": "1 day, 8:01:23", "remaining_time": "2:18:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10123, "total_steps": 10853, "loss": 0.121, "learning_rate": 6.159517232893014e-08, "epoch": 0.9326945225042613, "percentage": 93.27, "elapsed_time": "1 day, 8:01:35", "remaining_time": "2:18:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10124, "total_steps": 10853, "loss": 0.124, "learning_rate": 6.142722803838874e-08, "epoch": 0.9327866586815313, "percentage": 93.28, "elapsed_time": "1 day, 8:01:46", "remaining_time": "2:18:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10125, "total_steps": 10853, "loss": 0.1247, "learning_rate": 6.125951016959175e-08, "epoch": 0.9328787948588013, "percentage": 93.29, "elapsed_time": "1 day, 8:01:56", "remaining_time": "2:18:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10126, "total_steps": 10853, "loss": 0.1254, "learning_rate": 6.109201873811171e-08, "epoch": 0.9329709310360713, "percentage": 93.3, "elapsed_time": "1 day, 8:02:07", "remaining_time": "2:17:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10127, "total_steps": 10853, "loss": 0.1058, "learning_rate": 6.092475375950035e-08, "epoch": 0.9330630672133413, "percentage": 93.31, "elapsed_time": "1 day, 8:02:17", "remaining_time": "2:17:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10128, "total_steps": 10853, "loss": 0.1118, "learning_rate": 6.075771524928804e-08, "epoch": 0.9331552033906113, "percentage": 93.32, "elapsed_time": "1 day, 8:02:28", "remaining_time": "2:17:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10129, "total_steps": 10853, "loss": 0.1099, "learning_rate": 6.0590903222984e-08, "epoch": 0.9332473395678813, "percentage": 93.33, "elapsed_time": "1 day, 8:02:39", "remaining_time": "2:17:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10130, "total_steps": 10853, "loss": 0.0987, "learning_rate": 6.042431769607782e-08, "epoch": 0.9333394757451513, "percentage": 93.34, "elapsed_time": "1 day, 8:02:49", "remaining_time": "2:17:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10131, "total_steps": 10853, "loss": 0.1221, "learning_rate": 6.025795868403573e-08, "epoch": 0.9334316119224213, "percentage": 93.35, "elapsed_time": "1 day, 8:03:00", "remaining_time": "2:17:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10132, "total_steps": 10853, "loss": 0.1153, "learning_rate": 6.009182620230508e-08, "epoch": 0.9335237480996913, "percentage": 93.36, "elapsed_time": "1 day, 8:03:10", "remaining_time": "2:16:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10133, "total_steps": 10853, "loss": 0.1064, "learning_rate": 5.992592026631078e-08, "epoch": 0.9336158842769613, "percentage": 93.37, "elapsed_time": "1 day, 8:03:21", "remaining_time": "2:16:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10134, "total_steps": 10853, "loss": 0.1137, "learning_rate": 5.976024089145715e-08, "epoch": 0.9337080204542314, "percentage": 93.38, "elapsed_time": "1 day, 8:03:33", "remaining_time": "2:16:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10135, "total_steps": 10853, "loss": 0.118, "learning_rate": 5.95947880931283e-08, "epoch": 0.9338001566315014, "percentage": 93.38, "elapsed_time": "1 day, 8:03:43", "remaining_time": "2:16:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10136, "total_steps": 10853, "loss": 0.1296, "learning_rate": 5.942956188668553e-08, "epoch": 0.9338922928087714, "percentage": 93.39, "elapsed_time": "1 day, 8:03:54", "remaining_time": "2:16:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10137, "total_steps": 10853, "loss": 0.1276, "learning_rate": 5.926456228747102e-08, "epoch": 0.9339844289860414, "percentage": 93.4, "elapsed_time": "1 day, 8:04:04", "remaining_time": "2:15:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10138, "total_steps": 10853, "loss": 0.1115, "learning_rate": 5.909978931080418e-08, "epoch": 0.9340765651633114, "percentage": 93.41, "elapsed_time": "1 day, 8:04:15", "remaining_time": "2:15:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10139, "total_steps": 10853, "loss": 0.1173, "learning_rate": 5.8935242971984993e-08, "epoch": 0.9341687013405814, "percentage": 93.42, "elapsed_time": "1 day, 8:04:26", "remaining_time": "2:15:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10140, "total_steps": 10853, "loss": 0.1201, "learning_rate": 5.877092328629097e-08, "epoch": 0.9342608375178514, "percentage": 93.43, "elapsed_time": "1 day, 8:04:37", "remaining_time": "2:15:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10141, "total_steps": 10853, "loss": 0.1115, "learning_rate": 5.8606830268979344e-08, "epoch": 0.9343529736951214, "percentage": 93.44, "elapsed_time": "1 day, 8:04:49", "remaining_time": "2:15:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10142, "total_steps": 10853, "loss": 0.1194, "learning_rate": 5.8442963935286535e-08, "epoch": 0.9344451098723914, "percentage": 93.45, "elapsed_time": "1 day, 8:05:00", "remaining_time": "2:14:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10143, "total_steps": 10853, "loss": 0.1087, "learning_rate": 5.827932430042732e-08, "epoch": 0.9345372460496614, "percentage": 93.46, "elapsed_time": "1 day, 8:05:09", "remaining_time": "2:14:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10144, "total_steps": 10853, "loss": 0.1187, "learning_rate": 5.811591137959538e-08, "epoch": 0.9346293822269314, "percentage": 93.47, "elapsed_time": "1 day, 8:05:19", "remaining_time": "2:14:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10145, "total_steps": 10853, "loss": 0.1108, "learning_rate": 5.7952725187963855e-08, "epoch": 0.9347215184042014, "percentage": 93.48, "elapsed_time": "1 day, 8:05:29", "remaining_time": "2:14:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10146, "total_steps": 10853, "loss": 0.1212, "learning_rate": 5.778976574068451e-08, "epoch": 0.9348136545814714, "percentage": 93.49, "elapsed_time": "1 day, 8:05:38", "remaining_time": "2:14:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10147, "total_steps": 10853, "loss": 0.1154, "learning_rate": 5.762703305288858e-08, "epoch": 0.9349057907587415, "percentage": 93.49, "elapsed_time": "1 day, 8:05:50", "remaining_time": "2:13:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10148, "total_steps": 10853, "loss": 0.1232, "learning_rate": 5.746452713968564e-08, "epoch": 0.9349979269360115, "percentage": 93.5, "elapsed_time": "1 day, 8:06:01", "remaining_time": "2:13:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10149, "total_steps": 10853, "loss": 0.1175, "learning_rate": 5.730224801616391e-08, "epoch": 0.9350900631132815, "percentage": 93.51, "elapsed_time": "1 day, 8:06:12", "remaining_time": "2:13:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10150, "total_steps": 10853, "loss": 0.1115, "learning_rate": 5.714019569739132e-08, "epoch": 0.9351821992905515, "percentage": 93.52, "elapsed_time": "1 day, 8:06:22", "remaining_time": "2:13:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10151, "total_steps": 10853, "loss": 0.125, "learning_rate": 5.697837019841446e-08, "epoch": 0.9352743354678215, "percentage": 93.53, "elapsed_time": "1 day, 8:06:32", "remaining_time": "2:13:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10152, "total_steps": 10853, "loss": 0.1196, "learning_rate": 5.6816771534258794e-08, "epoch": 0.9353664716450915, "percentage": 93.54, "elapsed_time": "1 day, 8:06:43", "remaining_time": "2:13:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10153, "total_steps": 10853, "loss": 0.1149, "learning_rate": 5.6655399719929286e-08, "epoch": 0.9354586078223615, "percentage": 93.55, "elapsed_time": "1 day, 8:06:55", "remaining_time": "2:12:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10154, "total_steps": 10853, "loss": 0.1107, "learning_rate": 5.649425477040837e-08, "epoch": 0.9355507439996315, "percentage": 93.56, "elapsed_time": "1 day, 8:07:06", "remaining_time": "2:12:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10155, "total_steps": 10853, "loss": 0.1259, "learning_rate": 5.63333367006591e-08, "epoch": 0.9356428801769014, "percentage": 93.57, "elapsed_time": "1 day, 8:07:17", "remaining_time": "2:12:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10156, "total_steps": 10853, "loss": 0.1262, "learning_rate": 5.617264552562229e-08, "epoch": 0.9357350163541714, "percentage": 93.58, "elapsed_time": "1 day, 8:07:29", "remaining_time": "2:12:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10157, "total_steps": 10853, "loss": 0.1219, "learning_rate": 5.6012181260218514e-08, "epoch": 0.9358271525314414, "percentage": 93.59, "elapsed_time": "1 day, 8:07:39", "remaining_time": "2:12:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10158, "total_steps": 10853, "loss": 0.1155, "learning_rate": 5.5851943919346394e-08, "epoch": 0.9359192887087114, "percentage": 93.6, "elapsed_time": "1 day, 8:07:49", "remaining_time": "2:11:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10159, "total_steps": 10853, "loss": 0.1258, "learning_rate": 5.569193351788516e-08, "epoch": 0.9360114248859814, "percentage": 93.61, "elapsed_time": "1 day, 8:07:59", "remaining_time": "2:11:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10160, "total_steps": 10853, "loss": 0.1144, "learning_rate": 5.5532150070690404e-08, "epoch": 0.9361035610632514, "percentage": 93.61, "elapsed_time": "1 day, 8:08:11", "remaining_time": "2:11:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10161, "total_steps": 10853, "loss": 0.1239, "learning_rate": 5.5372593592598333e-08, "epoch": 0.9361956972405215, "percentage": 93.62, "elapsed_time": "1 day, 8:08:22", "remaining_time": "2:11:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10162, "total_steps": 10853, "loss": 0.1072, "learning_rate": 5.521326409842431e-08, "epoch": 0.9362878334177915, "percentage": 93.63, "elapsed_time": "1 day, 8:08:34", "remaining_time": "2:11:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10163, "total_steps": 10853, "loss": 0.1128, "learning_rate": 5.5054161602961786e-08, "epoch": 0.9363799695950615, "percentage": 93.64, "elapsed_time": "1 day, 8:08:44", "remaining_time": "2:10:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10164, "total_steps": 10853, "loss": 0.1104, "learning_rate": 5.489528612098366e-08, "epoch": 0.9364721057723315, "percentage": 93.65, "elapsed_time": "1 day, 8:08:53", "remaining_time": "2:10:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10165, "total_steps": 10853, "loss": 0.1188, "learning_rate": 5.4736637667241465e-08, "epoch": 0.9365642419496015, "percentage": 93.66, "elapsed_time": "1 day, 8:09:05", "remaining_time": "2:10:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10166, "total_steps": 10853, "loss": 0.121, "learning_rate": 5.457821625646537e-08, "epoch": 0.9366563781268715, "percentage": 93.67, "elapsed_time": "1 day, 8:09:16", "remaining_time": "2:10:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10167, "total_steps": 10853, "loss": 0.1255, "learning_rate": 5.442002190336498e-08, "epoch": 0.9367485143041415, "percentage": 93.68, "elapsed_time": "1 day, 8:09:28", "remaining_time": "2:10:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10168, "total_steps": 10853, "loss": 0.1363, "learning_rate": 5.426205462262884e-08, "epoch": 0.9368406504814115, "percentage": 93.69, "elapsed_time": "1 day, 8:09:40", "remaining_time": "2:09:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10169, "total_steps": 10853, "loss": 0.1318, "learning_rate": 5.410431442892411e-08, "epoch": 0.9369327866586815, "percentage": 93.7, "elapsed_time": "1 day, 8:09:52", "remaining_time": "2:09:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10170, "total_steps": 10853, "loss": 0.1152, "learning_rate": 5.3946801336897395e-08, "epoch": 0.9370249228359515, "percentage": 93.71, "elapsed_time": "1 day, 8:10:02", "remaining_time": "2:09:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10171, "total_steps": 10853, "loss": 0.1161, "learning_rate": 5.37895153611731e-08, "epoch": 0.9371170590132215, "percentage": 93.72, "elapsed_time": "1 day, 8:10:14", "remaining_time": "2:09:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10172, "total_steps": 10853, "loss": 0.1163, "learning_rate": 5.363245651635568e-08, "epoch": 0.9372091951904915, "percentage": 93.73, "elapsed_time": "1 day, 8:10:25", "remaining_time": "2:09:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10173, "total_steps": 10853, "loss": 0.1221, "learning_rate": 5.3475624817027614e-08, "epoch": 0.9373013313677615, "percentage": 93.73, "elapsed_time": "1 day, 8:10:35", "remaining_time": "2:09:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10174, "total_steps": 10853, "loss": 0.1226, "learning_rate": 5.331902027775143e-08, "epoch": 0.9373934675450316, "percentage": 93.74, "elapsed_time": "1 day, 8:10:46", "remaining_time": "2:08:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10175, "total_steps": 10853, "loss": 0.1171, "learning_rate": 5.316264291306744e-08, "epoch": 0.9374856037223016, "percentage": 93.75, "elapsed_time": "1 day, 8:10:57", "remaining_time": "2:08:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10176, "total_steps": 10853, "loss": 0.1196, "learning_rate": 5.300649273749542e-08, "epoch": 0.9375777398995716, "percentage": 93.76, "elapsed_time": "1 day, 8:11:08", "remaining_time": "2:08:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10177, "total_steps": 10853, "loss": 0.1175, "learning_rate": 5.2850569765533766e-08, "epoch": 0.9376698760768416, "percentage": 93.77, "elapsed_time": "1 day, 8:11:19", "remaining_time": "2:08:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10178, "total_steps": 10853, "loss": 0.1195, "learning_rate": 5.2694874011660066e-08, "epoch": 0.9377620122541116, "percentage": 93.78, "elapsed_time": "1 day, 8:11:30", "remaining_time": "2:08:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10179, "total_steps": 10853, "loss": 0.1064, "learning_rate": 5.253940549033082e-08, "epoch": 0.9378541484313816, "percentage": 93.79, "elapsed_time": "1 day, 8:11:40", "remaining_time": "2:07:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10180, "total_steps": 10853, "loss": 0.1188, "learning_rate": 5.238416421598142e-08, "epoch": 0.9379462846086516, "percentage": 93.8, "elapsed_time": "1 day, 8:11:52", "remaining_time": "2:07:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10181, "total_steps": 10853, "loss": 0.117, "learning_rate": 5.2229150203025604e-08, "epoch": 0.9380384207859216, "percentage": 93.81, "elapsed_time": "1 day, 8:12:02", "remaining_time": "2:07:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10182, "total_steps": 10853, "loss": 0.1138, "learning_rate": 5.2074363465856316e-08, "epoch": 0.9381305569631916, "percentage": 93.82, "elapsed_time": "1 day, 8:12:13", "remaining_time": "2:07:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10183, "total_steps": 10853, "loss": 0.1181, "learning_rate": 5.191980401884594e-08, "epoch": 0.9382226931404616, "percentage": 93.83, "elapsed_time": "1 day, 8:12:23", "remaining_time": "2:07:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10184, "total_steps": 10853, "loss": 0.1173, "learning_rate": 5.176547187634551e-08, "epoch": 0.9383148293177316, "percentage": 93.84, "elapsed_time": "1 day, 8:12:36", "remaining_time": "2:06:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10185, "total_steps": 10853, "loss": 0.1197, "learning_rate": 5.161136705268438e-08, "epoch": 0.9384069654950016, "percentage": 93.85, "elapsed_time": "1 day, 8:12:47", "remaining_time": "2:06:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10186, "total_steps": 10853, "loss": 0.1186, "learning_rate": 5.145748956217139e-08, "epoch": 0.9384991016722716, "percentage": 93.85, "elapsed_time": "1 day, 8:12:58", "remaining_time": "2:06:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10187, "total_steps": 10853, "loss": 0.1077, "learning_rate": 5.130383941909372e-08, "epoch": 0.9385912378495416, "percentage": 93.86, "elapsed_time": "1 day, 8:13:12", "remaining_time": "2:06:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10188, "total_steps": 10853, "loss": 0.1071, "learning_rate": 5.1150416637718306e-08, "epoch": 0.9386833740268117, "percentage": 93.87, "elapsed_time": "1 day, 8:13:23", "remaining_time": "2:06:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10189, "total_steps": 10853, "loss": 0.1182, "learning_rate": 5.0997221232290115e-08, "epoch": 0.9387755102040817, "percentage": 93.88, "elapsed_time": "1 day, 8:13:34", "remaining_time": "2:06:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10190, "total_steps": 10853, "loss": 0.1253, "learning_rate": 5.0844253217033624e-08, "epoch": 0.9388676463813517, "percentage": 93.89, "elapsed_time": "1 day, 8:13:45", "remaining_time": "2:05:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10191, "total_steps": 10853, "loss": 0.1107, "learning_rate": 5.06915126061519e-08, "epoch": 0.9389597825586217, "percentage": 93.9, "elapsed_time": "1 day, 8:13:56", "remaining_time": "2:05:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10192, "total_steps": 10853, "loss": 0.1178, "learning_rate": 5.0538999413826393e-08, "epoch": 0.9390519187358917, "percentage": 93.91, "elapsed_time": "1 day, 8:14:08", "remaining_time": "2:05:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10193, "total_steps": 10853, "loss": 0.1308, "learning_rate": 5.0386713654218825e-08, "epoch": 0.9391440549131617, "percentage": 93.92, "elapsed_time": "1 day, 8:14:19", "remaining_time": "2:05:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10194, "total_steps": 10853, "loss": 0.1214, "learning_rate": 5.023465534146843e-08, "epoch": 0.9392361910904317, "percentage": 93.93, "elapsed_time": "1 day, 8:14:32", "remaining_time": "2:05:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10195, "total_steps": 10853, "loss": 0.1084, "learning_rate": 5.008282448969393e-08, "epoch": 0.9393283272677017, "percentage": 93.94, "elapsed_time": "1 day, 8:14:42", "remaining_time": "2:04:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10196, "total_steps": 10853, "loss": 0.1198, "learning_rate": 4.9931221112992924e-08, "epoch": 0.9394204634449717, "percentage": 93.95, "elapsed_time": "1 day, 8:14:54", "remaining_time": "2:04:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10197, "total_steps": 10853, "loss": 0.1091, "learning_rate": 4.977984522544166e-08, "epoch": 0.9395125996222417, "percentage": 93.96, "elapsed_time": "1 day, 8:15:05", "remaining_time": "2:04:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10198, "total_steps": 10853, "loss": 0.1097, "learning_rate": 4.962869684109528e-08, "epoch": 0.9396047357995116, "percentage": 93.96, "elapsed_time": "1 day, 8:15:15", "remaining_time": "2:04:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10199, "total_steps": 10853, "loss": 0.1145, "learning_rate": 4.947777597398812e-08, "epoch": 0.9396968719767816, "percentage": 93.97, "elapsed_time": "1 day, 8:15:26", "remaining_time": "2:04:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10200, "total_steps": 10853, "loss": 0.1114, "learning_rate": 4.932708263813341e-08, "epoch": 0.9397890081540516, "percentage": 93.98, "elapsed_time": "1 day, 8:15:38", "remaining_time": "2:03:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10201, "total_steps": 10853, "loss": 0.1214, "learning_rate": 4.917661684752273e-08, "epoch": 0.9398811443313216, "percentage": 93.99, "elapsed_time": "1 day, 8:15:48", "remaining_time": "2:03:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10202, "total_steps": 10853, "loss": 0.118, "learning_rate": 4.9026378616127133e-08, "epoch": 0.9399732805085917, "percentage": 94.0, "elapsed_time": "1 day, 8:16:00", "remaining_time": "2:03:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10203, "total_steps": 10853, "loss": 0.1084, "learning_rate": 4.8876367957895744e-08, "epoch": 0.9400654166858617, "percentage": 94.01, "elapsed_time": "1 day, 8:16:10", "remaining_time": "2:03:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10204, "total_steps": 10853, "loss": 0.1127, "learning_rate": 4.872658488675741e-08, "epoch": 0.9401575528631317, "percentage": 94.02, "elapsed_time": "1 day, 8:16:22", "remaining_time": "2:03:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10205, "total_steps": 10853, "loss": 0.1131, "learning_rate": 4.8577029416619625e-08, "epoch": 0.9402496890404017, "percentage": 94.03, "elapsed_time": "1 day, 8:16:34", "remaining_time": "2:02:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10206, "total_steps": 10853, "loss": 0.1083, "learning_rate": 4.84277015613685e-08, "epoch": 0.9403418252176717, "percentage": 94.04, "elapsed_time": "1 day, 8:16:44", "remaining_time": "2:02:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10207, "total_steps": 10853, "loss": 0.1192, "learning_rate": 4.8278601334869056e-08, "epoch": 0.9404339613949417, "percentage": 94.05, "elapsed_time": "1 day, 8:16:56", "remaining_time": "2:02:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10208, "total_steps": 10853, "loss": 0.1128, "learning_rate": 4.8129728750965224e-08, "epoch": 0.9405260975722117, "percentage": 94.06, "elapsed_time": "1 day, 8:17:07", "remaining_time": "2:02:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10209, "total_steps": 10853, "loss": 0.1303, "learning_rate": 4.79810838234801e-08, "epoch": 0.9406182337494817, "percentage": 94.07, "elapsed_time": "1 day, 8:17:18", "remaining_time": "2:02:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10210, "total_steps": 10853, "loss": 0.0994, "learning_rate": 4.7832666566215156e-08, "epoch": 0.9407103699267517, "percentage": 94.08, "elapsed_time": "1 day, 8:17:31", "remaining_time": "2:02:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10211, "total_steps": 10853, "loss": 0.1122, "learning_rate": 4.7684476992951033e-08, "epoch": 0.9408025061040217, "percentage": 94.08, "elapsed_time": "1 day, 8:17:41", "remaining_time": "2:01:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10212, "total_steps": 10853, "loss": 0.1072, "learning_rate": 4.753651511744728e-08, "epoch": 0.9408946422812917, "percentage": 94.09, "elapsed_time": "1 day, 8:17:53", "remaining_time": "2:01:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10213, "total_steps": 10853, "loss": 0.1167, "learning_rate": 4.738878095344207e-08, "epoch": 0.9409867784585617, "percentage": 94.1, "elapsed_time": "1 day, 8:18:03", "remaining_time": "2:01:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10214, "total_steps": 10853, "loss": 0.114, "learning_rate": 4.7241274514652217e-08, "epoch": 0.9410789146358317, "percentage": 94.11, "elapsed_time": "1 day, 8:18:14", "remaining_time": "2:01:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10215, "total_steps": 10853, "loss": 0.1234, "learning_rate": 4.7093995814773975e-08, "epoch": 0.9411710508131018, "percentage": 94.12, "elapsed_time": "1 day, 8:18:25", "remaining_time": "2:01:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10216, "total_steps": 10853, "loss": 0.1163, "learning_rate": 4.694694486748225e-08, "epoch": 0.9412631869903718, "percentage": 94.13, "elapsed_time": "1 day, 8:18:34", "remaining_time": "2:00:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10217, "total_steps": 10853, "loss": 0.1156, "learning_rate": 4.680012168643111e-08, "epoch": 0.9413553231676418, "percentage": 94.14, "elapsed_time": "1 day, 8:18:46", "remaining_time": "2:00:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10218, "total_steps": 10853, "loss": 0.1186, "learning_rate": 4.6653526285252437e-08, "epoch": 0.9414474593449118, "percentage": 94.15, "elapsed_time": "1 day, 8:18:58", "remaining_time": "2:00:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10219, "total_steps": 10853, "loss": 0.1124, "learning_rate": 4.650715867755784e-08, "epoch": 0.9415395955221818, "percentage": 94.16, "elapsed_time": "1 day, 8:19:09", "remaining_time": "2:00:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10220, "total_steps": 10853, "loss": 0.1156, "learning_rate": 4.636101887693756e-08, "epoch": 0.9416317316994518, "percentage": 94.17, "elapsed_time": "1 day, 8:19:19", "remaining_time": "2:00:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10221, "total_steps": 10853, "loss": 0.1234, "learning_rate": 4.621510689696046e-08, "epoch": 0.9417238678767218, "percentage": 94.18, "elapsed_time": "1 day, 8:19:31", "remaining_time": "1:59:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10222, "total_steps": 10853, "loss": 0.1082, "learning_rate": 4.606942275117543e-08, "epoch": 0.9418160040539918, "percentage": 94.19, "elapsed_time": "1 day, 8:19:41", "remaining_time": "1:59:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10223, "total_steps": 10853, "loss": 0.1154, "learning_rate": 4.5923966453108315e-08, "epoch": 0.9419081402312618, "percentage": 94.2, "elapsed_time": "1 day, 8:19:51", "remaining_time": "1:59:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10224, "total_steps": 10853, "loss": 0.1105, "learning_rate": 4.57787380162647e-08, "epoch": 0.9420002764085318, "percentage": 94.2, "elapsed_time": "1 day, 8:20:03", "remaining_time": "1:59:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10225, "total_steps": 10853, "loss": 0.1222, "learning_rate": 4.5633737454129636e-08, "epoch": 0.9420924125858018, "percentage": 94.21, "elapsed_time": "1 day, 8:20:13", "remaining_time": "1:59:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10226, "total_steps": 10853, "loss": 0.1213, "learning_rate": 4.548896478016651e-08, "epoch": 0.9421845487630718, "percentage": 94.22, "elapsed_time": "1 day, 8:20:25", "remaining_time": "1:58:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10227, "total_steps": 10853, "loss": 0.1125, "learning_rate": 4.5344420007816526e-08, "epoch": 0.9422766849403418, "percentage": 94.23, "elapsed_time": "1 day, 8:20:36", "remaining_time": "1:58:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10228, "total_steps": 10853, "loss": 0.1132, "learning_rate": 4.5200103150501996e-08, "epoch": 0.9423688211176118, "percentage": 94.24, "elapsed_time": "1 day, 8:20:47", "remaining_time": "1:58:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10229, "total_steps": 10853, "loss": 0.1106, "learning_rate": 4.5056014221621645e-08, "epoch": 0.9424609572948819, "percentage": 94.25, "elapsed_time": "1 day, 8:20:57", "remaining_time": "1:58:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10230, "total_steps": 10853, "loss": 0.1163, "learning_rate": 4.4912153234554777e-08, "epoch": 0.9425530934721519, "percentage": 94.26, "elapsed_time": "1 day, 8:21:08", "remaining_time": "1:58:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10231, "total_steps": 10853, "loss": 0.1036, "learning_rate": 4.4768520202658484e-08, "epoch": 0.9426452296494219, "percentage": 94.27, "elapsed_time": "1 day, 8:21:19", "remaining_time": "1:58:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10232, "total_steps": 10853, "loss": 0.1237, "learning_rate": 4.4625115139269314e-08, "epoch": 0.9427373658266919, "percentage": 94.28, "elapsed_time": "1 day, 8:21:31", "remaining_time": "1:57:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10233, "total_steps": 10853, "loss": 0.1118, "learning_rate": 4.448193805770273e-08, "epoch": 0.9428295020039619, "percentage": 94.29, "elapsed_time": "1 day, 8:21:42", "remaining_time": "1:57:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10234, "total_steps": 10853, "loss": 0.1255, "learning_rate": 4.4338988971252275e-08, "epoch": 0.9429216381812319, "percentage": 94.3, "elapsed_time": "1 day, 8:21:52", "remaining_time": "1:57:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10235, "total_steps": 10853, "loss": 0.1181, "learning_rate": 4.4196267893190926e-08, "epoch": 0.9430137743585019, "percentage": 94.31, "elapsed_time": "1 day, 8:22:03", "remaining_time": "1:57:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10236, "total_steps": 10853, "loss": 0.1235, "learning_rate": 4.4053774836770315e-08, "epoch": 0.9431059105357719, "percentage": 94.31, "elapsed_time": "1 day, 8:22:13", "remaining_time": "1:57:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10237, "total_steps": 10853, "loss": 0.1065, "learning_rate": 4.3911509815221244e-08, "epoch": 0.9431980467130419, "percentage": 94.32, "elapsed_time": "1 day, 8:22:24", "remaining_time": "1:56:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10238, "total_steps": 10853, "loss": 0.1147, "learning_rate": 4.3769472841752866e-08, "epoch": 0.9432901828903119, "percentage": 94.33, "elapsed_time": "1 day, 8:22:35", "remaining_time": "1:56:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10239, "total_steps": 10853, "loss": 0.1158, "learning_rate": 4.362766392955325e-08, "epoch": 0.9433823190675819, "percentage": 94.34, "elapsed_time": "1 day, 8:22:47", "remaining_time": "1:56:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10240, "total_steps": 10853, "loss": 0.1229, "learning_rate": 4.348608309178909e-08, "epoch": 0.9434744552448519, "percentage": 94.35, "elapsed_time": "1 day, 8:22:57", "remaining_time": "1:56:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10241, "total_steps": 10853, "loss": 0.1156, "learning_rate": 4.33447303416068e-08, "epoch": 0.9435665914221218, "percentage": 94.36, "elapsed_time": "1 day, 8:23:07", "remaining_time": "1:56:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10242, "total_steps": 10853, "loss": 0.1123, "learning_rate": 4.320360569213061e-08, "epoch": 0.943658727599392, "percentage": 94.37, "elapsed_time": "1 day, 8:23:18", "remaining_time": "1:55:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10243, "total_steps": 10853, "loss": 0.1157, "learning_rate": 4.3062709156463936e-08, "epoch": 0.943750863776662, "percentage": 94.38, "elapsed_time": "1 day, 8:23:29", "remaining_time": "1:55:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10244, "total_steps": 10853, "loss": 0.1169, "learning_rate": 4.292204074768908e-08, "epoch": 0.943842999953932, "percentage": 94.39, "elapsed_time": "1 day, 8:23:39", "remaining_time": "1:55:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10245, "total_steps": 10853, "loss": 0.1266, "learning_rate": 4.278160047886753e-08, "epoch": 0.943935136131202, "percentage": 94.4, "elapsed_time": "1 day, 8:23:50", "remaining_time": "1:55:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10246, "total_steps": 10853, "loss": 0.1203, "learning_rate": 4.264138836303861e-08, "epoch": 0.9440272723084719, "percentage": 94.41, "elapsed_time": "1 day, 8:24:00", "remaining_time": "1:55:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10247, "total_steps": 10853, "loss": 0.1272, "learning_rate": 4.250140441322131e-08, "epoch": 0.9441194084857419, "percentage": 94.42, "elapsed_time": "1 day, 8:24:11", "remaining_time": "1:54:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10248, "total_steps": 10853, "loss": 0.1184, "learning_rate": 4.236164864241277e-08, "epoch": 0.9442115446630119, "percentage": 94.43, "elapsed_time": "1 day, 8:24:24", "remaining_time": "1:54:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10249, "total_steps": 10853, "loss": 0.1153, "learning_rate": 4.22221210635898e-08, "epoch": 0.9443036808402819, "percentage": 94.43, "elapsed_time": "1 day, 8:24:35", "remaining_time": "1:54:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10250, "total_steps": 10853, "loss": 0.1173, "learning_rate": 4.208282168970762e-08, "epoch": 0.9443958170175519, "percentage": 94.44, "elapsed_time": "1 day, 8:24:46", "remaining_time": "1:54:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10251, "total_steps": 10853, "loss": 0.1264, "learning_rate": 4.1943750533700036e-08, "epoch": 0.9444879531948219, "percentage": 94.45, "elapsed_time": "1 day, 8:24:56", "remaining_time": "1:54:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10252, "total_steps": 10853, "loss": 0.1312, "learning_rate": 4.1804907608479494e-08, "epoch": 0.9445800893720919, "percentage": 94.46, "elapsed_time": "1 day, 8:25:06", "remaining_time": "1:54:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10253, "total_steps": 10853, "loss": 0.1095, "learning_rate": 4.166629292693791e-08, "epoch": 0.9446722255493619, "percentage": 94.47, "elapsed_time": "1 day, 8:25:17", "remaining_time": "1:53:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10254, "total_steps": 10853, "loss": 0.1136, "learning_rate": 4.1527906501945547e-08, "epoch": 0.9447643617266319, "percentage": 94.48, "elapsed_time": "1 day, 8:25:27", "remaining_time": "1:53:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10255, "total_steps": 10853, "loss": 0.123, "learning_rate": 4.138974834635157e-08, "epoch": 0.9448564979039019, "percentage": 94.49, "elapsed_time": "1 day, 8:25:39", "remaining_time": "1:53:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10256, "total_steps": 10853, "loss": 0.1184, "learning_rate": 4.1251818472984315e-08, "epoch": 0.944948634081172, "percentage": 94.5, "elapsed_time": "1 day, 8:25:50", "remaining_time": "1:53:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10257, "total_steps": 10853, "loss": 0.1161, "learning_rate": 4.1114116894650225e-08, "epoch": 0.945040770258442, "percentage": 94.51, "elapsed_time": "1 day, 8:26:01", "remaining_time": "1:53:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10258, "total_steps": 10853, "loss": 0.114, "learning_rate": 4.0976643624134896e-08, "epoch": 0.945132906435712, "percentage": 94.52, "elapsed_time": "1 day, 8:26:11", "remaining_time": "1:52:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10259, "total_steps": 10853, "loss": 0.1172, "learning_rate": 4.0839398674203114e-08, "epoch": 0.945225042612982, "percentage": 94.53, "elapsed_time": "1 day, 8:26:21", "remaining_time": "1:52:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10260, "total_steps": 10853, "loss": 0.1085, "learning_rate": 4.0702382057597465e-08, "epoch": 0.945317178790252, "percentage": 94.54, "elapsed_time": "1 day, 8:26:33", "remaining_time": "1:52:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10261, "total_steps": 10853, "loss": 0.1229, "learning_rate": 4.0565593787040555e-08, "epoch": 0.945409314967522, "percentage": 94.55, "elapsed_time": "1 day, 8:26:43", "remaining_time": "1:52:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10262, "total_steps": 10853, "loss": 0.1133, "learning_rate": 4.042903387523278e-08, "epoch": 0.945501451144792, "percentage": 94.55, "elapsed_time": "1 day, 8:26:55", "remaining_time": "1:52:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10263, "total_steps": 10853, "loss": 0.1178, "learning_rate": 4.029270233485427e-08, "epoch": 0.945593587322062, "percentage": 94.56, "elapsed_time": "1 day, 8:27:05", "remaining_time": "1:51:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10264, "total_steps": 10853, "loss": 0.1157, "learning_rate": 4.0156599178562686e-08, "epoch": 0.945685723499332, "percentage": 94.57, "elapsed_time": "1 day, 8:27:17", "remaining_time": "1:51:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10265, "total_steps": 10853, "loss": 0.1299, "learning_rate": 4.002072441899568e-08, "epoch": 0.945777859676602, "percentage": 94.58, "elapsed_time": "1 day, 8:27:28", "remaining_time": "1:51:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10266, "total_steps": 10853, "loss": 0.1099, "learning_rate": 3.988507806876929e-08, "epoch": 0.945869995853872, "percentage": 94.59, "elapsed_time": "1 day, 8:27:38", "remaining_time": "1:51:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10267, "total_steps": 10853, "loss": 0.1083, "learning_rate": 3.974966014047815e-08, "epoch": 0.945962132031142, "percentage": 94.6, "elapsed_time": "1 day, 8:27:48", "remaining_time": "1:51:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10268, "total_steps": 10853, "loss": 0.1077, "learning_rate": 3.961447064669582e-08, "epoch": 0.946054268208412, "percentage": 94.61, "elapsed_time": "1 day, 8:27:59", "remaining_time": "1:50:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10269, "total_steps": 10853, "loss": 0.1205, "learning_rate": 3.9479509599974486e-08, "epoch": 0.946146404385682, "percentage": 94.62, "elapsed_time": "1 day, 8:28:10", "remaining_time": "1:50:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10270, "total_steps": 10853, "loss": 0.1142, "learning_rate": 3.9344777012845504e-08, "epoch": 0.9462385405629521, "percentage": 94.63, "elapsed_time": "1 day, 8:28:20", "remaining_time": "1:50:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10271, "total_steps": 10853, "loss": 0.1286, "learning_rate": 3.921027289781915e-08, "epoch": 0.9463306767402221, "percentage": 94.64, "elapsed_time": "1 day, 8:28:31", "remaining_time": "1:50:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10272, "total_steps": 10853, "loss": 0.1214, "learning_rate": 3.907599726738348e-08, "epoch": 0.9464228129174921, "percentage": 94.65, "elapsed_time": "1 day, 8:28:41", "remaining_time": "1:50:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10273, "total_steps": 10853, "loss": 0.1087, "learning_rate": 3.894195013400631e-08, "epoch": 0.9465149490947621, "percentage": 94.66, "elapsed_time": "1 day, 8:28:50", "remaining_time": "1:50:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10274, "total_steps": 10853, "loss": 0.1263, "learning_rate": 3.8808131510134074e-08, "epoch": 0.9466070852720321, "percentage": 94.67, "elapsed_time": "1 day, 8:29:00", "remaining_time": "1:49:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10275, "total_steps": 10853, "loss": 0.1213, "learning_rate": 3.8674541408191824e-08, "epoch": 0.9466992214493021, "percentage": 94.67, "elapsed_time": "1 day, 8:29:10", "remaining_time": "1:49:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10276, "total_steps": 10853, "loss": 0.1212, "learning_rate": 3.854117984058298e-08, "epoch": 0.9467913576265721, "percentage": 94.68, "elapsed_time": "1 day, 8:29:21", "remaining_time": "1:49:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10277, "total_steps": 10853, "loss": 0.1067, "learning_rate": 3.840804681969068e-08, "epoch": 0.9468834938038421, "percentage": 94.69, "elapsed_time": "1 day, 8:29:32", "remaining_time": "1:49:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10278, "total_steps": 10853, "loss": 0.1217, "learning_rate": 3.827514235787616e-08, "epoch": 0.9469756299811121, "percentage": 94.7, "elapsed_time": "1 day, 8:29:43", "remaining_time": "1:49:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10279, "total_steps": 10853, "loss": 0.1105, "learning_rate": 3.8142466467479265e-08, "epoch": 0.9470677661583821, "percentage": 94.71, "elapsed_time": "1 day, 8:29:54", "remaining_time": "1:48:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10280, "total_steps": 10853, "loss": 0.1158, "learning_rate": 3.801001916081987e-08, "epoch": 0.9471599023356521, "percentage": 94.72, "elapsed_time": "1 day, 8:30:05", "remaining_time": "1:48:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10281, "total_steps": 10853, "loss": 0.119, "learning_rate": 3.787780045019479e-08, "epoch": 0.9472520385129221, "percentage": 94.73, "elapsed_time": "1 day, 8:30:16", "remaining_time": "1:48:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10282, "total_steps": 10853, "loss": 0.1135, "learning_rate": 3.774581034788116e-08, "epoch": 0.947344174690192, "percentage": 94.74, "elapsed_time": "1 day, 8:30:27", "remaining_time": "1:48:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10283, "total_steps": 10853, "loss": 0.1173, "learning_rate": 3.7614048866133624e-08, "epoch": 0.9474363108674622, "percentage": 94.75, "elapsed_time": "1 day, 8:30:36", "remaining_time": "1:48:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10284, "total_steps": 10853, "loss": 0.1223, "learning_rate": 3.748251601718711e-08, "epoch": 0.9475284470447322, "percentage": 94.76, "elapsed_time": "1 day, 8:30:48", "remaining_time": "1:47:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10285, "total_steps": 10853, "loss": 0.1196, "learning_rate": 3.7351211813253795e-08, "epoch": 0.9476205832220022, "percentage": 94.77, "elapsed_time": "1 day, 8:30:59", "remaining_time": "1:47:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10286, "total_steps": 10853, "loss": 0.1178, "learning_rate": 3.722013626652532e-08, "epoch": 0.9477127193992722, "percentage": 94.78, "elapsed_time": "1 day, 8:31:10", "remaining_time": "1:47:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10287, "total_steps": 10853, "loss": 0.1016, "learning_rate": 3.70892893891725e-08, "epoch": 0.9478048555765421, "percentage": 94.78, "elapsed_time": "1 day, 8:31:21", "remaining_time": "1:47:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10288, "total_steps": 10853, "loss": 0.1173, "learning_rate": 3.695867119334423e-08, "epoch": 0.9478969917538121, "percentage": 94.79, "elapsed_time": "1 day, 8:31:32", "remaining_time": "1:47:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10289, "total_steps": 10853, "loss": 0.1272, "learning_rate": 3.682828169116831e-08, "epoch": 0.9479891279310821, "percentage": 94.8, "elapsed_time": "1 day, 8:31:43", "remaining_time": "1:46:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10290, "total_steps": 10853, "loss": 0.1161, "learning_rate": 3.669812089475144e-08, "epoch": 0.9480812641083521, "percentage": 94.81, "elapsed_time": "1 day, 8:31:54", "remaining_time": "1:46:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10291, "total_steps": 10853, "loss": 0.1204, "learning_rate": 3.656818881617924e-08, "epoch": 0.9481734002856221, "percentage": 94.82, "elapsed_time": "1 day, 8:32:05", "remaining_time": "1:46:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10292, "total_steps": 10853, "loss": 0.1015, "learning_rate": 3.6438485467515935e-08, "epoch": 0.9482655364628921, "percentage": 94.83, "elapsed_time": "1 day, 8:32:16", "remaining_time": "1:46:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10293, "total_steps": 10853, "loss": 0.1283, "learning_rate": 3.630901086080441e-08, "epoch": 0.9483576726401621, "percentage": 94.84, "elapsed_time": "1 day, 8:32:26", "remaining_time": "1:46:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10294, "total_steps": 10853, "loss": 0.117, "learning_rate": 3.6179765008066134e-08, "epoch": 0.9484498088174321, "percentage": 94.85, "elapsed_time": "1 day, 8:32:35", "remaining_time": "1:46:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10295, "total_steps": 10853, "loss": 0.1089, "learning_rate": 3.605074792130181e-08, "epoch": 0.9485419449947021, "percentage": 94.86, "elapsed_time": "1 day, 8:32:46", "remaining_time": "1:45:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10296, "total_steps": 10853, "loss": 0.1118, "learning_rate": 3.5921959612491006e-08, "epoch": 0.9486340811719721, "percentage": 94.87, "elapsed_time": "1 day, 8:32:55", "remaining_time": "1:45:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10297, "total_steps": 10853, "loss": 0.1092, "learning_rate": 3.5793400093591394e-08, "epoch": 0.9487262173492422, "percentage": 94.88, "elapsed_time": "1 day, 8:33:07", "remaining_time": "1:45:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10298, "total_steps": 10853, "loss": 0.1276, "learning_rate": 3.5665069376539796e-08, "epoch": 0.9488183535265122, "percentage": 94.89, "elapsed_time": "1 day, 8:33:19", "remaining_time": "1:45:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10299, "total_steps": 10853, "loss": 0.1125, "learning_rate": 3.553696747325142e-08, "epoch": 0.9489104897037822, "percentage": 94.9, "elapsed_time": "1 day, 8:33:29", "remaining_time": "1:45:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10300, "total_steps": 10853, "loss": 0.1186, "learning_rate": 3.540909439562118e-08, "epoch": 0.9490026258810522, "percentage": 94.9, "elapsed_time": "1 day, 8:33:40", "remaining_time": "1:44:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10301, "total_steps": 10853, "loss": 0.1309, "learning_rate": 3.528145015552154e-08, "epoch": 0.9490947620583222, "percentage": 94.91, "elapsed_time": "1 day, 8:33:51", "remaining_time": "1:44:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10302, "total_steps": 10853, "loss": 0.1118, "learning_rate": 3.515403476480439e-08, "epoch": 0.9491868982355922, "percentage": 94.92, "elapsed_time": "1 day, 8:34:01", "remaining_time": "1:44:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10303, "total_steps": 10853, "loss": 0.11, "learning_rate": 3.5026848235300834e-08, "epoch": 0.9492790344128622, "percentage": 94.93, "elapsed_time": "1 day, 8:34:12", "remaining_time": "1:44:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10304, "total_steps": 10853, "loss": 0.1133, "learning_rate": 3.489989057881948e-08, "epoch": 0.9493711705901322, "percentage": 94.94, "elapsed_time": "1 day, 8:34:23", "remaining_time": "1:44:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10305, "total_steps": 10853, "loss": 0.1243, "learning_rate": 3.47731618071484e-08, "epoch": 0.9494633067674022, "percentage": 94.95, "elapsed_time": "1 day, 8:34:33", "remaining_time": "1:43:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10306, "total_steps": 10853, "loss": 0.1175, "learning_rate": 3.4646661932054846e-08, "epoch": 0.9495554429446722, "percentage": 94.96, "elapsed_time": "1 day, 8:34:43", "remaining_time": "1:43:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10307, "total_steps": 10853, "loss": 0.1169, "learning_rate": 3.452039096528359e-08, "epoch": 0.9496475791219422, "percentage": 94.97, "elapsed_time": "1 day, 8:34:53", "remaining_time": "1:43:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10308, "total_steps": 10853, "loss": 0.1117, "learning_rate": 3.439434891855997e-08, "epoch": 0.9497397152992122, "percentage": 94.98, "elapsed_time": "1 day, 8:35:03", "remaining_time": "1:43:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10309, "total_steps": 10853, "loss": 0.117, "learning_rate": 3.42685358035863e-08, "epoch": 0.9498318514764822, "percentage": 94.99, "elapsed_time": "1 day, 8:35:14", "remaining_time": "1:43:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10310, "total_steps": 10853, "loss": 0.1161, "learning_rate": 3.4142951632044065e-08, "epoch": 0.9499239876537523, "percentage": 95.0, "elapsed_time": "1 day, 8:35:25", "remaining_time": "1:42:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10311, "total_steps": 10853, "loss": 0.1268, "learning_rate": 3.401759641559449e-08, "epoch": 0.9500161238310223, "percentage": 95.01, "elapsed_time": "1 day, 8:35:36", "remaining_time": "1:42:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10312, "total_steps": 10853, "loss": 0.1143, "learning_rate": 3.3892470165876045e-08, "epoch": 0.9501082600082923, "percentage": 95.02, "elapsed_time": "1 day, 8:35:47", "remaining_time": "1:42:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10313, "total_steps": 10853, "loss": 0.1156, "learning_rate": 3.376757289450777e-08, "epoch": 0.9502003961855623, "percentage": 95.02, "elapsed_time": "1 day, 8:35:57", "remaining_time": "1:42:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10314, "total_steps": 10853, "loss": 0.1117, "learning_rate": 3.3642904613085393e-08, "epoch": 0.9502925323628323, "percentage": 95.03, "elapsed_time": "1 day, 8:36:07", "remaining_time": "1:42:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10315, "total_steps": 10853, "loss": 0.1192, "learning_rate": 3.3518465333184925e-08, "epoch": 0.9503846685401023, "percentage": 95.04, "elapsed_time": "1 day, 8:36:18", "remaining_time": "1:42:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10316, "total_steps": 10853, "loss": 0.1054, "learning_rate": 3.339425506636018e-08, "epoch": 0.9504768047173723, "percentage": 95.05, "elapsed_time": "1 day, 8:36:29", "remaining_time": "1:41:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10317, "total_steps": 10853, "loss": 0.1131, "learning_rate": 3.327027382414444e-08, "epoch": 0.9505689408946423, "percentage": 95.06, "elapsed_time": "1 day, 8:36:40", "remaining_time": "1:41:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10318, "total_steps": 10853, "loss": 0.1161, "learning_rate": 3.314652161804932e-08, "epoch": 0.9506610770719123, "percentage": 95.07, "elapsed_time": "1 day, 8:36:51", "remaining_time": "1:41:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10319, "total_steps": 10853, "loss": 0.1201, "learning_rate": 3.30229984595648e-08, "epoch": 0.9507532132491823, "percentage": 95.08, "elapsed_time": "1 day, 8:37:02", "remaining_time": "1:41:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10320, "total_steps": 10853, "loss": 0.1221, "learning_rate": 3.289970436016088e-08, "epoch": 0.9508453494264523, "percentage": 95.09, "elapsed_time": "1 day, 8:37:12", "remaining_time": "1:41:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10321, "total_steps": 10853, "loss": 0.1144, "learning_rate": 3.2776639331284774e-08, "epoch": 0.9509374856037223, "percentage": 95.1, "elapsed_time": "1 day, 8:37:23", "remaining_time": "1:40:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10322, "total_steps": 10853, "loss": 0.1181, "learning_rate": 3.2653803384362914e-08, "epoch": 0.9510296217809923, "percentage": 95.11, "elapsed_time": "1 day, 8:37:35", "remaining_time": "1:40:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10323, "total_steps": 10853, "loss": 0.1223, "learning_rate": 3.253119653080117e-08, "epoch": 0.9511217579582623, "percentage": 95.12, "elapsed_time": "1 day, 8:37:46", "remaining_time": "1:40:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10324, "total_steps": 10853, "loss": 0.1185, "learning_rate": 3.240881878198349e-08, "epoch": 0.9512138941355324, "percentage": 95.13, "elapsed_time": "1 day, 8:37:58", "remaining_time": "1:40:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10325, "total_steps": 10853, "loss": 0.1042, "learning_rate": 3.228667014927245e-08, "epoch": 0.9513060303128024, "percentage": 95.13, "elapsed_time": "1 day, 8:38:08", "remaining_time": "1:40:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10326, "total_steps": 10853, "loss": 0.1217, "learning_rate": 3.2164750644009814e-08, "epoch": 0.9513981664900724, "percentage": 95.14, "elapsed_time": "1 day, 8:38:20", "remaining_time": "1:39:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10327, "total_steps": 10853, "loss": 0.1116, "learning_rate": 3.204306027751541e-08, "epoch": 0.9514903026673424, "percentage": 95.15, "elapsed_time": "1 day, 8:38:29", "remaining_time": "1:39:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10328, "total_steps": 10853, "loss": 0.1249, "learning_rate": 3.1921599061088546e-08, "epoch": 0.9515824388446124, "percentage": 95.16, "elapsed_time": "1 day, 8:38:39", "remaining_time": "1:39:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10329, "total_steps": 10853, "loss": 0.1114, "learning_rate": 3.180036700600686e-08, "epoch": 0.9516745750218824, "percentage": 95.17, "elapsed_time": "1 day, 8:38:49", "remaining_time": "1:39:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10330, "total_steps": 10853, "loss": 0.1187, "learning_rate": 3.1679364123526625e-08, "epoch": 0.9517667111991523, "percentage": 95.18, "elapsed_time": "1 day, 8:39:00", "remaining_time": "1:39:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10331, "total_steps": 10853, "loss": 0.1276, "learning_rate": 3.1558590424883294e-08, "epoch": 0.9518588473764223, "percentage": 95.19, "elapsed_time": "1 day, 8:39:12", "remaining_time": "1:38:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10332, "total_steps": 10853, "loss": 0.124, "learning_rate": 3.1438045921290404e-08, "epoch": 0.9519509835536923, "percentage": 95.2, "elapsed_time": "1 day, 8:39:24", "remaining_time": "1:38:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10333, "total_steps": 10853, "loss": 0.1033, "learning_rate": 3.1317730623940665e-08, "epoch": 0.9520431197309623, "percentage": 95.21, "elapsed_time": "1 day, 8:39:35", "remaining_time": "1:38:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10334, "total_steps": 10853, "loss": 0.1218, "learning_rate": 3.119764454400515e-08, "epoch": 0.9521352559082323, "percentage": 95.22, "elapsed_time": "1 day, 8:39:46", "remaining_time": "1:38:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10335, "total_steps": 10853, "loss": 0.121, "learning_rate": 3.1077787692634085e-08, "epoch": 0.9522273920855023, "percentage": 95.23, "elapsed_time": "1 day, 8:39:57", "remaining_time": "1:38:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10336, "total_steps": 10853, "loss": 0.1149, "learning_rate": 3.095816008095637e-08, "epoch": 0.9523195282627723, "percentage": 95.24, "elapsed_time": "1 day, 8:40:08", "remaining_time": "1:38:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10337, "total_steps": 10853, "loss": 0.122, "learning_rate": 3.083876172007894e-08, "epoch": 0.9524116644400424, "percentage": 95.25, "elapsed_time": "1 day, 8:40:19", "remaining_time": "1:37:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10338, "total_steps": 10853, "loss": 0.1063, "learning_rate": 3.071959262108848e-08, "epoch": 0.9525038006173124, "percentage": 95.25, "elapsed_time": "1 day, 8:40:28", "remaining_time": "1:37:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10339, "total_steps": 10853, "loss": 0.112, "learning_rate": 3.0600652795049204e-08, "epoch": 0.9525959367945824, "percentage": 95.26, "elapsed_time": "1 day, 8:40:38", "remaining_time": "1:37:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10340, "total_steps": 10853, "loss": 0.112, "learning_rate": 3.048194225300532e-08, "epoch": 0.9526880729718524, "percentage": 95.27, "elapsed_time": "1 day, 8:40:48", "remaining_time": "1:37:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10341, "total_steps": 10853, "loss": 0.1103, "learning_rate": 3.0363461005978865e-08, "epoch": 0.9527802091491224, "percentage": 95.28, "elapsed_time": "1 day, 8:41:00", "remaining_time": "1:37:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10342, "total_steps": 10853, "loss": 0.1088, "learning_rate": 3.024520906497103e-08, "epoch": 0.9528723453263924, "percentage": 95.29, "elapsed_time": "1 day, 8:41:11", "remaining_time": "1:36:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10343, "total_steps": 10853, "loss": 0.116, "learning_rate": 3.012718644096107e-08, "epoch": 0.9529644815036624, "percentage": 95.3, "elapsed_time": "1 day, 8:41:21", "remaining_time": "1:36:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10344, "total_steps": 10853, "loss": 0.1025, "learning_rate": 3.0009393144907475e-08, "epoch": 0.9530566176809324, "percentage": 95.31, "elapsed_time": "1 day, 8:41:31", "remaining_time": "1:36:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10345, "total_steps": 10853, "loss": 0.1208, "learning_rate": 2.989182918774786e-08, "epoch": 0.9531487538582024, "percentage": 95.32, "elapsed_time": "1 day, 8:41:41", "remaining_time": "1:36:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10346, "total_steps": 10853, "loss": 0.1339, "learning_rate": 2.977449458039766e-08, "epoch": 0.9532408900354724, "percentage": 95.33, "elapsed_time": "1 day, 8:41:51", "remaining_time": "1:36:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10347, "total_steps": 10853, "loss": 0.1154, "learning_rate": 2.9657389333751784e-08, "epoch": 0.9533330262127424, "percentage": 95.34, "elapsed_time": "1 day, 8:42:01", "remaining_time": "1:35:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10348, "total_steps": 10853, "loss": 0.1031, "learning_rate": 2.954051345868264e-08, "epoch": 0.9534251623900124, "percentage": 95.35, "elapsed_time": "1 day, 8:42:10", "remaining_time": "1:35:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10349, "total_steps": 10853, "loss": 0.1116, "learning_rate": 2.9423866966042935e-08, "epoch": 0.9535172985672824, "percentage": 95.36, "elapsed_time": "1 day, 8:42:21", "remaining_time": "1:35:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10350, "total_steps": 10853, "loss": 0.1174, "learning_rate": 2.9307449866663174e-08, "epoch": 0.9536094347445524, "percentage": 95.37, "elapsed_time": "1 day, 8:42:32", "remaining_time": "1:35:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10351, "total_steps": 10853, "loss": 0.1111, "learning_rate": 2.9191262171352486e-08, "epoch": 0.9537015709218225, "percentage": 95.37, "elapsed_time": "1 day, 8:42:42", "remaining_time": "1:35:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10352, "total_steps": 10853, "loss": 0.1282, "learning_rate": 2.9075303890899187e-08, "epoch": 0.9537937070990925, "percentage": 95.38, "elapsed_time": "1 day, 8:42:52", "remaining_time": "1:34:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10353, "total_steps": 10853, "loss": 0.1274, "learning_rate": 2.895957503606939e-08, "epoch": 0.9538858432763625, "percentage": 95.39, "elapsed_time": "1 day, 8:43:03", "remaining_time": "1:34:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10354, "total_steps": 10853, "loss": 0.1105, "learning_rate": 2.8844075617609492e-08, "epoch": 0.9539779794536325, "percentage": 95.4, "elapsed_time": "1 day, 8:43:14", "remaining_time": "1:34:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10355, "total_steps": 10853, "loss": 0.1128, "learning_rate": 2.8728805646242863e-08, "epoch": 0.9540701156309025, "percentage": 95.41, "elapsed_time": "1 day, 8:43:25", "remaining_time": "1:34:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10356, "total_steps": 10853, "loss": 0.1128, "learning_rate": 2.8613765132672612e-08, "epoch": 0.9541622518081725, "percentage": 95.42, "elapsed_time": "1 day, 8:43:34", "remaining_time": "1:34:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10357, "total_steps": 10853, "loss": 0.0943, "learning_rate": 2.8498954087580187e-08, "epoch": 0.9542543879854425, "percentage": 95.43, "elapsed_time": "1 day, 8:43:44", "remaining_time": "1:34:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10358, "total_steps": 10853, "loss": 0.1172, "learning_rate": 2.8384372521626236e-08, "epoch": 0.9543465241627125, "percentage": 95.44, "elapsed_time": "1 day, 8:43:55", "remaining_time": "1:33:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10359, "total_steps": 10853, "loss": 0.1148, "learning_rate": 2.827002044544891e-08, "epoch": 0.9544386603399825, "percentage": 95.45, "elapsed_time": "1 day, 8:44:06", "remaining_time": "1:33:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10360, "total_steps": 10853, "loss": 0.1206, "learning_rate": 2.8155897869666105e-08, "epoch": 0.9545307965172525, "percentage": 95.46, "elapsed_time": "1 day, 8:44:17", "remaining_time": "1:33:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10361, "total_steps": 10853, "loss": 0.1116, "learning_rate": 2.8042004804874346e-08, "epoch": 0.9546229326945225, "percentage": 95.47, "elapsed_time": "1 day, 8:44:28", "remaining_time": "1:33:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10362, "total_steps": 10853, "loss": 0.1018, "learning_rate": 2.7928341261648507e-08, "epoch": 0.9547150688717925, "percentage": 95.48, "elapsed_time": "1 day, 8:44:39", "remaining_time": "1:33:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10363, "total_steps": 10853, "loss": 0.1133, "learning_rate": 2.7814907250542368e-08, "epoch": 0.9548072050490625, "percentage": 95.49, "elapsed_time": "1 day, 8:44:51", "remaining_time": "1:32:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10364, "total_steps": 10853, "loss": 0.1211, "learning_rate": 2.770170278208806e-08, "epoch": 0.9548993412263325, "percentage": 95.49, "elapsed_time": "1 day, 8:45:02", "remaining_time": "1:32:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10365, "total_steps": 10853, "loss": 0.1193, "learning_rate": 2.7588727866796617e-08, "epoch": 0.9549914774036026, "percentage": 95.5, "elapsed_time": "1 day, 8:45:13", "remaining_time": "1:32:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10366, "total_steps": 10853, "loss": 0.108, "learning_rate": 2.7475982515157986e-08, "epoch": 0.9550836135808726, "percentage": 95.51, "elapsed_time": "1 day, 8:45:23", "remaining_time": "1:32:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10367, "total_steps": 10853, "loss": 0.1126, "learning_rate": 2.7363466737640453e-08, "epoch": 0.9551757497581426, "percentage": 95.52, "elapsed_time": "1 day, 8:45:33", "remaining_time": "1:32:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10368, "total_steps": 10853, "loss": 0.1166, "learning_rate": 2.7251180544691225e-08, "epoch": 0.9552678859354126, "percentage": 95.53, "elapsed_time": "1 day, 8:45:44", "remaining_time": "1:31:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10369, "total_steps": 10853, "loss": 0.1229, "learning_rate": 2.7139123946735847e-08, "epoch": 0.9553600221126826, "percentage": 95.54, "elapsed_time": "1 day, 8:45:56", "remaining_time": "1:31:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10370, "total_steps": 10853, "loss": 0.1169, "learning_rate": 2.7027296954178773e-08, "epoch": 0.9554521582899526, "percentage": 95.55, "elapsed_time": "1 day, 8:46:07", "remaining_time": "1:31:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10371, "total_steps": 10853, "loss": 0.1119, "learning_rate": 2.6915699577403644e-08, "epoch": 0.9555442944672226, "percentage": 95.56, "elapsed_time": "1 day, 8:46:19", "remaining_time": "1:31:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10372, "total_steps": 10853, "loss": 0.1151, "learning_rate": 2.680433182677189e-08, "epoch": 0.9556364306444926, "percentage": 95.57, "elapsed_time": "1 day, 8:46:30", "remaining_time": "1:31:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10373, "total_steps": 10853, "loss": 0.1183, "learning_rate": 2.6693193712624133e-08, "epoch": 0.9557285668217625, "percentage": 95.58, "elapsed_time": "1 day, 8:46:41", "remaining_time": "1:31:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10374, "total_steps": 10853, "loss": 0.1121, "learning_rate": 2.6582285245279338e-08, "epoch": 0.9558207029990325, "percentage": 95.59, "elapsed_time": "1 day, 8:46:52", "remaining_time": "1:30:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10375, "total_steps": 10853, "loss": 0.1075, "learning_rate": 2.6471606435035934e-08, "epoch": 0.9559128391763025, "percentage": 95.6, "elapsed_time": "1 day, 8:47:03", "remaining_time": "1:30:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10376, "total_steps": 10853, "loss": 0.1195, "learning_rate": 2.6361157292169593e-08, "epoch": 0.9560049753535725, "percentage": 95.6, "elapsed_time": "1 day, 8:47:12", "remaining_time": "1:30:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10377, "total_steps": 10853, "loss": 0.12, "learning_rate": 2.6250937826936274e-08, "epoch": 0.9560971115308425, "percentage": 95.61, "elapsed_time": "1 day, 8:47:22", "remaining_time": "1:30:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10378, "total_steps": 10853, "loss": 0.111, "learning_rate": 2.6140948049569737e-08, "epoch": 0.9561892477081126, "percentage": 95.62, "elapsed_time": "1 day, 8:47:32", "remaining_time": "1:30:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10379, "total_steps": 10853, "loss": 0.1256, "learning_rate": 2.603118797028209e-08, "epoch": 0.9562813838853826, "percentage": 95.63, "elapsed_time": "1 day, 8:47:42", "remaining_time": "1:29:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10380, "total_steps": 10853, "loss": 0.1157, "learning_rate": 2.592165759926518e-08, "epoch": 0.9563735200626526, "percentage": 95.64, "elapsed_time": "1 day, 8:47:53", "remaining_time": "1:29:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10381, "total_steps": 10853, "loss": 0.1102, "learning_rate": 2.5812356946688376e-08, "epoch": 0.9564656562399226, "percentage": 95.65, "elapsed_time": "1 day, 8:48:03", "remaining_time": "1:29:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10382, "total_steps": 10853, "loss": 0.1209, "learning_rate": 2.5703286022700503e-08, "epoch": 0.9565577924171926, "percentage": 95.66, "elapsed_time": "1 day, 8:48:14", "remaining_time": "1:29:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10383, "total_steps": 10853, "loss": 0.122, "learning_rate": 2.559444483742901e-08, "epoch": 0.9566499285944626, "percentage": 95.67, "elapsed_time": "1 day, 8:48:25", "remaining_time": "1:29:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10384, "total_steps": 10853, "loss": 0.1099, "learning_rate": 2.548583340097971e-08, "epoch": 0.9567420647717326, "percentage": 95.68, "elapsed_time": "1 day, 8:48:37", "remaining_time": "1:28:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10385, "total_steps": 10853, "loss": 0.1122, "learning_rate": 2.5377451723436753e-08, "epoch": 0.9568342009490026, "percentage": 95.69, "elapsed_time": "1 day, 8:48:48", "remaining_time": "1:28:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10386, "total_steps": 10853, "loss": 0.125, "learning_rate": 2.5269299814863756e-08, "epoch": 0.9569263371262726, "percentage": 95.7, "elapsed_time": "1 day, 8:49:00", "remaining_time": "1:28:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10387, "total_steps": 10853, "loss": 0.1283, "learning_rate": 2.5161377685302968e-08, "epoch": 0.9570184733035426, "percentage": 95.71, "elapsed_time": "1 day, 8:49:11", "remaining_time": "1:28:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10388, "total_steps": 10853, "loss": 0.1199, "learning_rate": 2.505368534477415e-08, "epoch": 0.9571106094808126, "percentage": 95.72, "elapsed_time": "1 day, 8:49:22", "remaining_time": "1:28:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10389, "total_steps": 10853, "loss": 0.0986, "learning_rate": 2.4946222803277354e-08, "epoch": 0.9572027456580826, "percentage": 95.72, "elapsed_time": "1 day, 8:49:33", "remaining_time": "1:27:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10390, "total_steps": 10853, "loss": 0.1306, "learning_rate": 2.483899007078988e-08, "epoch": 0.9572948818353526, "percentage": 95.73, "elapsed_time": "1 day, 8:49:44", "remaining_time": "1:27:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10391, "total_steps": 10853, "loss": 0.1247, "learning_rate": 2.4731987157268768e-08, "epoch": 0.9573870180126226, "percentage": 95.74, "elapsed_time": "1 day, 8:49:55", "remaining_time": "1:27:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10392, "total_steps": 10853, "loss": 0.1122, "learning_rate": 2.462521407264912e-08, "epoch": 0.9574791541898927, "percentage": 95.75, "elapsed_time": "1 day, 8:50:07", "remaining_time": "1:27:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10393, "total_steps": 10853, "loss": 0.1129, "learning_rate": 2.4518670826844393e-08, "epoch": 0.9575712903671627, "percentage": 95.76, "elapsed_time": "1 day, 8:50:17", "remaining_time": "1:27:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10394, "total_steps": 10853, "loss": 0.1156, "learning_rate": 2.4412357429747514e-08, "epoch": 0.9576634265444327, "percentage": 95.77, "elapsed_time": "1 day, 8:50:27", "remaining_time": "1:27:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10395, "total_steps": 10853, "loss": 0.1104, "learning_rate": 2.4306273891230025e-08, "epoch": 0.9577555627217027, "percentage": 95.78, "elapsed_time": "1 day, 8:50:38", "remaining_time": "1:26:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10396, "total_steps": 10853, "loss": 0.1333, "learning_rate": 2.4200420221141274e-08, "epoch": 0.9578476988989727, "percentage": 95.79, "elapsed_time": "1 day, 8:50:49", "remaining_time": "1:26:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10397, "total_steps": 10853, "loss": 0.1398, "learning_rate": 2.4094796429310063e-08, "epoch": 0.9579398350762427, "percentage": 95.8, "elapsed_time": "1 day, 8:51:00", "remaining_time": "1:26:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10398, "total_steps": 10853, "loss": 0.1067, "learning_rate": 2.398940252554327e-08, "epoch": 0.9580319712535127, "percentage": 95.81, "elapsed_time": "1 day, 8:51:11", "remaining_time": "1:26:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10399, "total_steps": 10853, "loss": 0.1124, "learning_rate": 2.3884238519626957e-08, "epoch": 0.9581241074307827, "percentage": 95.82, "elapsed_time": "1 day, 8:51:21", "remaining_time": "1:26:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10400, "total_steps": 10853, "loss": 0.1116, "learning_rate": 2.3779304421325532e-08, "epoch": 0.9582162436080527, "percentage": 95.83, "elapsed_time": "1 day, 8:51:32", "remaining_time": "1:25:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10401, "total_steps": 10853, "loss": 0.1218, "learning_rate": 2.3674600240382594e-08, "epoch": 0.9583083797853227, "percentage": 95.84, "elapsed_time": "1 day, 8:51:43", "remaining_time": "1:25:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10402, "total_steps": 10853, "loss": 0.1234, "learning_rate": 2.3570125986518977e-08, "epoch": 0.9584005159625927, "percentage": 95.84, "elapsed_time": "1 day, 8:51:53", "remaining_time": "1:25:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10403, "total_steps": 10853, "loss": 0.115, "learning_rate": 2.346588166943581e-08, "epoch": 0.9584926521398627, "percentage": 95.85, "elapsed_time": "1 day, 8:52:03", "remaining_time": "1:25:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10404, "total_steps": 10853, "loss": 0.1194, "learning_rate": 2.336186729881229e-08, "epoch": 0.9585847883171327, "percentage": 95.86, "elapsed_time": "1 day, 8:52:13", "remaining_time": "1:25:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10405, "total_steps": 10853, "loss": 0.1186, "learning_rate": 2.32580828843057e-08, "epoch": 0.9586769244944028, "percentage": 95.87, "elapsed_time": "1 day, 8:52:24", "remaining_time": "1:24:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10406, "total_steps": 10853, "loss": 0.1092, "learning_rate": 2.3154528435553046e-08, "epoch": 0.9587690606716728, "percentage": 95.88, "elapsed_time": "1 day, 8:52:35", "remaining_time": "1:24:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10407, "total_steps": 10853, "loss": 0.0984, "learning_rate": 2.3051203962168588e-08, "epoch": 0.9588611968489428, "percentage": 95.89, "elapsed_time": "1 day, 8:52:45", "remaining_time": "1:24:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10408, "total_steps": 10853, "loss": 0.1201, "learning_rate": 2.2948109473746593e-08, "epoch": 0.9589533330262128, "percentage": 95.9, "elapsed_time": "1 day, 8:52:55", "remaining_time": "1:24:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10409, "total_steps": 10853, "loss": 0.1207, "learning_rate": 2.2845244979859127e-08, "epoch": 0.9590454692034828, "percentage": 95.91, "elapsed_time": "1 day, 8:53:07", "remaining_time": "1:24:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10410, "total_steps": 10853, "loss": 0.1243, "learning_rate": 2.274261049005716e-08, "epoch": 0.9591376053807528, "percentage": 95.92, "elapsed_time": "1 day, 8:53:17", "remaining_time": "1:23:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10411, "total_steps": 10853, "loss": 0.1186, "learning_rate": 2.264020601387057e-08, "epoch": 0.9592297415580228, "percentage": 95.93, "elapsed_time": "1 day, 8:53:29", "remaining_time": "1:23:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10412, "total_steps": 10853, "loss": 0.1362, "learning_rate": 2.2538031560807584e-08, "epoch": 0.9593218777352928, "percentage": 95.94, "elapsed_time": "1 day, 8:53:40", "remaining_time": "1:23:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10413, "total_steps": 10853, "loss": 0.1276, "learning_rate": 2.243608714035478e-08, "epoch": 0.9594140139125628, "percentage": 95.95, "elapsed_time": "1 day, 8:53:50", "remaining_time": "1:23:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10414, "total_steps": 10853, "loss": 0.1123, "learning_rate": 2.2334372761977918e-08, "epoch": 0.9595061500898328, "percentage": 95.96, "elapsed_time": "1 day, 8:54:01", "remaining_time": "1:23:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10415, "total_steps": 10853, "loss": 0.1082, "learning_rate": 2.2232888435121115e-08, "epoch": 0.9595982862671028, "percentage": 95.96, "elapsed_time": "1 day, 8:54:12", "remaining_time": "1:23:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10416, "total_steps": 10853, "loss": 0.1001, "learning_rate": 2.213163416920766e-08, "epoch": 0.9596904224443727, "percentage": 95.97, "elapsed_time": "1 day, 8:54:24", "remaining_time": "1:22:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10417, "total_steps": 10853, "loss": 0.1357, "learning_rate": 2.203060997363837e-08, "epoch": 0.9597825586216427, "percentage": 95.98, "elapsed_time": "1 day, 8:54:35", "remaining_time": "1:22:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10418, "total_steps": 10853, "loss": 0.1232, "learning_rate": 2.1929815857793802e-08, "epoch": 0.9598746947989127, "percentage": 95.99, "elapsed_time": "1 day, 8:54:46", "remaining_time": "1:22:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10419, "total_steps": 10853, "loss": 0.1048, "learning_rate": 2.1829251831032293e-08, "epoch": 0.9599668309761828, "percentage": 96.0, "elapsed_time": "1 day, 8:54:57", "remaining_time": "1:22:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10420, "total_steps": 10853, "loss": 0.1191, "learning_rate": 2.172891790269166e-08, "epoch": 0.9600589671534528, "percentage": 96.01, "elapsed_time": "1 day, 8:55:08", "remaining_time": "1:22:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10421, "total_steps": 10853, "loss": 0.1059, "learning_rate": 2.1628814082087503e-08, "epoch": 0.9601511033307228, "percentage": 96.02, "elapsed_time": "1 day, 8:55:19", "remaining_time": "1:21:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10422, "total_steps": 10853, "loss": 0.1162, "learning_rate": 2.1528940378514885e-08, "epoch": 0.9602432395079928, "percentage": 96.03, "elapsed_time": "1 day, 8:55:31", "remaining_time": "1:21:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10423, "total_steps": 10853, "loss": 0.1193, "learning_rate": 2.142929680124667e-08, "epoch": 0.9603353756852628, "percentage": 96.04, "elapsed_time": "1 day, 8:55:43", "remaining_time": "1:21:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10424, "total_steps": 10853, "loss": 0.1224, "learning_rate": 2.1329883359535174e-08, "epoch": 0.9604275118625328, "percentage": 96.05, "elapsed_time": "1 day, 8:55:54", "remaining_time": "1:21:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10425, "total_steps": 10853, "loss": 0.1116, "learning_rate": 2.12307000626108e-08, "epoch": 0.9605196480398028, "percentage": 96.06, "elapsed_time": "1 day, 8:56:04", "remaining_time": "1:21:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10426, "total_steps": 10853, "loss": 0.1222, "learning_rate": 2.113174691968256e-08, "epoch": 0.9606117842170728, "percentage": 96.07, "elapsed_time": "1 day, 8:56:15", "remaining_time": "1:20:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10427, "total_steps": 10853, "loss": 0.1215, "learning_rate": 2.103302393993867e-08, "epoch": 0.9607039203943428, "percentage": 96.07, "elapsed_time": "1 day, 8:56:27", "remaining_time": "1:20:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10428, "total_steps": 10853, "loss": 0.1119, "learning_rate": 2.0934531132544845e-08, "epoch": 0.9607960565716128, "percentage": 96.08, "elapsed_time": "1 day, 8:56:39", "remaining_time": "1:20:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10429, "total_steps": 10853, "loss": 0.1159, "learning_rate": 2.0836268506647108e-08, "epoch": 0.9608881927488828, "percentage": 96.09, "elapsed_time": "1 day, 8:56:50", "remaining_time": "1:20:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10430, "total_steps": 10853, "loss": 0.1267, "learning_rate": 2.0738236071368157e-08, "epoch": 0.9609803289261528, "percentage": 96.1, "elapsed_time": "1 day, 8:57:01", "remaining_time": "1:20:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10431, "total_steps": 10853, "loss": 0.124, "learning_rate": 2.0640433835810992e-08, "epoch": 0.9610724651034228, "percentage": 96.11, "elapsed_time": "1 day, 8:57:13", "remaining_time": "1:19:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10432, "total_steps": 10853, "loss": 0.1195, "learning_rate": 2.0542861809056403e-08, "epoch": 0.9611646012806928, "percentage": 96.12, "elapsed_time": "1 day, 8:57:24", "remaining_time": "1:19:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10433, "total_steps": 10853, "loss": 0.1221, "learning_rate": 2.044552000016409e-08, "epoch": 0.9612567374579629, "percentage": 96.13, "elapsed_time": "1 day, 8:57:36", "remaining_time": "1:19:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10434, "total_steps": 10853, "loss": 0.1264, "learning_rate": 2.0348408418172095e-08, "epoch": 0.9613488736352329, "percentage": 96.14, "elapsed_time": "1 day, 8:57:47", "remaining_time": "1:19:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10435, "total_steps": 10853, "loss": 0.1254, "learning_rate": 2.025152707209682e-08, "epoch": 0.9614410098125029, "percentage": 96.15, "elapsed_time": "1 day, 8:57:58", "remaining_time": "1:19:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10436, "total_steps": 10853, "loss": 0.1203, "learning_rate": 2.0154875970934406e-08, "epoch": 0.9615331459897729, "percentage": 96.16, "elapsed_time": "1 day, 8:58:10", "remaining_time": "1:19:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10437, "total_steps": 10853, "loss": 0.1034, "learning_rate": 2.0058455123658783e-08, "epoch": 0.9616252821670429, "percentage": 96.17, "elapsed_time": "1 day, 8:58:22", "remaining_time": "1:18:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10438, "total_steps": 10853, "loss": 0.1133, "learning_rate": 1.996226453922251e-08, "epoch": 0.9617174183443129, "percentage": 96.18, "elapsed_time": "1 day, 8:58:32", "remaining_time": "1:18:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10439, "total_steps": 10853, "loss": 0.122, "learning_rate": 1.98663042265565e-08, "epoch": 0.9618095545215829, "percentage": 96.19, "elapsed_time": "1 day, 8:58:43", "remaining_time": "1:18:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10440, "total_steps": 10853, "loss": 0.1164, "learning_rate": 1.97705741945714e-08, "epoch": 0.9619016906988529, "percentage": 96.19, "elapsed_time": "1 day, 8:58:54", "remaining_time": "1:18:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10441, "total_steps": 10853, "loss": 0.122, "learning_rate": 1.9675074452155385e-08, "epoch": 0.9619938268761229, "percentage": 96.2, "elapsed_time": "1 day, 8:59:06", "remaining_time": "1:18:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10442, "total_steps": 10853, "loss": 0.1125, "learning_rate": 1.9579805008175524e-08, "epoch": 0.9620859630533929, "percentage": 96.21, "elapsed_time": "1 day, 8:59:17", "remaining_time": "1:17:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10443, "total_steps": 10853, "loss": 0.124, "learning_rate": 1.9484765871477795e-08, "epoch": 0.9621780992306629, "percentage": 96.22, "elapsed_time": "1 day, 8:59:29", "remaining_time": "1:17:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10444, "total_steps": 10853, "loss": 0.1299, "learning_rate": 1.9389957050886255e-08, "epoch": 0.9622702354079329, "percentage": 96.23, "elapsed_time": "1 day, 8:59:40", "remaining_time": "1:17:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10445, "total_steps": 10853, "loss": 0.1108, "learning_rate": 1.9295378555204692e-08, "epoch": 0.9623623715852029, "percentage": 96.24, "elapsed_time": "1 day, 8:59:50", "remaining_time": "1:17:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10446, "total_steps": 10853, "loss": 0.1038, "learning_rate": 1.920103039321386e-08, "epoch": 0.962454507762473, "percentage": 96.25, "elapsed_time": "1 day, 9:00:01", "remaining_time": "1:17:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10447, "total_steps": 10853, "loss": 0.1185, "learning_rate": 1.910691257367425e-08, "epoch": 0.962546643939743, "percentage": 96.26, "elapsed_time": "1 day, 9:00:12", "remaining_time": "1:16:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10448, "total_steps": 10853, "loss": 0.1156, "learning_rate": 1.9013025105324988e-08, "epoch": 0.962638780117013, "percentage": 96.27, "elapsed_time": "1 day, 9:00:23", "remaining_time": "1:16:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10449, "total_steps": 10853, "loss": 0.1358, "learning_rate": 1.8919367996883263e-08, "epoch": 0.962730916294283, "percentage": 96.28, "elapsed_time": "1 day, 9:00:33", "remaining_time": "1:16:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10450, "total_steps": 10853, "loss": 0.1215, "learning_rate": 1.8825941257045178e-08, "epoch": 0.962823052471553, "percentage": 96.29, "elapsed_time": "1 day, 9:00:45", "remaining_time": "1:16:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10451, "total_steps": 10853, "loss": 0.1147, "learning_rate": 1.8732744894485732e-08, "epoch": 0.962915188648823, "percentage": 96.3, "elapsed_time": "1 day, 9:00:57", "remaining_time": "1:16:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10452, "total_steps": 10853, "loss": 0.1154, "learning_rate": 1.8639778917857732e-08, "epoch": 0.963007324826093, "percentage": 96.31, "elapsed_time": "1 day, 9:01:08", "remaining_time": "1:16:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10453, "total_steps": 10853, "loss": 0.1207, "learning_rate": 1.8547043335793435e-08, "epoch": 0.963099461003363, "percentage": 96.31, "elapsed_time": "1 day, 9:01:20", "remaining_time": "1:15:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10454, "total_steps": 10853, "loss": 0.1165, "learning_rate": 1.845453815690318e-08, "epoch": 0.963191597180633, "percentage": 96.32, "elapsed_time": "1 day, 9:01:30", "remaining_time": "1:15:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10455, "total_steps": 10853, "loss": 0.1158, "learning_rate": 1.8362263389775926e-08, "epoch": 0.963283733357903, "percentage": 96.33, "elapsed_time": "1 day, 9:01:41", "remaining_time": "1:15:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10456, "total_steps": 10853, "loss": 0.1068, "learning_rate": 1.827021904297982e-08, "epoch": 0.963375869535173, "percentage": 96.34, "elapsed_time": "1 day, 9:01:53", "remaining_time": "1:15:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10457, "total_steps": 10853, "loss": 0.1254, "learning_rate": 1.8178405125060804e-08, "epoch": 0.963468005712443, "percentage": 96.35, "elapsed_time": "1 day, 9:02:04", "remaining_time": "1:15:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10458, "total_steps": 10853, "loss": 0.1093, "learning_rate": 1.8086821644544283e-08, "epoch": 0.963560141889713, "percentage": 96.36, "elapsed_time": "1 day, 9:02:14", "remaining_time": "1:14:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10459, "total_steps": 10853, "loss": 0.1197, "learning_rate": 1.7995468609933176e-08, "epoch": 0.963652278066983, "percentage": 96.37, "elapsed_time": "1 day, 9:02:25", "remaining_time": "1:14:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10460, "total_steps": 10853, "loss": 0.1174, "learning_rate": 1.790434602971014e-08, "epoch": 0.9637444142442531, "percentage": 96.38, "elapsed_time": "1 day, 9:02:36", "remaining_time": "1:14:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10461, "total_steps": 10853, "loss": 0.1207, "learning_rate": 1.7813453912335354e-08, "epoch": 0.963836550421523, "percentage": 96.39, "elapsed_time": "1 day, 9:02:47", "remaining_time": "1:14:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10462, "total_steps": 10853, "loss": 0.1189, "learning_rate": 1.772279226624901e-08, "epoch": 0.963928686598793, "percentage": 96.4, "elapsed_time": "1 day, 9:02:58", "remaining_time": "1:14:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10463, "total_steps": 10853, "loss": 0.1148, "learning_rate": 1.7632361099867988e-08, "epoch": 0.964020822776063, "percentage": 96.41, "elapsed_time": "1 day, 9:03:08", "remaining_time": "1:13:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10464, "total_steps": 10853, "loss": 0.1204, "learning_rate": 1.7542160421590017e-08, "epoch": 0.964112958953333, "percentage": 96.42, "elapsed_time": "1 day, 9:03:19", "remaining_time": "1:13:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10465, "total_steps": 10853, "loss": 0.1125, "learning_rate": 1.7452190239789225e-08, "epoch": 0.964205095130603, "percentage": 96.42, "elapsed_time": "1 day, 9:03:30", "remaining_time": "1:13:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10466, "total_steps": 10853, "loss": 0.1112, "learning_rate": 1.7362450562819765e-08, "epoch": 0.964297231307873, "percentage": 96.43, "elapsed_time": "1 day, 9:03:41", "remaining_time": "1:13:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10467, "total_steps": 10853, "loss": 0.1203, "learning_rate": 1.7272941399013865e-08, "epoch": 0.964389367485143, "percentage": 96.44, "elapsed_time": "1 day, 9:03:51", "remaining_time": "1:13:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10468, "total_steps": 10853, "loss": 0.1135, "learning_rate": 1.718366275668265e-08, "epoch": 0.964481503662413, "percentage": 96.45, "elapsed_time": "1 day, 9:04:03", "remaining_time": "1:12:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10469, "total_steps": 10853, "loss": 0.1202, "learning_rate": 1.7094614644115605e-08, "epoch": 0.964573639839683, "percentage": 96.46, "elapsed_time": "1 day, 9:04:14", "remaining_time": "1:12:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10470, "total_steps": 10853, "loss": 0.1116, "learning_rate": 1.700579706958083e-08, "epoch": 0.964665776016953, "percentage": 96.47, "elapsed_time": "1 day, 9:04:25", "remaining_time": "1:12:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10471, "total_steps": 10853, "loss": 0.1239, "learning_rate": 1.6917210041325073e-08, "epoch": 0.964757912194223, "percentage": 96.48, "elapsed_time": "1 day, 9:04:36", "remaining_time": "1:12:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10472, "total_steps": 10853, "loss": 0.1103, "learning_rate": 1.6828853567573413e-08, "epoch": 0.964850048371493, "percentage": 96.49, "elapsed_time": "1 day, 9:04:46", "remaining_time": "1:12:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10473, "total_steps": 10853, "loss": 0.1229, "learning_rate": 1.6740727656529844e-08, "epoch": 0.9649421845487631, "percentage": 96.5, "elapsed_time": "1 day, 9:04:57", "remaining_time": "1:12:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10474, "total_steps": 10853, "loss": 0.1136, "learning_rate": 1.6652832316377264e-08, "epoch": 0.9650343207260331, "percentage": 96.51, "elapsed_time": "1 day, 9:05:08", "remaining_time": "1:11:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10475, "total_steps": 10853, "loss": 0.108, "learning_rate": 1.6565167555276373e-08, "epoch": 0.9651264569033031, "percentage": 96.52, "elapsed_time": "1 day, 9:05:19", "remaining_time": "1:11:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10476, "total_steps": 10853, "loss": 0.1172, "learning_rate": 1.6477733381367043e-08, "epoch": 0.9652185930805731, "percentage": 96.53, "elapsed_time": "1 day, 9:05:31", "remaining_time": "1:11:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10477, "total_steps": 10853, "loss": 0.1171, "learning_rate": 1.639052980276723e-08, "epoch": 0.9653107292578431, "percentage": 96.54, "elapsed_time": "1 day, 9:05:42", "remaining_time": "1:11:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10478, "total_steps": 10853, "loss": 0.1103, "learning_rate": 1.6303556827574062e-08, "epoch": 0.9654028654351131, "percentage": 96.54, "elapsed_time": "1 day, 9:05:52", "remaining_time": "1:11:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10479, "total_steps": 10853, "loss": 0.1112, "learning_rate": 1.6216814463863028e-08, "epoch": 0.9654950016123831, "percentage": 96.55, "elapsed_time": "1 day, 9:06:03", "remaining_time": "1:10:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10480, "total_steps": 10853, "loss": 0.1148, "learning_rate": 1.6130302719687962e-08, "epoch": 0.9655871377896531, "percentage": 96.56, "elapsed_time": "1 day, 9:06:15", "remaining_time": "1:10:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10481, "total_steps": 10853, "loss": 0.1188, "learning_rate": 1.6044021603081607e-08, "epoch": 0.9656792739669231, "percentage": 96.57, "elapsed_time": "1 day, 9:06:26", "remaining_time": "1:10:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10482, "total_steps": 10853, "loss": 0.1224, "learning_rate": 1.5957971122055327e-08, "epoch": 0.9657714101441931, "percentage": 96.58, "elapsed_time": "1 day, 9:06:36", "remaining_time": "1:10:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10483, "total_steps": 10853, "loss": 0.1106, "learning_rate": 1.5872151284598848e-08, "epoch": 0.9658635463214631, "percentage": 96.59, "elapsed_time": "1 day, 9:06:47", "remaining_time": "1:10:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10484, "total_steps": 10853, "loss": 0.1217, "learning_rate": 1.5786562098680235e-08, "epoch": 0.9659556824987331, "percentage": 96.6, "elapsed_time": "1 day, 9:06:57", "remaining_time": "1:09:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10485, "total_steps": 10853, "loss": 0.1133, "learning_rate": 1.570120357224647e-08, "epoch": 0.9660478186760031, "percentage": 96.61, "elapsed_time": "1 day, 9:07:08", "remaining_time": "1:09:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10486, "total_steps": 10853, "loss": 0.1093, "learning_rate": 1.561607571322371e-08, "epoch": 0.9661399548532731, "percentage": 96.62, "elapsed_time": "1 day, 9:07:19", "remaining_time": "1:09:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10487, "total_steps": 10853, "loss": 0.1097, "learning_rate": 1.5531178529515635e-08, "epoch": 0.9662320910305432, "percentage": 96.63, "elapsed_time": "1 day, 9:07:29", "remaining_time": "1:09:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10488, "total_steps": 10853, "loss": 0.1054, "learning_rate": 1.54465120290051e-08, "epoch": 0.9663242272078132, "percentage": 96.64, "elapsed_time": "1 day, 9:07:39", "remaining_time": "1:09:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10489, "total_steps": 10853, "loss": 0.1167, "learning_rate": 1.5362076219553048e-08, "epoch": 0.9664163633850832, "percentage": 96.65, "elapsed_time": "1 day, 9:07:51", "remaining_time": "1:08:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10490, "total_steps": 10853, "loss": 0.1196, "learning_rate": 1.5277871108999586e-08, "epoch": 0.9665084995623532, "percentage": 96.66, "elapsed_time": "1 day, 9:08:02", "remaining_time": "1:08:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10491, "total_steps": 10853, "loss": 0.1264, "learning_rate": 1.519389670516347e-08, "epoch": 0.9666006357396232, "percentage": 96.66, "elapsed_time": "1 day, 9:08:12", "remaining_time": "1:08:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10492, "total_steps": 10853, "loss": 0.1155, "learning_rate": 1.511015301584151e-08, "epoch": 0.9666927719168932, "percentage": 96.67, "elapsed_time": "1 day, 9:08:23", "remaining_time": "1:08:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10493, "total_steps": 10853, "loss": 0.1104, "learning_rate": 1.502664004880888e-08, "epoch": 0.9667849080941632, "percentage": 96.68, "elapsed_time": "1 day, 9:08:34", "remaining_time": "1:08:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10494, "total_steps": 10853, "loss": 0.1179, "learning_rate": 1.4943357811820492e-08, "epoch": 0.9668770442714332, "percentage": 96.69, "elapsed_time": "1 day, 9:08:45", "remaining_time": "1:08:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10495, "total_steps": 10853, "loss": 0.1246, "learning_rate": 1.4860306312608762e-08, "epoch": 0.9669691804487032, "percentage": 96.7, "elapsed_time": "1 day, 9:08:56", "remaining_time": "1:07:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10496, "total_steps": 10853, "loss": 0.1193, "learning_rate": 1.4777485558884753e-08, "epoch": 0.9670613166259732, "percentage": 96.71, "elapsed_time": "1 day, 9:09:07", "remaining_time": "1:07:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10497, "total_steps": 10853, "loss": 0.1222, "learning_rate": 1.4694895558338972e-08, "epoch": 0.9671534528032432, "percentage": 96.72, "elapsed_time": "1 day, 9:09:17", "remaining_time": "1:07:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10498, "total_steps": 10853, "loss": 0.1188, "learning_rate": 1.4612536318639459e-08, "epoch": 0.9672455889805132, "percentage": 96.73, "elapsed_time": "1 day, 9:09:28", "remaining_time": "1:07:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10499, "total_steps": 10853, "loss": 0.1288, "learning_rate": 1.4530407847433702e-08, "epoch": 0.9673377251577832, "percentage": 96.74, "elapsed_time": "1 day, 9:09:39", "remaining_time": "1:07:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10500, "total_steps": 10853, "loss": 0.1133, "learning_rate": 1.4448510152346717e-08, "epoch": 0.9674298613350532, "percentage": 96.75, "elapsed_time": "1 day, 9:09:50", "remaining_time": "1:06:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10500, "total_steps": 10853, "eval_loss": 0.11658257246017456, "epoch": 0.9674298613350532, "percentage": 96.75, "elapsed_time": "1 day, 9:14:51", "remaining_time": "1:07:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10501, "total_steps": 10853, "loss": 0.1149, "learning_rate": 1.4366843240982975e-08, "epoch": 0.9675219975123233, "percentage": 96.76, "elapsed_time": "1 day, 9:15:03", "remaining_time": "1:06:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10502, "total_steps": 10853, "loss": 0.1203, "learning_rate": 1.4285407120925854e-08, "epoch": 0.9676141336895933, "percentage": 96.77, "elapsed_time": "1 day, 9:15:14", "remaining_time": "1:06:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10503, "total_steps": 10853, "loss": 0.1048, "learning_rate": 1.4204201799735973e-08, "epoch": 0.9677062698668633, "percentage": 96.78, "elapsed_time": "1 day, 9:15:23", "remaining_time": "1:06:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10504, "total_steps": 10853, "loss": 0.1076, "learning_rate": 1.412322728495341e-08, "epoch": 0.9677984060441333, "percentage": 96.78, "elapsed_time": "1 day, 9:15:34", "remaining_time": "1:06:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10505, "total_steps": 10853, "loss": 0.1125, "learning_rate": 1.40424835840966e-08, "epoch": 0.9678905422214032, "percentage": 96.79, "elapsed_time": "1 day, 9:15:46", "remaining_time": "1:06:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10506, "total_steps": 10853, "loss": 0.1061, "learning_rate": 1.3961970704662875e-08, "epoch": 0.9679826783986732, "percentage": 96.8, "elapsed_time": "1 day, 9:15:57", "remaining_time": "1:05:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10507, "total_steps": 10853, "loss": 0.1051, "learning_rate": 1.3881688654127645e-08, "epoch": 0.9680748145759432, "percentage": 96.81, "elapsed_time": "1 day, 9:16:08", "remaining_time": "1:05:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10508, "total_steps": 10853, "loss": 0.1203, "learning_rate": 1.3801637439945225e-08, "epoch": 0.9681669507532132, "percentage": 96.82, "elapsed_time": "1 day, 9:16:19", "remaining_time": "1:05:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10509, "total_steps": 10853, "loss": 0.1178, "learning_rate": 1.3721817069548282e-08, "epoch": 0.9682590869304832, "percentage": 96.83, "elapsed_time": "1 day, 9:16:29", "remaining_time": "1:05:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10510, "total_steps": 10853, "loss": 0.1199, "learning_rate": 1.3642227550348387e-08, "epoch": 0.9683512231077532, "percentage": 96.84, "elapsed_time": "1 day, 9:16:39", "remaining_time": "1:05:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10511, "total_steps": 10853, "loss": 0.104, "learning_rate": 1.3562868889735182e-08, "epoch": 0.9684433592850232, "percentage": 96.85, "elapsed_time": "1 day, 9:16:51", "remaining_time": "1:04:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10512, "total_steps": 10853, "loss": 0.1223, "learning_rate": 1.348374109507694e-08, "epoch": 0.9685354954622932, "percentage": 96.86, "elapsed_time": "1 day, 9:17:01", "remaining_time": "1:04:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10513, "total_steps": 10853, "loss": 0.1183, "learning_rate": 1.3404844173721398e-08, "epoch": 0.9686276316395632, "percentage": 96.87, "elapsed_time": "1 day, 9:17:13", "remaining_time": "1:04:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10514, "total_steps": 10853, "loss": 0.1234, "learning_rate": 1.332617813299325e-08, "epoch": 0.9687197678168333, "percentage": 96.88, "elapsed_time": "1 day, 9:17:23", "remaining_time": "1:04:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10515, "total_steps": 10853, "loss": 0.1115, "learning_rate": 1.324774298019721e-08, "epoch": 0.9688119039941033, "percentage": 96.89, "elapsed_time": "1 day, 9:17:34", "remaining_time": "1:04:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10516, "total_steps": 10853, "loss": 0.1205, "learning_rate": 1.316953872261606e-08, "epoch": 0.9689040401713733, "percentage": 96.89, "elapsed_time": "1 day, 9:17:44", "remaining_time": "1:04:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10517, "total_steps": 10853, "loss": 0.1111, "learning_rate": 1.3091565367510661e-08, "epoch": 0.9689961763486433, "percentage": 96.9, "elapsed_time": "1 day, 9:17:55", "remaining_time": "1:03:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10518, "total_steps": 10853, "loss": 0.1164, "learning_rate": 1.3013822922121332e-08, "epoch": 0.9690883125259133, "percentage": 96.91, "elapsed_time": "1 day, 9:18:06", "remaining_time": "1:03:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10519, "total_steps": 10853, "loss": 0.1154, "learning_rate": 1.2936311393665912e-08, "epoch": 0.9691804487031833, "percentage": 96.92, "elapsed_time": "1 day, 9:18:16", "remaining_time": "1:03:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10520, "total_steps": 10853, "loss": 0.1109, "learning_rate": 1.2859030789341698e-08, "epoch": 0.9692725848804533, "percentage": 96.93, "elapsed_time": "1 day, 9:18:26", "remaining_time": "1:03:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10521, "total_steps": 10853, "loss": 0.1073, "learning_rate": 1.278198111632406e-08, "epoch": 0.9693647210577233, "percentage": 96.94, "elapsed_time": "1 day, 9:18:36", "remaining_time": "1:03:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10522, "total_steps": 10853, "loss": 0.1166, "learning_rate": 1.2705162381767277e-08, "epoch": 0.9694568572349933, "percentage": 96.95, "elapsed_time": "1 day, 9:18:47", "remaining_time": "1:02:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10523, "total_steps": 10853, "loss": 0.1131, "learning_rate": 1.2628574592803977e-08, "epoch": 0.9695489934122633, "percentage": 96.96, "elapsed_time": "1 day, 9:18:58", "remaining_time": "1:02:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10524, "total_steps": 10853, "loss": 0.1115, "learning_rate": 1.2552217756545137e-08, "epoch": 0.9696411295895333, "percentage": 96.97, "elapsed_time": "1 day, 9:19:10", "remaining_time": "1:02:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10525, "total_steps": 10853, "loss": 0.1189, "learning_rate": 1.2476091880080366e-08, "epoch": 0.9697332657668033, "percentage": 96.98, "elapsed_time": "1 day, 9:19:20", "remaining_time": "1:02:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10526, "total_steps": 10853, "loss": 0.1234, "learning_rate": 1.240019697047845e-08, "epoch": 0.9698254019440733, "percentage": 96.99, "elapsed_time": "1 day, 9:19:30", "remaining_time": "1:02:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10527, "total_steps": 10853, "loss": 0.1086, "learning_rate": 1.2324533034785702e-08, "epoch": 0.9699175381213433, "percentage": 97.0, "elapsed_time": "1 day, 9:19:40", "remaining_time": "1:01:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10528, "total_steps": 10853, "loss": 0.1089, "learning_rate": 1.2249100080028164e-08, "epoch": 0.9700096742986134, "percentage": 97.01, "elapsed_time": "1 day, 9:19:51", "remaining_time": "1:01:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10529, "total_steps": 10853, "loss": 0.1191, "learning_rate": 1.2173898113209126e-08, "epoch": 0.9701018104758834, "percentage": 97.01, "elapsed_time": "1 day, 9:20:02", "remaining_time": "1:01:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10530, "total_steps": 10853, "loss": 0.1188, "learning_rate": 1.2098927141311333e-08, "epoch": 0.9701939466531534, "percentage": 97.02, "elapsed_time": "1 day, 9:20:13", "remaining_time": "1:01:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10531, "total_steps": 10853, "loss": 0.1207, "learning_rate": 1.2024187171296165e-08, "epoch": 0.9702860828304234, "percentage": 97.03, "elapsed_time": "1 day, 9:20:24", "remaining_time": "1:01:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10532, "total_steps": 10853, "loss": 0.1141, "learning_rate": 1.1949678210102788e-08, "epoch": 0.9703782190076934, "percentage": 97.04, "elapsed_time": "1 day, 9:20:34", "remaining_time": "1:00:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10533, "total_steps": 10853, "loss": 0.1137, "learning_rate": 1.1875400264649562e-08, "epoch": 0.9704703551849634, "percentage": 97.05, "elapsed_time": "1 day, 9:20:46", "remaining_time": "1:00:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10534, "total_steps": 10853, "loss": 0.1106, "learning_rate": 1.1801353341833466e-08, "epoch": 0.9705624913622334, "percentage": 97.06, "elapsed_time": "1 day, 9:20:57", "remaining_time": "1:00:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10535, "total_steps": 10853, "loss": 0.1079, "learning_rate": 1.1727537448529003e-08, "epoch": 0.9706546275395034, "percentage": 97.07, "elapsed_time": "1 day, 9:21:07", "remaining_time": "1:00:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10536, "total_steps": 10853, "loss": 0.1169, "learning_rate": 1.1653952591590967e-08, "epoch": 0.9707467637167734, "percentage": 97.08, "elapsed_time": "1 day, 9:21:17", "remaining_time": "1:00:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10537, "total_steps": 10853, "loss": 0.1115, "learning_rate": 1.1580598777850837e-08, "epoch": 0.9708388998940434, "percentage": 97.09, "elapsed_time": "1 day, 9:21:28", "remaining_time": "1:00:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10538, "total_steps": 10853, "loss": 0.1081, "learning_rate": 1.1507476014120112e-08, "epoch": 0.9709310360713134, "percentage": 97.1, "elapsed_time": "1 day, 9:21:39", "remaining_time": "0:59:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10539, "total_steps": 10853, "loss": 0.12, "learning_rate": 1.143458430718808e-08, "epoch": 0.9710231722485834, "percentage": 97.11, "elapsed_time": "1 day, 9:21:49", "remaining_time": "0:59:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10540, "total_steps": 10853, "loss": 0.1229, "learning_rate": 1.136192366382266e-08, "epoch": 0.9711153084258534, "percentage": 97.12, "elapsed_time": "1 day, 9:22:01", "remaining_time": "0:59:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10541, "total_steps": 10853, "loss": 0.1144, "learning_rate": 1.128949409077068e-08, "epoch": 0.9712074446031235, "percentage": 97.13, "elapsed_time": "1 day, 9:22:12", "remaining_time": "0:59:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10542, "total_steps": 10853, "loss": 0.118, "learning_rate": 1.121729559475676e-08, "epoch": 0.9712995807803935, "percentage": 97.13, "elapsed_time": "1 day, 9:22:22", "remaining_time": "0:59:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10543, "total_steps": 10853, "loss": 0.1097, "learning_rate": 1.1145328182484706e-08, "epoch": 0.9713917169576635, "percentage": 97.14, "elapsed_time": "1 day, 9:22:33", "remaining_time": "0:58:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10544, "total_steps": 10853, "loss": 0.1156, "learning_rate": 1.1073591860636946e-08, "epoch": 0.9714838531349335, "percentage": 97.15, "elapsed_time": "1 day, 9:22:45", "remaining_time": "0:58:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10545, "total_steps": 10853, "loss": 0.1241, "learning_rate": 1.1002086635873987e-08, "epoch": 0.9715759893122035, "percentage": 97.16, "elapsed_time": "1 day, 9:22:55", "remaining_time": "0:58:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10546, "total_steps": 10853, "loss": 0.1213, "learning_rate": 1.0930812514835243e-08, "epoch": 0.9716681254894735, "percentage": 97.17, "elapsed_time": "1 day, 9:23:05", "remaining_time": "0:58:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10547, "total_steps": 10853, "loss": 0.1083, "learning_rate": 1.0859769504138196e-08, "epoch": 0.9717602616667435, "percentage": 97.18, "elapsed_time": "1 day, 9:23:17", "remaining_time": "0:58:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10548, "total_steps": 10853, "loss": 0.1113, "learning_rate": 1.0788957610379791e-08, "epoch": 0.9718523978440134, "percentage": 97.19, "elapsed_time": "1 day, 9:23:27", "remaining_time": "0:57:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10549, "total_steps": 10853, "loss": 0.1117, "learning_rate": 1.0718376840134214e-08, "epoch": 0.9719445340212834, "percentage": 97.2, "elapsed_time": "1 day, 9:23:38", "remaining_time": "0:57:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10550, "total_steps": 10853, "loss": 0.1214, "learning_rate": 1.0648027199955391e-08, "epoch": 0.9720366701985534, "percentage": 97.21, "elapsed_time": "1 day, 9:23:49", "remaining_time": "0:57:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10551, "total_steps": 10853, "loss": 0.1165, "learning_rate": 1.0577908696375316e-08, "epoch": 0.9721288063758234, "percentage": 97.22, "elapsed_time": "1 day, 9:24:01", "remaining_time": "0:57:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10552, "total_steps": 10853, "loss": 0.1156, "learning_rate": 1.0508021335904061e-08, "epoch": 0.9722209425530934, "percentage": 97.23, "elapsed_time": "1 day, 9:24:11", "remaining_time": "0:57:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10553, "total_steps": 10853, "loss": 0.1192, "learning_rate": 1.0438365125031158e-08, "epoch": 0.9723130787303634, "percentage": 97.24, "elapsed_time": "1 day, 9:24:22", "remaining_time": "0:56:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10554, "total_steps": 10853, "loss": 0.1135, "learning_rate": 1.0368940070223932e-08, "epoch": 0.9724052149076334, "percentage": 97.25, "elapsed_time": "1 day, 9:24:33", "remaining_time": "0:56:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10555, "total_steps": 10853, "loss": 0.1158, "learning_rate": 1.0299746177928338e-08, "epoch": 0.9724973510849035, "percentage": 97.25, "elapsed_time": "1 day, 9:24:44", "remaining_time": "0:56:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10556, "total_steps": 10853, "loss": 0.1143, "learning_rate": 1.0230783454569515e-08, "epoch": 0.9725894872621735, "percentage": 97.26, "elapsed_time": "1 day, 9:24:53", "remaining_time": "0:56:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10557, "total_steps": 10853, "loss": 0.1136, "learning_rate": 1.0162051906550397e-08, "epoch": 0.9726816234394435, "percentage": 97.27, "elapsed_time": "1 day, 9:25:03", "remaining_time": "0:56:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10558, "total_steps": 10853, "loss": 0.1071, "learning_rate": 1.0093551540252822e-08, "epoch": 0.9727737596167135, "percentage": 97.28, "elapsed_time": "1 day, 9:25:12", "remaining_time": "0:56:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10559, "total_steps": 10853, "loss": 0.1206, "learning_rate": 1.0025282362036704e-08, "epoch": 0.9728658957939835, "percentage": 97.29, "elapsed_time": "1 day, 9:25:25", "remaining_time": "0:55:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10560, "total_steps": 10853, "loss": 0.1101, "learning_rate": 9.957244378241138e-09, "epoch": 0.9729580319712535, "percentage": 97.3, "elapsed_time": "1 day, 9:25:35", "remaining_time": "0:55:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10561, "total_steps": 10853, "loss": 0.1244, "learning_rate": 9.889437595183293e-09, "epoch": 0.9730501681485235, "percentage": 97.31, "elapsed_time": "1 day, 9:25:44", "remaining_time": "0:55:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10562, "total_steps": 10853, "loss": 0.1231, "learning_rate": 9.821862019159522e-09, "epoch": 0.9731423043257935, "percentage": 97.32, "elapsed_time": "1 day, 9:25:55", "remaining_time": "0:55:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10563, "total_steps": 10853, "loss": 0.1221, "learning_rate": 9.754517656443697e-09, "epoch": 0.9732344405030635, "percentage": 97.33, "elapsed_time": "1 day, 9:26:07", "remaining_time": "0:55:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10564, "total_steps": 10853, "loss": 0.1171, "learning_rate": 9.68740451328859e-09, "epoch": 0.9733265766803335, "percentage": 97.34, "elapsed_time": "1 day, 9:26:18", "remaining_time": "0:54:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10565, "total_steps": 10853, "loss": 0.1243, "learning_rate": 9.62052259592644e-09, "epoch": 0.9734187128576035, "percentage": 97.35, "elapsed_time": "1 day, 9:26:27", "remaining_time": "0:54:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10566, "total_steps": 10853, "loss": 0.1239, "learning_rate": 9.553871910566448e-09, "epoch": 0.9735108490348735, "percentage": 97.36, "elapsed_time": "1 day, 9:26:40", "remaining_time": "0:54:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10567, "total_steps": 10853, "loss": 0.1033, "learning_rate": 9.487452463397828e-09, "epoch": 0.9736029852121435, "percentage": 97.36, "elapsed_time": "1 day, 9:26:50", "remaining_time": "0:54:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10568, "total_steps": 10853, "loss": 0.1191, "learning_rate": 9.421264260587038e-09, "epoch": 0.9736951213894135, "percentage": 97.37, "elapsed_time": "1 day, 9:27:01", "remaining_time": "0:54:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10569, "total_steps": 10853, "loss": 0.1246, "learning_rate": 9.355307308279992e-09, "epoch": 0.9737872575666836, "percentage": 97.38, "elapsed_time": "1 day, 9:27:11", "remaining_time": "0:53:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10570, "total_steps": 10853, "loss": 0.1194, "learning_rate": 9.289581612600684e-09, "epoch": 0.9738793937439536, "percentage": 97.39, "elapsed_time": "1 day, 9:27:22", "remaining_time": "0:53:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10571, "total_steps": 10853, "loss": 0.1099, "learning_rate": 9.224087179651731e-09, "epoch": 0.9739715299212236, "percentage": 97.4, "elapsed_time": "1 day, 9:27:32", "remaining_time": "0:53:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10572, "total_steps": 10853, "loss": 0.1174, "learning_rate": 9.158824015514378e-09, "epoch": 0.9740636660984936, "percentage": 97.41, "elapsed_time": "1 day, 9:27:44", "remaining_time": "0:53:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10573, "total_steps": 10853, "loss": 0.1177, "learning_rate": 9.093792126248224e-09, "epoch": 0.9741558022757636, "percentage": 97.42, "elapsed_time": "1 day, 9:27:55", "remaining_time": "0:53:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10574, "total_steps": 10853, "loss": 0.119, "learning_rate": 9.028991517891495e-09, "epoch": 0.9742479384530336, "percentage": 97.43, "elapsed_time": "1 day, 9:28:06", "remaining_time": "0:52:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10575, "total_steps": 10853, "loss": 0.1296, "learning_rate": 8.964422196461042e-09, "epoch": 0.9743400746303036, "percentage": 97.44, "elapsed_time": "1 day, 9:28:17", "remaining_time": "0:52:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10576, "total_steps": 10853, "loss": 0.1066, "learning_rate": 8.900084167952072e-09, "epoch": 0.9744322108075736, "percentage": 97.45, "elapsed_time": "1 day, 9:28:29", "remaining_time": "0:52:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10577, "total_steps": 10853, "loss": 0.114, "learning_rate": 8.835977438338417e-09, "epoch": 0.9745243469848436, "percentage": 97.46, "elapsed_time": "1 day, 9:28:40", "remaining_time": "0:52:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10578, "total_steps": 10853, "loss": 0.1093, "learning_rate": 8.772102013572537e-09, "epoch": 0.9746164831621136, "percentage": 97.47, "elapsed_time": "1 day, 9:28:51", "remaining_time": "0:52:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10579, "total_steps": 10853, "loss": 0.1128, "learning_rate": 8.708457899584965e-09, "epoch": 0.9747086193393836, "percentage": 97.48, "elapsed_time": "1 day, 9:29:02", "remaining_time": "0:52:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10580, "total_steps": 10853, "loss": 0.1171, "learning_rate": 8.645045102285143e-09, "epoch": 0.9748007555166536, "percentage": 97.48, "elapsed_time": "1 day, 9:29:13", "remaining_time": "0:51:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10581, "total_steps": 10853, "loss": 0.1186, "learning_rate": 8.58186362756086e-09, "epoch": 0.9748928916939236, "percentage": 97.49, "elapsed_time": "1 day, 9:29:24", "remaining_time": "0:51:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10582, "total_steps": 10853, "loss": 0.1214, "learning_rate": 8.518913481278812e-09, "epoch": 0.9749850278711937, "percentage": 97.5, "elapsed_time": "1 day, 9:29:35", "remaining_time": "0:51:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10583, "total_steps": 10853, "loss": 0.1277, "learning_rate": 8.456194669284046e-09, "epoch": 0.9750771640484637, "percentage": 97.51, "elapsed_time": "1 day, 9:29:45", "remaining_time": "0:51:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10584, "total_steps": 10853, "loss": 0.1194, "learning_rate": 8.393707197399404e-09, "epoch": 0.9751693002257337, "percentage": 97.52, "elapsed_time": "1 day, 9:29:56", "remaining_time": "0:51:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10585, "total_steps": 10853, "loss": 0.1154, "learning_rate": 8.331451071427188e-09, "epoch": 0.9752614364030037, "percentage": 97.53, "elapsed_time": "1 day, 9:30:07", "remaining_time": "0:50:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10586, "total_steps": 10853, "loss": 0.1093, "learning_rate": 8.269426297148053e-09, "epoch": 0.9753535725802737, "percentage": 97.54, "elapsed_time": "1 day, 9:30:18", "remaining_time": "0:50:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10587, "total_steps": 10853, "loss": 0.1089, "learning_rate": 8.207632880320727e-09, "epoch": 0.9754457087575437, "percentage": 97.55, "elapsed_time": "1 day, 9:30:29", "remaining_time": "0:50:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10588, "total_steps": 10853, "loss": 0.1195, "learning_rate": 8.146070826683116e-09, "epoch": 0.9755378449348137, "percentage": 97.56, "elapsed_time": "1 day, 9:30:39", "remaining_time": "0:50:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10589, "total_steps": 10853, "loss": 0.1236, "learning_rate": 8.084740141950653e-09, "epoch": 0.9756299811120837, "percentage": 97.57, "elapsed_time": "1 day, 9:30:49", "remaining_time": "0:50:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10590, "total_steps": 10853, "loss": 0.1095, "learning_rate": 8.023640831818502e-09, "epoch": 0.9757221172893537, "percentage": 97.58, "elapsed_time": "1 day, 9:31:00", "remaining_time": "0:49:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10591, "total_steps": 10853, "loss": 0.112, "learning_rate": 7.962772901959348e-09, "epoch": 0.9758142534666236, "percentage": 97.59, "elapsed_time": "1 day, 9:31:11", "remaining_time": "0:49:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10592, "total_steps": 10853, "loss": 0.1138, "learning_rate": 7.902136358025058e-09, "epoch": 0.9759063896438936, "percentage": 97.6, "elapsed_time": "1 day, 9:31:23", "remaining_time": "0:49:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10593, "total_steps": 10853, "loss": 0.124, "learning_rate": 7.841731205645576e-09, "epoch": 0.9759985258211636, "percentage": 97.6, "elapsed_time": "1 day, 9:31:33", "remaining_time": "0:49:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10594, "total_steps": 10853, "loss": 0.1009, "learning_rate": 7.781557450429467e-09, "epoch": 0.9760906619984336, "percentage": 97.61, "elapsed_time": "1 day, 9:31:44", "remaining_time": "0:49:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10595, "total_steps": 10853, "loss": 0.1119, "learning_rate": 7.72161509796393e-09, "epoch": 0.9761827981757036, "percentage": 97.62, "elapsed_time": "1 day, 9:31:54", "remaining_time": "0:48:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10596, "total_steps": 10853, "loss": 0.1133, "learning_rate": 7.661904153814793e-09, "epoch": 0.9762749343529737, "percentage": 97.63, "elapsed_time": "1 day, 9:32:05", "remaining_time": "0:48:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10597, "total_steps": 10853, "loss": 0.1228, "learning_rate": 7.60242462352595e-09, "epoch": 0.9763670705302437, "percentage": 97.64, "elapsed_time": "1 day, 9:32:17", "remaining_time": "0:48:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10598, "total_steps": 10853, "loss": 0.1168, "learning_rate": 7.543176512620487e-09, "epoch": 0.9764592067075137, "percentage": 97.65, "elapsed_time": "1 day, 9:32:29", "remaining_time": "0:48:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10599, "total_steps": 10853, "loss": 0.1176, "learning_rate": 7.484159826599002e-09, "epoch": 0.9765513428847837, "percentage": 97.66, "elapsed_time": "1 day, 9:32:39", "remaining_time": "0:48:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10600, "total_steps": 10853, "loss": 0.1141, "learning_rate": 7.425374570941557e-09, "epoch": 0.9766434790620537, "percentage": 97.67, "elapsed_time": "1 day, 9:32:50", "remaining_time": "0:48:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10601, "total_steps": 10853, "loss": 0.1142, "learning_rate": 7.366820751106562e-09, "epoch": 0.9767356152393237, "percentage": 97.68, "elapsed_time": "1 day, 9:33:02", "remaining_time": "0:47:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10602, "total_steps": 10853, "loss": 0.1259, "learning_rate": 7.308498372530226e-09, "epoch": 0.9768277514165937, "percentage": 97.69, "elapsed_time": "1 day, 9:33:13", "remaining_time": "0:47:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10603, "total_steps": 10853, "loss": 0.1234, "learning_rate": 7.250407440628493e-09, "epoch": 0.9769198875938637, "percentage": 97.7, "elapsed_time": "1 day, 9:33:22", "remaining_time": "0:47:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10604, "total_steps": 10853, "loss": 0.1217, "learning_rate": 7.192547960794549e-09, "epoch": 0.9770120237711337, "percentage": 97.71, "elapsed_time": "1 day, 9:33:33", "remaining_time": "0:47:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10605, "total_steps": 10853, "loss": 0.1178, "learning_rate": 7.134919938400486e-09, "epoch": 0.9771041599484037, "percentage": 97.71, "elapsed_time": "1 day, 9:33:43", "remaining_time": "0:47:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10606, "total_steps": 10853, "loss": 0.1136, "learning_rate": 7.077523378797579e-09, "epoch": 0.9771962961256737, "percentage": 97.72, "elapsed_time": "1 day, 9:33:53", "remaining_time": "0:46:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10607, "total_steps": 10853, "loss": 0.106, "learning_rate": 7.0203582873151764e-09, "epoch": 0.9772884323029437, "percentage": 97.73, "elapsed_time": "1 day, 9:34:05", "remaining_time": "0:46:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10608, "total_steps": 10853, "loss": 0.1176, "learning_rate": 6.963424669260421e-09, "epoch": 0.9773805684802137, "percentage": 97.74, "elapsed_time": "1 day, 9:34:15", "remaining_time": "0:46:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10609, "total_steps": 10853, "loss": 0.1233, "learning_rate": 6.906722529920196e-09, "epoch": 0.9774727046574838, "percentage": 97.75, "elapsed_time": "1 day, 9:34:26", "remaining_time": "0:46:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10610, "total_steps": 10853, "loss": 0.1128, "learning_rate": 6.850251874559177e-09, "epoch": 0.9775648408347538, "percentage": 97.76, "elapsed_time": "1 day, 9:34:36", "remaining_time": "0:46:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10611, "total_steps": 10853, "loss": 0.1125, "learning_rate": 6.7940127084203945e-09, "epoch": 0.9776569770120238, "percentage": 97.77, "elapsed_time": "1 day, 9:34:48", "remaining_time": "0:45:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10612, "total_steps": 10853, "loss": 0.1082, "learning_rate": 6.738005036726059e-09, "epoch": 0.9777491131892938, "percentage": 97.78, "elapsed_time": "1 day, 9:34:59", "remaining_time": "0:45:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10613, "total_steps": 10853, "loss": 0.117, "learning_rate": 6.682228864675899e-09, "epoch": 0.9778412493665638, "percentage": 97.79, "elapsed_time": "1 day, 9:35:09", "remaining_time": "0:45:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10614, "total_steps": 10853, "loss": 0.1073, "learning_rate": 6.626684197449384e-09, "epoch": 0.9779333855438338, "percentage": 97.8, "elapsed_time": "1 day, 9:35:20", "remaining_time": "0:45:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10615, "total_steps": 10853, "loss": 0.111, "learning_rate": 6.5713710402037775e-09, "epoch": 0.9780255217211038, "percentage": 97.81, "elapsed_time": "1 day, 9:35:32", "remaining_time": "0:45:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10616, "total_steps": 10853, "loss": 0.1272, "learning_rate": 6.516289398074416e-09, "epoch": 0.9781176578983738, "percentage": 97.82, "elapsed_time": "1 day, 9:35:43", "remaining_time": "0:45:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10617, "total_steps": 10853, "loss": 0.1156, "learning_rate": 6.461439276176096e-09, "epoch": 0.9782097940756438, "percentage": 97.83, "elapsed_time": "1 day, 9:35:54", "remaining_time": "0:44:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10618, "total_steps": 10853, "loss": 0.1257, "learning_rate": 6.406820679601411e-09, "epoch": 0.9783019302529138, "percentage": 97.83, "elapsed_time": "1 day, 9:36:05", "remaining_time": "0:44:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10619, "total_steps": 10853, "loss": 0.1294, "learning_rate": 6.35243361342186e-09, "epoch": 0.9783940664301838, "percentage": 97.84, "elapsed_time": "1 day, 9:36:16", "remaining_time": "0:44:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10620, "total_steps": 10853, "loss": 0.1229, "learning_rate": 6.298278082687015e-09, "epoch": 0.9784862026074538, "percentage": 97.85, "elapsed_time": "1 day, 9:36:27", "remaining_time": "0:44:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10621, "total_steps": 10853, "loss": 0.1092, "learning_rate": 6.244354092425631e-09, "epoch": 0.9785783387847238, "percentage": 97.86, "elapsed_time": "1 day, 9:36:39", "remaining_time": "0:44:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10622, "total_steps": 10853, "loss": 0.0974, "learning_rate": 6.190661647644259e-09, "epoch": 0.9786704749619938, "percentage": 97.87, "elapsed_time": "1 day, 9:36:48", "remaining_time": "0:43:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10623, "total_steps": 10853, "loss": 0.1078, "learning_rate": 6.137200753328354e-09, "epoch": 0.9787626111392639, "percentage": 97.88, "elapsed_time": "1 day, 9:36:59", "remaining_time": "0:43:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10624, "total_steps": 10853, "loss": 0.1059, "learning_rate": 6.083971414442003e-09, "epoch": 0.9788547473165339, "percentage": 97.89, "elapsed_time": "1 day, 9:37:09", "remaining_time": "0:43:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10625, "total_steps": 10853, "loss": 0.1196, "learning_rate": 6.030973635926807e-09, "epoch": 0.9789468834938039, "percentage": 97.9, "elapsed_time": "1 day, 9:37:20", "remaining_time": "0:43:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10626, "total_steps": 10853, "loss": 0.1106, "learning_rate": 5.9782074227046625e-09, "epoch": 0.9790390196710739, "percentage": 97.91, "elapsed_time": "1 day, 9:37:31", "remaining_time": "0:43:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10627, "total_steps": 10853, "loss": 0.13, "learning_rate": 5.925672779673875e-09, "epoch": 0.9791311558483439, "percentage": 97.92, "elapsed_time": "1 day, 9:37:42", "remaining_time": "0:42:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10628, "total_steps": 10853, "loss": 0.1117, "learning_rate": 5.87336971171304e-09, "epoch": 0.9792232920256139, "percentage": 97.93, "elapsed_time": "1 day, 9:37:52", "remaining_time": "0:42:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10629, "total_steps": 10853, "loss": 0.1152, "learning_rate": 5.821298223678274e-09, "epoch": 0.9793154282028839, "percentage": 97.94, "elapsed_time": "1 day, 9:38:04", "remaining_time": "0:42:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10630, "total_steps": 10853, "loss": 0.1227, "learning_rate": 5.76945832040432e-09, "epoch": 0.9794075643801539, "percentage": 97.95, "elapsed_time": "1 day, 9:38:14", "remaining_time": "0:42:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10631, "total_steps": 10853, "loss": 0.1071, "learning_rate": 5.717850006704551e-09, "epoch": 0.9794997005574239, "percentage": 97.95, "elapsed_time": "1 day, 9:38:22", "remaining_time": "0:42:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10632, "total_steps": 10853, "loss": 0.1245, "learning_rate": 5.666473287370966e-09, "epoch": 0.9795918367346939, "percentage": 97.96, "elapsed_time": "1 day, 9:38:34", "remaining_time": "0:41:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10633, "total_steps": 10853, "loss": 0.1178, "learning_rate": 5.615328167173639e-09, "epoch": 0.9796839729119639, "percentage": 97.97, "elapsed_time": "1 day, 9:38:44", "remaining_time": "0:41:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10634, "total_steps": 10853, "loss": 0.1154, "learning_rate": 5.564414650861549e-09, "epoch": 0.9797761090892338, "percentage": 97.98, "elapsed_time": "1 day, 9:38:55", "remaining_time": "0:41:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10635, "total_steps": 10853, "loss": 0.1063, "learning_rate": 5.513732743162303e-09, "epoch": 0.9798682452665038, "percentage": 97.99, "elapsed_time": "1 day, 9:39:06", "remaining_time": "0:41:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10636, "total_steps": 10853, "loss": 0.1048, "learning_rate": 5.463282448781027e-09, "epoch": 0.9799603814437738, "percentage": 98.0, "elapsed_time": "1 day, 9:39:18", "remaining_time": "0:41:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10637, "total_steps": 10853, "loss": 0.1111, "learning_rate": 5.41306377240286e-09, "epoch": 0.980052517621044, "percentage": 98.01, "elapsed_time": "1 day, 9:39:27", "remaining_time": "0:41:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10638, "total_steps": 10853, "loss": 0.1257, "learning_rate": 5.363076718689908e-09, "epoch": 0.980144653798314, "percentage": 98.02, "elapsed_time": "1 day, 9:39:37", "remaining_time": "0:40:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10639, "total_steps": 10853, "loss": 0.1118, "learning_rate": 5.313321292283735e-09, "epoch": 0.9802367899755839, "percentage": 98.03, "elapsed_time": "1 day, 9:39:49", "remaining_time": "0:40:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10640, "total_steps": 10853, "loss": 0.1202, "learning_rate": 5.263797497804257e-09, "epoch": 0.9803289261528539, "percentage": 98.04, "elapsed_time": "1 day, 9:40:00", "remaining_time": "0:40:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10641, "total_steps": 10853, "loss": 0.113, "learning_rate": 5.2145053398494626e-09, "epoch": 0.9804210623301239, "percentage": 98.05, "elapsed_time": "1 day, 9:40:10", "remaining_time": "0:40:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10642, "total_steps": 10853, "loss": 0.1096, "learning_rate": 5.165444822996801e-09, "epoch": 0.9805131985073939, "percentage": 98.06, "elapsed_time": "1 day, 9:40:20", "remaining_time": "0:40:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10643, "total_steps": 10853, "loss": 0.1138, "learning_rate": 5.116615951800685e-09, "epoch": 0.9806053346846639, "percentage": 98.07, "elapsed_time": "1 day, 9:40:32", "remaining_time": "0:39:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10644, "total_steps": 10853, "loss": 0.1278, "learning_rate": 5.068018730795543e-09, "epoch": 0.9806974708619339, "percentage": 98.07, "elapsed_time": "1 day, 9:40:42", "remaining_time": "0:39:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10645, "total_steps": 10853, "loss": 0.1126, "learning_rate": 5.019653164493044e-09, "epoch": 0.9807896070392039, "percentage": 98.08, "elapsed_time": "1 day, 9:40:54", "remaining_time": "0:39:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10646, "total_steps": 10853, "loss": 0.1164, "learning_rate": 4.971519257384316e-09, "epoch": 0.9808817432164739, "percentage": 98.09, "elapsed_time": "1 day, 9:41:04", "remaining_time": "0:39:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10647, "total_steps": 10853, "loss": 0.1181, "learning_rate": 4.9236170139388415e-09, "epoch": 0.9809738793937439, "percentage": 98.1, "elapsed_time": "1 day, 9:41:15", "remaining_time": "0:39:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10648, "total_steps": 10853, "loss": 0.1192, "learning_rate": 4.875946438603896e-09, "epoch": 0.9810660155710139, "percentage": 98.11, "elapsed_time": "1 day, 9:41:26", "remaining_time": "0:38:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10649, "total_steps": 10853, "loss": 0.1155, "learning_rate": 4.828507535805937e-09, "epoch": 0.9811581517482839, "percentage": 98.12, "elapsed_time": "1 day, 9:41:36", "remaining_time": "0:38:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10650, "total_steps": 10853, "loss": 0.122, "learning_rate": 4.781300309949221e-09, "epoch": 0.981250287925554, "percentage": 98.13, "elapsed_time": "1 day, 9:41:46", "remaining_time": "0:38:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10651, "total_steps": 10853, "loss": 0.1081, "learning_rate": 4.734324765417741e-09, "epoch": 0.981342424102824, "percentage": 98.14, "elapsed_time": "1 day, 9:41:56", "remaining_time": "0:38:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10652, "total_steps": 10853, "loss": 0.1197, "learning_rate": 4.687580906572453e-09, "epoch": 0.981434560280094, "percentage": 98.15, "elapsed_time": "1 day, 9:42:08", "remaining_time": "0:38:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10653, "total_steps": 10853, "loss": 0.1154, "learning_rate": 4.6410687377540505e-09, "epoch": 0.981526696457364, "percentage": 98.16, "elapsed_time": "1 day, 9:42:17", "remaining_time": "0:37:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10654, "total_steps": 10853, "loss": 0.1083, "learning_rate": 4.5947882632810244e-09, "epoch": 0.981618832634634, "percentage": 98.17, "elapsed_time": "1 day, 9:42:28", "remaining_time": "0:37:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10655, "total_steps": 10853, "loss": 0.105, "learning_rate": 4.5487394874502155e-09, "epoch": 0.981710968811904, "percentage": 98.18, "elapsed_time": "1 day, 9:42:38", "remaining_time": "0:37:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10656, "total_steps": 10853, "loss": 0.1162, "learning_rate": 4.502922414537647e-09, "epoch": 0.981803104989174, "percentage": 98.18, "elapsed_time": "1 day, 9:42:49", "remaining_time": "0:37:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10657, "total_steps": 10853, "loss": 0.112, "learning_rate": 4.457337048797139e-09, "epoch": 0.981895241166444, "percentage": 98.19, "elapsed_time": "1 day, 9:43:01", "remaining_time": "0:37:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10658, "total_steps": 10853, "loss": 0.1213, "learning_rate": 4.411983394461694e-09, "epoch": 0.981987377343714, "percentage": 98.2, "elapsed_time": "1 day, 9:43:12", "remaining_time": "0:37:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10659, "total_steps": 10853, "loss": 0.1136, "learning_rate": 4.366861455742111e-09, "epoch": 0.982079513520984, "percentage": 98.21, "elapsed_time": "1 day, 9:43:23", "remaining_time": "0:36:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10660, "total_steps": 10853, "loss": 0.1124, "learning_rate": 4.321971236827815e-09, "epoch": 0.982171649698254, "percentage": 98.22, "elapsed_time": "1 day, 9:43:34", "remaining_time": "0:36:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10661, "total_steps": 10853, "loss": 0.1162, "learning_rate": 4.277312741887418e-09, "epoch": 0.982263785875524, "percentage": 98.23, "elapsed_time": "1 day, 9:43:45", "remaining_time": "0:36:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10662, "total_steps": 10853, "loss": 0.1073, "learning_rate": 4.232885975066769e-09, "epoch": 0.982355922052794, "percentage": 98.24, "elapsed_time": "1 day, 9:43:56", "remaining_time": "0:36:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10663, "total_steps": 10853, "loss": 0.1221, "learning_rate": 4.188690940491457e-09, "epoch": 0.982448058230064, "percentage": 98.25, "elapsed_time": "1 day, 9:44:06", "remaining_time": "0:36:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10664, "total_steps": 10853, "loss": 0.1033, "learning_rate": 4.144727642264867e-09, "epoch": 0.9825401944073341, "percentage": 98.26, "elapsed_time": "1 day, 9:44:18", "remaining_time": "0:35:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10665, "total_steps": 10853, "loss": 0.1169, "learning_rate": 4.100996084468734e-09, "epoch": 0.9826323305846041, "percentage": 98.27, "elapsed_time": "1 day, 9:44:29", "remaining_time": "0:35:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10666, "total_steps": 10853, "loss": 0.1186, "learning_rate": 4.057496271163974e-09, "epoch": 0.9827244667618741, "percentage": 98.28, "elapsed_time": "1 day, 9:44:40", "remaining_time": "0:35:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10667, "total_steps": 10853, "loss": 0.1189, "learning_rate": 4.014228206389026e-09, "epoch": 0.9828166029391441, "percentage": 98.29, "elapsed_time": "1 day, 9:44:53", "remaining_time": "0:35:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10668, "total_steps": 10853, "loss": 0.1147, "learning_rate": 3.971191894161785e-09, "epoch": 0.9829087391164141, "percentage": 98.3, "elapsed_time": "1 day, 9:45:05", "remaining_time": "0:35:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10669, "total_steps": 10853, "loss": 0.1111, "learning_rate": 3.9283873384779455e-09, "epoch": 0.9830008752936841, "percentage": 98.3, "elapsed_time": "1 day, 9:45:16", "remaining_time": "0:34:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10670, "total_steps": 10853, "loss": 0.1149, "learning_rate": 3.8858145433118275e-09, "epoch": 0.9830930114709541, "percentage": 98.31, "elapsed_time": "1 day, 9:45:26", "remaining_time": "0:34:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10671, "total_steps": 10853, "loss": 0.1233, "learning_rate": 3.843473512616658e-09, "epoch": 0.9831851476482241, "percentage": 98.32, "elapsed_time": "1 day, 9:45:35", "remaining_time": "0:34:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10672, "total_steps": 10853, "loss": 0.1204, "learning_rate": 3.801364250323458e-09, "epoch": 0.9832772838254941, "percentage": 98.33, "elapsed_time": "1 day, 9:45:46", "remaining_time": "0:34:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10673, "total_steps": 10853, "loss": 0.1131, "learning_rate": 3.759486760342435e-09, "epoch": 0.9833694200027641, "percentage": 98.34, "elapsed_time": "1 day, 9:45:56", "remaining_time": "0:34:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10674, "total_steps": 10853, "loss": 0.1074, "learning_rate": 3.7178410465615876e-09, "epoch": 0.9834615561800341, "percentage": 98.35, "elapsed_time": "1 day, 9:46:06", "remaining_time": "0:33:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10675, "total_steps": 10853, "loss": 0.108, "learning_rate": 3.676427112848102e-09, "epoch": 0.983553692357304, "percentage": 98.36, "elapsed_time": "1 day, 9:46:18", "remaining_time": "0:33:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10676, "total_steps": 10853, "loss": 0.1303, "learning_rate": 3.63524496304668e-09, "epoch": 0.983645828534574, "percentage": 98.37, "elapsed_time": "1 day, 9:46:30", "remaining_time": "0:33:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10677, "total_steps": 10853, "loss": 0.1222, "learning_rate": 3.5942946009814848e-09, "epoch": 0.9837379647118442, "percentage": 98.38, "elapsed_time": "1 day, 9:46:43", "remaining_time": "0:33:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10678, "total_steps": 10853, "loss": 0.1105, "learning_rate": 3.553576030454753e-09, "epoch": 0.9838301008891142, "percentage": 98.39, "elapsed_time": "1 day, 9:46:53", "remaining_time": "0:33:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10679, "total_steps": 10853, "loss": 0.122, "learning_rate": 3.5130892552473485e-09, "epoch": 0.9839222370663842, "percentage": 98.4, "elapsed_time": "1 day, 9:47:03", "remaining_time": "0:33:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10680, "total_steps": 10853, "loss": 0.1105, "learning_rate": 3.4728342791179313e-09, "epoch": 0.9840143732436542, "percentage": 98.41, "elapsed_time": "1 day, 9:47:14", "remaining_time": "0:32:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10681, "total_steps": 10853, "loss": 0.118, "learning_rate": 3.432811105804623e-09, "epoch": 0.9841065094209241, "percentage": 98.42, "elapsed_time": "1 day, 9:47:22", "remaining_time": "0:32:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10682, "total_steps": 10853, "loss": 0.114, "learning_rate": 3.3930197390236175e-09, "epoch": 0.9841986455981941, "percentage": 98.42, "elapsed_time": "1 day, 9:47:32", "remaining_time": "0:32:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10683, "total_steps": 10853, "loss": 0.1243, "learning_rate": 3.353460182469459e-09, "epoch": 0.9842907817754641, "percentage": 98.43, "elapsed_time": "1 day, 9:47:45", "remaining_time": "0:32:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10684, "total_steps": 10853, "loss": 0.1231, "learning_rate": 3.3141324398150434e-09, "epoch": 0.9843829179527341, "percentage": 98.44, "elapsed_time": "1 day, 9:47:57", "remaining_time": "0:32:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10685, "total_steps": 10853, "loss": 0.1181, "learning_rate": 3.275036514712171e-09, "epoch": 0.9844750541300041, "percentage": 98.45, "elapsed_time": "1 day, 9:48:08", "remaining_time": "0:31:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10686, "total_steps": 10853, "loss": 0.1243, "learning_rate": 3.236172410790994e-09, "epoch": 0.9845671903072741, "percentage": 98.46, "elapsed_time": "1 day, 9:48:20", "remaining_time": "0:31:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10687, "total_steps": 10853, "loss": 0.1114, "learning_rate": 3.1975401316597376e-09, "epoch": 0.9846593264845441, "percentage": 98.47, "elapsed_time": "1 day, 9:48:29", "remaining_time": "0:31:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10688, "total_steps": 10853, "loss": 0.1126, "learning_rate": 3.1591396809055317e-09, "epoch": 0.9847514626618141, "percentage": 98.48, "elapsed_time": "1 day, 9:48:41", "remaining_time": "0:31:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10689, "total_steps": 10853, "loss": 0.1243, "learning_rate": 3.120971062094136e-09, "epoch": 0.9848435988390841, "percentage": 98.49, "elapsed_time": "1 day, 9:48:52", "remaining_time": "0:31:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10690, "total_steps": 10853, "loss": 0.116, "learning_rate": 3.0830342787693814e-09, "epoch": 0.9849357350163541, "percentage": 98.5, "elapsed_time": "1 day, 9:49:04", "remaining_time": "0:30:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10691, "total_steps": 10853, "loss": 0.1134, "learning_rate": 3.0453293344534507e-09, "epoch": 0.9850278711936242, "percentage": 98.51, "elapsed_time": "1 day, 9:49:15", "remaining_time": "0:30:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10692, "total_steps": 10853, "loss": 0.1128, "learning_rate": 3.007856232647155e-09, "epoch": 0.9851200073708942, "percentage": 98.52, "elapsed_time": "1 day, 9:49:26", "remaining_time": "0:30:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10693, "total_steps": 10853, "loss": 0.1182, "learning_rate": 2.970614976830488e-09, "epoch": 0.9852121435481642, "percentage": 98.53, "elapsed_time": "1 day, 9:49:36", "remaining_time": "0:30:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10694, "total_steps": 10853, "loss": 0.1059, "learning_rate": 2.933605570460962e-09, "epoch": 0.9853042797254342, "percentage": 98.53, "elapsed_time": "1 day, 9:49:47", "remaining_time": "0:30:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10695, "total_steps": 10853, "loss": 0.1197, "learning_rate": 2.8968280169747177e-09, "epoch": 0.9853964159027042, "percentage": 98.54, "elapsed_time": "1 day, 9:49:58", "remaining_time": "0:29:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10696, "total_steps": 10853, "loss": 0.1093, "learning_rate": 2.8602823197868e-09, "epoch": 0.9854885520799742, "percentage": 98.55, "elapsed_time": "1 day, 9:50:08", "remaining_time": "0:29:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10697, "total_steps": 10853, "loss": 0.1253, "learning_rate": 2.823968482290329e-09, "epoch": 0.9855806882572442, "percentage": 98.56, "elapsed_time": "1 day, 9:50:20", "remaining_time": "0:29:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10698, "total_steps": 10853, "loss": 0.1129, "learning_rate": 2.787886507857329e-09, "epoch": 0.9856728244345142, "percentage": 98.57, "elapsed_time": "1 day, 9:50:31", "remaining_time": "0:29:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10699, "total_steps": 10853, "loss": 0.1153, "learning_rate": 2.7520363998376208e-09, "epoch": 0.9857649606117842, "percentage": 98.58, "elapsed_time": "1 day, 9:50:40", "remaining_time": "0:29:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10700, "total_steps": 10853, "loss": 0.1153, "learning_rate": 2.716418161560208e-09, "epoch": 0.9858570967890542, "percentage": 98.59, "elapsed_time": "1 day, 9:50:51", "remaining_time": "0:29:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10701, "total_steps": 10853, "loss": 0.116, "learning_rate": 2.6810317963321674e-09, "epoch": 0.9859492329663242, "percentage": 98.6, "elapsed_time": "1 day, 9:51:01", "remaining_time": "0:28:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10702, "total_steps": 10853, "loss": 0.1128, "learning_rate": 2.6458773074389266e-09, "epoch": 0.9860413691435942, "percentage": 98.61, "elapsed_time": "1 day, 9:51:13", "remaining_time": "0:28:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10703, "total_steps": 10853, "loss": 0.1231, "learning_rate": 2.610954698145096e-09, "epoch": 0.9861335053208642, "percentage": 98.62, "elapsed_time": "1 day, 9:51:23", "remaining_time": "0:28:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10704, "total_steps": 10853, "loss": 0.1164, "learning_rate": 2.5762639716925274e-09, "epoch": 0.9862256414981343, "percentage": 98.63, "elapsed_time": "1 day, 9:51:34", "remaining_time": "0:28:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10705, "total_steps": 10853, "loss": 0.116, "learning_rate": 2.5418051313028102e-09, "epoch": 0.9863177776754043, "percentage": 98.64, "elapsed_time": "1 day, 9:51:44", "remaining_time": "0:28:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10706, "total_steps": 10853, "loss": 0.1059, "learning_rate": 2.507578180175052e-09, "epoch": 0.9864099138526743, "percentage": 98.65, "elapsed_time": "1 day, 9:51:55", "remaining_time": "0:27:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10707, "total_steps": 10853, "loss": 0.1191, "learning_rate": 2.473583121487544e-09, "epoch": 0.9865020500299443, "percentage": 98.65, "elapsed_time": "1 day, 9:52:05", "remaining_time": "0:27:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10708, "total_steps": 10853, "loss": 0.1145, "learning_rate": 2.43981995839665e-09, "epoch": 0.9865941862072143, "percentage": 98.66, "elapsed_time": "1 day, 9:52:18", "remaining_time": "0:27:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10709, "total_steps": 10853, "loss": 0.1206, "learning_rate": 2.406288694037362e-09, "epoch": 0.9866863223844843, "percentage": 98.67, "elapsed_time": "1 day, 9:52:28", "remaining_time": "0:27:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10710, "total_steps": 10853, "loss": 0.1151, "learning_rate": 2.3729893315230234e-09, "epoch": 0.9867784585617543, "percentage": 98.68, "elapsed_time": "1 day, 9:52:40", "remaining_time": "0:27:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10711, "total_steps": 10853, "loss": 0.1192, "learning_rate": 2.339921873945328e-09, "epoch": 0.9868705947390243, "percentage": 98.69, "elapsed_time": "1 day, 9:52:51", "remaining_time": "0:26:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10712, "total_steps": 10853, "loss": 0.1197, "learning_rate": 2.3070863243745967e-09, "epoch": 0.9869627309162943, "percentage": 98.7, "elapsed_time": "1 day, 9:53:02", "remaining_time": "0:26:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10713, "total_steps": 10853, "loss": 0.1159, "learning_rate": 2.2744826858597803e-09, "epoch": 0.9870548670935643, "percentage": 98.71, "elapsed_time": "1 day, 9:53:13", "remaining_time": "0:26:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10714, "total_steps": 10853, "loss": 0.1123, "learning_rate": 2.2421109614279015e-09, "epoch": 0.9871470032708343, "percentage": 98.72, "elapsed_time": "1 day, 9:53:24", "remaining_time": "0:26:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10715, "total_steps": 10853, "loss": 0.129, "learning_rate": 2.209971154084889e-09, "epoch": 0.9872391394481043, "percentage": 98.73, "elapsed_time": "1 day, 9:53:36", "remaining_time": "0:26:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10716, "total_steps": 10853, "loss": 0.1192, "learning_rate": 2.1780632668150226e-09, "epoch": 0.9873312756253743, "percentage": 98.74, "elapsed_time": "1 day, 9:53:46", "remaining_time": "0:26:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10717, "total_steps": 10853, "loss": 0.13, "learning_rate": 2.1463873025806547e-09, "epoch": 0.9874234118026443, "percentage": 98.75, "elapsed_time": "1 day, 9:53:57", "remaining_time": "0:25:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10718, "total_steps": 10853, "loss": 0.1015, "learning_rate": 2.1149432643233213e-09, "epoch": 0.9875155479799144, "percentage": 98.76, "elapsed_time": "1 day, 9:54:06", "remaining_time": "0:25:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10719, "total_steps": 10853, "loss": 0.1105, "learning_rate": 2.0837311549620763e-09, "epoch": 0.9876076841571844, "percentage": 98.77, "elapsed_time": "1 day, 9:54:17", "remaining_time": "0:25:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10720, "total_steps": 10853, "loss": 0.1109, "learning_rate": 2.052750977395157e-09, "epoch": 0.9876998203344544, "percentage": 98.77, "elapsed_time": "1 day, 9:54:28", "remaining_time": "0:25:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10721, "total_steps": 10853, "loss": 0.1063, "learning_rate": 2.0220027344994285e-09, "epoch": 0.9877919565117244, "percentage": 98.78, "elapsed_time": "1 day, 9:54:39", "remaining_time": "0:25:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10722, "total_steps": 10853, "loss": 0.1135, "learning_rate": 1.9914864291292747e-09, "epoch": 0.9878840926889944, "percentage": 98.79, "elapsed_time": "1 day, 9:54:49", "remaining_time": "0:24:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10723, "total_steps": 10853, "loss": 0.1222, "learning_rate": 1.961202064118539e-09, "epoch": 0.9879762288662643, "percentage": 98.8, "elapsed_time": "1 day, 9:55:00", "remaining_time": "0:24:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10724, "total_steps": 10853, "loss": 0.1183, "learning_rate": 1.9311496422791398e-09, "epoch": 0.9880683650435343, "percentage": 98.81, "elapsed_time": "1 day, 9:55:11", "remaining_time": "0:24:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10725, "total_steps": 10853, "loss": 0.1247, "learning_rate": 1.9013291664013445e-09, "epoch": 0.9881605012208043, "percentage": 98.82, "elapsed_time": "1 day, 9:55:22", "remaining_time": "0:24:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10726, "total_steps": 10853, "loss": 0.1032, "learning_rate": 1.8717406392537718e-09, "epoch": 0.9882526373980743, "percentage": 98.83, "elapsed_time": "1 day, 9:55:33", "remaining_time": "0:24:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10727, "total_steps": 10853, "loss": 0.1255, "learning_rate": 1.8423840635842237e-09, "epoch": 0.9883447735753443, "percentage": 98.84, "elapsed_time": "1 day, 9:55:45", "remaining_time": "0:23:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10728, "total_steps": 10853, "loss": 0.1166, "learning_rate": 1.8132594421180206e-09, "epoch": 0.9884369097526143, "percentage": 98.85, "elapsed_time": "1 day, 9:55:55", "remaining_time": "0:23:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10729, "total_steps": 10853, "loss": 0.111, "learning_rate": 1.7843667775593875e-09, "epoch": 0.9885290459298843, "percentage": 98.86, "elapsed_time": "1 day, 9:56:07", "remaining_time": "0:23:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10730, "total_steps": 10853, "loss": 0.0993, "learning_rate": 1.7557060725914566e-09, "epoch": 0.9886211821071543, "percentage": 98.87, "elapsed_time": "1 day, 9:56:18", "remaining_time": "0:23:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10731, "total_steps": 10853, "loss": 0.1258, "learning_rate": 1.7272773298748769e-09, "epoch": 0.9887133182844243, "percentage": 98.88, "elapsed_time": "1 day, 9:56:30", "remaining_time": "0:23:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10732, "total_steps": 10853, "loss": 0.1135, "learning_rate": 1.6990805520494813e-09, "epoch": 0.9888054544616944, "percentage": 98.89, "elapsed_time": "1 day, 9:56:41", "remaining_time": "0:22:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10733, "total_steps": 10853, "loss": 0.1169, "learning_rate": 1.6711157417334533e-09, "epoch": 0.9888975906389644, "percentage": 98.89, "elapsed_time": "1 day, 9:56:52", "remaining_time": "0:22:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10734, "total_steps": 10853, "loss": 0.1135, "learning_rate": 1.6433829015230497e-09, "epoch": 0.9889897268162344, "percentage": 98.9, "elapsed_time": "1 day, 9:57:02", "remaining_time": "0:22:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10735, "total_steps": 10853, "loss": 0.1076, "learning_rate": 1.6158820339937098e-09, "epoch": 0.9890818629935044, "percentage": 98.91, "elapsed_time": "1 day, 9:57:13", "remaining_time": "0:22:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10736, "total_steps": 10853, "loss": 0.1036, "learning_rate": 1.5886131416981144e-09, "epoch": 0.9891739991707744, "percentage": 98.92, "elapsed_time": "1 day, 9:57:24", "remaining_time": "0:22:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10737, "total_steps": 10853, "loss": 0.1257, "learning_rate": 1.5615762271689593e-09, "epoch": 0.9892661353480444, "percentage": 98.93, "elapsed_time": "1 day, 9:57:36", "remaining_time": "0:22:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10738, "total_steps": 10853, "loss": 0.1243, "learning_rate": 1.5347712929164594e-09, "epoch": 0.9893582715253144, "percentage": 98.94, "elapsed_time": "1 day, 9:57:46", "remaining_time": "0:21:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10739, "total_steps": 10853, "loss": 0.1245, "learning_rate": 1.508198341429179e-09, "epoch": 0.9894504077025844, "percentage": 98.95, "elapsed_time": "1 day, 9:57:57", "remaining_time": "0:21:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10740, "total_steps": 10853, "loss": 0.1245, "learning_rate": 1.481857375174589e-09, "epoch": 0.9895425438798544, "percentage": 98.96, "elapsed_time": "1 day, 9:58:08", "remaining_time": "0:21:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10741, "total_steps": 10853, "loss": 0.1217, "learning_rate": 1.4557483965985109e-09, "epoch": 0.9896346800571244, "percentage": 98.97, "elapsed_time": "1 day, 9:58:17", "remaining_time": "0:21:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10742, "total_steps": 10853, "loss": 0.1154, "learning_rate": 1.4298714081248389e-09, "epoch": 0.9897268162343944, "percentage": 98.98, "elapsed_time": "1 day, 9:58:28", "remaining_time": "0:21:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10743, "total_steps": 10853, "loss": 0.1159, "learning_rate": 1.4042264121566507e-09, "epoch": 0.9898189524116644, "percentage": 98.99, "elapsed_time": "1 day, 9:58:39", "remaining_time": "0:20:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10744, "total_steps": 10853, "loss": 0.1162, "learning_rate": 1.3788134110750972e-09, "epoch": 0.9899110885889344, "percentage": 99.0, "elapsed_time": "1 day, 9:58:51", "remaining_time": "0:20:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10745, "total_steps": 10853, "loss": 0.1217, "learning_rate": 1.3536324072394026e-09, "epoch": 0.9900032247662045, "percentage": 99.0, "elapsed_time": "1 day, 9:59:02", "remaining_time": "0:20:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10746, "total_steps": 10853, "loss": 0.1193, "learning_rate": 1.3286834029879735e-09, "epoch": 0.9900953609434745, "percentage": 99.01, "elapsed_time": "1 day, 9:59:12", "remaining_time": "0:20:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10747, "total_steps": 10853, "loss": 0.1153, "learning_rate": 1.303966400637291e-09, "epoch": 0.9901874971207445, "percentage": 99.02, "elapsed_time": "1 day, 9:59:23", "remaining_time": "0:20:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10748, "total_steps": 10853, "loss": 0.1095, "learning_rate": 1.279481402481908e-09, "epoch": 0.9902796332980145, "percentage": 99.03, "elapsed_time": "1 day, 9:59:34", "remaining_time": "0:19:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10749, "total_steps": 10853, "loss": 0.1132, "learning_rate": 1.255228410795839e-09, "epoch": 0.9903717694752845, "percentage": 99.04, "elapsed_time": "1 day, 9:59:45", "remaining_time": "0:19:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10750, "total_steps": 10853, "loss": 0.1053, "learning_rate": 1.2312074278308939e-09, "epoch": 0.9904639056525545, "percentage": 99.05, "elapsed_time": "1 day, 9:59:54", "remaining_time": "0:19:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10751, "total_steps": 10853, "loss": 0.1238, "learning_rate": 1.2074184558169554e-09, "epoch": 0.9905560418298245, "percentage": 99.06, "elapsed_time": "1 day, 10:00:05", "remaining_time": "0:19:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10752, "total_steps": 10853, "loss": 0.134, "learning_rate": 1.1838614969633678e-09, "epoch": 0.9906481780070945, "percentage": 99.07, "elapsed_time": "1 day, 10:00:15", "remaining_time": "0:19:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10753, "total_steps": 10853, "loss": 0.1165, "learning_rate": 1.1605365534569922e-09, "epoch": 0.9907403141843645, "percentage": 99.08, "elapsed_time": "1 day, 10:00:25", "remaining_time": "0:18:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10754, "total_steps": 10853, "loss": 0.1207, "learning_rate": 1.1374436274635968e-09, "epoch": 0.9908324503616345, "percentage": 99.09, "elapsed_time": "1 day, 10:00:37", "remaining_time": "0:18:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10755, "total_steps": 10853, "loss": 0.1191, "learning_rate": 1.1145827211278548e-09, "epoch": 0.9909245865389045, "percentage": 99.1, "elapsed_time": "1 day, 10:00:48", "remaining_time": "0:18:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10756, "total_steps": 10853, "loss": 0.1095, "learning_rate": 1.0919538365716797e-09, "epoch": 0.9910167227161745, "percentage": 99.11, "elapsed_time": "1 day, 10:00:59", "remaining_time": "0:18:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10757, "total_steps": 10853, "loss": 0.1164, "learning_rate": 1.069556975896724e-09, "epoch": 0.9911088588934445, "percentage": 99.12, "elapsed_time": "1 day, 10:01:10", "remaining_time": "0:18:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10758, "total_steps": 10853, "loss": 0.1157, "learning_rate": 1.047392141182435e-09, "epoch": 0.9912009950707145, "percentage": 99.12, "elapsed_time": "1 day, 10:01:21", "remaining_time": "0:18:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10759, "total_steps": 10853, "loss": 0.1156, "learning_rate": 1.0254593344866115e-09, "epoch": 0.9912931312479846, "percentage": 99.13, "elapsed_time": "1 day, 10:01:31", "remaining_time": "0:17:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10760, "total_steps": 10853, "loss": 0.1161, "learning_rate": 1.00375855784568e-09, "epoch": 0.9913852674252546, "percentage": 99.14, "elapsed_time": "1 day, 10:01:41", "remaining_time": "0:17:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10761, "total_steps": 10853, "loss": 0.1127, "learning_rate": 9.822898132749726e-10, "epoch": 0.9914774036025246, "percentage": 99.15, "elapsed_time": "1 day, 10:01:53", "remaining_time": "0:17:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10762, "total_steps": 10853, "loss": 0.1099, "learning_rate": 9.610531027673398e-10, "epoch": 0.9915695397797946, "percentage": 99.16, "elapsed_time": "1 day, 10:02:03", "remaining_time": "0:17:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10763, "total_steps": 10853, "loss": 0.1116, "learning_rate": 9.400484282950928e-10, "epoch": 0.9916616759570646, "percentage": 99.17, "elapsed_time": "1 day, 10:02:15", "remaining_time": "0:17:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10764, "total_steps": 10853, "loss": 0.1247, "learning_rate": 9.192757918083383e-10, "epoch": 0.9917538121343346, "percentage": 99.18, "elapsed_time": "1 day, 10:02:27", "remaining_time": "0:16:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10765, "total_steps": 10853, "loss": 0.1188, "learning_rate": 8.987351952355338e-10, "epoch": 0.9918459483116046, "percentage": 99.19, "elapsed_time": "1 day, 10:02:37", "remaining_time": "0:16:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10766, "total_steps": 10853, "loss": 0.1232, "learning_rate": 8.7842664048432e-10, "epoch": 0.9919380844888745, "percentage": 99.2, "elapsed_time": "1 day, 10:02:49", "remaining_time": "0:16:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10767, "total_steps": 10853, "loss": 0.123, "learning_rate": 8.58350129440133e-10, "epoch": 0.9920302206661445, "percentage": 99.21, "elapsed_time": "1 day, 10:02:59", "remaining_time": "0:16:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10768, "total_steps": 10853, "loss": 0.1104, "learning_rate": 8.385056639670375e-10, "epoch": 0.9921223568434145, "percentage": 99.22, "elapsed_time": "1 day, 10:03:11", "remaining_time": "0:16:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10769, "total_steps": 10853, "loss": 0.1148, "learning_rate": 8.188932459077259e-10, "epoch": 0.9922144930206845, "percentage": 99.23, "elapsed_time": "1 day, 10:03:22", "remaining_time": "0:15:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10770, "total_steps": 10853, "loss": 0.1229, "learning_rate": 7.995128770829641e-10, "epoch": 0.9923066291979545, "percentage": 99.24, "elapsed_time": "1 day, 10:03:33", "remaining_time": "0:15:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10771, "total_steps": 10853, "loss": 0.1261, "learning_rate": 7.803645592927012e-10, "epoch": 0.9923987653752245, "percentage": 99.24, "elapsed_time": "1 day, 10:03:44", "remaining_time": "0:15:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10772, "total_steps": 10853, "loss": 0.1078, "learning_rate": 7.614482943144041e-10, "epoch": 0.9924909015524946, "percentage": 99.25, "elapsed_time": "1 day, 10:03:55", "remaining_time": "0:15:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10773, "total_steps": 10853, "loss": 0.1165, "learning_rate": 7.427640839044458e-10, "epoch": 0.9925830377297646, "percentage": 99.26, "elapsed_time": "1 day, 10:04:06", "remaining_time": "0:15:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10774, "total_steps": 10853, "loss": 0.1301, "learning_rate": 7.243119297981049e-10, "epoch": 0.9926751739070346, "percentage": 99.27, "elapsed_time": "1 day, 10:04:16", "remaining_time": "0:14:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10775, "total_steps": 10853, "loss": 0.1298, "learning_rate": 7.060918337081779e-10, "epoch": 0.9927673100843046, "percentage": 99.28, "elapsed_time": "1 day, 10:04:27", "remaining_time": "0:14:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10776, "total_steps": 10853, "loss": 0.1085, "learning_rate": 6.881037973266447e-10, "epoch": 0.9928594462615746, "percentage": 99.29, "elapsed_time": "1 day, 10:04:38", "remaining_time": "0:14:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10777, "total_steps": 10853, "loss": 0.1183, "learning_rate": 6.703478223235582e-10, "epoch": 0.9929515824388446, "percentage": 99.3, "elapsed_time": "1 day, 10:04:48", "remaining_time": "0:14:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10778, "total_steps": 10853, "loss": 0.1207, "learning_rate": 6.528239103478773e-10, "epoch": 0.9930437186161146, "percentage": 99.31, "elapsed_time": "1 day, 10:04:58", "remaining_time": "0:14:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10779, "total_steps": 10853, "loss": 0.108, "learning_rate": 6.355320630263561e-10, "epoch": 0.9931358547933846, "percentage": 99.32, "elapsed_time": "1 day, 10:05:09", "remaining_time": "0:14:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10780, "total_steps": 10853, "loss": 0.1075, "learning_rate": 6.184722819646549e-10, "epoch": 0.9932279909706546, "percentage": 99.33, "elapsed_time": "1 day, 10:05:20", "remaining_time": "0:13:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10781, "total_steps": 10853, "loss": 0.1195, "learning_rate": 6.016445687467842e-10, "epoch": 0.9933201271479246, "percentage": 99.34, "elapsed_time": "1 day, 10:05:31", "remaining_time": "0:13:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10782, "total_steps": 10853, "loss": 0.1316, "learning_rate": 5.850489249351054e-10, "epoch": 0.9934122633251946, "percentage": 99.35, "elapsed_time": "1 day, 10:05:43", "remaining_time": "0:13:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10783, "total_steps": 10853, "loss": 0.1036, "learning_rate": 5.686853520708857e-10, "epoch": 0.9935043995024646, "percentage": 99.36, "elapsed_time": "1 day, 10:05:53", "remaining_time": "0:13:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10784, "total_steps": 10853, "loss": 0.1088, "learning_rate": 5.525538516729101e-10, "epoch": 0.9935965356797346, "percentage": 99.36, "elapsed_time": "1 day, 10:06:04", "remaining_time": "0:13:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10785, "total_steps": 10853, "loss": 0.1181, "learning_rate": 5.366544252397021e-10, "epoch": 0.9936886718570046, "percentage": 99.37, "elapsed_time": "1 day, 10:06:14", "remaining_time": "0:12:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10786, "total_steps": 10853, "loss": 0.1192, "learning_rate": 5.209870742467482e-10, "epoch": 0.9937808080342747, "percentage": 99.38, "elapsed_time": "1 day, 10:06:25", "remaining_time": "0:12:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10787, "total_steps": 10853, "loss": 0.1158, "learning_rate": 5.055518001492731e-10, "epoch": 0.9938729442115447, "percentage": 99.39, "elapsed_time": "1 day, 10:06:36", "remaining_time": "0:12:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10788, "total_steps": 10853, "loss": 0.1205, "learning_rate": 4.903486043802974e-10, "epoch": 0.9939650803888147, "percentage": 99.4, "elapsed_time": "1 day, 10:06:48", "remaining_time": "0:12:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10789, "total_steps": 10853, "loss": 0.1172, "learning_rate": 4.75377488351747e-10, "epoch": 0.9940572165660847, "percentage": 99.41, "elapsed_time": "1 day, 10:06:58", "remaining_time": "0:12:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10790, "total_steps": 10853, "loss": 0.1096, "learning_rate": 4.6063845345306613e-10, "epoch": 0.9941493527433547, "percentage": 99.42, "elapsed_time": "1 day, 10:07:08", "remaining_time": "0:11:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10791, "total_steps": 10853, "loss": 0.1159, "learning_rate": 4.4613150105315974e-10, "epoch": 0.9942414889206247, "percentage": 99.43, "elapsed_time": "1 day, 10:07:18", "remaining_time": "0:11:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10792, "total_steps": 10853, "loss": 0.1151, "learning_rate": 4.3185663249900587e-10, "epoch": 0.9943336250978947, "percentage": 99.44, "elapsed_time": "1 day, 10:07:29", "remaining_time": "0:11:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10793, "total_steps": 10853, "loss": 0.1106, "learning_rate": 4.1781384911593336e-10, "epoch": 0.9944257612751647, "percentage": 99.45, "elapsed_time": "1 day, 10:07:39", "remaining_time": "0:11:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10794, "total_steps": 10853, "loss": 0.1155, "learning_rate": 4.040031522078991e-10, "epoch": 0.9945178974524347, "percentage": 99.46, "elapsed_time": "1 day, 10:07:48", "remaining_time": "0:11:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10795, "total_steps": 10853, "loss": 0.1182, "learning_rate": 3.904245430569331e-10, "epoch": 0.9946100336297047, "percentage": 99.47, "elapsed_time": "1 day, 10:08:00", "remaining_time": "0:11:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10796, "total_steps": 10853, "loss": 0.1068, "learning_rate": 3.7707802292424877e-10, "epoch": 0.9947021698069747, "percentage": 99.47, "elapsed_time": "1 day, 10:08:10", "remaining_time": "0:10:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10797, "total_steps": 10853, "loss": 0.1169, "learning_rate": 3.639635930491325e-10, "epoch": 0.9947943059842447, "percentage": 99.48, "elapsed_time": "1 day, 10:08:20", "remaining_time": "0:10:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10798, "total_steps": 10853, "loss": 0.1149, "learning_rate": 3.5108125464866636e-10, "epoch": 0.9948864421615147, "percentage": 99.49, "elapsed_time": "1 day, 10:08:32", "remaining_time": "0:10:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10799, "total_steps": 10853, "loss": 0.118, "learning_rate": 3.3843100891939316e-10, "epoch": 0.9949785783387847, "percentage": 99.5, "elapsed_time": "1 day, 10:08:44", "remaining_time": "0:10:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10800, "total_steps": 10853, "loss": 0.1164, "learning_rate": 3.260128570359289e-10, "epoch": 0.9950707145160548, "percentage": 99.51, "elapsed_time": "1 day, 10:08:55", "remaining_time": "0:10:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10801, "total_steps": 10853, "loss": 0.1222, "learning_rate": 3.138268001509626e-10, "epoch": 0.9951628506933248, "percentage": 99.52, "elapsed_time": "1 day, 10:09:04", "remaining_time": "0:09:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10802, "total_steps": 10853, "loss": 0.1253, "learning_rate": 3.018728393963666e-10, "epoch": 0.9952549868705948, "percentage": 99.53, "elapsed_time": "1 day, 10:09:15", "remaining_time": "0:09:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10803, "total_steps": 10853, "loss": 0.1206, "learning_rate": 2.901509758820864e-10, "epoch": 0.9953471230478648, "percentage": 99.54, "elapsed_time": "1 day, 10:09:26", "remaining_time": "0:09:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10804, "total_steps": 10853, "loss": 0.11, "learning_rate": 2.786612106961406e-10, "epoch": 0.9954392592251348, "percentage": 99.55, "elapsed_time": "1 day, 10:09:36", "remaining_time": "0:09:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10805, "total_steps": 10853, "loss": 0.114, "learning_rate": 2.674035449054535e-10, "epoch": 0.9955313954024048, "percentage": 99.56, "elapsed_time": "1 day, 10:09:46", "remaining_time": "0:09:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10806, "total_steps": 10853, "loss": 0.1223, "learning_rate": 2.563779795553001e-10, "epoch": 0.9956235315796748, "percentage": 99.57, "elapsed_time": "1 day, 10:09:58", "remaining_time": "0:08:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10807, "total_steps": 10853, "loss": 0.1231, "learning_rate": 2.455845156695835e-10, "epoch": 0.9957156677569448, "percentage": 99.58, "elapsed_time": "1 day, 10:10:08", "remaining_time": "0:08:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10808, "total_steps": 10853, "loss": 0.0981, "learning_rate": 2.350231542502801e-10, "epoch": 0.9958078039342148, "percentage": 99.59, "elapsed_time": "1 day, 10:10:18", "remaining_time": "0:08:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10809, "total_steps": 10853, "loss": 0.1242, "learning_rate": 2.2469389627827188e-10, "epoch": 0.9958999401114847, "percentage": 99.59, "elapsed_time": "1 day, 10:10:29", "remaining_time": "0:08:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10810, "total_steps": 10853, "loss": 0.1179, "learning_rate": 2.1459674271251397e-10, "epoch": 0.9959920762887547, "percentage": 99.6, "elapsed_time": "1 day, 10:10:41", "remaining_time": "0:08:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10811, "total_steps": 10853, "loss": 0.1181, "learning_rate": 2.0473169449031217e-10, "epoch": 0.9960842124660247, "percentage": 99.61, "elapsed_time": "1 day, 10:10:53", "remaining_time": "0:07:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10812, "total_steps": 10853, "loss": 0.1071, "learning_rate": 1.9509875252787803e-10, "epoch": 0.9961763486432947, "percentage": 99.62, "elapsed_time": "1 day, 10:11:04", "remaining_time": "0:07:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10813, "total_steps": 10853, "loss": 0.1127, "learning_rate": 1.856979177194962e-10, "epoch": 0.9962684848205648, "percentage": 99.63, "elapsed_time": "1 day, 10:11:15", "remaining_time": "0:07:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10814, "total_steps": 10853, "loss": 0.1084, "learning_rate": 1.7652919093807952e-10, "epoch": 0.9963606209978348, "percentage": 99.64, "elapsed_time": "1 day, 10:11:26", "remaining_time": "0:07:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10815, "total_steps": 10853, "loss": 0.1181, "learning_rate": 1.675925730348915e-10, "epoch": 0.9964527571751048, "percentage": 99.65, "elapsed_time": "1 day, 10:11:36", "remaining_time": "0:07:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10816, "total_steps": 10853, "loss": 0.1092, "learning_rate": 1.5888806484010143e-10, "epoch": 0.9965448933523748, "percentage": 99.66, "elapsed_time": "1 day, 10:11:47", "remaining_time": "0:07:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10817, "total_steps": 10853, "loss": 0.1152, "learning_rate": 1.5041566716139656e-10, "epoch": 0.9966370295296448, "percentage": 99.67, "elapsed_time": "1 day, 10:11:58", "remaining_time": "0:06:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10818, "total_steps": 10853, "loss": 0.121, "learning_rate": 1.4217538078536985e-10, "epoch": 0.9967291657069148, "percentage": 99.68, "elapsed_time": "1 day, 10:12:08", "remaining_time": "0:06:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10819, "total_steps": 10853, "loss": 0.1254, "learning_rate": 1.3416720647779768e-10, "epoch": 0.9968213018841848, "percentage": 99.69, "elapsed_time": "1 day, 10:12:19", "remaining_time": "0:06:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10820, "total_steps": 10853, "loss": 0.1228, "learning_rate": 1.263911449816968e-10, "epoch": 0.9969134380614548, "percentage": 99.7, "elapsed_time": "1 day, 10:12:30", "remaining_time": "0:06:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10821, "total_steps": 10853, "loss": 0.1175, "learning_rate": 1.1884719701926727e-10, "epoch": 0.9970055742387248, "percentage": 99.71, "elapsed_time": "1 day, 10:12:40", "remaining_time": "0:06:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10822, "total_steps": 10853, "loss": 0.1171, "learning_rate": 1.1153536329078229e-10, "epoch": 0.9970977104159948, "percentage": 99.71, "elapsed_time": "1 day, 10:12:49", "remaining_time": "0:05:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10823, "total_steps": 10853, "loss": 0.1192, "learning_rate": 1.0445564447542078e-10, "epoch": 0.9971898465932648, "percentage": 99.72, "elapsed_time": "1 day, 10:12:59", "remaining_time": "0:05:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10824, "total_steps": 10853, "loss": 0.1141, "learning_rate": 9.760804123015721e-11, "epoch": 0.9972819827705348, "percentage": 99.73, "elapsed_time": "1 day, 10:13:09", "remaining_time": "0:05:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10825, "total_steps": 10853, "loss": 0.1177, "learning_rate": 9.099255419114938e-11, "epoch": 0.9973741189478048, "percentage": 99.74, "elapsed_time": "1 day, 10:13:19", "remaining_time": "0:05:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10826, "total_steps": 10853, "loss": 0.1128, "learning_rate": 8.460918397262818e-11, "epoch": 0.9974662551250748, "percentage": 99.75, "elapsed_time": "1 day, 10:13:30", "remaining_time": "0:05:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10827, "total_steps": 10853, "loss": 0.1134, "learning_rate": 7.845793116717515e-11, "epoch": 0.9975583913023449, "percentage": 99.76, "elapsed_time": "1 day, 10:13:42", "remaining_time": "0:04:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10828, "total_steps": 10853, "loss": 0.1238, "learning_rate": 7.253879634600003e-11, "epoch": 0.9976505274796149, "percentage": 99.77, "elapsed_time": "1 day, 10:13:54", "remaining_time": "0:04:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10829, "total_steps": 10853, "loss": 0.1114, "learning_rate": 6.685178005838567e-11, "epoch": 0.9977426636568849, "percentage": 99.78, "elapsed_time": "1 day, 10:14:06", "remaining_time": "0:04:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10830, "total_steps": 10853, "loss": 0.1272, "learning_rate": 6.139688283279821e-11, "epoch": 0.9978347998341549, "percentage": 99.79, "elapsed_time": "1 day, 10:14:17", "remaining_time": "0:04:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10831, "total_steps": 10853, "loss": 0.1112, "learning_rate": 5.617410517549937e-11, "epoch": 0.9979269360114249, "percentage": 99.8, "elapsed_time": "1 day, 10:14:28", "remaining_time": "0:04:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10832, "total_steps": 10853, "loss": 0.1272, "learning_rate": 5.118344757165661e-11, "epoch": 0.9980190721886949, "percentage": 99.81, "elapsed_time": "1 day, 10:14:38", "remaining_time": "0:03:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10833, "total_steps": 10853, "loss": 0.1351, "learning_rate": 4.6424910484232924e-11, "epoch": 0.9981112083659649, "percentage": 99.82, "elapsed_time": "1 day, 10:14:51", "remaining_time": "0:03:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10834, "total_steps": 10853, "loss": 0.1033, "learning_rate": 4.189849435565219e-11, "epoch": 0.9982033445432349, "percentage": 99.82, "elapsed_time": "1 day, 10:15:00", "remaining_time": "0:03:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10835, "total_steps": 10853, "loss": 0.1195, "learning_rate": 3.7604199605578705e-11, "epoch": 0.9982954807205049, "percentage": 99.83, "elapsed_time": "1 day, 10:15:12", "remaining_time": "0:03:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10836, "total_steps": 10853, "loss": 0.1267, "learning_rate": 3.35420266328601e-11, "epoch": 0.9983876168977749, "percentage": 99.84, "elapsed_time": "1 day, 10:15:24", "remaining_time": "0:03:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10837, "total_steps": 10853, "loss": 0.1205, "learning_rate": 2.9711975814972205e-11, "epoch": 0.9984797530750449, "percentage": 99.85, "elapsed_time": "1 day, 10:15:35", "remaining_time": "0:03:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10838, "total_steps": 10853, "loss": 0.1177, "learning_rate": 2.6114047507463936e-11, "epoch": 0.9985718892523149, "percentage": 99.86, "elapsed_time": "1 day, 10:15:46", "remaining_time": "0:02:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10839, "total_steps": 10853, "loss": 0.1155, "learning_rate": 2.2748242044234868e-11, "epoch": 0.9986640254295849, "percentage": 99.87, "elapsed_time": "1 day, 10:15:56", "remaining_time": "0:02:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10840, "total_steps": 10853, "loss": 0.1206, "learning_rate": 1.9614559738090345e-11, "epoch": 0.998756161606855, "percentage": 99.88, "elapsed_time": "1 day, 10:16:07", "remaining_time": "0:02:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10841, "total_steps": 10853, "loss": 0.1137, "learning_rate": 1.671300087935368e-11, "epoch": 0.998848297784125, "percentage": 99.89, "elapsed_time": "1 day, 10:16:18", "remaining_time": "0:02:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10842, "total_steps": 10853, "loss": 0.112, "learning_rate": 1.4043565738364184e-11, "epoch": 0.998940433961395, "percentage": 99.9, "elapsed_time": "1 day, 10:16:30", "remaining_time": "0:02:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10843, "total_steps": 10853, "loss": 0.1132, "learning_rate": 1.1606254562146479e-11, "epoch": 0.999032570138665, "percentage": 99.91, "elapsed_time": "1 day, 10:16:41", "remaining_time": "0:01:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10844, "total_steps": 10853, "loss": 0.1083, "learning_rate": 9.401067577463618e-12, "epoch": 0.999124706315935, "percentage": 99.92, "elapsed_time": "1 day, 10:16:51", "remaining_time": "0:01:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10845, "total_steps": 10853, "loss": 0.1201, "learning_rate": 7.428004988874194e-12, "epoch": 0.999216842493205, "percentage": 99.93, "elapsed_time": "1 day, 10:17:02", "remaining_time": "0:01:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10846, "total_steps": 10853, "loss": 0.1133, "learning_rate": 5.687066979565003e-12, "epoch": 0.999308978670475, "percentage": 99.94, "elapsed_time": "1 day, 10:17:13", "remaining_time": "0:01:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10847, "total_steps": 10853, "loss": 0.1123, "learning_rate": 4.178253711351054e-12, "epoch": 0.999401114847745, "percentage": 99.94, "elapsed_time": "1 day, 10:17:23", "remaining_time": "0:01:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10848, "total_steps": 10853, "loss": 0.1194, "learning_rate": 2.9015653243980034e-12, "epoch": 0.999493251025015, "percentage": 99.95, "elapsed_time": "1 day, 10:17:35", "remaining_time": "0:00:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10849, "total_steps": 10853, "loss": 0.1209, "learning_rate": 1.8570019369446025e-12, "epoch": 0.999585387202285, "percentage": 99.96, "elapsed_time": "1 day, 10:17:47", "remaining_time": "0:00:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10850, "total_steps": 10853, "loss": 0.1213, "learning_rate": 1.044563646135366e-12, "epoch": 0.999677523379555, "percentage": 99.97, "elapsed_time": "1 day, 10:17:58", "remaining_time": "0:00:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10851, "total_steps": 10853, "loss": 0.1109, "learning_rate": 4.642505274654596e-13, "epoch": 0.999769659556825, "percentage": 99.98, "elapsed_time": "1 day, 10:18:08", "remaining_time": "0:00:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10852, "total_steps": 10853, "loss": 0.1163, "learning_rate": 1.1606263450314458e-13, "epoch": 0.999861795734095, "percentage": 99.99, "elapsed_time": "1 day, 10:18:19", "remaining_time": "0:00:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10853, "total_steps": 10853, "loss": 0.1287, "learning_rate": 0.0, "epoch": 0.999953931911365, "percentage": 100.0, "elapsed_time": "1 day, 10:18:30", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10853, "total_steps": 10853, "epoch": 0.999953931911365, "percentage": 100.0, "elapsed_time": "1 day, 10:18:30", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0}