{"current_steps": 1, "total_steps": 1025, "loss": 0.3691, "learning_rate": 9.615384615384617e-08, "epoch": 0.0009754907938056335, "percentage": 0.1, "elapsed_time": "0:00:48", "remaining_time": "13:48:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2, "total_steps": 1025, "loss": 0.3804, "learning_rate": 1.9230769230769234e-07, "epoch": 0.001950981587611267, "percentage": 0.2, "elapsed_time": "0:01:33", "remaining_time": "13:18:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3, "total_steps": 1025, "loss": 0.3682, "learning_rate": 2.884615384615385e-07, "epoch": 0.0029264723814169005, "percentage": 0.29, "elapsed_time": "0:02:20", "remaining_time": "13:16:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4, "total_steps": 1025, "loss": 0.3567, "learning_rate": 3.846153846153847e-07, "epoch": 0.003901963175222534, "percentage": 0.39, "elapsed_time": "0:03:06", "remaining_time": "13:13:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5, "total_steps": 1025, "loss": 0.3773, "learning_rate": 4.807692307692308e-07, "epoch": 0.004877453969028167, "percentage": 0.49, "elapsed_time": "0:03:51", "remaining_time": "13:08:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6, "total_steps": 1025, "loss": 0.3502, "learning_rate": 5.76923076923077e-07, "epoch": 0.005852944762833801, "percentage": 0.59, "elapsed_time": "0:04:42", "remaining_time": "13:20:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7, "total_steps": 1025, "loss": 0.3614, "learning_rate": 6.730769230769231e-07, "epoch": 0.006828435556639434, "percentage": 0.68, "elapsed_time": "0:05:30", "remaining_time": "13:21:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8, "total_steps": 1025, "loss": 0.3463, "learning_rate": 7.692307692307694e-07, "epoch": 0.007803926350445068, "percentage": 0.78, "elapsed_time": "0:06:13", "remaining_time": "13:11:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9, "total_steps": 1025, "loss": 0.3582, "learning_rate": 8.653846153846154e-07, "epoch": 0.008779417144250701, "percentage": 0.88, "elapsed_time": "0:06:58", "remaining_time": "13:07:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10, "total_steps": 1025, "loss": 0.3277, "learning_rate": 9.615384615384617e-07, "epoch": 0.009754907938056334, "percentage": 0.98, "elapsed_time": "0:07:42", "remaining_time": "13:02:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11, "total_steps": 1025, "loss": 0.3411, "learning_rate": 1.0576923076923078e-06, "epoch": 0.010730398731861967, "percentage": 1.07, "elapsed_time": "0:08:30", "remaining_time": "13:04:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12, "total_steps": 1025, "loss": 0.3323, "learning_rate": 1.153846153846154e-06, "epoch": 0.011705889525667602, "percentage": 1.17, "elapsed_time": "0:09:14", "remaining_time": "13:00:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13, "total_steps": 1025, "loss": 0.3201, "learning_rate": 1.25e-06, "epoch": 0.012681380319473235, "percentage": 1.27, "elapsed_time": "0:09:59", "remaining_time": "12:57:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14, "total_steps": 1025, "loss": 0.3458, "learning_rate": 1.3461538461538462e-06, "epoch": 0.013656871113278868, "percentage": 1.37, "elapsed_time": "0:10:44", "remaining_time": "12:55:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15, "total_steps": 1025, "loss": 0.3057, "learning_rate": 1.4423076923076922e-06, "epoch": 0.014632361907084501, "percentage": 1.46, "elapsed_time": "0:11:34", "remaining_time": "12:59:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16, "total_steps": 1025, "loss": 0.2974, "learning_rate": 1.5384615384615387e-06, "epoch": 0.015607852700890136, "percentage": 1.56, "elapsed_time": "0:12:21", "remaining_time": "12:59:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17, "total_steps": 1025, "loss": 0.2738, "learning_rate": 1.6346153846153848e-06, "epoch": 0.016583343494695767, "percentage": 1.66, "elapsed_time": "0:13:09", "remaining_time": "13:00:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18, "total_steps": 1025, "loss": 0.268, "learning_rate": 1.7307692307692308e-06, "epoch": 0.017558834288501402, "percentage": 1.76, "elapsed_time": "0:14:00", "remaining_time": "13:03:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19, "total_steps": 1025, "loss": 0.2851, "learning_rate": 1.826923076923077e-06, "epoch": 0.018534325082307037, "percentage": 1.85, "elapsed_time": "0:14:47", "remaining_time": "13:02:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20, "total_steps": 1025, "loss": 0.2773, "learning_rate": 1.9230769230769234e-06, "epoch": 0.01950981587611267, "percentage": 1.95, "elapsed_time": "0:15:37", "remaining_time": "13:04:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21, "total_steps": 1025, "loss": 0.279, "learning_rate": 2.0192307692307692e-06, "epoch": 0.020485306669918303, "percentage": 2.05, "elapsed_time": "0:16:26", "remaining_time": "13:05:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22, "total_steps": 1025, "loss": 0.2743, "learning_rate": 2.1153846153846155e-06, "epoch": 0.021460797463723934, "percentage": 2.15, "elapsed_time": "0:17:13", "remaining_time": "13:05:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23, "total_steps": 1025, "loss": 0.2694, "learning_rate": 2.211538461538462e-06, "epoch": 0.02243628825752957, "percentage": 2.24, "elapsed_time": "0:18:00", "remaining_time": "13:04:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24, "total_steps": 1025, "loss": 0.2644, "learning_rate": 2.307692307692308e-06, "epoch": 0.023411779051335204, "percentage": 2.34, "elapsed_time": "0:18:45", "remaining_time": "13:02:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25, "total_steps": 1025, "loss": 0.2419, "learning_rate": 2.403846153846154e-06, "epoch": 0.024387269845140835, "percentage": 2.44, "elapsed_time": "0:19:32", "remaining_time": "13:01:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 26, "total_steps": 1025, "loss": 0.2544, "learning_rate": 2.5e-06, "epoch": 0.02536276063894647, "percentage": 2.54, "elapsed_time": "0:20:16", "remaining_time": "12:59:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 27, "total_steps": 1025, "loss": 0.223, "learning_rate": 2.5961538461538465e-06, "epoch": 0.026338251432752105, "percentage": 2.63, "elapsed_time": "0:21:01", "remaining_time": "12:57:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 28, "total_steps": 1025, "loss": 0.2456, "learning_rate": 2.6923076923076923e-06, "epoch": 0.027313742226557736, "percentage": 2.73, "elapsed_time": "0:21:43", "remaining_time": "12:53:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 29, "total_steps": 1025, "loss": 0.2516, "learning_rate": 2.7884615384615386e-06, "epoch": 0.02828923302036337, "percentage": 2.83, "elapsed_time": "0:22:30", "remaining_time": "12:53:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 30, "total_steps": 1025, "loss": 0.2416, "learning_rate": 2.8846153846153845e-06, "epoch": 0.029264723814169002, "percentage": 2.93, "elapsed_time": "0:23:17", "remaining_time": "12:52:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 31, "total_steps": 1025, "loss": 0.2329, "learning_rate": 2.980769230769231e-06, "epoch": 0.030240214607974637, "percentage": 3.02, "elapsed_time": "0:24:05", "remaining_time": "12:52:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 32, "total_steps": 1025, "loss": 0.2217, "learning_rate": 3.0769230769230774e-06, "epoch": 0.031215705401780272, "percentage": 3.12, "elapsed_time": "0:24:46", "remaining_time": "12:49:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 33, "total_steps": 1025, "loss": 0.2309, "learning_rate": 3.1730769230769233e-06, "epoch": 0.03219119619558591, "percentage": 3.22, "elapsed_time": "0:25:32", "remaining_time": "12:47:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 34, "total_steps": 1025, "loss": 0.2217, "learning_rate": 3.2692307692307696e-06, "epoch": 0.033166686989391535, "percentage": 3.32, "elapsed_time": "0:26:19", "remaining_time": "12:47:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 35, "total_steps": 1025, "loss": 0.2338, "learning_rate": 3.365384615384616e-06, "epoch": 0.03414217778319717, "percentage": 3.41, "elapsed_time": "0:27:05", "remaining_time": "12:46:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 36, "total_steps": 1025, "loss": 0.2137, "learning_rate": 3.4615384615384617e-06, "epoch": 0.035117668577002804, "percentage": 3.51, "elapsed_time": "0:27:51", "remaining_time": "12:45:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 37, "total_steps": 1025, "loss": 0.2162, "learning_rate": 3.557692307692308e-06, "epoch": 0.03609315937080844, "percentage": 3.61, "elapsed_time": "0:28:32", "remaining_time": "12:42:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 38, "total_steps": 1025, "loss": 0.228, "learning_rate": 3.653846153846154e-06, "epoch": 0.037068650164614074, "percentage": 3.71, "elapsed_time": "0:29:21", "remaining_time": "12:42:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 39, "total_steps": 1025, "loss": 0.2106, "learning_rate": 3.7500000000000005e-06, "epoch": 0.0380441409584197, "percentage": 3.8, "elapsed_time": "0:30:04", "remaining_time": "12:40:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 40, "total_steps": 1025, "loss": 0.218, "learning_rate": 3.846153846153847e-06, "epoch": 0.03901963175222534, "percentage": 3.9, "elapsed_time": "0:30:51", "remaining_time": "12:39:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 41, "total_steps": 1025, "loss": 0.2032, "learning_rate": 3.942307692307692e-06, "epoch": 0.03999512254603097, "percentage": 4.0, "elapsed_time": "0:31:37", "remaining_time": "12:39:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 42, "total_steps": 1025, "loss": 0.217, "learning_rate": 4.0384615384615385e-06, "epoch": 0.040970613339836606, "percentage": 4.1, "elapsed_time": "0:32:23", "remaining_time": "12:38:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 43, "total_steps": 1025, "loss": 0.2215, "learning_rate": 4.134615384615385e-06, "epoch": 0.04194610413364224, "percentage": 4.2, "elapsed_time": "0:33:07", "remaining_time": "12:36:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 44, "total_steps": 1025, "loss": 0.2138, "learning_rate": 4.230769230769231e-06, "epoch": 0.04292159492744787, "percentage": 4.29, "elapsed_time": "0:33:59", "remaining_time": "12:37:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 45, "total_steps": 1025, "loss": 0.2113, "learning_rate": 4.326923076923077e-06, "epoch": 0.043897085721253504, "percentage": 4.39, "elapsed_time": "0:34:45", "remaining_time": "12:37:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 46, "total_steps": 1025, "loss": 0.2106, "learning_rate": 4.423076923076924e-06, "epoch": 0.04487257651505914, "percentage": 4.49, "elapsed_time": "0:35:35", "remaining_time": "12:37:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 47, "total_steps": 1025, "loss": 0.2104, "learning_rate": 4.51923076923077e-06, "epoch": 0.04584806730886477, "percentage": 4.59, "elapsed_time": "0:36:22", "remaining_time": "12:36:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 48, "total_steps": 1025, "loss": 0.1981, "learning_rate": 4.615384615384616e-06, "epoch": 0.04682355810267041, "percentage": 4.68, "elapsed_time": "0:37:10", "remaining_time": "12:36:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 49, "total_steps": 1025, "loss": 0.2014, "learning_rate": 4.711538461538462e-06, "epoch": 0.04779904889647604, "percentage": 4.78, "elapsed_time": "0:37:55", "remaining_time": "12:35:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 50, "total_steps": 1025, "loss": 0.1996, "learning_rate": 4.807692307692308e-06, "epoch": 0.04877453969028167, "percentage": 4.88, "elapsed_time": "0:38:36", "remaining_time": "12:32:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 51, "total_steps": 1025, "loss": 0.2052, "learning_rate": 4.903846153846154e-06, "epoch": 0.049750030484087306, "percentage": 4.98, "elapsed_time": "0:39:19", "remaining_time": "12:31:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 52, "total_steps": 1025, "loss": 0.2168, "learning_rate": 5e-06, "epoch": 0.05072552127789294, "percentage": 5.07, "elapsed_time": "0:40:08", "remaining_time": "12:31:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 53, "total_steps": 1025, "loss": 0.2099, "learning_rate": 4.9999869688212956e-06, "epoch": 0.051701012071698575, "percentage": 5.17, "elapsed_time": "0:40:55", "remaining_time": "12:30:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 54, "total_steps": 1025, "loss": 0.1978, "learning_rate": 4.999947875421032e-06, "epoch": 0.05267650286550421, "percentage": 5.27, "elapsed_time": "0:41:46", "remaining_time": "12:31:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 55, "total_steps": 1025, "loss": 0.1934, "learning_rate": 4.999882720206755e-06, "epoch": 0.05365199365930984, "percentage": 5.37, "elapsed_time": "0:42:35", "remaining_time": "12:31:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 56, "total_steps": 1025, "loss": 0.2019, "learning_rate": 4.999791503857704e-06, "epoch": 0.05462748445311547, "percentage": 5.46, "elapsed_time": "0:43:22", "remaining_time": "12:30:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 57, "total_steps": 1025, "loss": 0.2044, "learning_rate": 4.999674227324805e-06, "epoch": 0.05560297524692111, "percentage": 5.56, "elapsed_time": "0:44:02", "remaining_time": "12:27:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 58, "total_steps": 1025, "loss": 0.1972, "learning_rate": 4.9995308918306595e-06, "epoch": 0.05657846604072674, "percentage": 5.66, "elapsed_time": "0:44:50", "remaining_time": "12:27:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 59, "total_steps": 1025, "loss": 0.19, "learning_rate": 4.99936149886953e-06, "epoch": 0.05755395683453238, "percentage": 5.76, "elapsed_time": "0:45:38", "remaining_time": "12:27:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 60, "total_steps": 1025, "loss": 0.1838, "learning_rate": 4.999166050207331e-06, "epoch": 0.058529447628338005, "percentage": 5.85, "elapsed_time": "0:46:24", "remaining_time": "12:26:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 61, "total_steps": 1025, "loss": 0.1906, "learning_rate": 4.9989445478816e-06, "epoch": 0.05950493842214364, "percentage": 5.95, "elapsed_time": "0:47:10", "remaining_time": "12:25:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 62, "total_steps": 1025, "loss": 0.1949, "learning_rate": 4.99869699420149e-06, "epoch": 0.060480429215949275, "percentage": 6.05, "elapsed_time": "0:47:54", "remaining_time": "12:24:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 63, "total_steps": 1025, "loss": 0.1869, "learning_rate": 4.998423391747731e-06, "epoch": 0.06145592000975491, "percentage": 6.15, "elapsed_time": "0:48:40", "remaining_time": "12:23:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 64, "total_steps": 1025, "loss": 0.1832, "learning_rate": 4.998123743372615e-06, "epoch": 0.062431410803560544, "percentage": 6.24, "elapsed_time": "0:49:25", "remaining_time": "12:22:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 65, "total_steps": 1025, "loss": 0.2011, "learning_rate": 4.997798052199959e-06, "epoch": 0.06340690159736617, "percentage": 6.34, "elapsed_time": "0:50:13", "remaining_time": "12:21:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 66, "total_steps": 1025, "loss": 0.1851, "learning_rate": 4.9974463216250735e-06, "epoch": 0.06438239239117181, "percentage": 6.44, "elapsed_time": "0:51:00", "remaining_time": "12:21:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 67, "total_steps": 1025, "loss": 0.1959, "learning_rate": 4.9970685553147316e-06, "epoch": 0.06535788318497744, "percentage": 6.54, "elapsed_time": "0:51:42", "remaining_time": "12:19:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 68, "total_steps": 1025, "loss": 0.1948, "learning_rate": 4.996664757207124e-06, "epoch": 0.06633337397878307, "percentage": 6.63, "elapsed_time": "0:52:31", "remaining_time": "12:19:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 69, "total_steps": 1025, "loss": 0.1959, "learning_rate": 4.996234931511823e-06, "epoch": 0.06730886477258871, "percentage": 6.73, "elapsed_time": "0:53:15", "remaining_time": "12:17:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 70, "total_steps": 1025, "loss": 0.1962, "learning_rate": 4.995779082709739e-06, "epoch": 0.06828435556639434, "percentage": 6.83, "elapsed_time": "0:54:01", "remaining_time": "12:17:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 71, "total_steps": 1025, "loss": 0.1806, "learning_rate": 4.995297215553067e-06, "epoch": 0.06925984636019998, "percentage": 6.93, "elapsed_time": "0:54:48", "remaining_time": "12:16:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 72, "total_steps": 1025, "loss": 0.2044, "learning_rate": 4.994789335065245e-06, "epoch": 0.07023533715400561, "percentage": 7.02, "elapsed_time": "0:55:37", "remaining_time": "12:16:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 73, "total_steps": 1025, "loss": 0.1934, "learning_rate": 4.9942554465409e-06, "epoch": 0.07121082794781124, "percentage": 7.12, "elapsed_time": "0:56:23", "remaining_time": "12:15:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 74, "total_steps": 1025, "loss": 0.1905, "learning_rate": 4.993695555545789e-06, "epoch": 0.07218631874161688, "percentage": 7.22, "elapsed_time": "0:57:07", "remaining_time": "12:14:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 75, "total_steps": 1025, "loss": 0.193, "learning_rate": 4.993109667916742e-06, "epoch": 0.0731618095354225, "percentage": 7.32, "elapsed_time": "0:57:52", "remaining_time": "12:13:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 76, "total_steps": 1025, "loss": 0.1793, "learning_rate": 4.992497789761606e-06, "epoch": 0.07413730032922815, "percentage": 7.41, "elapsed_time": "0:58:40", "remaining_time": "12:12:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 77, "total_steps": 1025, "loss": 0.2023, "learning_rate": 4.991859927459174e-06, "epoch": 0.07511279112303378, "percentage": 7.51, "elapsed_time": "0:59:28", "remaining_time": "12:12:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 78, "total_steps": 1025, "loss": 0.1858, "learning_rate": 4.991196087659125e-06, "epoch": 0.0760882819168394, "percentage": 7.61, "elapsed_time": "1:00:15", "remaining_time": "12:11:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 79, "total_steps": 1025, "loss": 0.1843, "learning_rate": 4.990506277281952e-06, "epoch": 0.07706377271064505, "percentage": 7.71, "elapsed_time": "1:00:57", "remaining_time": "12:09:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 80, "total_steps": 1025, "loss": 0.1775, "learning_rate": 4.989790503518888e-06, "epoch": 0.07803926350445067, "percentage": 7.8, "elapsed_time": "1:01:36", "remaining_time": "12:07:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 81, "total_steps": 1025, "loss": 0.1879, "learning_rate": 4.989048773831834e-06, "epoch": 0.07901475429825632, "percentage": 7.9, "elapsed_time": "1:02:24", "remaining_time": "12:07:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 82, "total_steps": 1025, "loss": 0.1712, "learning_rate": 4.988281095953279e-06, "epoch": 0.07999024509206194, "percentage": 8.0, "elapsed_time": "1:03:15", "remaining_time": "12:07:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 83, "total_steps": 1025, "loss": 0.1806, "learning_rate": 4.987487477886221e-06, "epoch": 0.08096573588586757, "percentage": 8.1, "elapsed_time": "1:04:03", "remaining_time": "12:06:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 84, "total_steps": 1025, "loss": 0.172, "learning_rate": 4.986667927904084e-06, "epoch": 0.08194122667967321, "percentage": 8.2, "elapsed_time": "1:04:47", "remaining_time": "12:05:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 85, "total_steps": 1025, "loss": 0.1775, "learning_rate": 4.985822454550629e-06, "epoch": 0.08291671747347884, "percentage": 8.29, "elapsed_time": "1:05:31", "remaining_time": "12:04:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 86, "total_steps": 1025, "loss": 0.1872, "learning_rate": 4.984951066639869e-06, "epoch": 0.08389220826728448, "percentage": 8.39, "elapsed_time": "1:06:15", "remaining_time": "12:03:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 87, "total_steps": 1025, "loss": 0.1848, "learning_rate": 4.984053773255971e-06, "epoch": 0.08486769906109011, "percentage": 8.49, "elapsed_time": "1:07:00", "remaining_time": "12:02:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 88, "total_steps": 1025, "loss": 0.1789, "learning_rate": 4.9831305837531684e-06, "epoch": 0.08584318985489574, "percentage": 8.59, "elapsed_time": "1:07:44", "remaining_time": "12:01:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 89, "total_steps": 1025, "loss": 0.1763, "learning_rate": 4.98218150775566e-06, "epoch": 0.08681868064870138, "percentage": 8.68, "elapsed_time": "1:08:31", "remaining_time": "12:00:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 90, "total_steps": 1025, "loss": 0.1746, "learning_rate": 4.9812065551575075e-06, "epoch": 0.08779417144250701, "percentage": 8.78, "elapsed_time": "1:09:20", "remaining_time": "12:00:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 91, "total_steps": 1025, "loss": 0.2019, "learning_rate": 4.9802057361225375e-06, "epoch": 0.08876966223631265, "percentage": 8.88, "elapsed_time": "1:10:07", "remaining_time": "11:59:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 92, "total_steps": 1025, "loss": 0.1725, "learning_rate": 4.97917906108423e-06, "epoch": 0.08974515303011828, "percentage": 8.98, "elapsed_time": "1:10:55", "remaining_time": "11:59:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 93, "total_steps": 1025, "loss": 0.1804, "learning_rate": 4.978126540745615e-06, "epoch": 0.0907206438239239, "percentage": 9.07, "elapsed_time": "1:11:42", "remaining_time": "11:58:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 94, "total_steps": 1025, "loss": 0.2011, "learning_rate": 4.977048186079155e-06, "epoch": 0.09169613461772955, "percentage": 9.17, "elapsed_time": "1:12:27", "remaining_time": "11:57:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 95, "total_steps": 1025, "loss": 0.1835, "learning_rate": 4.975944008326638e-06, "epoch": 0.09267162541153517, "percentage": 9.27, "elapsed_time": "1:13:13", "remaining_time": "11:56:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 96, "total_steps": 1025, "loss": 0.1824, "learning_rate": 4.974814018999053e-06, "epoch": 0.09364711620534082, "percentage": 9.37, "elapsed_time": "1:14:00", "remaining_time": "11:56:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 97, "total_steps": 1025, "loss": 0.189, "learning_rate": 4.973658229876476e-06, "epoch": 0.09462260699914644, "percentage": 9.46, "elapsed_time": "1:14:44", "remaining_time": "11:55:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 98, "total_steps": 1025, "loss": 0.1832, "learning_rate": 4.97247665300794e-06, "epoch": 0.09559809779295209, "percentage": 9.56, "elapsed_time": "1:15:32", "remaining_time": "11:54:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 99, "total_steps": 1025, "loss": 0.1766, "learning_rate": 4.971269300711318e-06, "epoch": 0.09657358858675771, "percentage": 9.66, "elapsed_time": "1:16:19", "remaining_time": "11:53:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 100, "total_steps": 1025, "loss": 0.1805, "learning_rate": 4.970036185573189e-06, "epoch": 0.09754907938056334, "percentage": 9.76, "elapsed_time": "1:17:04", "remaining_time": "11:52:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 101, "total_steps": 1025, "loss": 0.1836, "learning_rate": 4.968777320448707e-06, "epoch": 0.09852457017436898, "percentage": 9.85, "elapsed_time": "1:17:51", "remaining_time": "11:52:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 102, "total_steps": 1025, "loss": 0.1767, "learning_rate": 4.96749271846147e-06, "epoch": 0.09950006096817461, "percentage": 9.95, "elapsed_time": "1:18:36", "remaining_time": "11:51:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 103, "total_steps": 1025, "loss": 0.1912, "learning_rate": 4.96618239300338e-06, "epoch": 0.10047555176198025, "percentage": 10.05, "elapsed_time": "1:19:20", "remaining_time": "11:50:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 104, "total_steps": 1025, "loss": 0.1726, "learning_rate": 4.964846357734505e-06, "epoch": 0.10145104255578588, "percentage": 10.15, "elapsed_time": "1:20:07", "remaining_time": "11:49:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 105, "total_steps": 1025, "loss": 0.1787, "learning_rate": 4.963484626582937e-06, "epoch": 0.10242653334959151, "percentage": 10.24, "elapsed_time": "1:20:51", "remaining_time": "11:48:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 106, "total_steps": 1025, "loss": 0.179, "learning_rate": 4.9620972137446456e-06, "epoch": 0.10340202414339715, "percentage": 10.34, "elapsed_time": "1:21:34", "remaining_time": "11:47:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 107, "total_steps": 1025, "loss": 0.1765, "learning_rate": 4.96068413368333e-06, "epoch": 0.10437751493720278, "percentage": 10.44, "elapsed_time": "1:22:21", "remaining_time": "11:46:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 108, "total_steps": 1025, "loss": 0.172, "learning_rate": 4.959245401130269e-06, "epoch": 0.10535300573100842, "percentage": 10.54, "elapsed_time": "1:23:08", "remaining_time": "11:45:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 109, "total_steps": 1025, "loss": 0.1805, "learning_rate": 4.957781031084169e-06, "epoch": 0.10632849652481405, "percentage": 10.63, "elapsed_time": "1:23:54", "remaining_time": "11:45:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 110, "total_steps": 1025, "loss": 0.1853, "learning_rate": 4.956291038811003e-06, "epoch": 0.10730398731861968, "percentage": 10.73, "elapsed_time": "1:24:41", "remaining_time": "11:44:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 111, "total_steps": 1025, "loss": 0.1873, "learning_rate": 4.954775439843855e-06, "epoch": 0.10827947811242532, "percentage": 10.83, "elapsed_time": "1:25:28", "remaining_time": "11:43:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 112, "total_steps": 1025, "loss": 0.185, "learning_rate": 4.9532342499827584e-06, "epoch": 0.10925496890623095, "percentage": 10.93, "elapsed_time": "1:26:17", "remaining_time": "11:43:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 113, "total_steps": 1025, "loss": 0.1892, "learning_rate": 4.95166748529453e-06, "epoch": 0.11023045970003659, "percentage": 11.02, "elapsed_time": "1:27:02", "remaining_time": "11:42:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 114, "total_steps": 1025, "loss": 0.1735, "learning_rate": 4.950075162112602e-06, "epoch": 0.11120595049384221, "percentage": 11.12, "elapsed_time": "1:27:46", "remaining_time": "11:41:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 115, "total_steps": 1025, "loss": 0.1838, "learning_rate": 4.9484572970368516e-06, "epoch": 0.11218144128764784, "percentage": 11.22, "elapsed_time": "1:28:31", "remaining_time": "11:40:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 116, "total_steps": 1025, "loss": 0.1874, "learning_rate": 4.946813906933432e-06, "epoch": 0.11315693208145348, "percentage": 11.32, "elapsed_time": "1:29:15", "remaining_time": "11:39:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 117, "total_steps": 1025, "loss": 0.1738, "learning_rate": 4.94514500893459e-06, "epoch": 0.11413242287525911, "percentage": 11.41, "elapsed_time": "1:29:59", "remaining_time": "11:38:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 118, "total_steps": 1025, "loss": 0.1752, "learning_rate": 4.943450620438491e-06, "epoch": 0.11510791366906475, "percentage": 11.51, "elapsed_time": "1:30:47", "remaining_time": "11:37:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 119, "total_steps": 1025, "loss": 0.1818, "learning_rate": 4.941730759109041e-06, "epoch": 0.11608340446287038, "percentage": 11.61, "elapsed_time": "1:31:33", "remaining_time": "11:37:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 120, "total_steps": 1025, "loss": 0.1799, "learning_rate": 4.939985442875695e-06, "epoch": 0.11705889525667601, "percentage": 11.71, "elapsed_time": "1:32:21", "remaining_time": "11:36:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 121, "total_steps": 1025, "loss": 0.1735, "learning_rate": 4.938214689933276e-06, "epoch": 0.11803438605048165, "percentage": 11.8, "elapsed_time": "1:33:06", "remaining_time": "11:35:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 122, "total_steps": 1025, "loss": 0.1868, "learning_rate": 4.93641851874178e-06, "epoch": 0.11900987684428728, "percentage": 11.9, "elapsed_time": "1:33:50", "remaining_time": "11:34:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 123, "total_steps": 1025, "loss": 0.1829, "learning_rate": 4.9345969480261925e-06, "epoch": 0.11998536763809292, "percentage": 12.0, "elapsed_time": "1:34:36", "remaining_time": "11:33:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 124, "total_steps": 1025, "loss": 0.1731, "learning_rate": 4.932749996776282e-06, "epoch": 0.12096085843189855, "percentage": 12.1, "elapsed_time": "1:35:21", "remaining_time": "11:32:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 125, "total_steps": 1025, "loss": 0.1886, "learning_rate": 4.93087768424641e-06, "epoch": 0.12193634922570418, "percentage": 12.2, "elapsed_time": "1:36:09", "remaining_time": "11:32:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 126, "total_steps": 1025, "loss": 0.1821, "learning_rate": 4.928980029955329e-06, "epoch": 0.12291184001950982, "percentage": 12.29, "elapsed_time": "1:36:53", "remaining_time": "11:31:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 127, "total_steps": 1025, "loss": 0.1801, "learning_rate": 4.927057053685975e-06, "epoch": 0.12388733081331545, "percentage": 12.39, "elapsed_time": "1:37:38", "remaining_time": "11:30:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 128, "total_steps": 1025, "loss": 0.1796, "learning_rate": 4.925108775485269e-06, "epoch": 0.12486282160712109, "percentage": 12.49, "elapsed_time": "1:38:24", "remaining_time": "11:29:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 129, "total_steps": 1025, "loss": 0.1654, "learning_rate": 4.923135215663897e-06, "epoch": 0.12583831240092672, "percentage": 12.59, "elapsed_time": "1:39:07", "remaining_time": "11:28:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 130, "total_steps": 1025, "loss": 0.1803, "learning_rate": 4.921136394796109e-06, "epoch": 0.12681380319473234, "percentage": 12.68, "elapsed_time": "1:39:50", "remaining_time": "11:27:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 131, "total_steps": 1025, "loss": 0.1878, "learning_rate": 4.919112333719498e-06, "epoch": 0.12778929398853797, "percentage": 12.78, "elapsed_time": "1:40:34", "remaining_time": "11:26:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 132, "total_steps": 1025, "loss": 0.1771, "learning_rate": 4.9170630535347866e-06, "epoch": 0.12876478478234363, "percentage": 12.88, "elapsed_time": "1:41:19", "remaining_time": "11:25:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 133, "total_steps": 1025, "loss": 0.1893, "learning_rate": 4.914988575605602e-06, "epoch": 0.12974027557614926, "percentage": 12.98, "elapsed_time": "1:42:04", "remaining_time": "11:24:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 134, "total_steps": 1025, "loss": 0.1728, "learning_rate": 4.91288892155826e-06, "epoch": 0.13071576636995488, "percentage": 13.07, "elapsed_time": "1:42:47", "remaining_time": "11:23:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 135, "total_steps": 1025, "loss": 0.1836, "learning_rate": 4.910764113281533e-06, "epoch": 0.1316912571637605, "percentage": 13.17, "elapsed_time": "1:43:32", "remaining_time": "11:22:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 136, "total_steps": 1025, "loss": 0.1757, "learning_rate": 4.908614172926426e-06, "epoch": 0.13266674795756614, "percentage": 13.27, "elapsed_time": "1:44:15", "remaining_time": "11:21:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 137, "total_steps": 1025, "loss": 0.161, "learning_rate": 4.906439122905946e-06, "epoch": 0.1336422387513718, "percentage": 13.37, "elapsed_time": "1:45:01", "remaining_time": "11:20:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 138, "total_steps": 1025, "loss": 0.1644, "learning_rate": 4.904238985894864e-06, "epoch": 0.13461772954517742, "percentage": 13.46, "elapsed_time": "1:45:49", "remaining_time": "11:20:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 139, "total_steps": 1025, "loss": 0.1541, "learning_rate": 4.902013784829483e-06, "epoch": 0.13559322033898305, "percentage": 13.56, "elapsed_time": "1:46:34", "remaining_time": "11:19:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 140, "total_steps": 1025, "loss": 0.1689, "learning_rate": 4.899763542907399e-06, "epoch": 0.13656871113278868, "percentage": 13.66, "elapsed_time": "1:47:23", "remaining_time": "11:18:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 141, "total_steps": 1025, "loss": 0.1764, "learning_rate": 4.897488283587253e-06, "epoch": 0.1375442019265943, "percentage": 13.76, "elapsed_time": "1:48:09", "remaining_time": "11:18:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 142, "total_steps": 1025, "loss": 0.1671, "learning_rate": 4.895188030588495e-06, "epoch": 0.13851969272039996, "percentage": 13.85, "elapsed_time": "1:48:56", "remaining_time": "11:17:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 143, "total_steps": 1025, "loss": 0.1723, "learning_rate": 4.892862807891131e-06, "epoch": 0.1394951835142056, "percentage": 13.95, "elapsed_time": "1:49:43", "remaining_time": "11:16:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 144, "total_steps": 1025, "loss": 0.1585, "learning_rate": 4.890512639735475e-06, "epoch": 0.14047067430801122, "percentage": 14.05, "elapsed_time": "1:50:26", "remaining_time": "11:15:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 145, "total_steps": 1025, "loss": 0.1667, "learning_rate": 4.888137550621897e-06, "epoch": 0.14144616510181685, "percentage": 14.15, "elapsed_time": "1:51:11", "remaining_time": "11:14:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 146, "total_steps": 1025, "loss": 0.1748, "learning_rate": 4.885737565310565e-06, "epoch": 0.14242165589562247, "percentage": 14.24, "elapsed_time": "1:51:57", "remaining_time": "11:14:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 147, "total_steps": 1025, "loss": 0.172, "learning_rate": 4.883312708821188e-06, "epoch": 0.14339714668942813, "percentage": 14.34, "elapsed_time": "1:52:43", "remaining_time": "11:13:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 148, "total_steps": 1025, "loss": 0.1704, "learning_rate": 4.880863006432758e-06, "epoch": 0.14437263748323376, "percentage": 14.44, "elapsed_time": "1:53:24", "remaining_time": "11:11:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 149, "total_steps": 1025, "loss": 0.1779, "learning_rate": 4.878388483683281e-06, "epoch": 0.14534812827703938, "percentage": 14.54, "elapsed_time": "1:54:06", "remaining_time": "11:10:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 150, "total_steps": 1025, "loss": 0.1733, "learning_rate": 4.8758891663695165e-06, "epoch": 0.146323619070845, "percentage": 14.63, "elapsed_time": "1:54:51", "remaining_time": "11:10:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 151, "total_steps": 1025, "loss": 0.1883, "learning_rate": 4.873365080546706e-06, "epoch": 0.14729910986465064, "percentage": 14.73, "elapsed_time": "1:55:38", "remaining_time": "11:09:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 152, "total_steps": 1025, "loss": 0.1725, "learning_rate": 4.870816252528298e-06, "epoch": 0.1482746006584563, "percentage": 14.83, "elapsed_time": "1:56:24", "remaining_time": "11:08:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 153, "total_steps": 1025, "loss": 0.1855, "learning_rate": 4.868242708885681e-06, "epoch": 0.14925009145226192, "percentage": 14.93, "elapsed_time": "1:57:10", "remaining_time": "11:07:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 154, "total_steps": 1025, "loss": 0.1815, "learning_rate": 4.8656444764479005e-06, "epoch": 0.15022558224606755, "percentage": 15.02, "elapsed_time": "1:57:57", "remaining_time": "11:07:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 155, "total_steps": 1025, "loss": 0.171, "learning_rate": 4.863021582301381e-06, "epoch": 0.15120107303987318, "percentage": 15.12, "elapsed_time": "1:58:42", "remaining_time": "11:06:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 156, "total_steps": 1025, "loss": 0.1703, "learning_rate": 4.860374053789643e-06, "epoch": 0.1521765638336788, "percentage": 15.22, "elapsed_time": "1:59:27", "remaining_time": "11:05:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 157, "total_steps": 1025, "loss": 0.1762, "learning_rate": 4.857701918513023e-06, "epoch": 0.15315205462748446, "percentage": 15.32, "elapsed_time": "2:00:17", "remaining_time": "11:05:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 158, "total_steps": 1025, "loss": 0.159, "learning_rate": 4.855005204328378e-06, "epoch": 0.1541275454212901, "percentage": 15.41, "elapsed_time": "2:01:04", "remaining_time": "11:04:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 159, "total_steps": 1025, "loss": 0.1701, "learning_rate": 4.8522839393487976e-06, "epoch": 0.15510303621509572, "percentage": 15.51, "elapsed_time": "2:01:48", "remaining_time": "11:03:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 160, "total_steps": 1025, "loss": 0.1742, "learning_rate": 4.849538151943316e-06, "epoch": 0.15607852700890135, "percentage": 15.61, "elapsed_time": "2:02:34", "remaining_time": "11:02:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 161, "total_steps": 1025, "loss": 0.173, "learning_rate": 4.84676787073661e-06, "epoch": 0.15705401780270697, "percentage": 15.71, "elapsed_time": "2:03:23", "remaining_time": "11:02:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 162, "total_steps": 1025, "loss": 0.1732, "learning_rate": 4.843973124608703e-06, "epoch": 0.15802950859651263, "percentage": 15.8, "elapsed_time": "2:04:10", "remaining_time": "11:01:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 163, "total_steps": 1025, "loss": 0.1665, "learning_rate": 4.841153942694664e-06, "epoch": 0.15900499939031826, "percentage": 15.9, "elapsed_time": "2:05:01", "remaining_time": "11:01:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 164, "total_steps": 1025, "loss": 0.1684, "learning_rate": 4.838310354384304e-06, "epoch": 0.15998049018412389, "percentage": 16.0, "elapsed_time": "2:05:46", "remaining_time": "11:00:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 165, "total_steps": 1025, "loss": 0.1692, "learning_rate": 4.835442389321867e-06, "epoch": 0.1609559809779295, "percentage": 16.1, "elapsed_time": "2:06:32", "remaining_time": "10:59:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 166, "total_steps": 1025, "loss": 0.1563, "learning_rate": 4.832550077405727e-06, "epoch": 0.16193147177173514, "percentage": 16.2, "elapsed_time": "2:07:21", "remaining_time": "10:59:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 167, "total_steps": 1025, "loss": 0.1796, "learning_rate": 4.829633448788072e-06, "epoch": 0.1629069625655408, "percentage": 16.29, "elapsed_time": "2:08:09", "remaining_time": "10:58:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 168, "total_steps": 1025, "loss": 0.1736, "learning_rate": 4.826692533874586e-06, "epoch": 0.16388245335934642, "percentage": 16.39, "elapsed_time": "2:08:56", "remaining_time": "10:57:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 169, "total_steps": 1025, "loss": 0.1763, "learning_rate": 4.823727363324142e-06, "epoch": 0.16485794415315205, "percentage": 16.49, "elapsed_time": "2:09:47", "remaining_time": "10:57:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 170, "total_steps": 1025, "loss": 0.1735, "learning_rate": 4.820737968048471e-06, "epoch": 0.16583343494695768, "percentage": 16.59, "elapsed_time": "2:10:32", "remaining_time": "10:56:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 171, "total_steps": 1025, "loss": 0.1843, "learning_rate": 4.8177243792118515e-06, "epoch": 0.1668089257407633, "percentage": 16.68, "elapsed_time": "2:11:21", "remaining_time": "10:56:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 172, "total_steps": 1025, "loss": 0.1719, "learning_rate": 4.8146866282307725e-06, "epoch": 0.16778441653456896, "percentage": 16.78, "elapsed_time": "2:12:07", "remaining_time": "10:55:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 173, "total_steps": 1025, "loss": 0.1597, "learning_rate": 4.811624746773616e-06, "epoch": 0.1687599073283746, "percentage": 16.88, "elapsed_time": "2:12:53", "remaining_time": "10:54:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 174, "total_steps": 1025, "loss": 0.1539, "learning_rate": 4.808538766760321e-06, "epoch": 0.16973539812218022, "percentage": 16.98, "elapsed_time": "2:13:42", "remaining_time": "10:53:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 175, "total_steps": 1025, "loss": 0.1682, "learning_rate": 4.805428720362054e-06, "epoch": 0.17071088891598585, "percentage": 17.07, "elapsed_time": "2:14:29", "remaining_time": "10:53:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 176, "total_steps": 1025, "loss": 0.1687, "learning_rate": 4.8022946400008705e-06, "epoch": 0.17168637970979148, "percentage": 17.17, "elapsed_time": "2:15:12", "remaining_time": "10:52:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 177, "total_steps": 1025, "loss": 0.1812, "learning_rate": 4.79913655834938e-06, "epoch": 0.17266187050359713, "percentage": 17.27, "elapsed_time": "2:16:01", "remaining_time": "10:51:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 178, "total_steps": 1025, "loss": 0.1721, "learning_rate": 4.795954508330403e-06, "epoch": 0.17363736129740276, "percentage": 17.37, "elapsed_time": "2:16:46", "remaining_time": "10:50:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 179, "total_steps": 1025, "loss": 0.1708, "learning_rate": 4.79274852311663e-06, "epoch": 0.1746128520912084, "percentage": 17.46, "elapsed_time": "2:17:33", "remaining_time": "10:50:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 180, "total_steps": 1025, "loss": 0.1639, "learning_rate": 4.7895186361302736e-06, "epoch": 0.17558834288501401, "percentage": 17.56, "elapsed_time": "2:18:20", "remaining_time": "10:49:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 181, "total_steps": 1025, "loss": 0.1544, "learning_rate": 4.786264881042722e-06, "epoch": 0.17656383367881964, "percentage": 17.66, "elapsed_time": "2:19:11", "remaining_time": "10:49:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 182, "total_steps": 1025, "loss": 0.1586, "learning_rate": 4.782987291774186e-06, "epoch": 0.1775393244726253, "percentage": 17.76, "elapsed_time": "2:19:58", "remaining_time": "10:48:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 183, "total_steps": 1025, "loss": 0.1703, "learning_rate": 4.779685902493346e-06, "epoch": 0.17851481526643093, "percentage": 17.85, "elapsed_time": "2:20:46", "remaining_time": "10:47:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 184, "total_steps": 1025, "loss": 0.1536, "learning_rate": 4.776360747616999e-06, "epoch": 0.17949030606023655, "percentage": 17.95, "elapsed_time": "2:21:31", "remaining_time": "10:46:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 185, "total_steps": 1025, "loss": 0.1729, "learning_rate": 4.773011861809694e-06, "epoch": 0.18046579685404218, "percentage": 18.05, "elapsed_time": "2:22:20", "remaining_time": "10:46:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 186, "total_steps": 1025, "loss": 0.1745, "learning_rate": 4.769639279983372e-06, "epoch": 0.1814412876478478, "percentage": 18.15, "elapsed_time": "2:23:07", "remaining_time": "10:45:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 187, "total_steps": 1025, "loss": 0.1651, "learning_rate": 4.76624303729701e-06, "epoch": 0.18241677844165347, "percentage": 18.24, "elapsed_time": "2:23:55", "remaining_time": "10:44:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 188, "total_steps": 1025, "loss": 0.1642, "learning_rate": 4.762823169156242e-06, "epoch": 0.1833922692354591, "percentage": 18.34, "elapsed_time": "2:24:44", "remaining_time": "10:44:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 189, "total_steps": 1025, "loss": 0.1701, "learning_rate": 4.7593797112129995e-06, "epoch": 0.18436776002926472, "percentage": 18.44, "elapsed_time": "2:25:32", "remaining_time": "10:43:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 190, "total_steps": 1025, "loss": 0.1619, "learning_rate": 4.755912699365135e-06, "epoch": 0.18534325082307035, "percentage": 18.54, "elapsed_time": "2:26:18", "remaining_time": "10:42:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 191, "total_steps": 1025, "loss": 0.1541, "learning_rate": 4.752422169756048e-06, "epoch": 0.18631874161687598, "percentage": 18.63, "elapsed_time": "2:27:05", "remaining_time": "10:42:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 192, "total_steps": 1025, "loss": 0.1583, "learning_rate": 4.748908158774312e-06, "epoch": 0.18729423241068163, "percentage": 18.73, "elapsed_time": "2:27:56", "remaining_time": "10:41:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 193, "total_steps": 1025, "loss": 0.1685, "learning_rate": 4.745370703053291e-06, "epoch": 0.18826972320448726, "percentage": 18.83, "elapsed_time": "2:28:40", "remaining_time": "10:40:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 194, "total_steps": 1025, "loss": 0.1624, "learning_rate": 4.741809839470758e-06, "epoch": 0.1892452139982929, "percentage": 18.93, "elapsed_time": "2:29:26", "remaining_time": "10:40:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 195, "total_steps": 1025, "loss": 0.171, "learning_rate": 4.738225605148514e-06, "epoch": 0.19022070479209852, "percentage": 19.02, "elapsed_time": "2:30:14", "remaining_time": "10:39:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 196, "total_steps": 1025, "loss": 0.1677, "learning_rate": 4.734618037451997e-06, "epoch": 0.19119619558590417, "percentage": 19.12, "elapsed_time": "2:30:56", "remaining_time": "10:38:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 197, "total_steps": 1025, "loss": 0.1654, "learning_rate": 4.730987173989894e-06, "epoch": 0.1921716863797098, "percentage": 19.22, "elapsed_time": "2:31:44", "remaining_time": "10:37:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 198, "total_steps": 1025, "loss": 0.1689, "learning_rate": 4.727333052613749e-06, "epoch": 0.19314717717351543, "percentage": 19.32, "elapsed_time": "2:32:29", "remaining_time": "10:36:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 199, "total_steps": 1025, "loss": 0.153, "learning_rate": 4.7236557114175705e-06, "epoch": 0.19412266796732106, "percentage": 19.41, "elapsed_time": "2:33:15", "remaining_time": "10:36:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 200, "total_steps": 1025, "loss": 0.1738, "learning_rate": 4.71995518873743e-06, "epoch": 0.19509815876112668, "percentage": 19.51, "elapsed_time": "2:34:00", "remaining_time": "10:35:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 201, "total_steps": 1025, "loss": 0.1621, "learning_rate": 4.716231523151065e-06, "epoch": 0.19607364955493234, "percentage": 19.61, "elapsed_time": "2:34:45", "remaining_time": "10:34:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 202, "total_steps": 1025, "loss": 0.1608, "learning_rate": 4.712484753477478e-06, "epoch": 0.19704914034873797, "percentage": 19.71, "elapsed_time": "2:35:35", "remaining_time": "10:33:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 203, "total_steps": 1025, "loss": 0.1712, "learning_rate": 4.708714918776527e-06, "epoch": 0.1980246311425436, "percentage": 19.8, "elapsed_time": "2:36:19", "remaining_time": "10:32:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 204, "total_steps": 1025, "loss": 0.1586, "learning_rate": 4.704922058348526e-06, "epoch": 0.19900012193634922, "percentage": 19.9, "elapsed_time": "2:37:06", "remaining_time": "10:32:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 205, "total_steps": 1025, "loss": 0.1633, "learning_rate": 4.701106211733827e-06, "epoch": 0.19997561273015485, "percentage": 20.0, "elapsed_time": "2:37:55", "remaining_time": "10:31:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 206, "total_steps": 1025, "loss": 0.1682, "learning_rate": 4.697267418712415e-06, "epoch": 0.2009511035239605, "percentage": 20.1, "elapsed_time": "2:38:44", "remaining_time": "10:31:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 207, "total_steps": 1025, "loss": 0.158, "learning_rate": 4.693405719303487e-06, "epoch": 0.20192659431776613, "percentage": 20.2, "elapsed_time": "2:39:33", "remaining_time": "10:30:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 208, "total_steps": 1025, "loss": 0.1585, "learning_rate": 4.689521153765039e-06, "epoch": 0.20290208511157176, "percentage": 20.29, "elapsed_time": "2:40:19", "remaining_time": "10:29:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 209, "total_steps": 1025, "loss": 0.1664, "learning_rate": 4.685613762593446e-06, "epoch": 0.2038775759053774, "percentage": 20.39, "elapsed_time": "2:41:07", "remaining_time": "10:29:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 210, "total_steps": 1025, "loss": 0.1678, "learning_rate": 4.681683586523037e-06, "epoch": 0.20485306669918302, "percentage": 20.49, "elapsed_time": "2:41:52", "remaining_time": "10:28:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 211, "total_steps": 1025, "loss": 0.1661, "learning_rate": 4.677730666525675e-06, "epoch": 0.20582855749298867, "percentage": 20.59, "elapsed_time": "2:42:36", "remaining_time": "10:27:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 212, "total_steps": 1025, "loss": 0.1629, "learning_rate": 4.673755043810324e-06, "epoch": 0.2068040482867943, "percentage": 20.68, "elapsed_time": "2:43:22", "remaining_time": "10:26:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 213, "total_steps": 1025, "loss": 0.1641, "learning_rate": 4.669756759822625e-06, "epoch": 0.20777953908059993, "percentage": 20.78, "elapsed_time": "2:44:08", "remaining_time": "10:25:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 214, "total_steps": 1025, "loss": 0.1689, "learning_rate": 4.66573585624446e-06, "epoch": 0.20875502987440556, "percentage": 20.88, "elapsed_time": "2:44:57", "remaining_time": "10:25:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 215, "total_steps": 1025, "loss": 0.1624, "learning_rate": 4.661692374993519e-06, "epoch": 0.20973052066821118, "percentage": 20.98, "elapsed_time": "2:45:43", "remaining_time": "10:24:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 216, "total_steps": 1025, "loss": 0.1756, "learning_rate": 4.657626358222864e-06, "epoch": 0.21070601146201684, "percentage": 21.07, "elapsed_time": "2:46:30", "remaining_time": "10:23:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 217, "total_steps": 1025, "loss": 0.1602, "learning_rate": 4.653537848320488e-06, "epoch": 0.21168150225582247, "percentage": 21.17, "elapsed_time": "2:47:15", "remaining_time": "10:22:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 218, "total_steps": 1025, "loss": 0.161, "learning_rate": 4.6494268879088745e-06, "epoch": 0.2126569930496281, "percentage": 21.27, "elapsed_time": "2:48:04", "remaining_time": "10:22:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 219, "total_steps": 1025, "loss": 0.169, "learning_rate": 4.6452935198445496e-06, "epoch": 0.21363248384343372, "percentage": 21.37, "elapsed_time": "2:48:47", "remaining_time": "10:21:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 220, "total_steps": 1025, "loss": 0.1686, "learning_rate": 4.64113778721764e-06, "epoch": 0.21460797463723935, "percentage": 21.46, "elapsed_time": "2:49:31", "remaining_time": "10:20:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 221, "total_steps": 1025, "loss": 0.1581, "learning_rate": 4.636959733351422e-06, "epoch": 0.215583465431045, "percentage": 21.56, "elapsed_time": "2:50:16", "remaining_time": "10:19:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 222, "total_steps": 1025, "loss": 0.1592, "learning_rate": 4.632759401801869e-06, "epoch": 0.21655895622485064, "percentage": 21.66, "elapsed_time": "2:51:02", "remaining_time": "10:18:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 223, "total_steps": 1025, "loss": 0.166, "learning_rate": 4.628536836357196e-06, "epoch": 0.21753444701865626, "percentage": 21.76, "elapsed_time": "2:51:46", "remaining_time": "10:17:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 224, "total_steps": 1025, "loss": 0.1542, "learning_rate": 4.6242920810374095e-06, "epoch": 0.2185099378124619, "percentage": 21.85, "elapsed_time": "2:52:32", "remaining_time": "10:17:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 225, "total_steps": 1025, "loss": 0.1725, "learning_rate": 4.62002518009384e-06, "epoch": 0.21948542860626752, "percentage": 21.95, "elapsed_time": "2:53:20", "remaining_time": "10:16:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 226, "total_steps": 1025, "loss": 0.1566, "learning_rate": 4.615736178008687e-06, "epoch": 0.22046091940007317, "percentage": 22.05, "elapsed_time": "2:54:05", "remaining_time": "10:15:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 227, "total_steps": 1025, "loss": 0.158, "learning_rate": 4.611425119494552e-06, "epoch": 0.2214364101938788, "percentage": 22.15, "elapsed_time": "2:54:50", "remaining_time": "10:14:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 228, "total_steps": 1025, "loss": 0.1633, "learning_rate": 4.607092049493973e-06, "epoch": 0.22241190098768443, "percentage": 22.24, "elapsed_time": "2:55:36", "remaining_time": "10:13:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 229, "total_steps": 1025, "loss": 0.1622, "learning_rate": 4.6027370131789614e-06, "epoch": 0.22338739178149006, "percentage": 22.34, "elapsed_time": "2:56:20", "remaining_time": "10:12:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 230, "total_steps": 1025, "loss": 0.1596, "learning_rate": 4.5983600559505196e-06, "epoch": 0.22436288257529569, "percentage": 22.44, "elapsed_time": "2:57:02", "remaining_time": "10:11:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 231, "total_steps": 1025, "loss": 0.1707, "learning_rate": 4.593961223438177e-06, "epoch": 0.22533837336910134, "percentage": 22.54, "elapsed_time": "2:57:49", "remaining_time": "10:11:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 232, "total_steps": 1025, "loss": 0.149, "learning_rate": 4.589540561499512e-06, "epoch": 0.22631386416290697, "percentage": 22.63, "elapsed_time": "2:58:34", "remaining_time": "10:10:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 233, "total_steps": 1025, "loss": 0.1666, "learning_rate": 4.585098116219674e-06, "epoch": 0.2272893549567126, "percentage": 22.73, "elapsed_time": "2:59:22", "remaining_time": "10:09:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 234, "total_steps": 1025, "loss": 0.1582, "learning_rate": 4.580633933910901e-06, "epoch": 0.22826484575051822, "percentage": 22.83, "elapsed_time": "3:00:04", "remaining_time": "10:08:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 235, "total_steps": 1025, "loss": 0.1798, "learning_rate": 4.576148061112039e-06, "epoch": 0.22924033654432385, "percentage": 22.93, "elapsed_time": "3:00:50", "remaining_time": "10:07:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 236, "total_steps": 1025, "loss": 0.1568, "learning_rate": 4.571640544588056e-06, "epoch": 0.2302158273381295, "percentage": 23.02, "elapsed_time": "3:01:39", "remaining_time": "10:07:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 237, "total_steps": 1025, "loss": 0.1556, "learning_rate": 4.567111431329555e-06, "epoch": 0.23119131813193514, "percentage": 23.12, "elapsed_time": "3:02:23", "remaining_time": "10:06:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 238, "total_steps": 1025, "loss": 0.1603, "learning_rate": 4.562560768552283e-06, "epoch": 0.23216680892574076, "percentage": 23.22, "elapsed_time": "3:03:07", "remaining_time": "10:05:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 239, "total_steps": 1025, "loss": 0.1458, "learning_rate": 4.55798860369664e-06, "epoch": 0.2331422997195464, "percentage": 23.32, "elapsed_time": "3:03:52", "remaining_time": "10:04:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 240, "total_steps": 1025, "loss": 0.1621, "learning_rate": 4.553394984427184e-06, "epoch": 0.23411779051335202, "percentage": 23.41, "elapsed_time": "3:04:40", "remaining_time": "10:04:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 241, "total_steps": 1025, "loss": 0.1568, "learning_rate": 4.548779958632134e-06, "epoch": 0.23509328130715768, "percentage": 23.51, "elapsed_time": "3:05:22", "remaining_time": "10:03:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 242, "total_steps": 1025, "loss": 0.1408, "learning_rate": 4.54414357442287e-06, "epoch": 0.2360687721009633, "percentage": 23.61, "elapsed_time": "3:06:06", "remaining_time": "10:02:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 243, "total_steps": 1025, "loss": 0.1609, "learning_rate": 4.539485880133433e-06, "epoch": 0.23704426289476893, "percentage": 23.71, "elapsed_time": "3:06:52", "remaining_time": "10:01:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 244, "total_steps": 1025, "loss": 0.1528, "learning_rate": 4.534806924320021e-06, "epoch": 0.23801975368857456, "percentage": 23.8, "elapsed_time": "3:07:40", "remaining_time": "10:00:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 245, "total_steps": 1025, "loss": 0.1607, "learning_rate": 4.5301067557604815e-06, "epoch": 0.2389952444823802, "percentage": 23.9, "elapsed_time": "3:08:24", "remaining_time": "9:59:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 246, "total_steps": 1025, "loss": 0.1621, "learning_rate": 4.525385423453803e-06, "epoch": 0.23997073527618584, "percentage": 24.0, "elapsed_time": "3:09:07", "remaining_time": "9:58:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 247, "total_steps": 1025, "loss": 0.1562, "learning_rate": 4.520642976619607e-06, "epoch": 0.24094622606999147, "percentage": 24.1, "elapsed_time": "3:09:52", "remaining_time": "9:58:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 248, "total_steps": 1025, "loss": 0.1524, "learning_rate": 4.515879464697629e-06, "epoch": 0.2419217168637971, "percentage": 24.2, "elapsed_time": "3:10:36", "remaining_time": "9:57:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 249, "total_steps": 1025, "loss": 0.1589, "learning_rate": 4.51109493734721e-06, "epoch": 0.24289720765760273, "percentage": 24.29, "elapsed_time": "3:11:24", "remaining_time": "9:56:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 250, "total_steps": 1025, "loss": 0.1661, "learning_rate": 4.506289444446775e-06, "epoch": 0.24387269845140835, "percentage": 24.39, "elapsed_time": "3:12:10", "remaining_time": "9:55:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 251, "total_steps": 1025, "loss": 0.1525, "learning_rate": 4.5014630360933136e-06, "epoch": 0.244848189245214, "percentage": 24.49, "elapsed_time": "3:12:56", "remaining_time": "9:54:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 252, "total_steps": 1025, "loss": 0.1553, "learning_rate": 4.496615762601857e-06, "epoch": 0.24582368003901964, "percentage": 24.59, "elapsed_time": "3:13:45", "remaining_time": "9:54:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 253, "total_steps": 1025, "loss": 0.1613, "learning_rate": 4.491747674504956e-06, "epoch": 0.24679917083282527, "percentage": 24.68, "elapsed_time": "3:14:34", "remaining_time": "9:53:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 254, "total_steps": 1025, "loss": 0.1561, "learning_rate": 4.48685882255215e-06, "epoch": 0.2477746616266309, "percentage": 24.78, "elapsed_time": "3:15:19", "remaining_time": "9:52:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 255, "total_steps": 1025, "loss": 0.1581, "learning_rate": 4.481949257709442e-06, "epoch": 0.24875015242043652, "percentage": 24.88, "elapsed_time": "3:16:03", "remaining_time": "9:52:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 256, "total_steps": 1025, "loss": 0.1635, "learning_rate": 4.477019031158767e-06, "epoch": 0.24972564321424218, "percentage": 24.98, "elapsed_time": "3:16:50", "remaining_time": "9:51:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 257, "total_steps": 1025, "loss": 0.1535, "learning_rate": 4.472068194297453e-06, "epoch": 0.2507011340080478, "percentage": 25.07, "elapsed_time": "3:17:35", "remaining_time": "9:50:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 258, "total_steps": 1025, "loss": 0.1419, "learning_rate": 4.467096798737694e-06, "epoch": 0.25167662480185343, "percentage": 25.17, "elapsed_time": "3:18:20", "remaining_time": "9:49:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 259, "total_steps": 1025, "loss": 0.1509, "learning_rate": 4.462104896306004e-06, "epoch": 0.2526521155956591, "percentage": 25.27, "elapsed_time": "3:19:05", "remaining_time": "9:48:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 260, "total_steps": 1025, "loss": 0.1503, "learning_rate": 4.457092539042682e-06, "epoch": 0.2536276063894647, "percentage": 25.37, "elapsed_time": "3:19:48", "remaining_time": "9:47:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 261, "total_steps": 1025, "loss": 0.1524, "learning_rate": 4.452059779201267e-06, "epoch": 0.25460309718327034, "percentage": 25.46, "elapsed_time": "3:20:37", "remaining_time": "9:47:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 262, "total_steps": 1025, "loss": 0.1599, "learning_rate": 4.44700666924799e-06, "epoch": 0.25557858797707594, "percentage": 25.56, "elapsed_time": "3:21:23", "remaining_time": "9:46:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 263, "total_steps": 1025, "loss": 0.1603, "learning_rate": 4.441933261861239e-06, "epoch": 0.2565540787708816, "percentage": 25.66, "elapsed_time": "3:22:12", "remaining_time": "9:45:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 264, "total_steps": 1025, "loss": 0.166, "learning_rate": 4.436839609930992e-06, "epoch": 0.25752956956468726, "percentage": 25.76, "elapsed_time": "3:23:00", "remaining_time": "9:45:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 265, "total_steps": 1025, "loss": 0.1592, "learning_rate": 4.431725766558284e-06, "epoch": 0.25850506035849286, "percentage": 25.85, "elapsed_time": "3:23:49", "remaining_time": "9:44:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 266, "total_steps": 1025, "loss": 0.1692, "learning_rate": 4.426591785054637e-06, "epoch": 0.2594805511522985, "percentage": 25.95, "elapsed_time": "3:24:36", "remaining_time": "9:43:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 267, "total_steps": 1025, "loss": 0.1546, "learning_rate": 4.421437718941517e-06, "epoch": 0.2604560419461041, "percentage": 26.05, "elapsed_time": "3:25:23", "remaining_time": "9:43:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 268, "total_steps": 1025, "loss": 0.158, "learning_rate": 4.416263621949769e-06, "epoch": 0.26143153273990977, "percentage": 26.15, "elapsed_time": "3:26:10", "remaining_time": "9:42:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 269, "total_steps": 1025, "loss": 0.1549, "learning_rate": 4.41106954801906e-06, "epoch": 0.2624070235337154, "percentage": 26.24, "elapsed_time": "3:26:56", "remaining_time": "9:41:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 270, "total_steps": 1025, "loss": 0.1526, "learning_rate": 4.4058555512973135e-06, "epoch": 0.263382514327521, "percentage": 26.34, "elapsed_time": "3:27:42", "remaining_time": "9:40:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 271, "total_steps": 1025, "loss": 0.1507, "learning_rate": 4.4006216861401475e-06, "epoch": 0.2643580051213267, "percentage": 26.44, "elapsed_time": "3:28:29", "remaining_time": "9:40:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 272, "total_steps": 1025, "loss": 0.1609, "learning_rate": 4.395368007110307e-06, "epoch": 0.2653334959151323, "percentage": 26.54, "elapsed_time": "3:29:13", "remaining_time": "9:39:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 273, "total_steps": 1025, "loss": 0.1517, "learning_rate": 4.390094568977099e-06, "epoch": 0.26630898670893793, "percentage": 26.63, "elapsed_time": "3:29:57", "remaining_time": "9:38:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 274, "total_steps": 1025, "loss": 0.1509, "learning_rate": 4.384801426715814e-06, "epoch": 0.2672844775027436, "percentage": 26.73, "elapsed_time": "3:30:41", "remaining_time": "9:37:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 275, "total_steps": 1025, "loss": 0.1479, "learning_rate": 4.379488635507157e-06, "epoch": 0.2682599682965492, "percentage": 26.83, "elapsed_time": "3:31:25", "remaining_time": "9:36:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 276, "total_steps": 1025, "loss": 0.1532, "learning_rate": 4.3741562507366754e-06, "epoch": 0.26923545909035485, "percentage": 26.93, "elapsed_time": "3:32:13", "remaining_time": "9:35:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 277, "total_steps": 1025, "loss": 0.1579, "learning_rate": 4.368804327994174e-06, "epoch": 0.27021094988416045, "percentage": 27.02, "elapsed_time": "3:33:01", "remaining_time": "9:35:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 278, "total_steps": 1025, "loss": 0.1543, "learning_rate": 4.363432923073144e-06, "epoch": 0.2711864406779661, "percentage": 27.12, "elapsed_time": "3:33:47", "remaining_time": "9:34:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 279, "total_steps": 1025, "loss": 0.1584, "learning_rate": 4.3580420919701745e-06, "epoch": 0.27216193147177176, "percentage": 27.22, "elapsed_time": "3:34:31", "remaining_time": "9:33:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 280, "total_steps": 1025, "loss": 0.1547, "learning_rate": 4.352631890884373e-06, "epoch": 0.27313742226557736, "percentage": 27.32, "elapsed_time": "3:35:14", "remaining_time": "9:32:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 281, "total_steps": 1025, "loss": 0.1648, "learning_rate": 4.347202376216775e-06, "epoch": 0.274112913059383, "percentage": 27.41, "elapsed_time": "3:36:03", "remaining_time": "9:32:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 282, "total_steps": 1025, "loss": 0.1488, "learning_rate": 4.341753604569764e-06, "epoch": 0.2750884038531886, "percentage": 27.51, "elapsed_time": "3:36:52", "remaining_time": "9:31:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 283, "total_steps": 1025, "loss": 0.155, "learning_rate": 4.336285632746472e-06, "epoch": 0.27606389464699427, "percentage": 27.61, "elapsed_time": "3:37:37", "remaining_time": "9:30:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 284, "total_steps": 1025, "loss": 0.138, "learning_rate": 4.330798517750194e-06, "epoch": 0.2770393854407999, "percentage": 27.71, "elapsed_time": "3:38:21", "remaining_time": "9:29:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 285, "total_steps": 1025, "loss": 0.1533, "learning_rate": 4.3252923167837905e-06, "epoch": 0.2780148762346055, "percentage": 27.8, "elapsed_time": "3:39:04", "remaining_time": "9:28:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 286, "total_steps": 1025, "loss": 0.1588, "learning_rate": 4.319767087249094e-06, "epoch": 0.2789903670284112, "percentage": 27.9, "elapsed_time": "3:39:51", "remaining_time": "9:28:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 287, "total_steps": 1025, "loss": 0.1546, "learning_rate": 4.314222886746304e-06, "epoch": 0.2799658578222168, "percentage": 28.0, "elapsed_time": "3:40:39", "remaining_time": "9:27:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 288, "total_steps": 1025, "loss": 0.1677, "learning_rate": 4.308659773073398e-06, "epoch": 0.28094134861602243, "percentage": 28.1, "elapsed_time": "3:41:22", "remaining_time": "9:26:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 289, "total_steps": 1025, "loss": 0.1626, "learning_rate": 4.303077804225517e-06, "epoch": 0.2819168394098281, "percentage": 28.2, "elapsed_time": "3:42:11", "remaining_time": "9:25:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 290, "total_steps": 1025, "loss": 0.1675, "learning_rate": 4.297477038394368e-06, "epoch": 0.2828923302036337, "percentage": 28.29, "elapsed_time": "3:42:59", "remaining_time": "9:25:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 291, "total_steps": 1025, "loss": 0.1574, "learning_rate": 4.291857533967616e-06, "epoch": 0.28386782099743935, "percentage": 28.39, "elapsed_time": "3:43:47", "remaining_time": "9:24:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 292, "total_steps": 1025, "loss": 0.1557, "learning_rate": 4.286219349528274e-06, "epoch": 0.28484331179124495, "percentage": 28.49, "elapsed_time": "3:44:29", "remaining_time": "9:23:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 293, "total_steps": 1025, "loss": 0.1645, "learning_rate": 4.280562543854091e-06, "epoch": 0.2858188025850506, "percentage": 28.59, "elapsed_time": "3:45:16", "remaining_time": "9:22:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 294, "total_steps": 1025, "loss": 0.1567, "learning_rate": 4.274887175916946e-06, "epoch": 0.28679429337885626, "percentage": 28.68, "elapsed_time": "3:46:01", "remaining_time": "9:21:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 295, "total_steps": 1025, "loss": 0.16, "learning_rate": 4.269193304882226e-06, "epoch": 0.28776978417266186, "percentage": 28.78, "elapsed_time": "3:46:52", "remaining_time": "9:21:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 296, "total_steps": 1025, "loss": 0.1578, "learning_rate": 4.263480990108212e-06, "epoch": 0.2887452749664675, "percentage": 28.88, "elapsed_time": "3:47:37", "remaining_time": "9:20:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 297, "total_steps": 1025, "loss": 0.1594, "learning_rate": 4.257750291145457e-06, "epoch": 0.2897207657602731, "percentage": 28.98, "elapsed_time": "3:48:21", "remaining_time": "9:19:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 298, "total_steps": 1025, "loss": 0.1555, "learning_rate": 4.252001267736174e-06, "epoch": 0.29069625655407877, "percentage": 29.07, "elapsed_time": "3:49:06", "remaining_time": "9:18:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 299, "total_steps": 1025, "loss": 0.1603, "learning_rate": 4.246233979813602e-06, "epoch": 0.2916717473478844, "percentage": 29.17, "elapsed_time": "3:49:51", "remaining_time": "9:18:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 300, "total_steps": 1025, "loss": 0.1491, "learning_rate": 4.24044848750139e-06, "epoch": 0.29264723814169, "percentage": 29.27, "elapsed_time": "3:50:32", "remaining_time": "9:17:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 301, "total_steps": 1025, "loss": 0.1607, "learning_rate": 4.234644851112965e-06, "epoch": 0.2936227289354957, "percentage": 29.37, "elapsed_time": "3:51:18", "remaining_time": "9:16:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 302, "total_steps": 1025, "loss": 0.1521, "learning_rate": 4.228823131150904e-06, "epoch": 0.2945982197293013, "percentage": 29.46, "elapsed_time": "3:52:04", "remaining_time": "9:15:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 303, "total_steps": 1025, "loss": 0.1616, "learning_rate": 4.222983388306308e-06, "epoch": 0.29557371052310694, "percentage": 29.56, "elapsed_time": "3:52:50", "remaining_time": "9:14:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 304, "total_steps": 1025, "loss": 0.1581, "learning_rate": 4.217125683458162e-06, "epoch": 0.2965492013169126, "percentage": 29.66, "elapsed_time": "3:53:37", "remaining_time": "9:14:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 305, "total_steps": 1025, "loss": 0.1492, "learning_rate": 4.211250077672704e-06, "epoch": 0.2975246921107182, "percentage": 29.76, "elapsed_time": "3:54:24", "remaining_time": "9:13:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 306, "total_steps": 1025, "loss": 0.1587, "learning_rate": 4.20535663220279e-06, "epoch": 0.29850018290452385, "percentage": 29.85, "elapsed_time": "3:55:11", "remaining_time": "9:12:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 307, "total_steps": 1025, "loss": 0.1593, "learning_rate": 4.199445408487253e-06, "epoch": 0.29947567369832945, "percentage": 29.95, "elapsed_time": "3:55:56", "remaining_time": "9:11:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 308, "total_steps": 1025, "loss": 0.151, "learning_rate": 4.1935164681502626e-06, "epoch": 0.3004511644921351, "percentage": 30.05, "elapsed_time": "3:56:43", "remaining_time": "9:11:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 309, "total_steps": 1025, "loss": 0.1629, "learning_rate": 4.187569873000684e-06, "epoch": 0.30142665528594076, "percentage": 30.15, "elapsed_time": "3:57:31", "remaining_time": "9:10:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 310, "total_steps": 1025, "loss": 0.1734, "learning_rate": 4.181605685031433e-06, "epoch": 0.30240214607974636, "percentage": 30.24, "elapsed_time": "3:58:20", "remaining_time": "9:09:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 311, "total_steps": 1025, "loss": 0.1509, "learning_rate": 4.1756239664188275e-06, "epoch": 0.303377636873552, "percentage": 30.34, "elapsed_time": "3:59:08", "remaining_time": "9:09:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 312, "total_steps": 1025, "loss": 0.1571, "learning_rate": 4.169624779521944e-06, "epoch": 0.3043531276673576, "percentage": 30.44, "elapsed_time": "3:59:55", "remaining_time": "9:08:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 313, "total_steps": 1025, "loss": 0.1628, "learning_rate": 4.163608186881964e-06, "epoch": 0.30532861846116327, "percentage": 30.54, "elapsed_time": "4:00:40", "remaining_time": "9:07:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 314, "total_steps": 1025, "loss": 0.1595, "learning_rate": 4.157574251221522e-06, "epoch": 0.3063041092549689, "percentage": 30.63, "elapsed_time": "4:01:25", "remaining_time": "9:06:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 315, "total_steps": 1025, "loss": 0.1524, "learning_rate": 4.1515230354440526e-06, "epoch": 0.3072796000487745, "percentage": 30.73, "elapsed_time": "4:02:09", "remaining_time": "9:05:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 316, "total_steps": 1025, "loss": 0.1619, "learning_rate": 4.145454602633137e-06, "epoch": 0.3082550908425802, "percentage": 30.83, "elapsed_time": "4:02:52", "remaining_time": "9:04:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 317, "total_steps": 1025, "loss": 0.1603, "learning_rate": 4.139369016051838e-06, "epoch": 0.3092305816363858, "percentage": 30.93, "elapsed_time": "4:03:38", "remaining_time": "9:04:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 318, "total_steps": 1025, "loss": 0.1604, "learning_rate": 4.1332663391420515e-06, "epoch": 0.31020607243019144, "percentage": 31.02, "elapsed_time": "4:04:24", "remaining_time": "9:03:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 319, "total_steps": 1025, "loss": 0.1437, "learning_rate": 4.127146635523835e-06, "epoch": 0.3111815632239971, "percentage": 31.12, "elapsed_time": "4:05:11", "remaining_time": "9:02:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 320, "total_steps": 1025, "loss": 0.1506, "learning_rate": 4.121009968994751e-06, "epoch": 0.3121570540178027, "percentage": 31.22, "elapsed_time": "4:06:00", "remaining_time": "9:01:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 321, "total_steps": 1025, "loss": 0.1463, "learning_rate": 4.114856403529196e-06, "epoch": 0.31313254481160835, "percentage": 31.32, "elapsed_time": "4:06:46", "remaining_time": "9:01:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 322, "total_steps": 1025, "loss": 0.1615, "learning_rate": 4.10868600327774e-06, "epoch": 0.31410803560541395, "percentage": 31.41, "elapsed_time": "4:07:33", "remaining_time": "9:00:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 323, "total_steps": 1025, "loss": 0.1537, "learning_rate": 4.102498832566454e-06, "epoch": 0.3150835263992196, "percentage": 31.51, "elapsed_time": "4:08:19", "remaining_time": "8:59:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 324, "total_steps": 1025, "loss": 0.1611, "learning_rate": 4.096294955896239e-06, "epoch": 0.31605901719302526, "percentage": 31.61, "elapsed_time": "4:09:08", "remaining_time": "8:59:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 325, "total_steps": 1025, "loss": 0.1533, "learning_rate": 4.090074437942155e-06, "epoch": 0.31703450798683086, "percentage": 31.71, "elapsed_time": "4:09:49", "remaining_time": "8:58:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 326, "total_steps": 1025, "loss": 0.1493, "learning_rate": 4.083837343552749e-06, "epoch": 0.3180099987806365, "percentage": 31.8, "elapsed_time": "4:10:33", "remaining_time": "8:57:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 327, "total_steps": 1025, "loss": 0.1424, "learning_rate": 4.077583737749373e-06, "epoch": 0.3189854895744421, "percentage": 31.9, "elapsed_time": "4:11:22", "remaining_time": "8:56:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 328, "total_steps": 1025, "loss": 0.1523, "learning_rate": 4.07131368572551e-06, "epoch": 0.31996098036824777, "percentage": 32.0, "elapsed_time": "4:12:09", "remaining_time": "8:55:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 329, "total_steps": 1025, "loss": 0.1539, "learning_rate": 4.0650272528460955e-06, "epoch": 0.3209364711620534, "percentage": 32.1, "elapsed_time": "4:12:52", "remaining_time": "8:54:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 330, "total_steps": 1025, "loss": 0.1377, "learning_rate": 4.058724504646834e-06, "epoch": 0.321911961955859, "percentage": 32.2, "elapsed_time": "4:13:33", "remaining_time": "8:54:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 331, "total_steps": 1025, "loss": 0.1534, "learning_rate": 4.052405506833516e-06, "epoch": 0.3228874527496647, "percentage": 32.29, "elapsed_time": "4:14:18", "remaining_time": "8:53:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 332, "total_steps": 1025, "loss": 0.1471, "learning_rate": 4.046070325281333e-06, "epoch": 0.3238629435434703, "percentage": 32.39, "elapsed_time": "4:15:03", "remaining_time": "8:52:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 333, "total_steps": 1025, "loss": 0.1403, "learning_rate": 4.039719026034191e-06, "epoch": 0.32483843433727594, "percentage": 32.49, "elapsed_time": "4:15:49", "remaining_time": "8:51:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 334, "total_steps": 1025, "loss": 0.1365, "learning_rate": 4.0333516753040225e-06, "epoch": 0.3258139251310816, "percentage": 32.59, "elapsed_time": "4:16:34", "remaining_time": "8:50:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 335, "total_steps": 1025, "loss": 0.1446, "learning_rate": 4.026968339470097e-06, "epoch": 0.3267894159248872, "percentage": 32.68, "elapsed_time": "4:17:17", "remaining_time": "8:49:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 336, "total_steps": 1025, "loss": 0.1553, "learning_rate": 4.020569085078324e-06, "epoch": 0.32776490671869285, "percentage": 32.78, "elapsed_time": "4:18:03", "remaining_time": "8:49:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 337, "total_steps": 1025, "loss": 0.1457, "learning_rate": 4.014153978840568e-06, "epoch": 0.32874039751249845, "percentage": 32.88, "elapsed_time": "4:18:48", "remaining_time": "8:48:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 338, "total_steps": 1025, "loss": 0.1567, "learning_rate": 4.007723087633943e-06, "epoch": 0.3297158883063041, "percentage": 32.98, "elapsed_time": "4:19:36", "remaining_time": "8:47:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 339, "total_steps": 1025, "loss": 0.1564, "learning_rate": 4.001276478500127e-06, "epoch": 0.33069137910010976, "percentage": 33.07, "elapsed_time": "4:20:20", "remaining_time": "8:46:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 340, "total_steps": 1025, "loss": 0.1409, "learning_rate": 3.994814218644649e-06, "epoch": 0.33166686989391536, "percentage": 33.17, "elapsed_time": "4:21:05", "remaining_time": "8:46:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 341, "total_steps": 1025, "loss": 0.1472, "learning_rate": 3.988336375436201e-06, "epoch": 0.332642360687721, "percentage": 33.27, "elapsed_time": "4:21:50", "remaining_time": "8:45:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 342, "total_steps": 1025, "loss": 0.1518, "learning_rate": 3.981843016405928e-06, "epoch": 0.3336178514815266, "percentage": 33.37, "elapsed_time": "4:22:34", "remaining_time": "8:44:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 343, "total_steps": 1025, "loss": 0.1448, "learning_rate": 3.975334209246727e-06, "epoch": 0.3345933422753323, "percentage": 33.46, "elapsed_time": "4:23:24", "remaining_time": "8:43:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 344, "total_steps": 1025, "loss": 0.1555, "learning_rate": 3.968810021812544e-06, "epoch": 0.33556883306913793, "percentage": 33.56, "elapsed_time": "4:24:13", "remaining_time": "8:43:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 345, "total_steps": 1025, "loss": 0.1457, "learning_rate": 3.962270522117659e-06, "epoch": 0.33654432386294353, "percentage": 33.66, "elapsed_time": "4:25:02", "remaining_time": "8:42:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 346, "total_steps": 1025, "loss": 0.1538, "learning_rate": 3.955715778335984e-06, "epoch": 0.3375198146567492, "percentage": 33.76, "elapsed_time": "4:25:48", "remaining_time": "8:41:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 347, "total_steps": 1025, "loss": 0.1481, "learning_rate": 3.949145858800348e-06, "epoch": 0.3384953054505548, "percentage": 33.85, "elapsed_time": "4:26:38", "remaining_time": "8:40:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 348, "total_steps": 1025, "loss": 0.1503, "learning_rate": 3.942560832001789e-06, "epoch": 0.33947079624436044, "percentage": 33.95, "elapsed_time": "4:27:24", "remaining_time": "8:40:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 349, "total_steps": 1025, "loss": 0.1528, "learning_rate": 3.935960766588835e-06, "epoch": 0.3404462870381661, "percentage": 34.05, "elapsed_time": "4:28:05", "remaining_time": "8:39:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 350, "total_steps": 1025, "loss": 0.1436, "learning_rate": 3.9293457313667905e-06, "epoch": 0.3414217778319717, "percentage": 34.15, "elapsed_time": "4:28:52", "remaining_time": "8:38:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 351, "total_steps": 1025, "loss": 0.1482, "learning_rate": 3.922715795297022e-06, "epoch": 0.34239726862577735, "percentage": 34.24, "elapsed_time": "4:29:41", "remaining_time": "8:37:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 352, "total_steps": 1025, "loss": 0.1445, "learning_rate": 3.916071027496234e-06, "epoch": 0.34337275941958295, "percentage": 34.34, "elapsed_time": "4:30:26", "remaining_time": "8:37:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 353, "total_steps": 1025, "loss": 0.1473, "learning_rate": 3.909411497235752e-06, "epoch": 0.3443482502133886, "percentage": 34.44, "elapsed_time": "4:31:13", "remaining_time": "8:36:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 354, "total_steps": 1025, "loss": 0.1471, "learning_rate": 3.902737273940799e-06, "epoch": 0.34532374100719426, "percentage": 34.54, "elapsed_time": "4:31:56", "remaining_time": "8:35:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 355, "total_steps": 1025, "loss": 0.1527, "learning_rate": 3.8960484271897736e-06, "epoch": 0.34629923180099986, "percentage": 34.63, "elapsed_time": "4:32:44", "remaining_time": "8:34:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 356, "total_steps": 1025, "loss": 0.1534, "learning_rate": 3.889345026713519e-06, "epoch": 0.3472747225948055, "percentage": 34.73, "elapsed_time": "4:33:30", "remaining_time": "8:33:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 357, "total_steps": 1025, "loss": 0.1486, "learning_rate": 3.882627142394605e-06, "epoch": 0.3482502133886111, "percentage": 34.83, "elapsed_time": "4:34:12", "remaining_time": "8:33:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 358, "total_steps": 1025, "loss": 0.1531, "learning_rate": 3.875894844266592e-06, "epoch": 0.3492257041824168, "percentage": 34.93, "elapsed_time": "4:34:54", "remaining_time": "8:32:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 359, "total_steps": 1025, "loss": 0.1606, "learning_rate": 3.869148202513303e-06, "epoch": 0.35020119497622243, "percentage": 35.02, "elapsed_time": "4:35:40", "remaining_time": "8:31:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 360, "total_steps": 1025, "loss": 0.137, "learning_rate": 3.862387287468095e-06, "epoch": 0.35117668577002803, "percentage": 35.12, "elapsed_time": "4:36:28", "remaining_time": "8:30:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 361, "total_steps": 1025, "loss": 0.1408, "learning_rate": 3.85561216961312e-06, "epoch": 0.3521521765638337, "percentage": 35.22, "elapsed_time": "4:37:16", "remaining_time": "8:29:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 362, "total_steps": 1025, "loss": 0.147, "learning_rate": 3.8488229195785965e-06, "epoch": 0.3531276673576393, "percentage": 35.32, "elapsed_time": "4:37:59", "remaining_time": "8:29:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 363, "total_steps": 1025, "loss": 0.1446, "learning_rate": 3.842019608142068e-06, "epoch": 0.35410315815144494, "percentage": 35.41, "elapsed_time": "4:38:48", "remaining_time": "8:28:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 364, "total_steps": 1025, "loss": 0.1484, "learning_rate": 3.83520230622767e-06, "epoch": 0.3550786489452506, "percentage": 35.51, "elapsed_time": "4:39:38", "remaining_time": "8:27:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 365, "total_steps": 1025, "loss": 0.1415, "learning_rate": 3.8283710849053835e-06, "epoch": 0.3560541397390562, "percentage": 35.61, "elapsed_time": "4:40:25", "remaining_time": "8:27:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 366, "total_steps": 1025, "loss": 0.1386, "learning_rate": 3.821526015390302e-06, "epoch": 0.35702963053286185, "percentage": 35.71, "elapsed_time": "4:41:11", "remaining_time": "8:26:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 367, "total_steps": 1025, "loss": 0.156, "learning_rate": 3.814667169041887e-06, "epoch": 0.35800512132666745, "percentage": 35.8, "elapsed_time": "4:41:59", "remaining_time": "8:25:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 368, "total_steps": 1025, "loss": 0.1351, "learning_rate": 3.8077946173632175e-06, "epoch": 0.3589806121204731, "percentage": 35.9, "elapsed_time": "4:42:45", "remaining_time": "8:24:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 369, "total_steps": 1025, "loss": 0.1427, "learning_rate": 3.800908432000254e-06, "epoch": 0.35995610291427876, "percentage": 36.0, "elapsed_time": "4:43:32", "remaining_time": "8:24:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 370, "total_steps": 1025, "loss": 0.1516, "learning_rate": 3.7940086847410875e-06, "epoch": 0.36093159370808436, "percentage": 36.1, "elapsed_time": "4:44:18", "remaining_time": "8:23:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 371, "total_steps": 1025, "loss": 0.1453, "learning_rate": 3.7870954475151873e-06, "epoch": 0.36190708450189, "percentage": 36.2, "elapsed_time": "4:45:06", "remaining_time": "8:22:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 372, "total_steps": 1025, "loss": 0.1403, "learning_rate": 3.780168792392658e-06, "epoch": 0.3628825752956956, "percentage": 36.29, "elapsed_time": "4:45:52", "remaining_time": "8:21:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 373, "total_steps": 1025, "loss": 0.1344, "learning_rate": 3.7732287915834842e-06, "epoch": 0.3638580660895013, "percentage": 36.39, "elapsed_time": "4:46:35", "remaining_time": "8:20:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 374, "total_steps": 1025, "loss": 0.1473, "learning_rate": 3.766275517436779e-06, "epoch": 0.36483355688330693, "percentage": 36.49, "elapsed_time": "4:47:22", "remaining_time": "8:20:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 375, "total_steps": 1025, "loss": 0.1626, "learning_rate": 3.759309042440028e-06, "epoch": 0.36580904767711253, "percentage": 36.59, "elapsed_time": "4:48:11", "remaining_time": "8:19:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 376, "total_steps": 1025, "loss": 0.1437, "learning_rate": 3.752329439218337e-06, "epoch": 0.3667845384709182, "percentage": 36.68, "elapsed_time": "4:48:56", "remaining_time": "8:18:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 377, "total_steps": 1025, "loss": 0.1411, "learning_rate": 3.7453367805336697e-06, "epoch": 0.3677600292647238, "percentage": 36.78, "elapsed_time": "4:49:41", "remaining_time": "8:17:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 378, "total_steps": 1025, "loss": 0.1462, "learning_rate": 3.738331139284096e-06, "epoch": 0.36873552005852944, "percentage": 36.88, "elapsed_time": "4:50:28", "remaining_time": "8:17:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 379, "total_steps": 1025, "loss": 0.1525, "learning_rate": 3.731312588503024e-06, "epoch": 0.3697110108523351, "percentage": 36.98, "elapsed_time": "4:51:16", "remaining_time": "8:16:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 380, "total_steps": 1025, "loss": 0.1509, "learning_rate": 3.7242812013584474e-06, "epoch": 0.3706865016461407, "percentage": 37.07, "elapsed_time": "4:52:03", "remaining_time": "8:15:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 381, "total_steps": 1025, "loss": 0.1433, "learning_rate": 3.717237051152175e-06, "epoch": 0.37166199243994635, "percentage": 37.17, "elapsed_time": "4:52:49", "remaining_time": "8:14:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 382, "total_steps": 1025, "loss": 0.1486, "learning_rate": 3.710180211319071e-06, "epoch": 0.37263748323375195, "percentage": 37.27, "elapsed_time": "4:53:36", "remaining_time": "8:14:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 383, "total_steps": 1025, "loss": 0.139, "learning_rate": 3.703110755426289e-06, "epoch": 0.3736129740275576, "percentage": 37.37, "elapsed_time": "4:54:25", "remaining_time": "8:13:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 384, "total_steps": 1025, "loss": 0.1521, "learning_rate": 3.696028757172503e-06, "epoch": 0.37458846482136327, "percentage": 37.46, "elapsed_time": "4:55:12", "remaining_time": "8:12:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 385, "total_steps": 1025, "loss": 0.146, "learning_rate": 3.68893429038714e-06, "epoch": 0.37556395561516887, "percentage": 37.56, "elapsed_time": "4:55:57", "remaining_time": "8:11:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 386, "total_steps": 1025, "loss": 0.1431, "learning_rate": 3.681827429029613e-06, "epoch": 0.3765394464089745, "percentage": 37.66, "elapsed_time": "4:56:44", "remaining_time": "8:11:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 387, "total_steps": 1025, "loss": 0.1484, "learning_rate": 3.6747082471885454e-06, "epoch": 0.3775149372027802, "percentage": 37.76, "elapsed_time": "4:57:31", "remaining_time": "8:10:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 388, "total_steps": 1025, "loss": 0.1405, "learning_rate": 3.6675768190810023e-06, "epoch": 0.3784904279965858, "percentage": 37.85, "elapsed_time": "4:58:17", "remaining_time": "8:09:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 389, "total_steps": 1025, "loss": 0.1461, "learning_rate": 3.6604332190517144e-06, "epoch": 0.37946591879039143, "percentage": 37.95, "elapsed_time": "4:59:03", "remaining_time": "8:08:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 390, "total_steps": 1025, "loss": 0.15, "learning_rate": 3.653277521572305e-06, "epoch": 0.38044140958419703, "percentage": 38.05, "elapsed_time": "4:59:49", "remaining_time": "8:08:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 391, "total_steps": 1025, "loss": 0.1446, "learning_rate": 3.6461098012405116e-06, "epoch": 0.3814169003780027, "percentage": 38.15, "elapsed_time": "5:00:37", "remaining_time": "8:07:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 392, "total_steps": 1025, "loss": 0.1671, "learning_rate": 3.6389301327794114e-06, "epoch": 0.38239239117180834, "percentage": 38.24, "elapsed_time": "5:01:25", "remaining_time": "8:06:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 393, "total_steps": 1025, "loss": 0.1476, "learning_rate": 3.6317385910366365e-06, "epoch": 0.38336788196561394, "percentage": 38.34, "elapsed_time": "5:02:14", "remaining_time": "8:06:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 394, "total_steps": 1025, "loss": 0.153, "learning_rate": 3.624535250983601e-06, "epoch": 0.3843433727594196, "percentage": 38.44, "elapsed_time": "5:03:02", "remaining_time": "8:05:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 395, "total_steps": 1025, "loss": 0.1456, "learning_rate": 3.6173201877147134e-06, "epoch": 0.3853188635532252, "percentage": 38.54, "elapsed_time": "5:03:47", "remaining_time": "8:04:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 396, "total_steps": 1025, "loss": 0.1413, "learning_rate": 3.6100934764465973e-06, "epoch": 0.38629435434703085, "percentage": 38.63, "elapsed_time": "5:04:34", "remaining_time": "8:03:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 397, "total_steps": 1025, "loss": 0.1512, "learning_rate": 3.6028551925173046e-06, "epoch": 0.3872698451408365, "percentage": 38.73, "elapsed_time": "5:05:20", "remaining_time": "8:03:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 398, "total_steps": 1025, "loss": 0.1428, "learning_rate": 3.595605411385533e-06, "epoch": 0.3882453359346421, "percentage": 38.83, "elapsed_time": "5:06:08", "remaining_time": "8:02:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 399, "total_steps": 1025, "loss": 0.1481, "learning_rate": 3.5883442086298375e-06, "epoch": 0.38922082672844777, "percentage": 38.93, "elapsed_time": "5:06:57", "remaining_time": "8:01:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 400, "total_steps": 1025, "loss": 0.1394, "learning_rate": 3.581071659947842e-06, "epoch": 0.39019631752225337, "percentage": 39.02, "elapsed_time": "5:07:42", "remaining_time": "8:00:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 401, "total_steps": 1025, "loss": 0.1396, "learning_rate": 3.5737878411554515e-06, "epoch": 0.391171808316059, "percentage": 39.12, "elapsed_time": "5:08:30", "remaining_time": "8:00:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 402, "total_steps": 1025, "loss": 0.1457, "learning_rate": 3.566492828186063e-06, "epoch": 0.3921472991098647, "percentage": 39.22, "elapsed_time": "5:09:16", "remaining_time": "7:59:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 403, "total_steps": 1025, "loss": 0.1428, "learning_rate": 3.5591866970897695e-06, "epoch": 0.3931227899036703, "percentage": 39.32, "elapsed_time": "5:10:02", "remaining_time": "7:58:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 404, "total_steps": 1025, "loss": 0.1459, "learning_rate": 3.55186952403257e-06, "epoch": 0.39409828069747593, "percentage": 39.41, "elapsed_time": "5:10:49", "remaining_time": "7:57:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 405, "total_steps": 1025, "loss": 0.1405, "learning_rate": 3.5445413852955783e-06, "epoch": 0.39507377149128153, "percentage": 39.51, "elapsed_time": "5:11:35", "remaining_time": "7:57:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 406, "total_steps": 1025, "loss": 0.144, "learning_rate": 3.5372023572742224e-06, "epoch": 0.3960492622850872, "percentage": 39.61, "elapsed_time": "5:12:23", "remaining_time": "7:56:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 407, "total_steps": 1025, "loss": 0.152, "learning_rate": 3.52985251647745e-06, "epoch": 0.39702475307889284, "percentage": 39.71, "elapsed_time": "5:13:07", "remaining_time": "7:55:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 408, "total_steps": 1025, "loss": 0.1527, "learning_rate": 3.522491939526932e-06, "epoch": 0.39800024387269844, "percentage": 39.8, "elapsed_time": "5:13:54", "remaining_time": "7:54:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 409, "total_steps": 1025, "loss": 0.1546, "learning_rate": 3.515120703156264e-06, "epoch": 0.3989757346665041, "percentage": 39.9, "elapsed_time": "5:14:40", "remaining_time": "7:53:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 410, "total_steps": 1025, "loss": 0.1397, "learning_rate": 3.507738884210164e-06, "epoch": 0.3999512254603097, "percentage": 40.0, "elapsed_time": "5:15:26", "remaining_time": "7:53:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 411, "total_steps": 1025, "loss": 0.1435, "learning_rate": 3.500346559643675e-06, "epoch": 0.40092671625411536, "percentage": 40.1, "elapsed_time": "5:16:13", "remaining_time": "7:52:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 412, "total_steps": 1025, "loss": 0.147, "learning_rate": 3.4929438065213568e-06, "epoch": 0.401902207047921, "percentage": 40.2, "elapsed_time": "5:17:01", "remaining_time": "7:51:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 413, "total_steps": 1025, "loss": 0.1558, "learning_rate": 3.48553070201649e-06, "epoch": 0.4028776978417266, "percentage": 40.29, "elapsed_time": "5:17:49", "remaining_time": "7:50:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 414, "total_steps": 1025, "loss": 0.1449, "learning_rate": 3.4781073234102665e-06, "epoch": 0.40385318863553227, "percentage": 40.39, "elapsed_time": "5:18:37", "remaining_time": "7:50:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 415, "total_steps": 1025, "loss": 0.1396, "learning_rate": 3.470673748090984e-06, "epoch": 0.40482867942933787, "percentage": 40.49, "elapsed_time": "5:19:25", "remaining_time": "7:49:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 416, "total_steps": 1025, "loss": 0.1427, "learning_rate": 3.4632300535532415e-06, "epoch": 0.4058041702231435, "percentage": 40.59, "elapsed_time": "5:20:10", "remaining_time": "7:48:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 417, "total_steps": 1025, "loss": 0.1449, "learning_rate": 3.4557763173971293e-06, "epoch": 0.4067796610169492, "percentage": 40.68, "elapsed_time": "5:20:55", "remaining_time": "7:47:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 418, "total_steps": 1025, "loss": 0.1473, "learning_rate": 3.4483126173274227e-06, "epoch": 0.4077551518107548, "percentage": 40.78, "elapsed_time": "5:21:38", "remaining_time": "7:47:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 419, "total_steps": 1025, "loss": 0.1432, "learning_rate": 3.440839031152769e-06, "epoch": 0.40873064260456043, "percentage": 40.88, "elapsed_time": "5:22:26", "remaining_time": "7:46:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 420, "total_steps": 1025, "loss": 0.1356, "learning_rate": 3.4333556367848773e-06, "epoch": 0.40970613339836603, "percentage": 40.98, "elapsed_time": "5:23:13", "remaining_time": "7:45:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 421, "total_steps": 1025, "loss": 0.1414, "learning_rate": 3.425862512237708e-06, "epoch": 0.4106816241921717, "percentage": 41.07, "elapsed_time": "5:23:54", "remaining_time": "7:44:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 422, "total_steps": 1025, "loss": 0.144, "learning_rate": 3.418359735626656e-06, "epoch": 0.41165711498597735, "percentage": 41.17, "elapsed_time": "5:24:40", "remaining_time": "7:43:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 423, "total_steps": 1025, "loss": 0.1413, "learning_rate": 3.4108473851677408e-06, "epoch": 0.41263260577978295, "percentage": 41.27, "elapsed_time": "5:25:23", "remaining_time": "7:43:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 424, "total_steps": 1025, "loss": 0.1492, "learning_rate": 3.4033255391767865e-06, "epoch": 0.4136080965735886, "percentage": 41.37, "elapsed_time": "5:26:13", "remaining_time": "7:42:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 425, "total_steps": 1025, "loss": 0.1452, "learning_rate": 3.395794276068609e-06, "epoch": 0.4145835873673942, "percentage": 41.46, "elapsed_time": "5:26:59", "remaining_time": "7:41:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 426, "total_steps": 1025, "loss": 0.1415, "learning_rate": 3.388253674356196e-06, "epoch": 0.41555907816119986, "percentage": 41.56, "elapsed_time": "5:27:46", "remaining_time": "7:40:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 427, "total_steps": 1025, "loss": 0.1403, "learning_rate": 3.380703812649891e-06, "epoch": 0.4165345689550055, "percentage": 41.66, "elapsed_time": "5:28:30", "remaining_time": "7:40:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 428, "total_steps": 1025, "loss": 0.1455, "learning_rate": 3.3731447696565713e-06, "epoch": 0.4175100597488111, "percentage": 41.76, "elapsed_time": "5:29:19", "remaining_time": "7:39:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 429, "total_steps": 1025, "loss": 0.1368, "learning_rate": 3.3655766241788285e-06, "epoch": 0.41848555054261677, "percentage": 41.85, "elapsed_time": "5:30:04", "remaining_time": "7:38:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 430, "total_steps": 1025, "loss": 0.1446, "learning_rate": 3.357999455114148e-06, "epoch": 0.41946104133642237, "percentage": 41.95, "elapsed_time": "5:30:53", "remaining_time": "7:37:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 431, "total_steps": 1025, "loss": 0.1506, "learning_rate": 3.350413341454086e-06, "epoch": 0.420436532130228, "percentage": 42.05, "elapsed_time": "5:31:37", "remaining_time": "7:37:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 432, "total_steps": 1025, "loss": 0.1513, "learning_rate": 3.3428183622834442e-06, "epoch": 0.4214120229240337, "percentage": 42.15, "elapsed_time": "5:32:26", "remaining_time": "7:36:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 433, "total_steps": 1025, "loss": 0.1403, "learning_rate": 3.3352145967794463e-06, "epoch": 0.4223875137178393, "percentage": 42.24, "elapsed_time": "5:33:13", "remaining_time": "7:35:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 434, "total_steps": 1025, "loss": 0.1411, "learning_rate": 3.3276021242109152e-06, "epoch": 0.42336300451164494, "percentage": 42.34, "elapsed_time": "5:34:01", "remaining_time": "7:34:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 435, "total_steps": 1025, "loss": 0.1508, "learning_rate": 3.319981023937442e-06, "epoch": 0.42433849530545054, "percentage": 42.44, "elapsed_time": "5:34:52", "remaining_time": "7:34:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 436, "total_steps": 1025, "loss": 0.1412, "learning_rate": 3.3123513754085635e-06, "epoch": 0.4253139860992562, "percentage": 42.54, "elapsed_time": "5:35:41", "remaining_time": "7:33:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 437, "total_steps": 1025, "loss": 0.1356, "learning_rate": 3.3047132581629297e-06, "epoch": 0.42628947689306185, "percentage": 42.63, "elapsed_time": "5:36:26", "remaining_time": "7:32:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 438, "total_steps": 1025, "loss": 0.1364, "learning_rate": 3.297066751827478e-06, "epoch": 0.42726496768686745, "percentage": 42.73, "elapsed_time": "5:37:14", "remaining_time": "7:31:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 439, "total_steps": 1025, "loss": 0.1384, "learning_rate": 3.2894119361166e-06, "epoch": 0.4282404584806731, "percentage": 42.83, "elapsed_time": "5:38:03", "remaining_time": "7:31:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 440, "total_steps": 1025, "loss": 0.1407, "learning_rate": 3.2817488908313132e-06, "epoch": 0.4292159492744787, "percentage": 42.93, "elapsed_time": "5:38:46", "remaining_time": "7:30:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 441, "total_steps": 1025, "loss": 0.1511, "learning_rate": 3.274077695858428e-06, "epoch": 0.43019144006828436, "percentage": 43.02, "elapsed_time": "5:39:33", "remaining_time": "7:29:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 442, "total_steps": 1025, "loss": 0.1443, "learning_rate": 3.2663984311697137e-06, "epoch": 0.43116693086209, "percentage": 43.12, "elapsed_time": "5:40:20", "remaining_time": "7:28:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 443, "total_steps": 1025, "loss": 0.1522, "learning_rate": 3.2587111768210677e-06, "epoch": 0.4321424216558956, "percentage": 43.22, "elapsed_time": "5:41:07", "remaining_time": "7:28:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 444, "total_steps": 1025, "loss": 0.1376, "learning_rate": 3.251016012951678e-06, "epoch": 0.43311791244970127, "percentage": 43.32, "elapsed_time": "5:41:55", "remaining_time": "7:27:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 445, "total_steps": 1025, "loss": 0.141, "learning_rate": 3.2433130197831877e-06, "epoch": 0.43409340324350687, "percentage": 43.41, "elapsed_time": "5:42:38", "remaining_time": "7:26:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 446, "total_steps": 1025, "loss": 0.1394, "learning_rate": 3.2356022776188623e-06, "epoch": 0.4350688940373125, "percentage": 43.51, "elapsed_time": "5:43:28", "remaining_time": "7:25:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 447, "total_steps": 1025, "loss": 0.1384, "learning_rate": 3.227883866842749e-06, "epoch": 0.4360443848311182, "percentage": 43.61, "elapsed_time": "5:44:13", "remaining_time": "7:25:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 448, "total_steps": 1025, "loss": 0.1383, "learning_rate": 3.2201578679188396e-06, "epoch": 0.4370198756249238, "percentage": 43.71, "elapsed_time": "5:44:58", "remaining_time": "7:24:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 449, "total_steps": 1025, "loss": 0.1404, "learning_rate": 3.2124243613902316e-06, "epoch": 0.43799536641872944, "percentage": 43.8, "elapsed_time": "5:45:43", "remaining_time": "7:23:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 450, "total_steps": 1025, "loss": 0.1467, "learning_rate": 3.204683427878291e-06, "epoch": 0.43897085721253504, "percentage": 43.9, "elapsed_time": "5:46:30", "remaining_time": "7:22:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 451, "total_steps": 1025, "loss": 0.1446, "learning_rate": 3.196935148081808e-06, "epoch": 0.4399463480063407, "percentage": 44.0, "elapsed_time": "5:47:19", "remaining_time": "7:22:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 452, "total_steps": 1025, "loss": 0.1362, "learning_rate": 3.189179602776157e-06, "epoch": 0.44092183880014635, "percentage": 44.1, "elapsed_time": "5:48:04", "remaining_time": "7:21:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 453, "total_steps": 1025, "loss": 0.1381, "learning_rate": 3.181416872812455e-06, "epoch": 0.44189732959395195, "percentage": 44.2, "elapsed_time": "5:48:48", "remaining_time": "7:20:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 454, "total_steps": 1025, "loss": 0.1439, "learning_rate": 3.1736470391167195e-06, "epoch": 0.4428728203877576, "percentage": 44.29, "elapsed_time": "5:49:33", "remaining_time": "7:19:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 455, "total_steps": 1025, "loss": 0.1472, "learning_rate": 3.1658701826890237e-06, "epoch": 0.4438483111815632, "percentage": 44.39, "elapsed_time": "5:50:21", "remaining_time": "7:18:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 456, "total_steps": 1025, "loss": 0.1401, "learning_rate": 3.158086384602652e-06, "epoch": 0.44482380197536886, "percentage": 44.49, "elapsed_time": "5:51:06", "remaining_time": "7:18:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 457, "total_steps": 1025, "loss": 0.1527, "learning_rate": 3.150295726003256e-06, "epoch": 0.4457992927691745, "percentage": 44.59, "elapsed_time": "5:51:55", "remaining_time": "7:17:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 458, "total_steps": 1025, "loss": 0.1365, "learning_rate": 3.142498288108007e-06, "epoch": 0.4467747835629801, "percentage": 44.68, "elapsed_time": "5:52:40", "remaining_time": "7:16:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 459, "total_steps": 1025, "loss": 0.1405, "learning_rate": 3.13469415220475e-06, "epoch": 0.44775027435678577, "percentage": 44.78, "elapsed_time": "5:53:28", "remaining_time": "7:15:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 460, "total_steps": 1025, "loss": 0.1479, "learning_rate": 3.1268833996511584e-06, "epoch": 0.44872576515059137, "percentage": 44.88, "elapsed_time": "5:54:19", "remaining_time": "7:15:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 461, "total_steps": 1025, "loss": 0.1312, "learning_rate": 3.119066111873879e-06, "epoch": 0.449701255944397, "percentage": 44.98, "elapsed_time": "5:55:04", "remaining_time": "7:14:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 462, "total_steps": 1025, "loss": 0.1344, "learning_rate": 3.1112423703676937e-06, "epoch": 0.4506767467382027, "percentage": 45.07, "elapsed_time": "5:55:51", "remaining_time": "7:13:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 463, "total_steps": 1025, "loss": 0.1329, "learning_rate": 3.1034122566946596e-06, "epoch": 0.4516522375320083, "percentage": 45.17, "elapsed_time": "5:56:39", "remaining_time": "7:12:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 464, "total_steps": 1025, "loss": 0.1454, "learning_rate": 3.0955758524832663e-06, "epoch": 0.45262772832581394, "percentage": 45.27, "elapsed_time": "5:57:25", "remaining_time": "7:12:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 465, "total_steps": 1025, "loss": 0.1393, "learning_rate": 3.0877332394275806e-06, "epoch": 0.45360321911961954, "percentage": 45.37, "elapsed_time": "5:58:13", "remaining_time": "7:11:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 466, "total_steps": 1025, "loss": 0.1303, "learning_rate": 3.079884499286396e-06, "epoch": 0.4545787099134252, "percentage": 45.46, "elapsed_time": "5:58:58", "remaining_time": "7:10:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 467, "total_steps": 1025, "loss": 0.1369, "learning_rate": 3.0720297138823814e-06, "epoch": 0.45555420070723085, "percentage": 45.56, "elapsed_time": "5:59:46", "remaining_time": "7:09:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 468, "total_steps": 1025, "loss": 0.1418, "learning_rate": 3.0641689651012253e-06, "epoch": 0.45652969150103645, "percentage": 45.66, "elapsed_time": "6:00:32", "remaining_time": "7:09:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 469, "total_steps": 1025, "loss": 0.1377, "learning_rate": 3.056302334890786e-06, "epoch": 0.4575051822948421, "percentage": 45.76, "elapsed_time": "6:01:20", "remaining_time": "7:08:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 470, "total_steps": 1025, "loss": 0.1399, "learning_rate": 3.0484299052602355e-06, "epoch": 0.4584806730886477, "percentage": 45.85, "elapsed_time": "6:02:07", "remaining_time": "7:07:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 471, "total_steps": 1025, "loss": 0.1369, "learning_rate": 3.040551758279204e-06, "epoch": 0.45945616388245336, "percentage": 45.95, "elapsed_time": "6:02:54", "remaining_time": "7:06:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 472, "total_steps": 1025, "loss": 0.1473, "learning_rate": 3.032667976076923e-06, "epoch": 0.460431654676259, "percentage": 46.05, "elapsed_time": "6:03:43", "remaining_time": "7:06:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 473, "total_steps": 1025, "loss": 0.1492, "learning_rate": 3.0247786408413725e-06, "epoch": 0.4614071454700646, "percentage": 46.15, "elapsed_time": "6:04:28", "remaining_time": "7:05:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 474, "total_steps": 1025, "loss": 0.1429, "learning_rate": 3.0168838348184226e-06, "epoch": 0.4623826362638703, "percentage": 46.24, "elapsed_time": "6:05:15", "remaining_time": "7:04:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 475, "total_steps": 1025, "loss": 0.1239, "learning_rate": 3.008983640310976e-06, "epoch": 0.4633581270576759, "percentage": 46.34, "elapsed_time": "6:06:05", "remaining_time": "7:03:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 476, "total_steps": 1025, "loss": 0.1416, "learning_rate": 3.0010781396781104e-06, "epoch": 0.46433361785148153, "percentage": 46.44, "elapsed_time": "6:06:52", "remaining_time": "7:03:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 477, "total_steps": 1025, "loss": 0.147, "learning_rate": 2.993167415334218e-06, "epoch": 0.4653091086452872, "percentage": 46.54, "elapsed_time": "6:07:38", "remaining_time": "7:02:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 478, "total_steps": 1025, "loss": 0.149, "learning_rate": 2.9852515497481494e-06, "epoch": 0.4662845994390928, "percentage": 46.63, "elapsed_time": "6:08:24", "remaining_time": "7:01:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 479, "total_steps": 1025, "loss": 0.1331, "learning_rate": 2.977330625442352e-06, "epoch": 0.46726009023289844, "percentage": 46.73, "elapsed_time": "6:09:06", "remaining_time": "7:00:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 480, "total_steps": 1025, "loss": 0.1508, "learning_rate": 2.9694047249920095e-06, "epoch": 0.46823558102670404, "percentage": 46.83, "elapsed_time": "6:09:50", "remaining_time": "6:59:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 481, "total_steps": 1025, "loss": 0.1347, "learning_rate": 2.961473931024182e-06, "epoch": 0.4692110718205097, "percentage": 46.93, "elapsed_time": "6:10:32", "remaining_time": "6:59:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 482, "total_steps": 1025, "loss": 0.1386, "learning_rate": 2.953538326216944e-06, "epoch": 0.47018656261431535, "percentage": 47.02, "elapsed_time": "6:11:22", "remaining_time": "6:58:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 483, "total_steps": 1025, "loss": 0.1378, "learning_rate": 2.9455979932985237e-06, "epoch": 0.47116205340812095, "percentage": 47.12, "elapsed_time": "6:12:12", "remaining_time": "6:57:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 484, "total_steps": 1025, "loss": 0.1366, "learning_rate": 2.9376530150464388e-06, "epoch": 0.4721375442019266, "percentage": 47.22, "elapsed_time": "6:12:56", "remaining_time": "6:56:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 485, "total_steps": 1025, "loss": 0.1436, "learning_rate": 2.9297034742866336e-06, "epoch": 0.4731130349957322, "percentage": 47.32, "elapsed_time": "6:13:38", "remaining_time": "6:56:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 486, "total_steps": 1025, "loss": 0.1335, "learning_rate": 2.921749453892618e-06, "epoch": 0.47408852578953786, "percentage": 47.41, "elapsed_time": "6:14:22", "remaining_time": "6:55:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 487, "total_steps": 1025, "loss": 0.1311, "learning_rate": 2.913791036784601e-06, "epoch": 0.4750640165833435, "percentage": 47.51, "elapsed_time": "6:15:07", "remaining_time": "6:54:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 488, "total_steps": 1025, "loss": 0.1384, "learning_rate": 2.9058283059286275e-06, "epoch": 0.4760395073771491, "percentage": 47.61, "elapsed_time": "6:15:52", "remaining_time": "6:53:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 489, "total_steps": 1025, "loss": 0.1532, "learning_rate": 2.8978613443357107e-06, "epoch": 0.4770149981709548, "percentage": 47.71, "elapsed_time": "6:16:38", "remaining_time": "6:52:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 490, "total_steps": 1025, "loss": 0.1451, "learning_rate": 2.889890235060972e-06, "epoch": 0.4779904889647604, "percentage": 47.8, "elapsed_time": "6:17:21", "remaining_time": "6:52:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 491, "total_steps": 1025, "loss": 0.1478, "learning_rate": 2.88191506120277e-06, "epoch": 0.47896597975856603, "percentage": 47.9, "elapsed_time": "6:18:08", "remaining_time": "6:51:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 492, "total_steps": 1025, "loss": 0.1383, "learning_rate": 2.873935905901839e-06, "epoch": 0.4799414705523717, "percentage": 48.0, "elapsed_time": "6:18:57", "remaining_time": "6:50:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 493, "total_steps": 1025, "loss": 0.1414, "learning_rate": 2.865952852340417e-06, "epoch": 0.4809169613461773, "percentage": 48.1, "elapsed_time": "6:19:40", "remaining_time": "6:49:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 494, "total_steps": 1025, "loss": 0.1381, "learning_rate": 2.8579659837413816e-06, "epoch": 0.48189245213998294, "percentage": 48.2, "elapsed_time": "6:20:28", "remaining_time": "6:48:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 495, "total_steps": 1025, "loss": 0.1356, "learning_rate": 2.8499753833673827e-06, "epoch": 0.48286794293378854, "percentage": 48.29, "elapsed_time": "6:21:17", "remaining_time": "6:48:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 496, "total_steps": 1025, "loss": 0.1288, "learning_rate": 2.8419811345199736e-06, "epoch": 0.4838434337275942, "percentage": 48.39, "elapsed_time": "6:22:01", "remaining_time": "6:47:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 497, "total_steps": 1025, "loss": 0.1272, "learning_rate": 2.8339833205387434e-06, "epoch": 0.48481892452139985, "percentage": 48.49, "elapsed_time": "6:22:47", "remaining_time": "6:46:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 498, "total_steps": 1025, "loss": 0.136, "learning_rate": 2.825982024800445e-06, "epoch": 0.48579441531520545, "percentage": 48.59, "elapsed_time": "6:23:33", "remaining_time": "6:45:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 499, "total_steps": 1025, "loss": 0.1401, "learning_rate": 2.8179773307181307e-06, "epoch": 0.4867699061090111, "percentage": 48.68, "elapsed_time": "6:24:19", "remaining_time": "6:45:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 500, "total_steps": 1025, "loss": 0.1455, "learning_rate": 2.8099693217402807e-06, "epoch": 0.4877453969028167, "percentage": 48.78, "elapsed_time": "6:25:06", "remaining_time": "6:44:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 500, "total_steps": 1025, "eval_loss": 0.13670527935028076, "epoch": 0.4877453969028167, "percentage": 48.78, "elapsed_time": "6:27:07", "remaining_time": "6:46:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 501, "total_steps": 1025, "loss": 0.1443, "learning_rate": 2.8019580813499304e-06, "epoch": 0.48872088769662236, "percentage": 48.88, "elapsed_time": "6:27:52", "remaining_time": "6:45:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 502, "total_steps": 1025, "loss": 0.1382, "learning_rate": 2.793943693063805e-06, "epoch": 0.489696378490428, "percentage": 48.98, "elapsed_time": "6:28:36", "remaining_time": "6:44:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 503, "total_steps": 1025, "loss": 0.1226, "learning_rate": 2.7859262404314453e-06, "epoch": 0.4906718692842336, "percentage": 49.07, "elapsed_time": "6:29:23", "remaining_time": "6:44:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 504, "total_steps": 1025, "loss": 0.147, "learning_rate": 2.7779058070343367e-06, "epoch": 0.4916473600780393, "percentage": 49.17, "elapsed_time": "6:30:11", "remaining_time": "6:43:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 505, "total_steps": 1025, "loss": 0.1328, "learning_rate": 2.7698824764850406e-06, "epoch": 0.4926228508718449, "percentage": 49.27, "elapsed_time": "6:30:59", "remaining_time": "6:42:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 506, "total_steps": 1025, "loss": 0.1357, "learning_rate": 2.7618563324263208e-06, "epoch": 0.49359834166565053, "percentage": 49.37, "elapsed_time": "6:31:43", "remaining_time": "6:41:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 507, "total_steps": 1025, "loss": 0.1328, "learning_rate": 2.7538274585302707e-06, "epoch": 0.4945738324594562, "percentage": 49.46, "elapsed_time": "6:32:24", "remaining_time": "6:40:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 508, "total_steps": 1025, "loss": 0.1334, "learning_rate": 2.745795938497443e-06, "epoch": 0.4955493232532618, "percentage": 49.56, "elapsed_time": "6:33:10", "remaining_time": "6:40:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 509, "total_steps": 1025, "loss": 0.1355, "learning_rate": 2.737761856055975e-06, "epoch": 0.49652481404706744, "percentage": 49.66, "elapsed_time": "6:34:00", "remaining_time": "6:39:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 510, "total_steps": 1025, "loss": 0.1338, "learning_rate": 2.7297252949607195e-06, "epoch": 0.49750030484087304, "percentage": 49.76, "elapsed_time": "6:34:51", "remaining_time": "6:38:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 511, "total_steps": 1025, "loss": 0.1371, "learning_rate": 2.721686338992366e-06, "epoch": 0.4984757956346787, "percentage": 49.85, "elapsed_time": "6:35:34", "remaining_time": "6:37:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 512, "total_steps": 1025, "loss": 0.1246, "learning_rate": 2.7136450719565732e-06, "epoch": 0.49945128642848435, "percentage": 49.95, "elapsed_time": "6:36:19", "remaining_time": "6:37:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 513, "total_steps": 1025, "loss": 0.1227, "learning_rate": 2.7056015776830907e-06, "epoch": 0.50042677722229, "percentage": 50.05, "elapsed_time": "6:37:08", "remaining_time": "6:36:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 514, "total_steps": 1025, "loss": 0.1376, "learning_rate": 2.6975559400248876e-06, "epoch": 0.5014022680160956, "percentage": 50.15, "elapsed_time": "6:37:52", "remaining_time": "6:35:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 515, "total_steps": 1025, "loss": 0.1417, "learning_rate": 2.6895082428572777e-06, "epoch": 0.5023777588099012, "percentage": 50.24, "elapsed_time": "6:38:39", "remaining_time": "6:34:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 516, "total_steps": 1025, "loss": 0.1346, "learning_rate": 2.681458570077045e-06, "epoch": 0.5033532496037069, "percentage": 50.34, "elapsed_time": "6:39:26", "remaining_time": "6:34:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 517, "total_steps": 1025, "loss": 0.1457, "learning_rate": 2.673407005601569e-06, "epoch": 0.5043287403975125, "percentage": 50.44, "elapsed_time": "6:40:12", "remaining_time": "6:33:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 518, "total_steps": 1025, "loss": 0.1331, "learning_rate": 2.6653536333679504e-06, "epoch": 0.5053042311913182, "percentage": 50.54, "elapsed_time": "6:41:00", "remaining_time": "6:32:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 519, "total_steps": 1025, "loss": 0.1434, "learning_rate": 2.6572985373321344e-06, "epoch": 0.5062797219851237, "percentage": 50.63, "elapsed_time": "6:41:45", "remaining_time": "6:31:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 520, "total_steps": 1025, "loss": 0.1403, "learning_rate": 2.649241801468039e-06, "epoch": 0.5072552127789294, "percentage": 50.73, "elapsed_time": "6:42:32", "remaining_time": "6:30:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 521, "total_steps": 1025, "loss": 0.1309, "learning_rate": 2.641183509766675e-06, "epoch": 0.508230703572735, "percentage": 50.83, "elapsed_time": "6:43:15", "remaining_time": "6:30:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 522, "total_steps": 1025, "loss": 0.1434, "learning_rate": 2.633123746235274e-06, "epoch": 0.5092061943665407, "percentage": 50.93, "elapsed_time": "6:44:05", "remaining_time": "6:29:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 523, "total_steps": 1025, "loss": 0.1362, "learning_rate": 2.6250625948964125e-06, "epoch": 0.5101816851603463, "percentage": 51.02, "elapsed_time": "6:44:54", "remaining_time": "6:28:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 524, "total_steps": 1025, "loss": 0.1412, "learning_rate": 2.617000139787132e-06, "epoch": 0.5111571759541519, "percentage": 51.12, "elapsed_time": "6:45:39", "remaining_time": "6:27:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 525, "total_steps": 1025, "loss": 0.1471, "learning_rate": 2.608936464958068e-06, "epoch": 0.5121326667479575, "percentage": 51.22, "elapsed_time": "6:46:24", "remaining_time": "6:27:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 526, "total_steps": 1025, "loss": 0.1419, "learning_rate": 2.6008716544725692e-06, "epoch": 0.5131081575417632, "percentage": 51.32, "elapsed_time": "6:47:11", "remaining_time": "6:26:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 527, "total_steps": 1025, "loss": 0.1289, "learning_rate": 2.5928057924058264e-06, "epoch": 0.5140836483355689, "percentage": 51.41, "elapsed_time": "6:47:57", "remaining_time": "6:25:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 528, "total_steps": 1025, "loss": 0.1295, "learning_rate": 2.5847389628439905e-06, "epoch": 0.5150591391293745, "percentage": 51.51, "elapsed_time": "6:48:40", "remaining_time": "6:24:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 529, "total_steps": 1025, "loss": 0.1341, "learning_rate": 2.576671249883301e-06, "epoch": 0.51603462992318, "percentage": 51.61, "elapsed_time": "6:49:26", "remaining_time": "6:23:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 530, "total_steps": 1025, "loss": 0.1383, "learning_rate": 2.568602737629204e-06, "epoch": 0.5170101207169857, "percentage": 51.71, "elapsed_time": "6:50:11", "remaining_time": "6:23:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 531, "total_steps": 1025, "loss": 0.1395, "learning_rate": 2.5605335101954796e-06, "epoch": 0.5179856115107914, "percentage": 51.8, "elapsed_time": "6:51:00", "remaining_time": "6:22:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 532, "total_steps": 1025, "loss": 0.1391, "learning_rate": 2.552463651703365e-06, "epoch": 0.518961102304597, "percentage": 51.9, "elapsed_time": "6:51:46", "remaining_time": "6:21:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 533, "total_steps": 1025, "loss": 0.1345, "learning_rate": 2.5443932462806733e-06, "epoch": 0.5199365930984027, "percentage": 52.0, "elapsed_time": "6:52:31", "remaining_time": "6:20:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 534, "total_steps": 1025, "loss": 0.1303, "learning_rate": 2.5363223780609214e-06, "epoch": 0.5209120838922082, "percentage": 52.1, "elapsed_time": "6:53:16", "remaining_time": "6:19:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 535, "total_steps": 1025, "loss": 0.138, "learning_rate": 2.52825113118245e-06, "epoch": 0.5218875746860139, "percentage": 52.2, "elapsed_time": "6:54:04", "remaining_time": "6:19:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 536, "total_steps": 1025, "loss": 0.1419, "learning_rate": 2.520179589787547e-06, "epoch": 0.5228630654798195, "percentage": 52.29, "elapsed_time": "6:54:54", "remaining_time": "6:18:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 537, "total_steps": 1025, "loss": 0.1378, "learning_rate": 2.5121078380215713e-06, "epoch": 0.5238385562736252, "percentage": 52.39, "elapsed_time": "6:55:42", "remaining_time": "6:17:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 538, "total_steps": 1025, "loss": 0.1331, "learning_rate": 2.5040359600320747e-06, "epoch": 0.5248140470674308, "percentage": 52.49, "elapsed_time": "6:56:25", "remaining_time": "6:16:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 539, "total_steps": 1025, "loss": 0.143, "learning_rate": 2.4959640399679253e-06, "epoch": 0.5257895378612364, "percentage": 52.59, "elapsed_time": "6:57:11", "remaining_time": "6:16:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 540, "total_steps": 1025, "loss": 0.1337, "learning_rate": 2.4878921619784295e-06, "epoch": 0.526765028655042, "percentage": 52.68, "elapsed_time": "6:58:00", "remaining_time": "6:15:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 541, "total_steps": 1025, "loss": 0.1344, "learning_rate": 2.4798204102124533e-06, "epoch": 0.5277405194488477, "percentage": 52.78, "elapsed_time": "6:58:45", "remaining_time": "6:14:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 542, "total_steps": 1025, "loss": 0.1315, "learning_rate": 2.4717488688175513e-06, "epoch": 0.5287160102426534, "percentage": 52.88, "elapsed_time": "6:59:34", "remaining_time": "6:13:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 543, "total_steps": 1025, "loss": 0.1329, "learning_rate": 2.4636776219390794e-06, "epoch": 0.529691501036459, "percentage": 52.98, "elapsed_time": "7:00:15", "remaining_time": "6:13:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 544, "total_steps": 1025, "loss": 0.1338, "learning_rate": 2.4556067537193276e-06, "epoch": 0.5306669918302646, "percentage": 53.07, "elapsed_time": "7:01:01", "remaining_time": "6:12:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 545, "total_steps": 1025, "loss": 0.1362, "learning_rate": 2.4475363482966356e-06, "epoch": 0.5316424826240702, "percentage": 53.17, "elapsed_time": "7:01:46", "remaining_time": "6:11:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 546, "total_steps": 1025, "loss": 0.133, "learning_rate": 2.4394664898045208e-06, "epoch": 0.5326179734178759, "percentage": 53.27, "elapsed_time": "7:02:32", "remaining_time": "6:10:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 547, "total_steps": 1025, "loss": 0.1343, "learning_rate": 2.4313972623707964e-06, "epoch": 0.5335934642116815, "percentage": 53.37, "elapsed_time": "7:03:18", "remaining_time": "6:09:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 548, "total_steps": 1025, "loss": 0.1318, "learning_rate": 2.4233287501167e-06, "epoch": 0.5345689550054872, "percentage": 53.46, "elapsed_time": "7:04:07", "remaining_time": "6:09:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 549, "total_steps": 1025, "loss": 0.141, "learning_rate": 2.4152610371560095e-06, "epoch": 0.5355444457992927, "percentage": 53.56, "elapsed_time": "7:04:55", "remaining_time": "6:08:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 550, "total_steps": 1025, "loss": 0.1329, "learning_rate": 2.4071942075941744e-06, "epoch": 0.5365199365930984, "percentage": 53.66, "elapsed_time": "7:05:44", "remaining_time": "6:07:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 551, "total_steps": 1025, "loss": 0.1288, "learning_rate": 2.3991283455274316e-06, "epoch": 0.537495427386904, "percentage": 53.76, "elapsed_time": "7:06:30", "remaining_time": "6:06:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 552, "total_steps": 1025, "loss": 0.1322, "learning_rate": 2.391063535041933e-06, "epoch": 0.5384709181807097, "percentage": 53.85, "elapsed_time": "7:07:14", "remaining_time": "6:06:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 553, "total_steps": 1025, "loss": 0.1239, "learning_rate": 2.3829998602128685e-06, "epoch": 0.5394464089745153, "percentage": 53.95, "elapsed_time": "7:08:02", "remaining_time": "6:05:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 554, "total_steps": 1025, "loss": 0.1308, "learning_rate": 2.3749374051035883e-06, "epoch": 0.5404218997683209, "percentage": 54.05, "elapsed_time": "7:08:50", "remaining_time": "6:04:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 555, "total_steps": 1025, "loss": 0.1377, "learning_rate": 2.3668762537647254e-06, "epoch": 0.5413973905621265, "percentage": 54.15, "elapsed_time": "7:09:37", "remaining_time": "6:03:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 556, "total_steps": 1025, "loss": 0.127, "learning_rate": 2.358816490233326e-06, "epoch": 0.5423728813559322, "percentage": 54.24, "elapsed_time": "7:10:24", "remaining_time": "6:03:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 557, "total_steps": 1025, "loss": 0.1212, "learning_rate": 2.3507581985319623e-06, "epoch": 0.5433483721497379, "percentage": 54.34, "elapsed_time": "7:11:09", "remaining_time": "6:02:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 558, "total_steps": 1025, "loss": 0.1401, "learning_rate": 2.342701462667866e-06, "epoch": 0.5443238629435435, "percentage": 54.44, "elapsed_time": "7:11:56", "remaining_time": "6:01:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 559, "total_steps": 1025, "loss": 0.1323, "learning_rate": 2.3346463666320512e-06, "epoch": 0.5452993537373491, "percentage": 54.54, "elapsed_time": "7:12:41", "remaining_time": "6:00:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 560, "total_steps": 1025, "loss": 0.1361, "learning_rate": 2.3265929943984317e-06, "epoch": 0.5462748445311547, "percentage": 54.63, "elapsed_time": "7:13:27", "remaining_time": "5:59:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 561, "total_steps": 1025, "loss": 0.1363, "learning_rate": 2.318541429922956e-06, "epoch": 0.5472503353249604, "percentage": 54.73, "elapsed_time": "7:14:12", "remaining_time": "5:59:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 562, "total_steps": 1025, "loss": 0.1414, "learning_rate": 2.310491757142723e-06, "epoch": 0.548225826118766, "percentage": 54.83, "elapsed_time": "7:14:57", "remaining_time": "5:58:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 563, "total_steps": 1025, "loss": 0.1338, "learning_rate": 2.3024440599751132e-06, "epoch": 0.5492013169125717, "percentage": 54.93, "elapsed_time": "7:15:46", "remaining_time": "5:57:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 564, "total_steps": 1025, "loss": 0.128, "learning_rate": 2.29439842231691e-06, "epoch": 0.5501768077063772, "percentage": 55.02, "elapsed_time": "7:16:30", "remaining_time": "5:56:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 565, "total_steps": 1025, "loss": 0.1378, "learning_rate": 2.2863549280434285e-06, "epoch": 0.5511522985001829, "percentage": 55.12, "elapsed_time": "7:17:14", "remaining_time": "5:55:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 566, "total_steps": 1025, "loss": 0.1302, "learning_rate": 2.2783136610076345e-06, "epoch": 0.5521277892939885, "percentage": 55.22, "elapsed_time": "7:18:02", "remaining_time": "5:55:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 567, "total_steps": 1025, "loss": 0.1371, "learning_rate": 2.270274705039282e-06, "epoch": 0.5531032800877942, "percentage": 55.32, "elapsed_time": "7:18:46", "remaining_time": "5:54:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 568, "total_steps": 1025, "loss": 0.1435, "learning_rate": 2.2622381439440255e-06, "epoch": 0.5540787708815998, "percentage": 55.41, "elapsed_time": "7:19:34", "remaining_time": "5:53:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 569, "total_steps": 1025, "loss": 0.1219, "learning_rate": 2.2542040615025584e-06, "epoch": 0.5550542616754054, "percentage": 55.51, "elapsed_time": "7:20:20", "remaining_time": "5:52:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 570, "total_steps": 1025, "loss": 0.1292, "learning_rate": 2.24617254146973e-06, "epoch": 0.556029752469211, "percentage": 55.61, "elapsed_time": "7:21:03", "remaining_time": "5:52:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 571, "total_steps": 1025, "loss": 0.1393, "learning_rate": 2.23814366757368e-06, "epoch": 0.5570052432630167, "percentage": 55.71, "elapsed_time": "7:21:53", "remaining_time": "5:51:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 572, "total_steps": 1025, "loss": 0.1235, "learning_rate": 2.23011752351496e-06, "epoch": 0.5579807340568224, "percentage": 55.8, "elapsed_time": "7:22:38", "remaining_time": "5:50:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 573, "total_steps": 1025, "loss": 0.1275, "learning_rate": 2.222094192965664e-06, "epoch": 0.558956224850628, "percentage": 55.9, "elapsed_time": "7:23:23", "remaining_time": "5:49:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 574, "total_steps": 1025, "loss": 0.1383, "learning_rate": 2.214073759568555e-06, "epoch": 0.5599317156444336, "percentage": 56.0, "elapsed_time": "7:24:07", "remaining_time": "5:48:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 575, "total_steps": 1025, "loss": 0.1221, "learning_rate": 2.2060563069361955e-06, "epoch": 0.5609072064382392, "percentage": 56.1, "elapsed_time": "7:24:52", "remaining_time": "5:48:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 576, "total_steps": 1025, "loss": 0.1203, "learning_rate": 2.19804191865007e-06, "epoch": 0.5618826972320449, "percentage": 56.2, "elapsed_time": "7:25:40", "remaining_time": "5:47:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 577, "total_steps": 1025, "loss": 0.127, "learning_rate": 2.19003067825972e-06, "epoch": 0.5628581880258505, "percentage": 56.29, "elapsed_time": "7:26:27", "remaining_time": "5:46:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 578, "total_steps": 1025, "loss": 0.1294, "learning_rate": 2.1820226692818693e-06, "epoch": 0.5638336788196562, "percentage": 56.39, "elapsed_time": "7:27:16", "remaining_time": "5:45:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 579, "total_steps": 1025, "loss": 0.1418, "learning_rate": 2.174017975199556e-06, "epoch": 0.5648091696134617, "percentage": 56.49, "elapsed_time": "7:28:02", "remaining_time": "5:45:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 580, "total_steps": 1025, "loss": 0.1549, "learning_rate": 2.1660166794612574e-06, "epoch": 0.5657846604072674, "percentage": 56.59, "elapsed_time": "7:28:44", "remaining_time": "5:44:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 581, "total_steps": 1025, "loss": 0.1339, "learning_rate": 2.158018865480027e-06, "epoch": 0.566760151201073, "percentage": 56.68, "elapsed_time": "7:29:34", "remaining_time": "5:43:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 582, "total_steps": 1025, "loss": 0.138, "learning_rate": 2.1500246166326177e-06, "epoch": 0.5677356419948787, "percentage": 56.78, "elapsed_time": "7:30:19", "remaining_time": "5:42:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 583, "total_steps": 1025, "loss": 0.1273, "learning_rate": 2.1420340162586196e-06, "epoch": 0.5687111327886843, "percentage": 56.88, "elapsed_time": "7:31:03", "remaining_time": "5:41:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 584, "total_steps": 1025, "loss": 0.1325, "learning_rate": 2.1340471476595836e-06, "epoch": 0.5696866235824899, "percentage": 56.98, "elapsed_time": "7:31:49", "remaining_time": "5:41:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 585, "total_steps": 1025, "loss": 0.1373, "learning_rate": 2.1260640940981616e-06, "epoch": 0.5706621143762955, "percentage": 57.07, "elapsed_time": "7:32:35", "remaining_time": "5:40:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 586, "total_steps": 1025, "loss": 0.1314, "learning_rate": 2.11808493879723e-06, "epoch": 0.5716376051701012, "percentage": 57.17, "elapsed_time": "7:33:25", "remaining_time": "5:39:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 587, "total_steps": 1025, "loss": 0.1273, "learning_rate": 2.110109764939029e-06, "epoch": 0.5726130959639069, "percentage": 57.27, "elapsed_time": "7:34:11", "remaining_time": "5:38:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 588, "total_steps": 1025, "loss": 0.1292, "learning_rate": 2.10213865566429e-06, "epoch": 0.5735885867577125, "percentage": 57.37, "elapsed_time": "7:34:56", "remaining_time": "5:38:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 589, "total_steps": 1025, "loss": 0.136, "learning_rate": 2.0941716940713733e-06, "epoch": 0.5745640775515181, "percentage": 57.46, "elapsed_time": "7:35:45", "remaining_time": "5:37:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 590, "total_steps": 1025, "loss": 0.1219, "learning_rate": 2.086208963215399e-06, "epoch": 0.5755395683453237, "percentage": 57.56, "elapsed_time": "7:36:31", "remaining_time": "5:36:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 591, "total_steps": 1025, "loss": 0.1272, "learning_rate": 2.0782505461073822e-06, "epoch": 0.5765150591391294, "percentage": 57.66, "elapsed_time": "7:37:12", "remaining_time": "5:35:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 592, "total_steps": 1025, "loss": 0.1211, "learning_rate": 2.0702965257133664e-06, "epoch": 0.577490549932935, "percentage": 57.76, "elapsed_time": "7:37:57", "remaining_time": "5:34:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 593, "total_steps": 1025, "loss": 0.1229, "learning_rate": 2.062346984953562e-06, "epoch": 0.5784660407267407, "percentage": 57.85, "elapsed_time": "7:38:39", "remaining_time": "5:34:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 594, "total_steps": 1025, "loss": 0.1383, "learning_rate": 2.0544020067014776e-06, "epoch": 0.5794415315205462, "percentage": 57.95, "elapsed_time": "7:39:26", "remaining_time": "5:33:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 595, "total_steps": 1025, "loss": 0.1337, "learning_rate": 2.0464616737830566e-06, "epoch": 0.5804170223143519, "percentage": 58.05, "elapsed_time": "7:40:12", "remaining_time": "5:32:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 596, "total_steps": 1025, "loss": 0.1244, "learning_rate": 2.03852606897582e-06, "epoch": 0.5813925131081575, "percentage": 58.15, "elapsed_time": "7:41:00", "remaining_time": "5:31:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 597, "total_steps": 1025, "loss": 0.1324, "learning_rate": 2.0305952750079918e-06, "epoch": 0.5823680039019632, "percentage": 58.24, "elapsed_time": "7:41:47", "remaining_time": "5:31:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 598, "total_steps": 1025, "loss": 0.136, "learning_rate": 2.0226693745576494e-06, "epoch": 0.5833434946957688, "percentage": 58.34, "elapsed_time": "7:42:31", "remaining_time": "5:30:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 599, "total_steps": 1025, "loss": 0.1286, "learning_rate": 2.0147484502518514e-06, "epoch": 0.5843189854895744, "percentage": 58.44, "elapsed_time": "7:43:17", "remaining_time": "5:29:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 600, "total_steps": 1025, "loss": 0.132, "learning_rate": 2.006832584665783e-06, "epoch": 0.58529447628338, "percentage": 58.54, "elapsed_time": "7:44:05", "remaining_time": "5:28:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 601, "total_steps": 1025, "loss": 0.1151, "learning_rate": 1.99892186032189e-06, "epoch": 0.5862699670771857, "percentage": 58.63, "elapsed_time": "7:44:47", "remaining_time": "5:27:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 602, "total_steps": 1025, "loss": 0.1288, "learning_rate": 1.9910163596890247e-06, "epoch": 0.5872454578709914, "percentage": 58.73, "elapsed_time": "7:45:31", "remaining_time": "5:27:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 603, "total_steps": 1025, "loss": 0.1239, "learning_rate": 1.983116165181578e-06, "epoch": 0.588220948664797, "percentage": 58.83, "elapsed_time": "7:46:20", "remaining_time": "5:26:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 604, "total_steps": 1025, "loss": 0.1276, "learning_rate": 1.9752213591586288e-06, "epoch": 0.5891964394586026, "percentage": 58.93, "elapsed_time": "7:47:03", "remaining_time": "5:25:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 605, "total_steps": 1025, "loss": 0.1305, "learning_rate": 1.9673320239230783e-06, "epoch": 0.5901719302524082, "percentage": 59.02, "elapsed_time": "7:47:49", "remaining_time": "5:24:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 606, "total_steps": 1025, "loss": 0.1261, "learning_rate": 1.9594482417207973e-06, "epoch": 0.5911474210462139, "percentage": 59.12, "elapsed_time": "7:48:39", "remaining_time": "5:24:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 607, "total_steps": 1025, "loss": 0.1211, "learning_rate": 1.951570094739765e-06, "epoch": 0.5921229118400195, "percentage": 59.22, "elapsed_time": "7:49:26", "remaining_time": "5:23:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 608, "total_steps": 1025, "loss": 0.1382, "learning_rate": 1.9436976651092143e-06, "epoch": 0.5930984026338252, "percentage": 59.32, "elapsed_time": "7:50:14", "remaining_time": "5:22:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 609, "total_steps": 1025, "loss": 0.1273, "learning_rate": 1.9358310348987755e-06, "epoch": 0.5940738934276307, "percentage": 59.41, "elapsed_time": "7:50:59", "remaining_time": "5:21:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 610, "total_steps": 1025, "loss": 0.1342, "learning_rate": 1.9279702861176203e-06, "epoch": 0.5950493842214364, "percentage": 59.51, "elapsed_time": "7:51:46", "remaining_time": "5:20:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 611, "total_steps": 1025, "loss": 0.1365, "learning_rate": 1.9201155007136045e-06, "epoch": 0.596024875015242, "percentage": 59.61, "elapsed_time": "7:52:27", "remaining_time": "5:20:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 612, "total_steps": 1025, "loss": 0.1348, "learning_rate": 1.9122667605724202e-06, "epoch": 0.5970003658090477, "percentage": 59.71, "elapsed_time": "7:53:12", "remaining_time": "5:19:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 613, "total_steps": 1025, "loss": 0.1348, "learning_rate": 1.9044241475167339e-06, "epoch": 0.5979758566028534, "percentage": 59.8, "elapsed_time": "7:53:57", "remaining_time": "5:18:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 614, "total_steps": 1025, "loss": 0.1287, "learning_rate": 1.8965877433053409e-06, "epoch": 0.5989513473966589, "percentage": 59.9, "elapsed_time": "7:54:44", "remaining_time": "5:17:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 615, "total_steps": 1025, "loss": 0.1234, "learning_rate": 1.8887576296323069e-06, "epoch": 0.5999268381904646, "percentage": 60.0, "elapsed_time": "7:55:33", "remaining_time": "5:17:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 616, "total_steps": 1025, "loss": 0.1312, "learning_rate": 1.8809338881261213e-06, "epoch": 0.6009023289842702, "percentage": 60.1, "elapsed_time": "7:56:20", "remaining_time": "5:16:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 617, "total_steps": 1025, "loss": 0.1256, "learning_rate": 1.8731166003488427e-06, "epoch": 0.6018778197780759, "percentage": 60.2, "elapsed_time": "7:57:10", "remaining_time": "5:15:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 618, "total_steps": 1025, "loss": 0.1269, "learning_rate": 1.86530584779525e-06, "epoch": 0.6028533105718815, "percentage": 60.29, "elapsed_time": "7:57:56", "remaining_time": "5:14:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 619, "total_steps": 1025, "loss": 0.1277, "learning_rate": 1.857501711891993e-06, "epoch": 0.6038288013656871, "percentage": 60.39, "elapsed_time": "7:58:39", "remaining_time": "5:13:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 620, "total_steps": 1025, "loss": 0.1321, "learning_rate": 1.8497042739967447e-06, "epoch": 0.6048042921594927, "percentage": 60.49, "elapsed_time": "7:59:23", "remaining_time": "5:13:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 621, "total_steps": 1025, "loss": 0.1273, "learning_rate": 1.841913615397348e-06, "epoch": 0.6057797829532984, "percentage": 60.59, "elapsed_time": "8:00:11", "remaining_time": "5:12:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 622, "total_steps": 1025, "loss": 0.1293, "learning_rate": 1.834129817310977e-06, "epoch": 0.606755273747104, "percentage": 60.68, "elapsed_time": "8:00:58", "remaining_time": "5:11:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 623, "total_steps": 1025, "loss": 0.1276, "learning_rate": 1.826352960883281e-06, "epoch": 0.6077307645409097, "percentage": 60.78, "elapsed_time": "8:01:48", "remaining_time": "5:10:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 624, "total_steps": 1025, "loss": 0.1204, "learning_rate": 1.8185831271875457e-06, "epoch": 0.6087062553347152, "percentage": 60.88, "elapsed_time": "8:02:34", "remaining_time": "5:10:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 625, "total_steps": 1025, "loss": 0.124, "learning_rate": 1.8108203972238436e-06, "epoch": 0.6096817461285209, "percentage": 60.98, "elapsed_time": "8:03:20", "remaining_time": "5:09:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 626, "total_steps": 1025, "loss": 0.1327, "learning_rate": 1.8030648519181926e-06, "epoch": 0.6106572369223265, "percentage": 61.07, "elapsed_time": "8:04:08", "remaining_time": "5:08:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 627, "total_steps": 1025, "loss": 0.1206, "learning_rate": 1.7953165721217086e-06, "epoch": 0.6116327277161322, "percentage": 61.17, "elapsed_time": "8:04:51", "remaining_time": "5:07:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 628, "total_steps": 1025, "loss": 0.1376, "learning_rate": 1.7875756386097686e-06, "epoch": 0.6126082185099379, "percentage": 61.27, "elapsed_time": "8:05:36", "remaining_time": "5:06:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 629, "total_steps": 1025, "loss": 0.1243, "learning_rate": 1.779842132081162e-06, "epoch": 0.6135837093037434, "percentage": 61.37, "elapsed_time": "8:06:22", "remaining_time": "5:06:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 630, "total_steps": 1025, "loss": 0.132, "learning_rate": 1.7721161331572522e-06, "epoch": 0.614559200097549, "percentage": 61.46, "elapsed_time": "8:07:09", "remaining_time": "5:05:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 631, "total_steps": 1025, "loss": 0.1364, "learning_rate": 1.7643977223811392e-06, "epoch": 0.6155346908913547, "percentage": 61.56, "elapsed_time": "8:07:54", "remaining_time": "5:04:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 632, "total_steps": 1025, "loss": 0.1189, "learning_rate": 1.7566869802168132e-06, "epoch": 0.6165101816851604, "percentage": 61.66, "elapsed_time": "8:08:39", "remaining_time": "5:03:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 633, "total_steps": 1025, "loss": 0.1277, "learning_rate": 1.7489839870483236e-06, "epoch": 0.617485672478966, "percentage": 61.76, "elapsed_time": "8:09:24", "remaining_time": "5:03:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 634, "total_steps": 1025, "loss": 0.1358, "learning_rate": 1.7412888231789327e-06, "epoch": 0.6184611632727716, "percentage": 61.85, "elapsed_time": "8:10:10", "remaining_time": "5:02:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 635, "total_steps": 1025, "loss": 0.1268, "learning_rate": 1.7336015688302869e-06, "epoch": 0.6194366540665772, "percentage": 61.95, "elapsed_time": "8:10:55", "remaining_time": "5:01:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 636, "total_steps": 1025, "loss": 0.1295, "learning_rate": 1.725922304141573e-06, "epoch": 0.6204121448603829, "percentage": 62.05, "elapsed_time": "8:11:43", "remaining_time": "5:00:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 637, "total_steps": 1025, "loss": 0.1318, "learning_rate": 1.718251109168688e-06, "epoch": 0.6213876356541885, "percentage": 62.15, "elapsed_time": "8:12:29", "remaining_time": "4:59:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 638, "total_steps": 1025, "loss": 0.1212, "learning_rate": 1.7105880638834007e-06, "epoch": 0.6223631264479942, "percentage": 62.24, "elapsed_time": "8:13:13", "remaining_time": "4:59:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 639, "total_steps": 1025, "loss": 0.1364, "learning_rate": 1.7029332481725234e-06, "epoch": 0.6233386172417997, "percentage": 62.34, "elapsed_time": "8:14:00", "remaining_time": "4:58:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 640, "total_steps": 1025, "loss": 0.127, "learning_rate": 1.6952867418370707e-06, "epoch": 0.6243141080356054, "percentage": 62.44, "elapsed_time": "8:14:48", "remaining_time": "4:57:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 641, "total_steps": 1025, "loss": 0.1249, "learning_rate": 1.6876486245914375e-06, "epoch": 0.625289598829411, "percentage": 62.54, "elapsed_time": "8:15:35", "remaining_time": "4:56:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 642, "total_steps": 1025, "loss": 0.1329, "learning_rate": 1.6800189760625585e-06, "epoch": 0.6262650896232167, "percentage": 62.63, "elapsed_time": "8:16:19", "remaining_time": "4:56:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 643, "total_steps": 1025, "loss": 0.125, "learning_rate": 1.672397875789086e-06, "epoch": 0.6272405804170224, "percentage": 62.73, "elapsed_time": "8:17:03", "remaining_time": "4:55:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 644, "total_steps": 1025, "loss": 0.1304, "learning_rate": 1.6647854032205547e-06, "epoch": 0.6282160712108279, "percentage": 62.83, "elapsed_time": "8:17:50", "remaining_time": "4:54:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 645, "total_steps": 1025, "loss": 0.1249, "learning_rate": 1.6571816377165568e-06, "epoch": 0.6291915620046336, "percentage": 62.93, "elapsed_time": "8:18:38", "remaining_time": "4:53:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 646, "total_steps": 1025, "loss": 0.131, "learning_rate": 1.6495866585459142e-06, "epoch": 0.6301670527984392, "percentage": 63.02, "elapsed_time": "8:19:25", "remaining_time": "4:53:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 647, "total_steps": 1025, "loss": 0.1329, "learning_rate": 1.6420005448858522e-06, "epoch": 0.6311425435922449, "percentage": 63.12, "elapsed_time": "8:20:12", "remaining_time": "4:52:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 648, "total_steps": 1025, "loss": 0.1217, "learning_rate": 1.6344233758211717e-06, "epoch": 0.6321180343860505, "percentage": 63.22, "elapsed_time": "8:20:55", "remaining_time": "4:51:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 649, "total_steps": 1025, "loss": 0.1211, "learning_rate": 1.6268552303434298e-06, "epoch": 0.6330935251798561, "percentage": 63.32, "elapsed_time": "8:21:41", "remaining_time": "4:50:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 650, "total_steps": 1025, "loss": 0.1297, "learning_rate": 1.6192961873501096e-06, "epoch": 0.6340690159736617, "percentage": 63.41, "elapsed_time": "8:22:24", "remaining_time": "4:49:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 651, "total_steps": 1025, "loss": 0.1295, "learning_rate": 1.611746325643805e-06, "epoch": 0.6350445067674674, "percentage": 63.51, "elapsed_time": "8:23:08", "remaining_time": "4:49:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 652, "total_steps": 1025, "loss": 0.1246, "learning_rate": 1.6042057239313919e-06, "epoch": 0.636019997561273, "percentage": 63.61, "elapsed_time": "8:23:52", "remaining_time": "4:48:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 653, "total_steps": 1025, "loss": 0.12, "learning_rate": 1.5966744608232137e-06, "epoch": 0.6369954883550787, "percentage": 63.71, "elapsed_time": "8:24:36", "remaining_time": "4:47:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 654, "total_steps": 1025, "loss": 0.1187, "learning_rate": 1.5891526148322594e-06, "epoch": 0.6379709791488842, "percentage": 63.8, "elapsed_time": "8:25:21", "remaining_time": "4:46:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 655, "total_steps": 1025, "loss": 0.1276, "learning_rate": 1.5816402643733441e-06, "epoch": 0.6389464699426899, "percentage": 63.9, "elapsed_time": "8:26:06", "remaining_time": "4:45:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 656, "total_steps": 1025, "loss": 0.1267, "learning_rate": 1.5741374877622922e-06, "epoch": 0.6399219607364955, "percentage": 64.0, "elapsed_time": "8:26:51", "remaining_time": "4:45:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 657, "total_steps": 1025, "loss": 0.1344, "learning_rate": 1.566644363215123e-06, "epoch": 0.6408974515303012, "percentage": 64.1, "elapsed_time": "8:27:35", "remaining_time": "4:44:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 658, "total_steps": 1025, "loss": 0.1363, "learning_rate": 1.5591609688472313e-06, "epoch": 0.6418729423241069, "percentage": 64.2, "elapsed_time": "8:28:22", "remaining_time": "4:43:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 659, "total_steps": 1025, "loss": 0.1354, "learning_rate": 1.551687382672578e-06, "epoch": 0.6428484331179124, "percentage": 64.29, "elapsed_time": "8:29:06", "remaining_time": "4:42:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 660, "total_steps": 1025, "loss": 0.1281, "learning_rate": 1.5442236826028705e-06, "epoch": 0.643823923911718, "percentage": 64.39, "elapsed_time": "8:29:52", "remaining_time": "4:41:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 661, "total_steps": 1025, "loss": 0.1316, "learning_rate": 1.5367699464467596e-06, "epoch": 0.6447994147055237, "percentage": 64.49, "elapsed_time": "8:30:38", "remaining_time": "4:41:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 662, "total_steps": 1025, "loss": 0.1289, "learning_rate": 1.5293262519090169e-06, "epoch": 0.6457749054993294, "percentage": 64.59, "elapsed_time": "8:31:25", "remaining_time": "4:40:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 663, "total_steps": 1025, "loss": 0.1238, "learning_rate": 1.5218926765897345e-06, "epoch": 0.646750396293135, "percentage": 64.68, "elapsed_time": "8:32:16", "remaining_time": "4:39:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 664, "total_steps": 1025, "loss": 0.1279, "learning_rate": 1.5144692979835103e-06, "epoch": 0.6477258870869406, "percentage": 64.78, "elapsed_time": "8:33:01", "remaining_time": "4:38:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 665, "total_steps": 1025, "loss": 0.131, "learning_rate": 1.5070561934786437e-06, "epoch": 0.6487013778807462, "percentage": 64.88, "elapsed_time": "8:33:48", "remaining_time": "4:38:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 666, "total_steps": 1025, "loss": 0.1334, "learning_rate": 1.4996534403563267e-06, "epoch": 0.6496768686745519, "percentage": 64.98, "elapsed_time": "8:34:35", "remaining_time": "4:37:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 667, "total_steps": 1025, "loss": 0.1168, "learning_rate": 1.4922611157898364e-06, "epoch": 0.6506523594683575, "percentage": 65.07, "elapsed_time": "8:35:23", "remaining_time": "4:36:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 668, "total_steps": 1025, "loss": 0.1248, "learning_rate": 1.4848792968437376e-06, "epoch": 0.6516278502621632, "percentage": 65.17, "elapsed_time": "8:36:09", "remaining_time": "4:35:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 669, "total_steps": 1025, "loss": 0.1321, "learning_rate": 1.477508060473069e-06, "epoch": 0.6526033410559687, "percentage": 65.27, "elapsed_time": "8:36:53", "remaining_time": "4:35:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 670, "total_steps": 1025, "loss": 0.1312, "learning_rate": 1.4701474835225515e-06, "epoch": 0.6535788318497744, "percentage": 65.37, "elapsed_time": "8:37:40", "remaining_time": "4:34:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 671, "total_steps": 1025, "loss": 0.1201, "learning_rate": 1.4627976427257784e-06, "epoch": 0.65455432264358, "percentage": 65.46, "elapsed_time": "8:38:26", "remaining_time": "4:33:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 672, "total_steps": 1025, "loss": 0.1365, "learning_rate": 1.4554586147044225e-06, "epoch": 0.6555298134373857, "percentage": 65.56, "elapsed_time": "8:39:11", "remaining_time": "4:32:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 673, "total_steps": 1025, "loss": 0.1249, "learning_rate": 1.4481304759674303e-06, "epoch": 0.6565053042311914, "percentage": 65.66, "elapsed_time": "8:39:59", "remaining_time": "4:31:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 674, "total_steps": 1025, "loss": 0.1195, "learning_rate": 1.4408133029102322e-06, "epoch": 0.6574807950249969, "percentage": 65.76, "elapsed_time": "8:40:46", "remaining_time": "4:31:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 675, "total_steps": 1025, "loss": 0.1183, "learning_rate": 1.4335071718139379e-06, "epoch": 0.6584562858188026, "percentage": 65.85, "elapsed_time": "8:41:35", "remaining_time": "4:30:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 676, "total_steps": 1025, "loss": 0.1245, "learning_rate": 1.4262121588445493e-06, "epoch": 0.6594317766126082, "percentage": 65.95, "elapsed_time": "8:42:17", "remaining_time": "4:29:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 677, "total_steps": 1025, "loss": 0.1286, "learning_rate": 1.418928340052159e-06, "epoch": 0.6604072674064139, "percentage": 66.05, "elapsed_time": "8:43:04", "remaining_time": "4:28:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 678, "total_steps": 1025, "loss": 0.1252, "learning_rate": 1.411655791370164e-06, "epoch": 0.6613827582002195, "percentage": 66.15, "elapsed_time": "8:43:44", "remaining_time": "4:28:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 679, "total_steps": 1025, "loss": 0.1179, "learning_rate": 1.4043945886144673e-06, "epoch": 0.6623582489940251, "percentage": 66.24, "elapsed_time": "8:44:30", "remaining_time": "4:27:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 680, "total_steps": 1025, "loss": 0.1252, "learning_rate": 1.397144807482696e-06, "epoch": 0.6633337397878307, "percentage": 66.34, "elapsed_time": "8:45:14", "remaining_time": "4:26:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 681, "total_steps": 1025, "loss": 0.1216, "learning_rate": 1.3899065235534031e-06, "epoch": 0.6643092305816364, "percentage": 66.44, "elapsed_time": "8:46:00", "remaining_time": "4:25:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 682, "total_steps": 1025, "loss": 0.1283, "learning_rate": 1.382679812285287e-06, "epoch": 0.665284721375442, "percentage": 66.54, "elapsed_time": "8:46:49", "remaining_time": "4:24:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 683, "total_steps": 1025, "loss": 0.1188, "learning_rate": 1.375464749016399e-06, "epoch": 0.6662602121692477, "percentage": 66.63, "elapsed_time": "8:47:32", "remaining_time": "4:24:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 684, "total_steps": 1025, "loss": 0.129, "learning_rate": 1.3682614089633637e-06, "epoch": 0.6672357029630532, "percentage": 66.73, "elapsed_time": "8:48:16", "remaining_time": "4:23:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 685, "total_steps": 1025, "loss": 0.1281, "learning_rate": 1.3610698672205897e-06, "epoch": 0.6682111937568589, "percentage": 66.83, "elapsed_time": "8:49:03", "remaining_time": "4:22:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 686, "total_steps": 1025, "loss": 0.1292, "learning_rate": 1.3538901987594882e-06, "epoch": 0.6691866845506645, "percentage": 66.93, "elapsed_time": "8:49:53", "remaining_time": "4:21:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 687, "total_steps": 1025, "loss": 0.1309, "learning_rate": 1.3467224784276961e-06, "epoch": 0.6701621753444702, "percentage": 67.02, "elapsed_time": "8:50:41", "remaining_time": "4:21:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 688, "total_steps": 1025, "loss": 0.1139, "learning_rate": 1.339566780948287e-06, "epoch": 0.6711376661382759, "percentage": 67.12, "elapsed_time": "8:51:26", "remaining_time": "4:20:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 689, "total_steps": 1025, "loss": 0.1309, "learning_rate": 1.3324231809189985e-06, "epoch": 0.6721131569320814, "percentage": 67.22, "elapsed_time": "8:52:08", "remaining_time": "4:19:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 690, "total_steps": 1025, "loss": 0.1267, "learning_rate": 1.3252917528114556e-06, "epoch": 0.6730886477258871, "percentage": 67.32, "elapsed_time": "8:52:55", "remaining_time": "4:18:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 691, "total_steps": 1025, "loss": 0.1213, "learning_rate": 1.3181725709703874e-06, "epoch": 0.6740641385196927, "percentage": 67.41, "elapsed_time": "8:53:43", "remaining_time": "4:17:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 692, "total_steps": 1025, "loss": 0.12, "learning_rate": 1.3110657096128606e-06, "epoch": 0.6750396293134984, "percentage": 67.51, "elapsed_time": "8:54:29", "remaining_time": "4:17:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 693, "total_steps": 1025, "loss": 0.1231, "learning_rate": 1.3039712428274976e-06, "epoch": 0.676015120107304, "percentage": 67.61, "elapsed_time": "8:55:14", "remaining_time": "4:16:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 694, "total_steps": 1025, "loss": 0.1294, "learning_rate": 1.2968892445737117e-06, "epoch": 0.6769906109011096, "percentage": 67.71, "elapsed_time": "8:55:58", "remaining_time": "4:15:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 695, "total_steps": 1025, "loss": 0.1256, "learning_rate": 1.2898197886809289e-06, "epoch": 0.6779661016949152, "percentage": 67.8, "elapsed_time": "8:56:45", "remaining_time": "4:14:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 696, "total_steps": 1025, "loss": 0.13, "learning_rate": 1.2827629488478254e-06, "epoch": 0.6789415924887209, "percentage": 67.9, "elapsed_time": "8:57:28", "remaining_time": "4:14:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 697, "total_steps": 1025, "loss": 0.1306, "learning_rate": 1.2757187986415528e-06, "epoch": 0.6799170832825265, "percentage": 68.0, "elapsed_time": "8:58:15", "remaining_time": "4:13:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 698, "total_steps": 1025, "loss": 0.1323, "learning_rate": 1.2686874114969767e-06, "epoch": 0.6808925740763322, "percentage": 68.1, "elapsed_time": "8:59:03", "remaining_time": "4:12:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 699, "total_steps": 1025, "loss": 0.1396, "learning_rate": 1.2616688607159045e-06, "epoch": 0.6818680648701377, "percentage": 68.2, "elapsed_time": "8:59:54", "remaining_time": "4:11:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 700, "total_steps": 1025, "loss": 0.1254, "learning_rate": 1.2546632194663305e-06, "epoch": 0.6828435556639434, "percentage": 68.29, "elapsed_time": "9:00:41", "remaining_time": "4:11:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 701, "total_steps": 1025, "loss": 0.1234, "learning_rate": 1.2476705607816639e-06, "epoch": 0.683819046457749, "percentage": 68.39, "elapsed_time": "9:01:31", "remaining_time": "4:10:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 702, "total_steps": 1025, "loss": 0.125, "learning_rate": 1.2406909575599717e-06, "epoch": 0.6847945372515547, "percentage": 68.49, "elapsed_time": "9:02:19", "remaining_time": "4:09:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 703, "total_steps": 1025, "loss": 0.135, "learning_rate": 1.2337244825632217e-06, "epoch": 0.6857700280453604, "percentage": 68.59, "elapsed_time": "9:03:06", "remaining_time": "4:08:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 704, "total_steps": 1025, "loss": 0.1158, "learning_rate": 1.2267712084165168e-06, "epoch": 0.6867455188391659, "percentage": 68.68, "elapsed_time": "9:03:51", "remaining_time": "4:07:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 705, "total_steps": 1025, "loss": 0.128, "learning_rate": 1.2198312076073427e-06, "epoch": 0.6877210096329716, "percentage": 68.78, "elapsed_time": "9:04:33", "remaining_time": "4:07:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 706, "total_steps": 1025, "loss": 0.128, "learning_rate": 1.2129045524848138e-06, "epoch": 0.6886965004267772, "percentage": 68.88, "elapsed_time": "9:05:16", "remaining_time": "4:06:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 707, "total_steps": 1025, "loss": 0.1185, "learning_rate": 1.205991315258914e-06, "epoch": 0.6896719912205829, "percentage": 68.98, "elapsed_time": "9:06:03", "remaining_time": "4:05:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 708, "total_steps": 1025, "loss": 0.1264, "learning_rate": 1.199091567999746e-06, "epoch": 0.6906474820143885, "percentage": 69.07, "elapsed_time": "9:06:49", "remaining_time": "4:04:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 709, "total_steps": 1025, "loss": 0.1152, "learning_rate": 1.1922053826367833e-06, "epoch": 0.6916229728081941, "percentage": 69.17, "elapsed_time": "9:07:33", "remaining_time": "4:04:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 710, "total_steps": 1025, "loss": 0.1283, "learning_rate": 1.1853328309581139e-06, "epoch": 0.6925984636019997, "percentage": 69.27, "elapsed_time": "9:08:20", "remaining_time": "4:03:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 711, "total_steps": 1025, "loss": 0.1238, "learning_rate": 1.1784739846096982e-06, "epoch": 0.6935739543958054, "percentage": 69.37, "elapsed_time": "9:09:09", "remaining_time": "4:02:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 712, "total_steps": 1025, "loss": 0.1234, "learning_rate": 1.1716289150946173e-06, "epoch": 0.694549445189611, "percentage": 69.46, "elapsed_time": "9:09:54", "remaining_time": "4:01:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 713, "total_steps": 1025, "loss": 0.1306, "learning_rate": 1.1647976937723315e-06, "epoch": 0.6955249359834167, "percentage": 69.56, "elapsed_time": "9:10:39", "remaining_time": "4:00:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 714, "total_steps": 1025, "loss": 0.125, "learning_rate": 1.1579803918579322e-06, "epoch": 0.6965004267772222, "percentage": 69.66, "elapsed_time": "9:11:27", "remaining_time": "4:00:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 715, "total_steps": 1025, "loss": 0.1248, "learning_rate": 1.1511770804214046e-06, "epoch": 0.6974759175710279, "percentage": 69.76, "elapsed_time": "9:12:11", "remaining_time": "3:59:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 716, "total_steps": 1025, "loss": 0.1338, "learning_rate": 1.1443878303868805e-06, "epoch": 0.6984514083648335, "percentage": 69.85, "elapsed_time": "9:13:00", "remaining_time": "3:58:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 717, "total_steps": 1025, "loss": 0.1148, "learning_rate": 1.1376127125319065e-06, "epoch": 0.6994268991586392, "percentage": 69.95, "elapsed_time": "9:13:43", "remaining_time": "3:57:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 718, "total_steps": 1025, "loss": 0.1274, "learning_rate": 1.1308517974866973e-06, "epoch": 0.7004023899524449, "percentage": 70.05, "elapsed_time": "9:14:31", "remaining_time": "3:57:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 719, "total_steps": 1025, "loss": 0.124, "learning_rate": 1.1241051557334087e-06, "epoch": 0.7013778807462504, "percentage": 70.15, "elapsed_time": "9:15:19", "remaining_time": "3:56:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 720, "total_steps": 1025, "loss": 0.1354, "learning_rate": 1.117372857605395e-06, "epoch": 0.7023533715400561, "percentage": 70.24, "elapsed_time": "9:16:05", "remaining_time": "3:55:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 721, "total_steps": 1025, "loss": 0.1164, "learning_rate": 1.110654973286481e-06, "epoch": 0.7033288623338617, "percentage": 70.34, "elapsed_time": "9:16:51", "remaining_time": "3:54:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 722, "total_steps": 1025, "loss": 0.1275, "learning_rate": 1.1039515728102273e-06, "epoch": 0.7043043531276674, "percentage": 70.44, "elapsed_time": "9:17:35", "remaining_time": "3:54:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 723, "total_steps": 1025, "loss": 0.1231, "learning_rate": 1.0972627260592014e-06, "epoch": 0.705279843921473, "percentage": 70.54, "elapsed_time": "9:18:24", "remaining_time": "3:53:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 724, "total_steps": 1025, "loss": 0.1177, "learning_rate": 1.0905885027642484e-06, "epoch": 0.7062553347152786, "percentage": 70.63, "elapsed_time": "9:19:12", "remaining_time": "3:52:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 725, "total_steps": 1025, "loss": 0.1334, "learning_rate": 1.0839289725037669e-06, "epoch": 0.7072308255090842, "percentage": 70.73, "elapsed_time": "9:19:57", "remaining_time": "3:51:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 726, "total_steps": 1025, "loss": 0.1218, "learning_rate": 1.0772842047029786e-06, "epoch": 0.7082063163028899, "percentage": 70.83, "elapsed_time": "9:20:46", "remaining_time": "3:50:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 727, "total_steps": 1025, "loss": 0.1143, "learning_rate": 1.0706542686332102e-06, "epoch": 0.7091818070966955, "percentage": 70.93, "elapsed_time": "9:21:30", "remaining_time": "3:50:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 728, "total_steps": 1025, "loss": 0.1264, "learning_rate": 1.064039233411166e-06, "epoch": 0.7101572978905012, "percentage": 71.02, "elapsed_time": "9:22:18", "remaining_time": "3:49:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 729, "total_steps": 1025, "loss": 0.1278, "learning_rate": 1.057439167998212e-06, "epoch": 0.7111327886843067, "percentage": 71.12, "elapsed_time": "9:23:04", "remaining_time": "3:48:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 730, "total_steps": 1025, "loss": 0.1235, "learning_rate": 1.050854141199652e-06, "epoch": 0.7121082794781124, "percentage": 71.22, "elapsed_time": "9:23:52", "remaining_time": "3:47:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 731, "total_steps": 1025, "loss": 0.1208, "learning_rate": 1.0442842216640168e-06, "epoch": 0.713083770271918, "percentage": 71.32, "elapsed_time": "9:24:34", "remaining_time": "3:47:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 732, "total_steps": 1025, "loss": 0.117, "learning_rate": 1.037729477882341e-06, "epoch": 0.7140592610657237, "percentage": 71.41, "elapsed_time": "9:25:21", "remaining_time": "3:46:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 733, "total_steps": 1025, "loss": 0.1293, "learning_rate": 1.0311899781874563e-06, "epoch": 0.7150347518595294, "percentage": 71.51, "elapsed_time": "9:26:07", "remaining_time": "3:45:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 734, "total_steps": 1025, "loss": 0.1216, "learning_rate": 1.0246657907532727e-06, "epoch": 0.7160102426533349, "percentage": 71.61, "elapsed_time": "9:26:53", "remaining_time": "3:44:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 735, "total_steps": 1025, "loss": 0.1149, "learning_rate": 1.018156983594073e-06, "epoch": 0.7169857334471406, "percentage": 71.71, "elapsed_time": "9:27:39", "remaining_time": "3:43:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 736, "total_steps": 1025, "loss": 0.115, "learning_rate": 1.0116636245637997e-06, "epoch": 0.7179612242409462, "percentage": 71.8, "elapsed_time": "9:28:25", "remaining_time": "3:43:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 737, "total_steps": 1025, "loss": 0.123, "learning_rate": 1.0051857813553516e-06, "epoch": 0.7189367150347519, "percentage": 71.9, "elapsed_time": "9:29:13", "remaining_time": "3:42:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 738, "total_steps": 1025, "loss": 0.1277, "learning_rate": 9.987235214998741e-07, "epoch": 0.7199122058285575, "percentage": 72.0, "elapsed_time": "9:29:59", "remaining_time": "3:41:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 739, "total_steps": 1025, "loss": 0.1197, "learning_rate": 9.922769123660564e-07, "epoch": 0.7208876966223631, "percentage": 72.1, "elapsed_time": "9:30:45", "remaining_time": "3:40:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 740, "total_steps": 1025, "loss": 0.124, "learning_rate": 9.858460211594331e-07, "epoch": 0.7218631874161687, "percentage": 72.2, "elapsed_time": "9:31:33", "remaining_time": "3:40:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 741, "total_steps": 1025, "loss": 0.1207, "learning_rate": 9.79430914921677e-07, "epoch": 0.7228386782099744, "percentage": 72.29, "elapsed_time": "9:32:19", "remaining_time": "3:39:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 742, "total_steps": 1025, "loss": 0.1226, "learning_rate": 9.730316605299041e-07, "epoch": 0.72381416900378, "percentage": 72.39, "elapsed_time": "9:33:09", "remaining_time": "3:38:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 743, "total_steps": 1025, "loss": 0.119, "learning_rate": 9.666483246959785e-07, "epoch": 0.7247896597975857, "percentage": 72.49, "elapsed_time": "9:33:50", "remaining_time": "3:37:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 744, "total_steps": 1025, "loss": 0.1245, "learning_rate": 9.602809739658105e-07, "epoch": 0.7257651505913912, "percentage": 72.59, "elapsed_time": "9:34:33", "remaining_time": "3:37:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 745, "total_steps": 1025, "loss": 0.1216, "learning_rate": 9.53929674718668e-07, "epoch": 0.7267406413851969, "percentage": 72.68, "elapsed_time": "9:35:16", "remaining_time": "3:36:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 746, "total_steps": 1025, "loss": 0.125, "learning_rate": 9.475944931664851e-07, "epoch": 0.7277161321790026, "percentage": 72.78, "elapsed_time": "9:36:06", "remaining_time": "3:35:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 747, "total_steps": 1025, "loss": 0.1223, "learning_rate": 9.412754953531664e-07, "epoch": 0.7286916229728082, "percentage": 72.88, "elapsed_time": "9:36:53", "remaining_time": "3:34:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 748, "total_steps": 1025, "loss": 0.1215, "learning_rate": 9.349727471539052e-07, "epoch": 0.7296671137666139, "percentage": 72.98, "elapsed_time": "9:37:42", "remaining_time": "3:33:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 749, "total_steps": 1025, "loss": 0.1237, "learning_rate": 9.286863142744907e-07, "epoch": 0.7306426045604194, "percentage": 73.07, "elapsed_time": "9:38:28", "remaining_time": "3:33:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 750, "total_steps": 1025, "loss": 0.118, "learning_rate": 9.224162622506283e-07, "epoch": 0.7316180953542251, "percentage": 73.17, "elapsed_time": "9:39:15", "remaining_time": "3:32:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 751, "total_steps": 1025, "loss": 0.1271, "learning_rate": 9.161626564472511e-07, "epoch": 0.7325935861480307, "percentage": 73.27, "elapsed_time": "9:40:00", "remaining_time": "3:31:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 752, "total_steps": 1025, "loss": 0.1212, "learning_rate": 9.099255620578451e-07, "epoch": 0.7335690769418364, "percentage": 73.37, "elapsed_time": "9:40:47", "remaining_time": "3:30:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 753, "total_steps": 1025, "loss": 0.1209, "learning_rate": 9.037050441037614e-07, "epoch": 0.734544567735642, "percentage": 73.46, "elapsed_time": "9:41:31", "remaining_time": "3:30:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 754, "total_steps": 1025, "loss": 0.1271, "learning_rate": 8.975011674335468e-07, "epoch": 0.7355200585294476, "percentage": 73.56, "elapsed_time": "9:42:18", "remaining_time": "3:29:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 755, "total_steps": 1025, "loss": 0.1174, "learning_rate": 8.9131399672226e-07, "epoch": 0.7364955493232532, "percentage": 73.66, "elapsed_time": "9:43:06", "remaining_time": "3:28:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 756, "total_steps": 1025, "loss": 0.1138, "learning_rate": 8.851435964708044e-07, "epoch": 0.7374710401170589, "percentage": 73.76, "elapsed_time": "9:43:50", "remaining_time": "3:27:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 757, "total_steps": 1025, "loss": 0.1215, "learning_rate": 8.789900310052491e-07, "epoch": 0.7384465309108645, "percentage": 73.85, "elapsed_time": "9:44:38", "remaining_time": "3:26:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 758, "total_steps": 1025, "loss": 0.1235, "learning_rate": 8.728533644761647e-07, "epoch": 0.7394220217046702, "percentage": 73.95, "elapsed_time": "9:45:24", "remaining_time": "3:26:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 759, "total_steps": 1025, "loss": 0.1226, "learning_rate": 8.667336608579488e-07, "epoch": 0.7403975124984757, "percentage": 74.05, "elapsed_time": "9:46:10", "remaining_time": "3:25:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 760, "total_steps": 1025, "loss": 0.123, "learning_rate": 8.606309839481628e-07, "epoch": 0.7413730032922814, "percentage": 74.15, "elapsed_time": "9:46:58", "remaining_time": "3:24:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 761, "total_steps": 1025, "loss": 0.1182, "learning_rate": 8.545453973668643e-07, "epoch": 0.742348494086087, "percentage": 74.24, "elapsed_time": "9:47:45", "remaining_time": "3:23:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 762, "total_steps": 1025, "loss": 0.1195, "learning_rate": 8.484769645559482e-07, "epoch": 0.7433239848798927, "percentage": 74.34, "elapsed_time": "9:48:31", "remaining_time": "3:23:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 763, "total_steps": 1025, "loss": 0.1221, "learning_rate": 8.424257487784787e-07, "epoch": 0.7442994756736984, "percentage": 74.44, "elapsed_time": "9:49:17", "remaining_time": "3:22:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 764, "total_steps": 1025, "loss": 0.1256, "learning_rate": 8.363918131180371e-07, "epoch": 0.7452749664675039, "percentage": 74.54, "elapsed_time": "9:50:05", "remaining_time": "3:21:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 765, "total_steps": 1025, "loss": 0.1248, "learning_rate": 8.303752204780563e-07, "epoch": 0.7462504572613096, "percentage": 74.63, "elapsed_time": "9:50:52", "remaining_time": "3:20:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 766, "total_steps": 1025, "loss": 0.1246, "learning_rate": 8.243760335811734e-07, "epoch": 0.7472259480551152, "percentage": 74.73, "elapsed_time": "9:51:38", "remaining_time": "3:20:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 767, "total_steps": 1025, "loss": 0.1173, "learning_rate": 8.183943149685678e-07, "epoch": 0.7482014388489209, "percentage": 74.83, "elapsed_time": "9:52:20", "remaining_time": "3:19:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 768, "total_steps": 1025, "loss": 0.1151, "learning_rate": 8.124301269993168e-07, "epoch": 0.7491769296427265, "percentage": 74.93, "elapsed_time": "9:53:02", "remaining_time": "3:18:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 769, "total_steps": 1025, "loss": 0.1235, "learning_rate": 8.06483531849738e-07, "epoch": 0.7501524204365322, "percentage": 75.02, "elapsed_time": "9:53:48", "remaining_time": "3:17:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 770, "total_steps": 1025, "loss": 0.1262, "learning_rate": 8.00554591512748e-07, "epoch": 0.7511279112303377, "percentage": 75.12, "elapsed_time": "9:54:37", "remaining_time": "3:16:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 771, "total_steps": 1025, "loss": 0.1243, "learning_rate": 7.946433677972104e-07, "epoch": 0.7521034020241434, "percentage": 75.22, "elapsed_time": "9:55:22", "remaining_time": "3:16:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 772, "total_steps": 1025, "loss": 0.1298, "learning_rate": 7.887499223272968e-07, "epoch": 0.753078892817949, "percentage": 75.32, "elapsed_time": "9:56:09", "remaining_time": "3:15:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 773, "total_steps": 1025, "loss": 0.111, "learning_rate": 7.828743165418393e-07, "epoch": 0.7540543836117547, "percentage": 75.41, "elapsed_time": "9:56:53", "remaining_time": "3:14:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 774, "total_steps": 1025, "loss": 0.1139, "learning_rate": 7.770166116936923e-07, "epoch": 0.7550298744055604, "percentage": 75.51, "elapsed_time": "9:57:38", "remaining_time": "3:13:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 775, "total_steps": 1025, "loss": 0.1219, "learning_rate": 7.711768688490962e-07, "epoch": 0.7560053651993659, "percentage": 75.61, "elapsed_time": "9:58:23", "remaining_time": "3:13:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 776, "total_steps": 1025, "loss": 0.1283, "learning_rate": 7.653551488870356e-07, "epoch": 0.7569808559931716, "percentage": 75.71, "elapsed_time": "9:59:10", "remaining_time": "3:12:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 777, "total_steps": 1025, "loss": 0.1237, "learning_rate": 7.595515124986106e-07, "epoch": 0.7579563467869772, "percentage": 75.8, "elapsed_time": "9:59:54", "remaining_time": "3:11:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 778, "total_steps": 1025, "loss": 0.1236, "learning_rate": 7.537660201863989e-07, "epoch": 0.7589318375807829, "percentage": 75.9, "elapsed_time": "10:00:41", "remaining_time": "3:10:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 779, "total_steps": 1025, "loss": 0.126, "learning_rate": 7.479987322638274e-07, "epoch": 0.7599073283745885, "percentage": 76.0, "elapsed_time": "10:01:27", "remaining_time": "3:09:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 780, "total_steps": 1025, "loss": 0.1225, "learning_rate": 7.422497088545436e-07, "epoch": 0.7608828191683941, "percentage": 76.1, "elapsed_time": "10:02:10", "remaining_time": "3:09:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 781, "total_steps": 1025, "loss": 0.1172, "learning_rate": 7.365190098917896e-07, "epoch": 0.7618583099621997, "percentage": 76.2, "elapsed_time": "10:02:55", "remaining_time": "3:08:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 782, "total_steps": 1025, "loss": 0.1194, "learning_rate": 7.308066951177742e-07, "epoch": 0.7628338007560054, "percentage": 76.29, "elapsed_time": "10:03:43", "remaining_time": "3:07:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 783, "total_steps": 1025, "loss": 0.1122, "learning_rate": 7.251128240830543e-07, "epoch": 0.763809291549811, "percentage": 76.39, "elapsed_time": "10:04:29", "remaining_time": "3:06:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 784, "total_steps": 1025, "loss": 0.1275, "learning_rate": 7.194374561459094e-07, "epoch": 0.7647847823436167, "percentage": 76.49, "elapsed_time": "10:05:16", "remaining_time": "3:06:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 785, "total_steps": 1025, "loss": 0.136, "learning_rate": 7.137806504717276e-07, "epoch": 0.7657602731374222, "percentage": 76.59, "elapsed_time": "10:06:05", "remaining_time": "3:05:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 786, "total_steps": 1025, "loss": 0.1213, "learning_rate": 7.081424660323846e-07, "epoch": 0.7667357639312279, "percentage": 76.68, "elapsed_time": "10:06:53", "remaining_time": "3:04:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 787, "total_steps": 1025, "loss": 0.1223, "learning_rate": 7.025229616056326e-07, "epoch": 0.7677112547250335, "percentage": 76.78, "elapsed_time": "10:07:37", "remaining_time": "3:03:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 788, "total_steps": 1025, "loss": 0.1325, "learning_rate": 6.969221957744832e-07, "epoch": 0.7686867455188392, "percentage": 76.88, "elapsed_time": "10:08:24", "remaining_time": "3:02:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 789, "total_steps": 1025, "loss": 0.1193, "learning_rate": 6.913402269266026e-07, "epoch": 0.7696622363126449, "percentage": 76.98, "elapsed_time": "10:09:11", "remaining_time": "3:02:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 790, "total_steps": 1025, "loss": 0.1177, "learning_rate": 6.857771132536958e-07, "epoch": 0.7706377271064504, "percentage": 77.07, "elapsed_time": "10:09:55", "remaining_time": "3:01:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 791, "total_steps": 1025, "loss": 0.1236, "learning_rate": 6.802329127509072e-07, "epoch": 0.771613217900256, "percentage": 77.17, "elapsed_time": "10:10:39", "remaining_time": "3:00:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 792, "total_steps": 1025, "loss": 0.1331, "learning_rate": 6.747076832162094e-07, "epoch": 0.7725887086940617, "percentage": 77.27, "elapsed_time": "10:11:27", "remaining_time": "2:59:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 793, "total_steps": 1025, "loss": 0.1179, "learning_rate": 6.692014822498066e-07, "epoch": 0.7735641994878674, "percentage": 77.37, "elapsed_time": "10:12:13", "remaining_time": "2:59:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 794, "total_steps": 1025, "loss": 0.1123, "learning_rate": 6.637143672535282e-07, "epoch": 0.774539690281673, "percentage": 77.46, "elapsed_time": "10:13:03", "remaining_time": "2:58:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 795, "total_steps": 1025, "loss": 0.1189, "learning_rate": 6.582463954302368e-07, "epoch": 0.7755151810754786, "percentage": 77.56, "elapsed_time": "10:13:50", "remaining_time": "2:57:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 796, "total_steps": 1025, "loss": 0.1145, "learning_rate": 6.527976237832256e-07, "epoch": 0.7764906718692842, "percentage": 77.66, "elapsed_time": "10:14:39", "remaining_time": "2:56:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 797, "total_steps": 1025, "loss": 0.1235, "learning_rate": 6.473681091156289e-07, "epoch": 0.7774661626630899, "percentage": 77.76, "elapsed_time": "10:15:26", "remaining_time": "2:56:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 798, "total_steps": 1025, "loss": 0.1218, "learning_rate": 6.419579080298263e-07, "epoch": 0.7784416534568955, "percentage": 77.85, "elapsed_time": "10:16:11", "remaining_time": "2:55:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 799, "total_steps": 1025, "loss": 0.1227, "learning_rate": 6.36567076926857e-07, "epoch": 0.7794171442507012, "percentage": 77.95, "elapsed_time": "10:16:54", "remaining_time": "2:54:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 800, "total_steps": 1025, "loss": 0.1278, "learning_rate": 6.311956720058263e-07, "epoch": 0.7803926350445067, "percentage": 78.05, "elapsed_time": "10:17:40", "remaining_time": "2:53:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 801, "total_steps": 1025, "loss": 0.1251, "learning_rate": 6.258437492633254e-07, "epoch": 0.7813681258383124, "percentage": 78.15, "elapsed_time": "10:18:28", "remaining_time": "2:52:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 802, "total_steps": 1025, "loss": 0.1139, "learning_rate": 6.205113644928429e-07, "epoch": 0.782343616632118, "percentage": 78.24, "elapsed_time": "10:19:15", "remaining_time": "2:52:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 803, "total_steps": 1025, "loss": 0.1117, "learning_rate": 6.151985732841867e-07, "epoch": 0.7833191074259237, "percentage": 78.34, "elapsed_time": "10:20:02", "remaining_time": "2:51:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 804, "total_steps": 1025, "loss": 0.1308, "learning_rate": 6.099054310229008e-07, "epoch": 0.7842945982197294, "percentage": 78.44, "elapsed_time": "10:20:48", "remaining_time": "2:50:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 805, "total_steps": 1025, "loss": 0.1157, "learning_rate": 6.046319928896926e-07, "epoch": 0.7852700890135349, "percentage": 78.54, "elapsed_time": "10:21:35", "remaining_time": "2:49:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 806, "total_steps": 1025, "loss": 0.1254, "learning_rate": 5.993783138598532e-07, "epoch": 0.7862455798073406, "percentage": 78.63, "elapsed_time": "10:22:24", "remaining_time": "2:49:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 807, "total_steps": 1025, "loss": 0.1193, "learning_rate": 5.941444487026877e-07, "epoch": 0.7872210706011462, "percentage": 78.73, "elapsed_time": "10:23:09", "remaining_time": "2:48:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 808, "total_steps": 1025, "loss": 0.1225, "learning_rate": 5.889304519809402e-07, "epoch": 0.7881965613949519, "percentage": 78.83, "elapsed_time": "10:23:57", "remaining_time": "2:47:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 809, "total_steps": 1025, "loss": 0.1301, "learning_rate": 5.837363780502309e-07, "epoch": 0.7891720521887575, "percentage": 78.93, "elapsed_time": "10:24:42", "remaining_time": "2:46:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 810, "total_steps": 1025, "loss": 0.1173, "learning_rate": 5.785622810584834e-07, "epoch": 0.7901475429825631, "percentage": 79.02, "elapsed_time": "10:25:30", "remaining_time": "2:46:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 811, "total_steps": 1025, "loss": 0.1134, "learning_rate": 5.734082149453634e-07, "epoch": 0.7911230337763687, "percentage": 79.12, "elapsed_time": "10:26:17", "remaining_time": "2:45:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 812, "total_steps": 1025, "loss": 0.125, "learning_rate": 5.682742334417171e-07, "epoch": 0.7920985245701744, "percentage": 79.22, "elapsed_time": "10:27:05", "remaining_time": "2:44:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 813, "total_steps": 1025, "loss": 0.1214, "learning_rate": 5.631603900690077e-07, "epoch": 0.79307401536398, "percentage": 79.32, "elapsed_time": "10:27:52", "remaining_time": "2:43:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 814, "total_steps": 1025, "loss": 0.1244, "learning_rate": 5.580667381387623e-07, "epoch": 0.7940495061577857, "percentage": 79.41, "elapsed_time": "10:28:37", "remaining_time": "2:42:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 815, "total_steps": 1025, "loss": 0.1087, "learning_rate": 5.529933307520102e-07, "epoch": 0.7950249969515912, "percentage": 79.51, "elapsed_time": "10:29:20", "remaining_time": "2:42:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 816, "total_steps": 1025, "loss": 0.1171, "learning_rate": 5.47940220798735e-07, "epoch": 0.7960004877453969, "percentage": 79.61, "elapsed_time": "10:30:07", "remaining_time": "2:41:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 817, "total_steps": 1025, "loss": 0.1226, "learning_rate": 5.429074609573184e-07, "epoch": 0.7969759785392025, "percentage": 79.71, "elapsed_time": "10:30:53", "remaining_time": "2:40:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 818, "total_steps": 1025, "loss": 0.1238, "learning_rate": 5.378951036939966e-07, "epoch": 0.7979514693330082, "percentage": 79.8, "elapsed_time": "10:31:39", "remaining_time": "2:39:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 819, "total_steps": 1025, "loss": 0.1244, "learning_rate": 5.329032012623064e-07, "epoch": 0.7989269601268139, "percentage": 79.9, "elapsed_time": "10:32:30", "remaining_time": "2:39:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 820, "total_steps": 1025, "loss": 0.1131, "learning_rate": 5.279318057025476e-07, "epoch": 0.7999024509206194, "percentage": 80.0, "elapsed_time": "10:33:19", "remaining_time": "2:38:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 821, "total_steps": 1025, "loss": 0.125, "learning_rate": 5.229809688412337e-07, "epoch": 0.8008779417144251, "percentage": 80.1, "elapsed_time": "10:34:06", "remaining_time": "2:37:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 822, "total_steps": 1025, "loss": 0.1182, "learning_rate": 5.180507422905585e-07, "epoch": 0.8018534325082307, "percentage": 80.2, "elapsed_time": "10:34:49", "remaining_time": "2:36:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 823, "total_steps": 1025, "loss": 0.1308, "learning_rate": 5.131411774478503e-07, "epoch": 0.8028289233020364, "percentage": 80.29, "elapsed_time": "10:35:36", "remaining_time": "2:36:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 824, "total_steps": 1025, "loss": 0.1194, "learning_rate": 5.082523254950447e-07, "epoch": 0.803804414095842, "percentage": 80.39, "elapsed_time": "10:36:24", "remaining_time": "2:35:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 825, "total_steps": 1025, "loss": 0.1157, "learning_rate": 5.033842373981429e-07, "epoch": 0.8047799048896476, "percentage": 80.49, "elapsed_time": "10:37:09", "remaining_time": "2:34:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 826, "total_steps": 1025, "loss": 0.1231, "learning_rate": 4.985369639066867e-07, "epoch": 0.8057553956834532, "percentage": 80.59, "elapsed_time": "10:37:56", "remaining_time": "2:33:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 827, "total_steps": 1025, "loss": 0.1205, "learning_rate": 4.937105555532252e-07, "epoch": 0.8067308864772589, "percentage": 80.68, "elapsed_time": "10:38:43", "remaining_time": "2:32:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 828, "total_steps": 1025, "loss": 0.1222, "learning_rate": 4.889050626527905e-07, "epoch": 0.8077063772710645, "percentage": 80.78, "elapsed_time": "10:39:31", "remaining_time": "2:32:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 829, "total_steps": 1025, "loss": 0.1176, "learning_rate": 4.841205353023715e-07, "epoch": 0.8086818680648702, "percentage": 80.88, "elapsed_time": "10:40:18", "remaining_time": "2:31:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 830, "total_steps": 1025, "loss": 0.1168, "learning_rate": 4.79357023380394e-07, "epoch": 0.8096573588586757, "percentage": 80.98, "elapsed_time": "10:41:03", "remaining_time": "2:30:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 831, "total_steps": 1025, "loss": 0.1246, "learning_rate": 4.746145765461965e-07, "epoch": 0.8106328496524814, "percentage": 81.07, "elapsed_time": "10:41:43", "remaining_time": "2:29:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 832, "total_steps": 1025, "loss": 0.1207, "learning_rate": 4.6989324423951847e-07, "epoch": 0.811608340446287, "percentage": 81.17, "elapsed_time": "10:42:28", "remaining_time": "2:29:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 833, "total_steps": 1025, "loss": 0.1214, "learning_rate": 4.651930756799794e-07, "epoch": 0.8125838312400927, "percentage": 81.27, "elapsed_time": "10:43:15", "remaining_time": "2:28:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 834, "total_steps": 1025, "loss": 0.1222, "learning_rate": 4.6051411986656775e-07, "epoch": 0.8135593220338984, "percentage": 81.37, "elapsed_time": "10:43:57", "remaining_time": "2:27:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 835, "total_steps": 1025, "loss": 0.1108, "learning_rate": 4.5585642557713083e-07, "epoch": 0.8145348128277039, "percentage": 81.46, "elapsed_time": "10:44:44", "remaining_time": "2:26:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 836, "total_steps": 1025, "loss": 0.1149, "learning_rate": 4.512200413678672e-07, "epoch": 0.8155103036215096, "percentage": 81.56, "elapsed_time": "10:45:28", "remaining_time": "2:25:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 837, "total_steps": 1025, "loss": 0.1246, "learning_rate": 4.466050155728166e-07, "epoch": 0.8164857944153152, "percentage": 81.66, "elapsed_time": "10:46:14", "remaining_time": "2:25:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 838, "total_steps": 1025, "loss": 0.1139, "learning_rate": 4.420113963033607e-07, "epoch": 0.8174612852091209, "percentage": 81.76, "elapsed_time": "10:47:03", "remaining_time": "2:24:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 839, "total_steps": 1025, "loss": 0.1442, "learning_rate": 4.374392314477174e-07, "epoch": 0.8184367760029265, "percentage": 81.85, "elapsed_time": "10:47:49", "remaining_time": "2:23:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 840, "total_steps": 1025, "loss": 0.117, "learning_rate": 4.3288856867044564e-07, "epoch": 0.8194122667967321, "percentage": 81.95, "elapsed_time": "10:48:38", "remaining_time": "2:22:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 841, "total_steps": 1025, "loss": 0.1106, "learning_rate": 4.2835945541194414e-07, "epoch": 0.8203877575905377, "percentage": 82.05, "elapsed_time": "10:49:27", "remaining_time": "2:22:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 842, "total_steps": 1025, "loss": 0.118, "learning_rate": 4.238519388879614e-07, "epoch": 0.8213632483843434, "percentage": 82.15, "elapsed_time": "10:50:17", "remaining_time": "2:21:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 843, "total_steps": 1025, "loss": 0.1155, "learning_rate": 4.1936606608909887e-07, "epoch": 0.822338739178149, "percentage": 82.24, "elapsed_time": "10:51:02", "remaining_time": "2:20:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 844, "total_steps": 1025, "loss": 0.124, "learning_rate": 4.149018837803262e-07, "epoch": 0.8233142299719547, "percentage": 82.34, "elapsed_time": "10:51:47", "remaining_time": "2:19:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 845, "total_steps": 1025, "loss": 0.1229, "learning_rate": 4.1045943850048843e-07, "epoch": 0.8242897207657602, "percentage": 82.44, "elapsed_time": "10:52:33", "remaining_time": "2:19:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 846, "total_steps": 1025, "loss": 0.1201, "learning_rate": 4.0603877656182373e-07, "epoch": 0.8252652115595659, "percentage": 82.54, "elapsed_time": "10:53:20", "remaining_time": "2:18:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 847, "total_steps": 1025, "loss": 0.1147, "learning_rate": 4.0163994404948144e-07, "epoch": 0.8262407023533715, "percentage": 82.63, "elapsed_time": "10:54:04", "remaining_time": "2:17:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 848, "total_steps": 1025, "loss": 0.1136, "learning_rate": 3.9726298682103923e-07, "epoch": 0.8272161931471772, "percentage": 82.73, "elapsed_time": "10:54:50", "remaining_time": "2:16:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 849, "total_steps": 1025, "loss": 0.1104, "learning_rate": 3.929079505060271e-07, "epoch": 0.8281916839409829, "percentage": 82.83, "elapsed_time": "10:55:36", "remaining_time": "2:15:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 850, "total_steps": 1025, "loss": 0.1196, "learning_rate": 3.8857488050544903e-07, "epoch": 0.8291671747347884, "percentage": 82.93, "elapsed_time": "10:56:25", "remaining_time": "2:15:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 851, "total_steps": 1025, "loss": 0.1187, "learning_rate": 3.842638219913142e-07, "epoch": 0.8301426655285941, "percentage": 83.02, "elapsed_time": "10:57:14", "remaining_time": "2:14:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 852, "total_steps": 1025, "loss": 0.1238, "learning_rate": 3.799748199061612e-07, "epoch": 0.8311181563223997, "percentage": 83.12, "elapsed_time": "10:57:58", "remaining_time": "2:13:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 853, "total_steps": 1025, "loss": 0.1195, "learning_rate": 3.7570791896259147e-07, "epoch": 0.8320936471162054, "percentage": 83.22, "elapsed_time": "10:58:44", "remaining_time": "2:12:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 854, "total_steps": 1025, "loss": 0.1202, "learning_rate": 3.7146316364280426e-07, "epoch": 0.833069137910011, "percentage": 83.32, "elapsed_time": "10:59:31", "remaining_time": "2:12:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 855, "total_steps": 1025, "loss": 0.1244, "learning_rate": 3.6724059819813223e-07, "epoch": 0.8340446287038166, "percentage": 83.41, "elapsed_time": "11:00:15", "remaining_time": "2:11:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 856, "total_steps": 1025, "loss": 0.1257, "learning_rate": 3.630402666485783e-07, "epoch": 0.8350201194976222, "percentage": 83.51, "elapsed_time": "11:01:03", "remaining_time": "2:10:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 857, "total_steps": 1025, "loss": 0.117, "learning_rate": 3.5886221278236045e-07, "epoch": 0.8359956102914279, "percentage": 83.61, "elapsed_time": "11:01:48", "remaining_time": "2:09:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 858, "total_steps": 1025, "loss": 0.1223, "learning_rate": 3.547064801554509e-07, "epoch": 0.8369711010852335, "percentage": 83.71, "elapsed_time": "11:02:35", "remaining_time": "2:08:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 859, "total_steps": 1025, "loss": 0.1273, "learning_rate": 3.5057311209112625e-07, "epoch": 0.8379465918790392, "percentage": 83.8, "elapsed_time": "11:03:23", "remaining_time": "2:08:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 860, "total_steps": 1025, "loss": 0.1237, "learning_rate": 3.4646215167951166e-07, "epoch": 0.8389220826728447, "percentage": 83.9, "elapsed_time": "11:04:08", "remaining_time": "2:07:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 861, "total_steps": 1025, "loss": 0.1194, "learning_rate": 3.4237364177713615e-07, "epoch": 0.8398975734666504, "percentage": 84.0, "elapsed_time": "11:04:49", "remaining_time": "2:06:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 862, "total_steps": 1025, "loss": 0.111, "learning_rate": 3.383076250064815e-07, "epoch": 0.840873064260456, "percentage": 84.1, "elapsed_time": "11:05:33", "remaining_time": "2:05:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 863, "total_steps": 1025, "loss": 0.1227, "learning_rate": 3.342641437555411e-07, "epoch": 0.8418485550542617, "percentage": 84.2, "elapsed_time": "11:06:20", "remaining_time": "2:05:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 864, "total_steps": 1025, "loss": 0.1219, "learning_rate": 3.3024324017737555e-07, "epoch": 0.8428240458480674, "percentage": 84.29, "elapsed_time": "11:07:08", "remaining_time": "2:04:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 865, "total_steps": 1025, "loss": 0.1208, "learning_rate": 3.262449561896766e-07, "epoch": 0.8437995366418729, "percentage": 84.39, "elapsed_time": "11:07:56", "remaining_time": "2:03:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 866, "total_steps": 1025, "loss": 0.1115, "learning_rate": 3.2226933347432516e-07, "epoch": 0.8447750274356786, "percentage": 84.49, "elapsed_time": "11:08:43", "remaining_time": "2:02:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 867, "total_steps": 1025, "loss": 0.1192, "learning_rate": 3.183164134769631e-07, "epoch": 0.8457505182294842, "percentage": 84.59, "elapsed_time": "11:09:33", "remaining_time": "2:02:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 868, "total_steps": 1025, "loss": 0.1271, "learning_rate": 3.143862374065548e-07, "epoch": 0.8467260090232899, "percentage": 84.68, "elapsed_time": "11:10:23", "remaining_time": "2:01:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 869, "total_steps": 1025, "loss": 0.1164, "learning_rate": 3.104788462349612e-07, "epoch": 0.8477014998170955, "percentage": 84.78, "elapsed_time": "11:11:10", "remaining_time": "2:00:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 870, "total_steps": 1025, "loss": 0.1166, "learning_rate": 3.065942806965139e-07, "epoch": 0.8486769906109011, "percentage": 84.88, "elapsed_time": "11:11:59", "remaining_time": "1:59:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 871, "total_steps": 1025, "loss": 0.1231, "learning_rate": 3.0273258128758585e-07, "epoch": 0.8496524814047067, "percentage": 84.98, "elapsed_time": "11:12:45", "remaining_time": "1:58:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 872, "total_steps": 1025, "loss": 0.1269, "learning_rate": 2.98893788266173e-07, "epoch": 0.8506279721985124, "percentage": 85.07, "elapsed_time": "11:13:35", "remaining_time": "1:58:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 873, "total_steps": 1025, "loss": 0.1185, "learning_rate": 2.9507794165147487e-07, "epoch": 0.851603462992318, "percentage": 85.17, "elapsed_time": "11:14:21", "remaining_time": "1:57:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 874, "total_steps": 1025, "loss": 0.1209, "learning_rate": 2.9128508122347324e-07, "epoch": 0.8525789537861237, "percentage": 85.27, "elapsed_time": "11:15:06", "remaining_time": "1:56:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 875, "total_steps": 1025, "loss": 0.1107, "learning_rate": 2.875152465225234e-07, "epoch": 0.8535544445799292, "percentage": 85.37, "elapsed_time": "11:15:56", "remaining_time": "1:55:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 876, "total_steps": 1025, "loss": 0.1159, "learning_rate": 2.837684768489354e-07, "epoch": 0.8545299353737349, "percentage": 85.46, "elapsed_time": "11:16:44", "remaining_time": "1:55:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 877, "total_steps": 1025, "loss": 0.1278, "learning_rate": 2.800448112625709e-07, "epoch": 0.8555054261675406, "percentage": 85.56, "elapsed_time": "11:17:31", "remaining_time": "1:54:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 878, "total_steps": 1025, "loss": 0.1244, "learning_rate": 2.7634428858242995e-07, "epoch": 0.8564809169613462, "percentage": 85.66, "elapsed_time": "11:18:19", "remaining_time": "1:53:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 879, "total_steps": 1025, "loss": 0.1134, "learning_rate": 2.7266694738625143e-07, "epoch": 0.8574564077551519, "percentage": 85.76, "elapsed_time": "11:19:01", "remaining_time": "1:52:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 880, "total_steps": 1025, "loss": 0.1216, "learning_rate": 2.690128260101069e-07, "epoch": 0.8584318985489574, "percentage": 85.85, "elapsed_time": "11:19:47", "remaining_time": "1:52:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 881, "total_steps": 1025, "loss": 0.1282, "learning_rate": 2.6538196254800393e-07, "epoch": 0.8594073893427631, "percentage": 85.95, "elapsed_time": "11:20:34", "remaining_time": "1:51:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 882, "total_steps": 1025, "loss": 0.1279, "learning_rate": 2.617743948514867e-07, "epoch": 0.8603828801365687, "percentage": 86.05, "elapsed_time": "11:21:19", "remaining_time": "1:50:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 883, "total_steps": 1025, "loss": 0.1186, "learning_rate": 2.5819016052924224e-07, "epoch": 0.8613583709303744, "percentage": 86.15, "elapsed_time": "11:22:06", "remaining_time": "1:49:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 884, "total_steps": 1025, "loss": 0.1162, "learning_rate": 2.5462929694670986e-07, "epoch": 0.86233386172418, "percentage": 86.24, "elapsed_time": "11:22:55", "remaining_time": "1:48:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 885, "total_steps": 1025, "loss": 0.1079, "learning_rate": 2.5109184122568797e-07, "epoch": 0.8633093525179856, "percentage": 86.34, "elapsed_time": "11:23:40", "remaining_time": "1:48:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 886, "total_steps": 1025, "loss": 0.1168, "learning_rate": 2.4757783024395244e-07, "epoch": 0.8642848433117912, "percentage": 86.44, "elapsed_time": "11:24:27", "remaining_time": "1:47:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 887, "total_steps": 1025, "loss": 0.1143, "learning_rate": 2.44087300634866e-07, "epoch": 0.8652603341055969, "percentage": 86.54, "elapsed_time": "11:25:11", "remaining_time": "1:46:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 888, "total_steps": 1025, "loss": 0.1242, "learning_rate": 2.4062028878700074e-07, "epoch": 0.8662358248994025, "percentage": 86.63, "elapsed_time": "11:25:58", "remaining_time": "1:45:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 889, "total_steps": 1025, "loss": 0.1179, "learning_rate": 2.3717683084375832e-07, "epoch": 0.8672113156932082, "percentage": 86.73, "elapsed_time": "11:26:45", "remaining_time": "1:45:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 890, "total_steps": 1025, "loss": 0.1193, "learning_rate": 2.3375696270299093e-07, "epoch": 0.8681868064870137, "percentage": 86.83, "elapsed_time": "11:27:29", "remaining_time": "1:44:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 891, "total_steps": 1025, "loss": 0.1112, "learning_rate": 2.3036072001662829e-07, "epoch": 0.8691622972808194, "percentage": 86.93, "elapsed_time": "11:28:15", "remaining_time": "1:43:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 892, "total_steps": 1025, "loss": 0.1128, "learning_rate": 2.2698813819030802e-07, "epoch": 0.870137788074625, "percentage": 87.02, "elapsed_time": "11:29:01", "remaining_time": "1:42:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 893, "total_steps": 1025, "loss": 0.1186, "learning_rate": 2.2363925238300167e-07, "epoch": 0.8711132788684307, "percentage": 87.12, "elapsed_time": "11:29:46", "remaining_time": "1:41:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 894, "total_steps": 1025, "loss": 0.1136, "learning_rate": 2.2031409750665422e-07, "epoch": 0.8720887696622364, "percentage": 87.22, "elapsed_time": "11:30:35", "remaining_time": "1:41:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 895, "total_steps": 1025, "loss": 0.1179, "learning_rate": 2.170127082258147e-07, "epoch": 0.8730642604560419, "percentage": 87.32, "elapsed_time": "11:31:22", "remaining_time": "1:40:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 896, "total_steps": 1025, "loss": 0.1093, "learning_rate": 2.1373511895727866e-07, "epoch": 0.8740397512498476, "percentage": 87.41, "elapsed_time": "11:32:08", "remaining_time": "1:39:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 897, "total_steps": 1025, "loss": 0.1201, "learning_rate": 2.1048136386972645e-07, "epoch": 0.8750152420436532, "percentage": 87.51, "elapsed_time": "11:32:54", "remaining_time": "1:38:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 898, "total_steps": 1025, "loss": 0.1209, "learning_rate": 2.0725147688337054e-07, "epoch": 0.8759907328374589, "percentage": 87.61, "elapsed_time": "11:33:40", "remaining_time": "1:38:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 899, "total_steps": 1025, "loss": 0.1104, "learning_rate": 2.040454916695972e-07, "epoch": 0.8769662236312645, "percentage": 87.71, "elapsed_time": "11:34:23", "remaining_time": "1:37:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 900, "total_steps": 1025, "loss": 0.1186, "learning_rate": 2.0086344165062054e-07, "epoch": 0.8779417144250701, "percentage": 87.8, "elapsed_time": "11:35:11", "remaining_time": "1:36:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 901, "total_steps": 1025, "loss": 0.1242, "learning_rate": 1.9770535999912967e-07, "epoch": 0.8789172052188757, "percentage": 87.9, "elapsed_time": "11:35:58", "remaining_time": "1:35:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 902, "total_steps": 1025, "loss": 0.1195, "learning_rate": 1.945712796379462e-07, "epoch": 0.8798926960126814, "percentage": 88.0, "elapsed_time": "11:36:46", "remaining_time": "1:35:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 903, "total_steps": 1025, "loss": 0.1191, "learning_rate": 1.914612332396787e-07, "epoch": 0.880868186806487, "percentage": 88.1, "elapsed_time": "11:37:33", "remaining_time": "1:34:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 904, "total_steps": 1025, "loss": 0.1212, "learning_rate": 1.883752532263844e-07, "epoch": 0.8818436776002927, "percentage": 88.2, "elapsed_time": "11:38:21", "remaining_time": "1:33:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 905, "total_steps": 1025, "loss": 0.109, "learning_rate": 1.8531337176922792e-07, "epoch": 0.8828191683940982, "percentage": 88.29, "elapsed_time": "11:39:06", "remaining_time": "1:32:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 906, "total_steps": 1025, "loss": 0.1185, "learning_rate": 1.8227562078814903e-07, "epoch": 0.8837946591879039, "percentage": 88.39, "elapsed_time": "11:39:51", "remaining_time": "1:31:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 907, "total_steps": 1025, "loss": 0.1236, "learning_rate": 1.7926203195152898e-07, "epoch": 0.8847701499817096, "percentage": 88.49, "elapsed_time": "11:40:40", "remaining_time": "1:31:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 908, "total_steps": 1025, "loss": 0.1118, "learning_rate": 1.7627263667585882e-07, "epoch": 0.8857456407755152, "percentage": 88.59, "elapsed_time": "11:41:28", "remaining_time": "1:30:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 909, "total_steps": 1025, "loss": 0.1153, "learning_rate": 1.7330746612541387e-07, "epoch": 0.8867211315693209, "percentage": 88.68, "elapsed_time": "11:42:11", "remaining_time": "1:29:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 910, "total_steps": 1025, "loss": 0.1262, "learning_rate": 1.7036655121192875e-07, "epoch": 0.8876966223631264, "percentage": 88.78, "elapsed_time": "11:42:57", "remaining_time": "1:28:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 911, "total_steps": 1025, "loss": 0.1241, "learning_rate": 1.6744992259427272e-07, "epoch": 0.8886721131569321, "percentage": 88.88, "elapsed_time": "11:43:46", "remaining_time": "1:28:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 912, "total_steps": 1025, "loss": 0.1137, "learning_rate": 1.6455761067813352e-07, "epoch": 0.8896476039507377, "percentage": 88.98, "elapsed_time": "11:44:34", "remaining_time": "1:27:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 913, "total_steps": 1025, "loss": 0.1177, "learning_rate": 1.6168964561569716e-07, "epoch": 0.8906230947445434, "percentage": 89.07, "elapsed_time": "11:45:21", "remaining_time": "1:26:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 914, "total_steps": 1025, "loss": 0.1173, "learning_rate": 1.5884605730533686e-07, "epoch": 0.891598585538349, "percentage": 89.17, "elapsed_time": "11:46:08", "remaining_time": "1:25:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 915, "total_steps": 1025, "loss": 0.1224, "learning_rate": 1.5602687539129745e-07, "epoch": 0.8925740763321546, "percentage": 89.27, "elapsed_time": "11:46:55", "remaining_time": "1:24:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 916, "total_steps": 1025, "loss": 0.119, "learning_rate": 1.5323212926339037e-07, "epoch": 0.8935495671259602, "percentage": 89.37, "elapsed_time": "11:47:40", "remaining_time": "1:24:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 917, "total_steps": 1025, "loss": 0.1137, "learning_rate": 1.504618480566844e-07, "epoch": 0.8945250579197659, "percentage": 89.46, "elapsed_time": "11:48:28", "remaining_time": "1:23:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 918, "total_steps": 1025, "loss": 0.1176, "learning_rate": 1.4771606065120293e-07, "epoch": 0.8955005487135715, "percentage": 89.56, "elapsed_time": "11:49:16", "remaining_time": "1:22:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 919, "total_steps": 1025, "loss": 0.1193, "learning_rate": 1.4499479567162328e-07, "epoch": 0.8964760395073772, "percentage": 89.66, "elapsed_time": "11:50:04", "remaining_time": "1:21:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 920, "total_steps": 1025, "loss": 0.1245, "learning_rate": 1.4229808148697732e-07, "epoch": 0.8974515303011827, "percentage": 89.76, "elapsed_time": "11:50:51", "remaining_time": "1:21:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 921, "total_steps": 1025, "loss": 0.1101, "learning_rate": 1.396259462103572e-07, "epoch": 0.8984270210949884, "percentage": 89.85, "elapsed_time": "11:51:37", "remaining_time": "1:20:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 922, "total_steps": 1025, "loss": 0.1198, "learning_rate": 1.3697841769861996e-07, "epoch": 0.899402511888794, "percentage": 89.95, "elapsed_time": "11:52:23", "remaining_time": "1:19:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 923, "total_steps": 1025, "loss": 0.1172, "learning_rate": 1.3435552355210018e-07, "epoch": 0.9003780026825997, "percentage": 90.05, "elapsed_time": "11:53:10", "remaining_time": "1:18:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 924, "total_steps": 1025, "loss": 0.1248, "learning_rate": 1.3175729111431946e-07, "epoch": 0.9013534934764054, "percentage": 90.15, "elapsed_time": "11:53:57", "remaining_time": "1:18:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 925, "total_steps": 1025, "loss": 0.1157, "learning_rate": 1.2918374747170225e-07, "epoch": 0.9023289842702109, "percentage": 90.24, "elapsed_time": "11:54:44", "remaining_time": "1:17:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 926, "total_steps": 1025, "loss": 0.1212, "learning_rate": 1.266349194532951e-07, "epoch": 0.9033044750640166, "percentage": 90.34, "elapsed_time": "11:55:32", "remaining_time": "1:16:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 927, "total_steps": 1025, "loss": 0.1168, "learning_rate": 1.2411083363048386e-07, "epoch": 0.9042799658578222, "percentage": 90.44, "elapsed_time": "11:56:21", "remaining_time": "1:15:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 928, "total_steps": 1025, "loss": 0.1193, "learning_rate": 1.2161151631671974e-07, "epoch": 0.9052554566516279, "percentage": 90.54, "elapsed_time": "11:57:08", "remaining_time": "1:14:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 929, "total_steps": 1025, "loss": 0.1139, "learning_rate": 1.1913699356724317e-07, "epoch": 0.9062309474454335, "percentage": 90.63, "elapsed_time": "11:57:52", "remaining_time": "1:14:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 930, "total_steps": 1025, "loss": 0.1193, "learning_rate": 1.166872911788125e-07, "epoch": 0.9072064382392391, "percentage": 90.73, "elapsed_time": "11:58:40", "remaining_time": "1:13:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 931, "total_steps": 1025, "loss": 0.1218, "learning_rate": 1.1426243468943582e-07, "epoch": 0.9081819290330447, "percentage": 90.83, "elapsed_time": "11:59:29", "remaining_time": "1:12:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 932, "total_steps": 1025, "loss": 0.1133, "learning_rate": 1.1186244937810315e-07, "epoch": 0.9091574198268504, "percentage": 90.93, "elapsed_time": "12:00:12", "remaining_time": "1:11:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 933, "total_steps": 1025, "loss": 0.1111, "learning_rate": 1.0948736026452495e-07, "epoch": 0.910132910620656, "percentage": 91.02, "elapsed_time": "12:01:00", "remaining_time": "1:11:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 934, "total_steps": 1025, "loss": 0.1219, "learning_rate": 1.071371921088693e-07, "epoch": 0.9111084014144617, "percentage": 91.12, "elapsed_time": "12:01:45", "remaining_time": "1:10:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 935, "total_steps": 1025, "loss": 0.1131, "learning_rate": 1.0481196941150574e-07, "epoch": 0.9120838922082672, "percentage": 91.22, "elapsed_time": "12:02:32", "remaining_time": "1:09:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 936, "total_steps": 1025, "loss": 0.1208, "learning_rate": 1.0251171641274788e-07, "epoch": 0.9130593830020729, "percentage": 91.32, "elapsed_time": "12:03:18", "remaining_time": "1:08:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 937, "total_steps": 1025, "loss": 0.111, "learning_rate": 1.0023645709260233e-07, "epoch": 0.9140348737958786, "percentage": 91.41, "elapsed_time": "12:04:06", "remaining_time": "1:08:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 938, "total_steps": 1025, "loss": 0.1134, "learning_rate": 9.798621517051716e-08, "epoch": 0.9150103645896842, "percentage": 91.51, "elapsed_time": "12:04:53", "remaining_time": "1:07:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 939, "total_steps": 1025, "loss": 0.1184, "learning_rate": 9.576101410513655e-08, "epoch": 0.9159858553834899, "percentage": 91.61, "elapsed_time": "12:05:38", "remaining_time": "1:06:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 940, "total_steps": 1025, "loss": 0.1141, "learning_rate": 9.356087709405465e-08, "epoch": 0.9169613461772954, "percentage": 91.71, "elapsed_time": "12:06:21", "remaining_time": "1:05:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 941, "total_steps": 1025, "loss": 0.1178, "learning_rate": 9.138582707357429e-08, "epoch": 0.9179368369711011, "percentage": 91.8, "elapsed_time": "12:07:07", "remaining_time": "1:04:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 942, "total_steps": 1025, "loss": 0.119, "learning_rate": 8.923588671846784e-08, "epoch": 0.9189123277649067, "percentage": 91.9, "elapsed_time": "12:07:53", "remaining_time": "1:04:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 943, "total_steps": 1025, "loss": 0.1224, "learning_rate": 8.711107844174089e-08, "epoch": 0.9198878185587124, "percentage": 92.0, "elapsed_time": "12:08:41", "remaining_time": "1:03:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 944, "total_steps": 1025, "loss": 0.1184, "learning_rate": 8.501142439439808e-08, "epoch": 0.920863309352518, "percentage": 92.1, "elapsed_time": "12:09:25", "remaining_time": "1:02:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 945, "total_steps": 1025, "loss": 0.0985, "learning_rate": 8.29369464652141e-08, "epoch": 0.9218388001463236, "percentage": 92.2, "elapsed_time": "12:10:12", "remaining_time": "1:01:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 946, "total_steps": 1025, "loss": 0.1102, "learning_rate": 8.088766628050193e-08, "epoch": 0.9228142909401292, "percentage": 92.29, "elapsed_time": "12:10:59", "remaining_time": "1:01:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 947, "total_steps": 1025, "loss": 0.1187, "learning_rate": 7.886360520389158e-08, "epoch": 0.9237897817339349, "percentage": 92.39, "elapsed_time": "12:11:49", "remaining_time": "1:00:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 948, "total_steps": 1025, "loss": 0.113, "learning_rate": 7.686478433610339e-08, "epoch": 0.9247652725277405, "percentage": 92.49, "elapsed_time": "12:12:38", "remaining_time": "0:59:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 949, "total_steps": 1025, "loss": 0.1183, "learning_rate": 7.48912245147318e-08, "epoch": 0.9257407633215462, "percentage": 92.59, "elapsed_time": "12:13:22", "remaining_time": "0:58:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 950, "total_steps": 1025, "loss": 0.1202, "learning_rate": 7.294294631402493e-08, "epoch": 0.9267162541153517, "percentage": 92.68, "elapsed_time": "12:14:13", "remaining_time": "0:57:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 951, "total_steps": 1025, "loss": 0.122, "learning_rate": 7.101997004467203e-08, "epoch": 0.9276917449091574, "percentage": 92.78, "elapsed_time": "12:15:03", "remaining_time": "0:57:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 952, "total_steps": 1025, "loss": 0.1104, "learning_rate": 6.912231575359057e-08, "epoch": 0.9286672357029631, "percentage": 92.88, "elapsed_time": "12:15:48", "remaining_time": "0:56:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 953, "total_steps": 1025, "loss": 0.1186, "learning_rate": 6.725000322371916e-08, "epoch": 0.9296427264967687, "percentage": 92.98, "elapsed_time": "12:16:36", "remaining_time": "0:55:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 954, "total_steps": 1025, "loss": 0.122, "learning_rate": 6.540305197380859e-08, "epoch": 0.9306182172905744, "percentage": 93.07, "elapsed_time": "12:17:23", "remaining_time": "0:54:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 955, "total_steps": 1025, "loss": 0.1136, "learning_rate": 6.358148125822e-08, "epoch": 0.9315937080843799, "percentage": 93.17, "elapsed_time": "12:18:12", "remaining_time": "0:54:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 956, "total_steps": 1025, "loss": 0.1276, "learning_rate": 6.178531006672484e-08, "epoch": 0.9325691988781856, "percentage": 93.27, "elapsed_time": "12:18:55", "remaining_time": "0:53:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 957, "total_steps": 1025, "loss": 0.126, "learning_rate": 6.001455712430492e-08, "epoch": 0.9335446896719912, "percentage": 93.37, "elapsed_time": "12:19:41", "remaining_time": "0:52:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 958, "total_steps": 1025, "loss": 0.1176, "learning_rate": 5.826924089095881e-08, "epoch": 0.9345201804657969, "percentage": 93.46, "elapsed_time": "12:20:25", "remaining_time": "0:51:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 959, "total_steps": 1025, "loss": 0.1208, "learning_rate": 5.654937956150852e-08, "epoch": 0.9354956712596025, "percentage": 93.56, "elapsed_time": "12:21:11", "remaining_time": "0:51:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 960, "total_steps": 1025, "loss": 0.1236, "learning_rate": 5.4854991065410866e-08, "epoch": 0.9364711620534081, "percentage": 93.66, "elapsed_time": "12:21:56", "remaining_time": "0:50:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 961, "total_steps": 1025, "loss": 0.1195, "learning_rate": 5.3186093066568965e-08, "epoch": 0.9374466528472137, "percentage": 93.76, "elapsed_time": "12:22:44", "remaining_time": "0:49:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 962, "total_steps": 1025, "loss": 0.1317, "learning_rate": 5.154270296314878e-08, "epoch": 0.9384221436410194, "percentage": 93.85, "elapsed_time": "12:23:32", "remaining_time": "0:48:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 963, "total_steps": 1025, "loss": 0.1208, "learning_rate": 4.992483788739927e-08, "epoch": 0.939397634434825, "percentage": 93.95, "elapsed_time": "12:24:16", "remaining_time": "0:47:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 964, "total_steps": 1025, "loss": 0.1293, "learning_rate": 4.833251470547084e-08, "epoch": 0.9403731252286307, "percentage": 94.05, "elapsed_time": "12:25:06", "remaining_time": "0:47:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 965, "total_steps": 1025, "loss": 0.1217, "learning_rate": 4.6765750017242206e-08, "epoch": 0.9413486160224362, "percentage": 94.15, "elapsed_time": "12:25:51", "remaining_time": "0:46:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 966, "total_steps": 1025, "loss": 0.118, "learning_rate": 4.5224560156145734e-08, "epoch": 0.9423241068162419, "percentage": 94.24, "elapsed_time": "12:26:34", "remaining_time": "0:45:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 967, "total_steps": 1025, "loss": 0.1145, "learning_rate": 4.370896118899792e-08, "epoch": 0.9432995976100476, "percentage": 94.34, "elapsed_time": "12:27:20", "remaining_time": "0:44:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 968, "total_steps": 1025, "loss": 0.1144, "learning_rate": 4.221896891583144e-08, "epoch": 0.9442750884038532, "percentage": 94.44, "elapsed_time": "12:28:08", "remaining_time": "0:44:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 969, "total_steps": 1025, "loss": 0.11, "learning_rate": 4.0754598869730824e-08, "epoch": 0.9452505791976589, "percentage": 94.54, "elapsed_time": "12:28:54", "remaining_time": "0:43:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 970, "total_steps": 1025, "loss": 0.1246, "learning_rate": 3.931586631667039e-08, "epoch": 0.9462260699914644, "percentage": 94.63, "elapsed_time": "12:29:43", "remaining_time": "0:42:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 971, "total_steps": 1025, "loss": 0.1244, "learning_rate": 3.7902786255354927e-08, "epoch": 0.9472015607852701, "percentage": 94.73, "elapsed_time": "12:30:30", "remaining_time": "0:41:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 972, "total_steps": 1025, "loss": 0.1167, "learning_rate": 3.65153734170634e-08, "epoch": 0.9481770515790757, "percentage": 94.83, "elapsed_time": "12:31:16", "remaining_time": "0:40:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 973, "total_steps": 1025, "loss": 0.1205, "learning_rate": 3.515364226549523e-08, "epoch": 0.9491525423728814, "percentage": 94.93, "elapsed_time": "12:32:01", "remaining_time": "0:40:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 974, "total_steps": 1025, "loss": 0.1223, "learning_rate": 3.381760699662062e-08, "epoch": 0.950128033166687, "percentage": 95.02, "elapsed_time": "12:32:50", "remaining_time": "0:39:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 975, "total_steps": 1025, "loss": 0.1161, "learning_rate": 3.25072815385305e-08, "epoch": 0.9511035239604926, "percentage": 95.12, "elapsed_time": "12:33:37", "remaining_time": "0:38:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 976, "total_steps": 1025, "loss": 0.1129, "learning_rate": 3.1222679551293486e-08, "epoch": 0.9520790147542982, "percentage": 95.22, "elapsed_time": "12:34:20", "remaining_time": "0:37:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 977, "total_steps": 1025, "loss": 0.1191, "learning_rate": 2.996381442681162e-08, "epoch": 0.9530545055481039, "percentage": 95.32, "elapsed_time": "12:35:03", "remaining_time": "0:37:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 978, "total_steps": 1025, "loss": 0.1262, "learning_rate": 2.8730699288682107e-08, "epoch": 0.9540299963419095, "percentage": 95.41, "elapsed_time": "12:35:46", "remaining_time": "0:36:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 979, "total_steps": 1025, "loss": 0.1159, "learning_rate": 2.7523346992060217e-08, "epoch": 0.9550054871357152, "percentage": 95.51, "elapsed_time": "12:36:32", "remaining_time": "0:35:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 980, "total_steps": 1025, "loss": 0.1181, "learning_rate": 2.634177012352468e-08, "epoch": 0.9559809779295207, "percentage": 95.61, "elapsed_time": "12:37:15", "remaining_time": "0:34:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 981, "total_steps": 1025, "loss": 0.1232, "learning_rate": 2.5185981000946657e-08, "epoch": 0.9569564687233264, "percentage": 95.71, "elapsed_time": "12:38:03", "remaining_time": "0:34:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 982, "total_steps": 1025, "loss": 0.1152, "learning_rate": 2.405599167336209e-08, "epoch": 0.9579319595171321, "percentage": 95.8, "elapsed_time": "12:38:50", "remaining_time": "0:33:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 983, "total_steps": 1025, "loss": 0.1192, "learning_rate": 2.295181392084511e-08, "epoch": 0.9589074503109377, "percentage": 95.9, "elapsed_time": "12:39:39", "remaining_time": "0:32:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 984, "total_steps": 1025, "loss": 0.1143, "learning_rate": 2.187345925438594e-08, "epoch": 0.9598829411047434, "percentage": 96.0, "elapsed_time": "12:40:25", "remaining_time": "0:31:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 985, "total_steps": 1025, "loss": 0.1105, "learning_rate": 2.0820938915770417e-08, "epoch": 0.9608584318985489, "percentage": 96.1, "elapsed_time": "12:41:13", "remaining_time": "0:30:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 986, "total_steps": 1025, "loss": 0.1061, "learning_rate": 1.9794263877463138e-08, "epoch": 0.9618339226923546, "percentage": 96.2, "elapsed_time": "12:42:01", "remaining_time": "0:30:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 987, "total_steps": 1025, "loss": 0.1229, "learning_rate": 1.879344484249257e-08, "epoch": 0.9628094134861602, "percentage": 96.29, "elapsed_time": "12:42:46", "remaining_time": "0:29:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 988, "total_steps": 1025, "loss": 0.1178, "learning_rate": 1.781849224434029e-08, "epoch": 0.9637849042799659, "percentage": 96.39, "elapsed_time": "12:43:32", "remaining_time": "0:28:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 989, "total_steps": 1025, "loss": 0.1268, "learning_rate": 1.686941624683164e-08, "epoch": 0.9647603950737715, "percentage": 96.49, "elapsed_time": "12:44:21", "remaining_time": "0:27:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 990, "total_steps": 1025, "loss": 0.1139, "learning_rate": 1.5946226744029402e-08, "epoch": 0.9657358858675771, "percentage": 96.59, "elapsed_time": "12:45:03", "remaining_time": "0:27:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 991, "total_steps": 1025, "loss": 0.117, "learning_rate": 1.504893336013169e-08, "epoch": 0.9667113766613827, "percentage": 96.68, "elapsed_time": "12:45:49", "remaining_time": "0:26:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 992, "total_steps": 1025, "loss": 0.1193, "learning_rate": 1.4177545449370889e-08, "epoch": 0.9676868674551884, "percentage": 96.78, "elapsed_time": "12:46:38", "remaining_time": "0:25:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 993, "total_steps": 1025, "loss": 0.1148, "learning_rate": 1.3332072095916527e-08, "epoch": 0.968662358248994, "percentage": 96.88, "elapsed_time": "12:47:22", "remaining_time": "0:24:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 994, "total_steps": 1025, "loss": 0.1212, "learning_rate": 1.2512522113779235e-08, "epoch": 0.9696378490427997, "percentage": 96.98, "elapsed_time": "12:48:06", "remaining_time": "0:23:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 995, "total_steps": 1025, "loss": 0.1169, "learning_rate": 1.1718904046721657e-08, "epoch": 0.9706133398366052, "percentage": 97.07, "elapsed_time": "12:48:56", "remaining_time": "0:23:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 996, "total_steps": 1025, "loss": 0.1158, "learning_rate": 1.0951226168166574e-08, "epoch": 0.9715888306304109, "percentage": 97.17, "elapsed_time": "12:49:46", "remaining_time": "0:22:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 997, "total_steps": 1025, "loss": 0.119, "learning_rate": 1.0209496481112247e-08, "epoch": 0.9725643214242166, "percentage": 97.27, "elapsed_time": "12:50:34", "remaining_time": "0:21:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 998, "total_steps": 1025, "loss": 0.108, "learning_rate": 9.493722718048326e-09, "epoch": 0.9735398122180222, "percentage": 97.37, "elapsed_time": "12:51:20", "remaining_time": "0:20:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 999, "total_steps": 1025, "loss": 0.1149, "learning_rate": 8.803912340875076e-09, "epoch": 0.9745153030118279, "percentage": 97.46, "elapsed_time": "12:52:05", "remaining_time": "0:20:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1000, "total_steps": 1025, "loss": 0.1229, "learning_rate": 8.140072540826772e-09, "epoch": 0.9754907938056334, "percentage": 97.56, "elapsed_time": "12:52:56", "remaining_time": "0:19:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1000, "total_steps": 1025, "eval_loss": 0.11711173504590988, "epoch": 0.9754907938056334, "percentage": 97.56, "elapsed_time": "12:55:03", "remaining_time": "0:19:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1001, "total_steps": 1025, "loss": 0.1202, "learning_rate": 7.502210238395091e-09, "epoch": 0.9764662845994391, "percentage": 97.66, "elapsed_time": "12:55:50", "remaining_time": "0:18:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1002, "total_steps": 1025, "loss": 0.1206, "learning_rate": 6.890332083258622e-09, "epoch": 0.9774417753932447, "percentage": 97.76, "elapsed_time": "12:56:34", "remaining_time": "0:17:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1003, "total_steps": 1025, "loss": 0.1253, "learning_rate": 6.304444454212077e-09, "epoch": 0.9784172661870504, "percentage": 97.85, "elapsed_time": "12:57:24", "remaining_time": "0:17:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1004, "total_steps": 1025, "loss": 0.115, "learning_rate": 5.7445534591002435e-09, "epoch": 0.979392756980856, "percentage": 97.95, "elapsed_time": "12:58:11", "remaining_time": "0:16:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1005, "total_steps": 1025, "loss": 0.1248, "learning_rate": 5.210664934754972e-09, "epoch": 0.9803682477746616, "percentage": 98.05, "elapsed_time": "12:58:58", "remaining_time": "0:15:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1006, "total_steps": 1025, "loss": 0.1185, "learning_rate": 4.702784446934116e-09, "epoch": 0.9813437385684672, "percentage": 98.15, "elapsed_time": "12:59:45", "remaining_time": "0:14:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1007, "total_steps": 1025, "loss": 0.1221, "learning_rate": 4.220917290262139e-09, "epoch": 0.9823192293622729, "percentage": 98.24, "elapsed_time": "13:00:35", "remaining_time": "0:13:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1008, "total_steps": 1025, "loss": 0.1243, "learning_rate": 3.765068488177093e-09, "epoch": 0.9832947201560785, "percentage": 98.34, "elapsed_time": "13:01:23", "remaining_time": "0:13:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1009, "total_steps": 1025, "loss": 0.1121, "learning_rate": 3.335242792876503e-09, "epoch": 0.9842702109498842, "percentage": 98.44, "elapsed_time": "13:02:09", "remaining_time": "0:12:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1010, "total_steps": 1025, "loss": 0.1296, "learning_rate": 2.931444685269069e-09, "epoch": 0.9852457017436898, "percentage": 98.54, "elapsed_time": "13:02:53", "remaining_time": "0:11:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1011, "total_steps": 1025, "loss": 0.1197, "learning_rate": 2.553678374926649e-09, "epoch": 0.9862211925374954, "percentage": 98.63, "elapsed_time": "13:03:40", "remaining_time": "0:10:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1012, "total_steps": 1025, "loss": 0.1233, "learning_rate": 2.201947800041515e-09, "epoch": 0.9871966833313011, "percentage": 98.73, "elapsed_time": "13:04:25", "remaining_time": "0:10:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1013, "total_steps": 1025, "loss": 0.1102, "learning_rate": 1.8762566273852754e-09, "epoch": 0.9881721741251067, "percentage": 98.83, "elapsed_time": "13:05:11", "remaining_time": "0:09:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1014, "total_steps": 1025, "loss": 0.1282, "learning_rate": 1.576608252269185e-09, "epoch": 0.9891476649189124, "percentage": 98.93, "elapsed_time": "13:05:59", "remaining_time": "0:08:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1015, "total_steps": 1025, "loss": 0.1184, "learning_rate": 1.3030057985108368e-09, "epoch": 0.9901231557127179, "percentage": 99.02, "elapsed_time": "13:06:45", "remaining_time": "0:07:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1016, "total_steps": 1025, "loss": 0.111, "learning_rate": 1.055452118400302e-09, "epoch": 0.9910986465065236, "percentage": 99.12, "elapsed_time": "13:07:33", "remaining_time": "0:06:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1017, "total_steps": 1025, "loss": 0.114, "learning_rate": 8.339497926704299e-10, "epoch": 0.9920741373003292, "percentage": 99.22, "elapsed_time": "13:08:19", "remaining_time": "0:06:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1018, "total_steps": 1025, "loss": 0.1257, "learning_rate": 6.385011304704814e-10, "epoch": 0.9930496280941349, "percentage": 99.32, "elapsed_time": "13:09:05", "remaining_time": "0:05:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1019, "total_steps": 1025, "loss": 0.1147, "learning_rate": 4.691081693411481e-10, "epoch": 0.9940251188879405, "percentage": 99.41, "elapsed_time": "13:09:51", "remaining_time": "0:04:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1020, "total_steps": 1025, "loss": 0.1257, "learning_rate": 3.2577267519484645e-10, "epoch": 0.9950006096817461, "percentage": 99.51, "elapsed_time": "13:10:38", "remaining_time": "0:03:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1021, "total_steps": 1025, "loss": 0.1145, "learning_rate": 2.0849614229601078e-10, "epoch": 0.9959761004755517, "percentage": 99.61, "elapsed_time": "13:11:22", "remaining_time": "0:03:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1022, "total_steps": 1025, "loss": 0.1185, "learning_rate": 1.1727979324527294e-10, "epoch": 0.9969515912693574, "percentage": 99.71, "elapsed_time": "13:12:10", "remaining_time": "0:02:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1023, "total_steps": 1025, "loss": 0.118, "learning_rate": 5.212457896835998e-11, "epoch": 0.997927082063163, "percentage": 99.8, "elapsed_time": "13:12:58", "remaining_time": "0:01:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1024, "total_steps": 1025, "loss": 0.118, "learning_rate": 1.303117870443682e-11, "epoch": 0.9989025728569687, "percentage": 99.9, "elapsed_time": "13:13:41", "remaining_time": "0:00:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1025, "total_steps": 1025, "loss": 0.1208, "learning_rate": 0.0, "epoch": 0.9998780636507743, "percentage": 100.0, "elapsed_time": "13:14:32", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1025, "total_steps": 1025, "epoch": 0.9998780636507743, "percentage": 100.0, "elapsed_time": "13:14:32", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0}