Goavanto / trainer_log.jsonl
sizhkhy's picture
Upload folder using huggingface_hub
cdbb266 verified
{"current_steps": 1, "total_steps": 2525, "loss": 0.1412, "lr": 3.952569169960474e-07, "epoch": 0.009900990099009901, "percentage": 0.04, "elapsed_time": "0:01:12", "remaining_time": "2 days, 2:33:38"}
{"current_steps": 2, "total_steps": 2525, "loss": 0.1399, "lr": 7.905138339920948e-07, "epoch": 0.019801980198019802, "percentage": 0.08, "elapsed_time": "0:01:42", "remaining_time": "1 day, 11:50:43"}
{"current_steps": 3, "total_steps": 2525, "loss": 0.14, "lr": 1.1857707509881422e-06, "epoch": 0.0297029702970297, "percentage": 0.12, "elapsed_time": "0:02:09", "remaining_time": "1 day, 6:17:23"}
{"current_steps": 4, "total_steps": 2525, "loss": 0.1333, "lr": 1.5810276679841897e-06, "epoch": 0.039603960396039604, "percentage": 0.16, "elapsed_time": "0:02:36", "remaining_time": "1 day, 3:23:34"}
{"current_steps": 5, "total_steps": 2525, "loss": 0.1377, "lr": 1.9762845849802374e-06, "epoch": 0.04950495049504951, "percentage": 0.2, "elapsed_time": "0:03:03", "remaining_time": "1 day, 1:40:23"}
{"current_steps": 6, "total_steps": 2525, "loss": 0.1872, "lr": 2.3715415019762844e-06, "epoch": 0.0594059405940594, "percentage": 0.24, "elapsed_time": "0:03:30", "remaining_time": "1 day, 0:31:19"}
{"current_steps": 7, "total_steps": 2525, "loss": 0.1336, "lr": 2.7667984189723323e-06, "epoch": 0.06930693069306931, "percentage": 0.28, "elapsed_time": "0:03:59", "remaining_time": "23:54:35"}
{"current_steps": 8, "total_steps": 2525, "loss": 0.156, "lr": 3.1620553359683794e-06, "epoch": 0.07920792079207921, "percentage": 0.32, "elapsed_time": "0:04:26", "remaining_time": "23:15:33"}
{"current_steps": 9, "total_steps": 2525, "loss": 0.1615, "lr": 3.5573122529644273e-06, "epoch": 0.0891089108910891, "percentage": 0.36, "elapsed_time": "0:04:53", "remaining_time": "22:45:11"}
{"current_steps": 10, "total_steps": 2525, "loss": 0.1277, "lr": 3.952569169960475e-06, "epoch": 0.09900990099009901, "percentage": 0.4, "elapsed_time": "0:05:19", "remaining_time": "22:20:49"}
{"current_steps": 11, "total_steps": 2525, "loss": 0.156, "lr": 4.347826086956522e-06, "epoch": 0.10891089108910891, "percentage": 0.44, "elapsed_time": "0:05:46", "remaining_time": "22:00:22"}
{"current_steps": 12, "total_steps": 2525, "loss": 0.1454, "lr": 4.743083003952569e-06, "epoch": 0.1188118811881188, "percentage": 0.48, "elapsed_time": "0:06:13", "remaining_time": "21:43:00"}
{"current_steps": 13, "total_steps": 2525, "loss": 0.1014, "lr": 5.138339920948617e-06, "epoch": 0.12871287128712872, "percentage": 0.51, "elapsed_time": "0:06:40", "remaining_time": "21:28:29"}
{"current_steps": 14, "total_steps": 2525, "loss": 0.1573, "lr": 5.533596837944665e-06, "epoch": 0.13861386138613863, "percentage": 0.55, "elapsed_time": "0:07:06", "remaining_time": "21:16:01"}
{"current_steps": 15, "total_steps": 2525, "loss": 0.1043, "lr": 5.928853754940711e-06, "epoch": 0.1485148514851485, "percentage": 0.59, "elapsed_time": "0:07:33", "remaining_time": "21:05:33"}
{"current_steps": 16, "total_steps": 2525, "loss": 0.1517, "lr": 6.324110671936759e-06, "epoch": 0.15841584158415842, "percentage": 0.63, "elapsed_time": "0:08:00", "remaining_time": "20:56:27"}
{"current_steps": 17, "total_steps": 2525, "loss": 0.1285, "lr": 6.719367588932807e-06, "epoch": 0.16831683168316833, "percentage": 0.67, "elapsed_time": "0:08:27", "remaining_time": "20:48:12"}
{"current_steps": 18, "total_steps": 2525, "loss": 0.1036, "lr": 7.1146245059288545e-06, "epoch": 0.1782178217821782, "percentage": 0.71, "elapsed_time": "0:08:54", "remaining_time": "20:40:36"}
{"current_steps": 19, "total_steps": 2525, "loss": 0.1052, "lr": 7.509881422924901e-06, "epoch": 0.18811881188118812, "percentage": 0.75, "elapsed_time": "0:09:28", "remaining_time": "20:50:00"}
{"current_steps": 20, "total_steps": 2525, "loss": 0.0883, "lr": 7.90513833992095e-06, "epoch": 0.19801980198019803, "percentage": 0.79, "elapsed_time": "0:09:55", "remaining_time": "20:42:54"}
{"current_steps": 21, "total_steps": 2525, "loss": 0.1041, "lr": 8.300395256916998e-06, "epoch": 0.2079207920792079, "percentage": 0.83, "elapsed_time": "0:10:22", "remaining_time": "20:36:24"}
{"current_steps": 22, "total_steps": 2525, "loss": 0.0877, "lr": 8.695652173913044e-06, "epoch": 0.21782178217821782, "percentage": 0.87, "elapsed_time": "0:10:48", "remaining_time": "20:30:28"}
{"current_steps": 23, "total_steps": 2525, "loss": 0.1186, "lr": 9.090909090909091e-06, "epoch": 0.22772277227722773, "percentage": 0.91, "elapsed_time": "0:11:15", "remaining_time": "20:24:14"}
{"current_steps": 24, "total_steps": 2525, "loss": 0.1149, "lr": 9.486166007905138e-06, "epoch": 0.2376237623762376, "percentage": 0.95, "elapsed_time": "0:11:41", "remaining_time": "20:18:30"}
{"current_steps": 25, "total_steps": 2525, "loss": 0.1227, "lr": 9.881422924901186e-06, "epoch": 0.24752475247524752, "percentage": 0.99, "elapsed_time": "0:12:08", "remaining_time": "20:13:20"}
{"current_steps": 25, "total_steps": 2525, "eval_loss": 0.10737022757530212, "epoch": 0.24752475247524752, "percentage": 0.99, "elapsed_time": "0:12:30", "remaining_time": "20:50:02"}
{"current_steps": 26, "total_steps": 2525, "loss": 0.0986, "lr": 1.0276679841897234e-05, "epoch": 0.25742574257425743, "percentage": 1.03, "elapsed_time": "0:12:56", "remaining_time": "20:43:38"}
{"current_steps": 27, "total_steps": 2525, "loss": 0.0932, "lr": 1.0671936758893281e-05, "epoch": 0.26732673267326734, "percentage": 1.07, "elapsed_time": "0:13:22", "remaining_time": "20:37:41"}
{"current_steps": 28, "total_steps": 2525, "loss": 0.091, "lr": 1.106719367588933e-05, "epoch": 0.27722772277227725, "percentage": 1.11, "elapsed_time": "0:13:49", "remaining_time": "20:32:10"}
{"current_steps": 29, "total_steps": 2525, "loss": 0.095, "lr": 1.1462450592885376e-05, "epoch": 0.2871287128712871, "percentage": 1.15, "elapsed_time": "0:14:15", "remaining_time": "20:26:56"}
{"current_steps": 30, "total_steps": 2525, "loss": 0.0587, "lr": 1.1857707509881423e-05, "epoch": 0.297029702970297, "percentage": 1.19, "elapsed_time": "0:14:41", "remaining_time": "20:22:05"}
{"current_steps": 31, "total_steps": 2525, "loss": 0.0788, "lr": 1.225296442687747e-05, "epoch": 0.3069306930693069, "percentage": 1.23, "elapsed_time": "0:15:08", "remaining_time": "20:17:35"}
{"current_steps": 32, "total_steps": 2525, "loss": 0.0967, "lr": 1.2648221343873517e-05, "epoch": 0.31683168316831684, "percentage": 1.27, "elapsed_time": "0:15:34", "remaining_time": "20:13:15"}
{"current_steps": 33, "total_steps": 2525, "loss": 0.0857, "lr": 1.3043478260869566e-05, "epoch": 0.32673267326732675, "percentage": 1.31, "elapsed_time": "0:16:00", "remaining_time": "20:09:06"}
{"current_steps": 34, "total_steps": 2525, "loss": 0.1421, "lr": 1.3438735177865614e-05, "epoch": 0.33663366336633666, "percentage": 1.35, "elapsed_time": "0:16:26", "remaining_time": "20:05:07"}
{"current_steps": 35, "total_steps": 2525, "loss": 0.0773, "lr": 1.383399209486166e-05, "epoch": 0.3465346534653465, "percentage": 1.39, "elapsed_time": "0:16:53", "remaining_time": "20:01:24"}
{"current_steps": 36, "total_steps": 2525, "loss": 0.0613, "lr": 1.4229249011857709e-05, "epoch": 0.3564356435643564, "percentage": 1.43, "elapsed_time": "0:17:19", "remaining_time": "19:57:52"}
{"current_steps": 37, "total_steps": 2525, "loss": 0.0902, "lr": 1.4624505928853754e-05, "epoch": 0.36633663366336633, "percentage": 1.47, "elapsed_time": "0:17:46", "remaining_time": "19:54:41"}
{"current_steps": 38, "total_steps": 2525, "loss": 0.0907, "lr": 1.5019762845849802e-05, "epoch": 0.37623762376237624, "percentage": 1.5, "elapsed_time": "0:18:12", "remaining_time": "19:51:24"}
{"current_steps": 39, "total_steps": 2525, "loss": 0.0667, "lr": 1.541501976284585e-05, "epoch": 0.38613861386138615, "percentage": 1.54, "elapsed_time": "0:18:38", "remaining_time": "19:48:20"}
{"current_steps": 40, "total_steps": 2525, "loss": 0.0501, "lr": 1.58102766798419e-05, "epoch": 0.39603960396039606, "percentage": 1.58, "elapsed_time": "0:19:04", "remaining_time": "19:45:25"}
{"current_steps": 41, "total_steps": 2525, "loss": 0.074, "lr": 1.6205533596837947e-05, "epoch": 0.40594059405940597, "percentage": 1.62, "elapsed_time": "0:19:33", "remaining_time": "19:44:51"}
{"current_steps": 42, "total_steps": 2525, "loss": 0.0791, "lr": 1.6600790513833996e-05, "epoch": 0.4158415841584158, "percentage": 1.66, "elapsed_time": "0:19:59", "remaining_time": "19:42:09"}
{"current_steps": 43, "total_steps": 2525, "loss": 0.075, "lr": 1.699604743083004e-05, "epoch": 0.42574257425742573, "percentage": 1.7, "elapsed_time": "0:20:26", "remaining_time": "19:39:32"}
{"current_steps": 44, "total_steps": 2525, "loss": 0.0611, "lr": 1.739130434782609e-05, "epoch": 0.43564356435643564, "percentage": 1.74, "elapsed_time": "0:20:52", "remaining_time": "19:37:00"}
{"current_steps": 45, "total_steps": 2525, "loss": 0.0449, "lr": 1.7786561264822134e-05, "epoch": 0.44554455445544555, "percentage": 1.78, "elapsed_time": "0:21:18", "remaining_time": "19:34:29"}
{"current_steps": 46, "total_steps": 2525, "loss": 0.038, "lr": 1.8181818181818182e-05, "epoch": 0.45544554455445546, "percentage": 1.82, "elapsed_time": "0:21:44", "remaining_time": "19:32:03"}
{"current_steps": 47, "total_steps": 2525, "loss": 0.1017, "lr": 1.857707509881423e-05, "epoch": 0.46534653465346537, "percentage": 1.86, "elapsed_time": "0:22:11", "remaining_time": "19:29:46"}
{"current_steps": 48, "total_steps": 2525, "loss": 0.0709, "lr": 1.8972332015810275e-05, "epoch": 0.4752475247524752, "percentage": 1.9, "elapsed_time": "0:22:37", "remaining_time": "19:27:32"}
{"current_steps": 49, "total_steps": 2525, "loss": 0.0581, "lr": 1.9367588932806324e-05, "epoch": 0.48514851485148514, "percentage": 1.94, "elapsed_time": "0:23:03", "remaining_time": "19:25:33"}
{"current_steps": 50, "total_steps": 2525, "loss": 0.0553, "lr": 1.9762845849802372e-05, "epoch": 0.49504950495049505, "percentage": 1.98, "elapsed_time": "0:23:30", "remaining_time": "19:23:31"}
{"current_steps": 50, "total_steps": 2525, "eval_loss": 0.055061474442481995, "epoch": 0.49504950495049505, "percentage": 1.98, "elapsed_time": "0:23:51", "remaining_time": "19:40:47"}
{"current_steps": 51, "total_steps": 2525, "loss": 0.085, "lr": 2.015810276679842e-05, "epoch": 0.504950495049505, "percentage": 2.02, "elapsed_time": "0:24:17", "remaining_time": "19:38:25"}
{"current_steps": 52, "total_steps": 2525, "loss": 0.0466, "lr": 2.055335968379447e-05, "epoch": 0.5148514851485149, "percentage": 2.06, "elapsed_time": "0:24:43", "remaining_time": "19:36:03"}
{"current_steps": 53, "total_steps": 2525, "loss": 0.037, "lr": 2.0948616600790517e-05, "epoch": 0.5247524752475248, "percentage": 2.1, "elapsed_time": "0:25:10", "remaining_time": "19:33:50"}
{"current_steps": 54, "total_steps": 2525, "loss": 0.0542, "lr": 2.1343873517786562e-05, "epoch": 0.5346534653465347, "percentage": 2.14, "elapsed_time": "0:25:36", "remaining_time": "19:31:42"}
{"current_steps": 55, "total_steps": 2525, "loss": 0.0335, "lr": 2.173913043478261e-05, "epoch": 0.5445544554455446, "percentage": 2.18, "elapsed_time": "0:26:02", "remaining_time": "19:29:29"}
{"current_steps": 56, "total_steps": 2525, "loss": 0.0348, "lr": 2.213438735177866e-05, "epoch": 0.5544554455445545, "percentage": 2.22, "elapsed_time": "0:26:28", "remaining_time": "19:27:27"}
{"current_steps": 57, "total_steps": 2525, "loss": 0.0568, "lr": 2.2529644268774703e-05, "epoch": 0.5643564356435643, "percentage": 2.26, "elapsed_time": "0:26:54", "remaining_time": "19:25:25"}
{"current_steps": 58, "total_steps": 2525, "loss": 0.0365, "lr": 2.2924901185770752e-05, "epoch": 0.5742574257425742, "percentage": 2.3, "elapsed_time": "0:27:21", "remaining_time": "19:23:26"}
{"current_steps": 59, "total_steps": 2525, "loss": 0.0464, "lr": 2.33201581027668e-05, "epoch": 0.5841584158415841, "percentage": 2.34, "elapsed_time": "0:27:47", "remaining_time": "19:21:34"}
{"current_steps": 60, "total_steps": 2525, "loss": 0.0548, "lr": 2.3715415019762845e-05, "epoch": 0.594059405940594, "percentage": 2.38, "elapsed_time": "0:28:13", "remaining_time": "19:19:50"}
{"current_steps": 61, "total_steps": 2525, "loss": 0.0431, "lr": 2.4110671936758893e-05, "epoch": 0.6039603960396039, "percentage": 2.42, "elapsed_time": "0:28:40", "remaining_time": "19:18:06"}
{"current_steps": 62, "total_steps": 2525, "loss": 0.0459, "lr": 2.450592885375494e-05, "epoch": 0.6138613861386139, "percentage": 2.46, "elapsed_time": "0:29:06", "remaining_time": "19:16:25"}
{"current_steps": 63, "total_steps": 2525, "loss": 0.0364, "lr": 2.490118577075099e-05, "epoch": 0.6237623762376238, "percentage": 2.5, "elapsed_time": "0:29:32", "remaining_time": "19:14:46"}
{"current_steps": 64, "total_steps": 2525, "loss": 0.0618, "lr": 2.5296442687747035e-05, "epoch": 0.6336633663366337, "percentage": 2.53, "elapsed_time": "0:29:59", "remaining_time": "19:13:07"}
{"current_steps": 65, "total_steps": 2525, "loss": 0.0401, "lr": 2.5691699604743087e-05, "epoch": 0.6435643564356436, "percentage": 2.57, "elapsed_time": "0:30:25", "remaining_time": "19:11:32"}
{"current_steps": 66, "total_steps": 2525, "loss": 0.0238, "lr": 2.608695652173913e-05, "epoch": 0.6534653465346535, "percentage": 2.61, "elapsed_time": "0:30:51", "remaining_time": "19:10:00"}
{"current_steps": 67, "total_steps": 2525, "loss": 0.0494, "lr": 2.6482213438735183e-05, "epoch": 0.6633663366336634, "percentage": 2.65, "elapsed_time": "0:31:18", "remaining_time": "19:08:23"}
{"current_steps": 68, "total_steps": 2525, "loss": 0.0373, "lr": 2.6877470355731228e-05, "epoch": 0.6732673267326733, "percentage": 2.69, "elapsed_time": "0:31:44", "remaining_time": "19:06:51"}
{"current_steps": 69, "total_steps": 2525, "loss": 0.0346, "lr": 2.7272727272727273e-05, "epoch": 0.6831683168316832, "percentage": 2.73, "elapsed_time": "0:32:10", "remaining_time": "19:05:20"}
{"current_steps": 70, "total_steps": 2525, "loss": 0.0278, "lr": 2.766798418972332e-05, "epoch": 0.693069306930693, "percentage": 2.77, "elapsed_time": "0:32:36", "remaining_time": "19:03:46"}
{"current_steps": 71, "total_steps": 2525, "loss": 0.0383, "lr": 2.8063241106719366e-05, "epoch": 0.7029702970297029, "percentage": 2.81, "elapsed_time": "0:33:03", "remaining_time": "19:02:20"}
{"current_steps": 72, "total_steps": 2525, "loss": 0.0565, "lr": 2.8458498023715418e-05, "epoch": 0.7128712871287128, "percentage": 2.85, "elapsed_time": "0:33:29", "remaining_time": "19:00:55"}
{"current_steps": 73, "total_steps": 2525, "loss": 0.0449, "lr": 2.8853754940711463e-05, "epoch": 0.7227722772277227, "percentage": 2.89, "elapsed_time": "0:33:55", "remaining_time": "18:59:37"}
{"current_steps": 74, "total_steps": 2525, "loss": 0.0378, "lr": 2.9249011857707508e-05, "epoch": 0.7326732673267327, "percentage": 2.93, "elapsed_time": "0:34:22", "remaining_time": "18:58:17"}
{"current_steps": 75, "total_steps": 2525, "loss": 0.0338, "lr": 2.964426877470356e-05, "epoch": 0.7425742574257426, "percentage": 2.97, "elapsed_time": "0:34:48", "remaining_time": "18:57:00"}
{"current_steps": 75, "total_steps": 2525, "eval_loss": 0.03502385690808296, "epoch": 0.7425742574257426, "percentage": 2.97, "elapsed_time": "0:35:09", "remaining_time": "19:08:23"}
{"current_steps": 76, "total_steps": 2525, "loss": 0.0317, "lr": 3.0039525691699605e-05, "epoch": 0.7524752475247525, "percentage": 3.01, "elapsed_time": "0:35:35", "remaining_time": "19:06:56"}
{"current_steps": 77, "total_steps": 2525, "loss": 0.0396, "lr": 3.0434782608695656e-05, "epoch": 0.7623762376237624, "percentage": 3.05, "elapsed_time": "0:36:01", "remaining_time": "19:05:27"}
{"current_steps": 78, "total_steps": 2525, "loss": 0.0297, "lr": 3.08300395256917e-05, "epoch": 0.7722772277227723, "percentage": 3.09, "elapsed_time": "0:36:27", "remaining_time": "19:04:00"}
{"current_steps": 79, "total_steps": 2525, "loss": 0.0414, "lr": 3.1225296442687746e-05, "epoch": 0.7821782178217822, "percentage": 3.13, "elapsed_time": "0:36:54", "remaining_time": "19:02:35"}
{"current_steps": 80, "total_steps": 2525, "loss": 0.0453, "lr": 3.16205533596838e-05, "epoch": 0.7920792079207921, "percentage": 3.17, "elapsed_time": "0:37:20", "remaining_time": "19:01:12"}
{"current_steps": 81, "total_steps": 2525, "loss": 0.0269, "lr": 3.201581027667984e-05, "epoch": 0.801980198019802, "percentage": 3.21, "elapsed_time": "0:37:46", "remaining_time": "18:59:54"}
{"current_steps": 82, "total_steps": 2525, "loss": 0.0364, "lr": 3.2411067193675894e-05, "epoch": 0.8118811881188119, "percentage": 3.25, "elapsed_time": "0:38:12", "remaining_time": "18:58:34"}
{"current_steps": 83, "total_steps": 2525, "loss": 0.0285, "lr": 3.280632411067194e-05, "epoch": 0.8217821782178217, "percentage": 3.29, "elapsed_time": "0:38:39", "remaining_time": "18:57:19"}
{"current_steps": 84, "total_steps": 2525, "loss": 0.0244, "lr": 3.320158102766799e-05, "epoch": 0.8316831683168316, "percentage": 3.33, "elapsed_time": "0:39:05", "remaining_time": "18:56:01"}
{"current_steps": 85, "total_steps": 2525, "loss": 0.0293, "lr": 3.3596837944664036e-05, "epoch": 0.8415841584158416, "percentage": 3.37, "elapsed_time": "0:39:31", "remaining_time": "18:54:45"}
{"current_steps": 86, "total_steps": 2525, "loss": 0.0378, "lr": 3.399209486166008e-05, "epoch": 0.8514851485148515, "percentage": 3.41, "elapsed_time": "0:39:58", "remaining_time": "18:53:33"}
{"current_steps": 87, "total_steps": 2525, "loss": 0.0265, "lr": 3.438735177865613e-05, "epoch": 0.8613861386138614, "percentage": 3.45, "elapsed_time": "0:40:24", "remaining_time": "18:52:26"}
{"current_steps": 88, "total_steps": 2525, "loss": 0.0363, "lr": 3.478260869565218e-05, "epoch": 0.8712871287128713, "percentage": 3.49, "elapsed_time": "0:40:51", "remaining_time": "18:51:16"}
{"current_steps": 89, "total_steps": 2525, "loss": 0.0351, "lr": 3.517786561264822e-05, "epoch": 0.8811881188118812, "percentage": 3.52, "elapsed_time": "0:41:17", "remaining_time": "18:50:06"}
{"current_steps": 90, "total_steps": 2525, "loss": 0.0314, "lr": 3.557312252964427e-05, "epoch": 0.8910891089108911, "percentage": 3.56, "elapsed_time": "0:41:43", "remaining_time": "18:48:57"}
{"current_steps": 91, "total_steps": 2525, "loss": 0.0277, "lr": 3.596837944664031e-05, "epoch": 0.900990099009901, "percentage": 3.6, "elapsed_time": "0:42:10", "remaining_time": "18:47:50"}
{"current_steps": 92, "total_steps": 2525, "loss": 0.025, "lr": 3.6363636363636364e-05, "epoch": 0.9108910891089109, "percentage": 3.64, "elapsed_time": "0:42:36", "remaining_time": "18:46:42"}
{"current_steps": 93, "total_steps": 2525, "loss": 0.0406, "lr": 3.675889328063241e-05, "epoch": 0.9207920792079208, "percentage": 3.68, "elapsed_time": "0:43:02", "remaining_time": "18:45:37"}
{"current_steps": 94, "total_steps": 2525, "loss": 0.0317, "lr": 3.715415019762846e-05, "epoch": 0.9306930693069307, "percentage": 3.72, "elapsed_time": "0:43:28", "remaining_time": "18:44:30"}
{"current_steps": 95, "total_steps": 2525, "loss": 0.0363, "lr": 3.7549407114624506e-05, "epoch": 0.9405940594059405, "percentage": 3.76, "elapsed_time": "0:43:55", "remaining_time": "18:43:27"}
{"current_steps": 96, "total_steps": 2525, "loss": 0.0181, "lr": 3.794466403162055e-05, "epoch": 0.9504950495049505, "percentage": 3.8, "elapsed_time": "0:44:21", "remaining_time": "18:42:23"}
{"current_steps": 97, "total_steps": 2525, "loss": 0.0296, "lr": 3.83399209486166e-05, "epoch": 0.9603960396039604, "percentage": 3.84, "elapsed_time": "0:44:48", "remaining_time": "18:41:23"}
{"current_steps": 98, "total_steps": 2525, "loss": 0.0213, "lr": 3.873517786561265e-05, "epoch": 0.9702970297029703, "percentage": 3.88, "elapsed_time": "0:45:14", "remaining_time": "18:40:22"}
{"current_steps": 99, "total_steps": 2525, "loss": 0.0294, "lr": 3.91304347826087e-05, "epoch": 0.9801980198019802, "percentage": 3.92, "elapsed_time": "0:45:40", "remaining_time": "18:39:21"}
{"current_steps": 100, "total_steps": 2525, "loss": 0.0302, "lr": 3.9525691699604744e-05, "epoch": 0.9900990099009901, "percentage": 3.96, "elapsed_time": "0:46:06", "remaining_time": "18:38:15"}
{"current_steps": 100, "total_steps": 2525, "eval_loss": 0.027701813727617264, "epoch": 0.9900990099009901, "percentage": 3.96, "elapsed_time": "0:46:27", "remaining_time": "18:46:44"}
{"current_steps": 101, "total_steps": 2525, "loss": 0.0226, "lr": 3.9920948616600796e-05, "epoch": 1.0, "percentage": 4.0, "elapsed_time": "0:46:44", "remaining_time": "18:41:53"}
{"current_steps": 102, "total_steps": 2525, "loss": 0.023, "lr": 4.031620553359684e-05, "epoch": 1.00990099009901, "percentage": 4.04, "elapsed_time": "0:47:11", "remaining_time": "18:40:56"}
{"current_steps": 103, "total_steps": 2525, "loss": 0.0296, "lr": 4.0711462450592886e-05, "epoch": 1.0198019801980198, "percentage": 4.08, "elapsed_time": "0:47:37", "remaining_time": "18:39:52"}
{"current_steps": 104, "total_steps": 2525, "loss": 0.0203, "lr": 4.110671936758894e-05, "epoch": 1.0297029702970297, "percentage": 4.12, "elapsed_time": "0:48:03", "remaining_time": "18:38:51"}
{"current_steps": 105, "total_steps": 2525, "loss": 0.0235, "lr": 4.150197628458498e-05, "epoch": 1.0396039603960396, "percentage": 4.16, "elapsed_time": "0:48:29", "remaining_time": "18:37:47"}
{"current_steps": 106, "total_steps": 2525, "loss": 0.0296, "lr": 4.1897233201581034e-05, "epoch": 1.0495049504950495, "percentage": 4.2, "elapsed_time": "0:48:56", "remaining_time": "18:36:45"}
{"current_steps": 107, "total_steps": 2525, "loss": 0.0272, "lr": 4.229249011857708e-05, "epoch": 1.0594059405940595, "percentage": 4.24, "elapsed_time": "0:49:22", "remaining_time": "18:35:43"}
{"current_steps": 108, "total_steps": 2525, "loss": 0.0341, "lr": 4.2687747035573124e-05, "epoch": 1.0693069306930694, "percentage": 4.28, "elapsed_time": "0:49:48", "remaining_time": "18:34:43"}
{"current_steps": 109, "total_steps": 2525, "loss": 0.0355, "lr": 4.3083003952569175e-05, "epoch": 1.0792079207920793, "percentage": 4.32, "elapsed_time": "0:50:14", "remaining_time": "18:33:44"}
{"current_steps": 110, "total_steps": 2525, "loss": 0.03, "lr": 4.347826086956522e-05, "epoch": 1.0891089108910892, "percentage": 4.36, "elapsed_time": "0:50:41", "remaining_time": "18:32:46"}
{"current_steps": 111, "total_steps": 2525, "loss": 0.0196, "lr": 4.387351778656127e-05, "epoch": 1.099009900990099, "percentage": 4.4, "elapsed_time": "0:51:07", "remaining_time": "18:31:51"}
{"current_steps": 112, "total_steps": 2525, "loss": 0.0168, "lr": 4.426877470355732e-05, "epoch": 1.108910891089109, "percentage": 4.44, "elapsed_time": "0:51:33", "remaining_time": "18:30:53"}
{"current_steps": 113, "total_steps": 2525, "loss": 0.0251, "lr": 4.466403162055336e-05, "epoch": 1.118811881188119, "percentage": 4.48, "elapsed_time": "0:52:00", "remaining_time": "18:29:59"}
{"current_steps": 114, "total_steps": 2525, "loss": 0.0244, "lr": 4.505928853754941e-05, "epoch": 1.1287128712871288, "percentage": 4.51, "elapsed_time": "0:52:26", "remaining_time": "18:29:03"}
{"current_steps": 115, "total_steps": 2525, "loss": 0.0213, "lr": 4.545454545454546e-05, "epoch": 1.1386138613861387, "percentage": 4.55, "elapsed_time": "0:52:52", "remaining_time": "18:28:08"}
{"current_steps": 116, "total_steps": 2525, "loss": 0.0206, "lr": 4.5849802371541504e-05, "epoch": 1.1485148514851484, "percentage": 4.59, "elapsed_time": "0:53:19", "remaining_time": "18:27:15"}
{"current_steps": 117, "total_steps": 2525, "loss": 0.0346, "lr": 4.624505928853755e-05, "epoch": 1.1584158415841583, "percentage": 4.63, "elapsed_time": "0:53:45", "remaining_time": "18:26:23"}
{"current_steps": 118, "total_steps": 2525, "loss": 0.0259, "lr": 4.66403162055336e-05, "epoch": 1.1683168316831682, "percentage": 4.67, "elapsed_time": "0:54:11", "remaining_time": "18:25:28"}
{"current_steps": 119, "total_steps": 2525, "loss": 0.0248, "lr": 4.7035573122529645e-05, "epoch": 1.1782178217821782, "percentage": 4.71, "elapsed_time": "0:54:37", "remaining_time": "18:24:35"}
{"current_steps": 120, "total_steps": 2525, "loss": 0.0243, "lr": 4.743083003952569e-05, "epoch": 1.188118811881188, "percentage": 4.75, "elapsed_time": "0:55:04", "remaining_time": "18:23:43"}
{"current_steps": 121, "total_steps": 2525, "loss": 0.0211, "lr": 4.782608695652174e-05, "epoch": 1.198019801980198, "percentage": 4.79, "elapsed_time": "0:55:30", "remaining_time": "18:22:53"}
{"current_steps": 122, "total_steps": 2525, "loss": 0.0395, "lr": 4.822134387351779e-05, "epoch": 1.2079207920792079, "percentage": 4.83, "elapsed_time": "0:55:56", "remaining_time": "18:22:00"}
{"current_steps": 123, "total_steps": 2525, "loss": 0.0343, "lr": 4.861660079051384e-05, "epoch": 1.2178217821782178, "percentage": 4.87, "elapsed_time": "0:56:23", "remaining_time": "18:21:07"}
{"current_steps": 124, "total_steps": 2525, "loss": 0.0269, "lr": 4.901185770750988e-05, "epoch": 1.2277227722772277, "percentage": 4.91, "elapsed_time": "0:56:49", "remaining_time": "18:20:17"}
{"current_steps": 125, "total_steps": 2525, "loss": 0.0373, "lr": 4.940711462450593e-05, "epoch": 1.2376237623762376, "percentage": 4.95, "elapsed_time": "0:57:15", "remaining_time": "18:19:27"}
{"current_steps": 125, "total_steps": 2525, "eval_loss": 0.025583934038877487, "epoch": 1.2376237623762376, "percentage": 4.95, "elapsed_time": "0:57:36", "remaining_time": "18:26:09"}
{"current_steps": 126, "total_steps": 2525, "loss": 0.0305, "lr": 4.980237154150198e-05, "epoch": 1.2475247524752475, "percentage": 4.99, "elapsed_time": "0:58:03", "remaining_time": "18:25:16"}
{"current_steps": 127, "total_steps": 2525, "loss": 0.0171, "lr": 5.0197628458498025e-05, "epoch": 1.2574257425742574, "percentage": 5.03, "elapsed_time": "0:58:29", "remaining_time": "18:24:23"}
{"current_steps": 128, "total_steps": 2525, "loss": 0.0238, "lr": 5.059288537549407e-05, "epoch": 1.2673267326732673, "percentage": 5.07, "elapsed_time": "0:58:55", "remaining_time": "18:23:28"}
{"current_steps": 129, "total_steps": 2525, "loss": 0.0296, "lr": 5.098814229249013e-05, "epoch": 1.2772277227722773, "percentage": 5.11, "elapsed_time": "0:59:21", "remaining_time": "18:22:37"}
{"current_steps": 130, "total_steps": 2525, "loss": 0.0246, "lr": 5.138339920948617e-05, "epoch": 1.2871287128712872, "percentage": 5.15, "elapsed_time": "0:59:48", "remaining_time": "18:21:44"}
{"current_steps": 131, "total_steps": 2525, "loss": 0.0339, "lr": 5.177865612648222e-05, "epoch": 1.297029702970297, "percentage": 5.19, "elapsed_time": "1:00:14", "remaining_time": "18:20:53"}
{"current_steps": 132, "total_steps": 2525, "loss": 0.0181, "lr": 5.217391304347826e-05, "epoch": 1.306930693069307, "percentage": 5.23, "elapsed_time": "1:00:40", "remaining_time": "18:20:01"}
{"current_steps": 133, "total_steps": 2525, "loss": 0.0307, "lr": 5.256916996047431e-05, "epoch": 1.316831683168317, "percentage": 5.27, "elapsed_time": "1:01:07", "remaining_time": "18:19:28"}
{"current_steps": 134, "total_steps": 2525, "loss": 0.0215, "lr": 5.2964426877470366e-05, "epoch": 1.3267326732673268, "percentage": 5.31, "elapsed_time": "1:01:34", "remaining_time": "18:18:37"}
{"current_steps": 135, "total_steps": 2525, "loss": 0.0252, "lr": 5.335968379446641e-05, "epoch": 1.3366336633663367, "percentage": 5.35, "elapsed_time": "1:02:00", "remaining_time": "18:17:46"}
{"current_steps": 136, "total_steps": 2525, "loss": 0.0284, "lr": 5.3754940711462456e-05, "epoch": 1.3465346534653464, "percentage": 5.39, "elapsed_time": "1:02:26", "remaining_time": "18:16:58"}
{"current_steps": 137, "total_steps": 2525, "loss": 0.0336, "lr": 5.41501976284585e-05, "epoch": 1.3564356435643563, "percentage": 5.43, "elapsed_time": "1:02:53", "remaining_time": "18:16:09"}
{"current_steps": 138, "total_steps": 2525, "loss": 0.0241, "lr": 5.4545454545454546e-05, "epoch": 1.3663366336633662, "percentage": 5.47, "elapsed_time": "1:03:19", "remaining_time": "18:15:20"}
{"current_steps": 139, "total_steps": 2525, "loss": 0.0239, "lr": 5.49407114624506e-05, "epoch": 1.3762376237623761, "percentage": 5.5, "elapsed_time": "1:03:45", "remaining_time": "18:14:31"}
{"current_steps": 140, "total_steps": 2525, "loss": 0.0342, "lr": 5.533596837944664e-05, "epoch": 1.386138613861386, "percentage": 5.54, "elapsed_time": "1:04:12", "remaining_time": "18:13:43"}
{"current_steps": 141, "total_steps": 2525, "loss": 0.0186, "lr": 5.573122529644269e-05, "epoch": 1.396039603960396, "percentage": 5.58, "elapsed_time": "1:04:38", "remaining_time": "18:12:56"}
{"current_steps": 142, "total_steps": 2525, "loss": 0.0244, "lr": 5.612648221343873e-05, "epoch": 1.4059405940594059, "percentage": 5.62, "elapsed_time": "1:05:04", "remaining_time": "18:12:09"}
{"current_steps": 143, "total_steps": 2525, "loss": 0.0179, "lr": 5.652173913043478e-05, "epoch": 1.4158415841584158, "percentage": 5.66, "elapsed_time": "1:05:31", "remaining_time": "18:11:22"}
{"current_steps": 144, "total_steps": 2525, "loss": 0.0216, "lr": 5.6916996047430836e-05, "epoch": 1.4257425742574257, "percentage": 5.7, "elapsed_time": "1:05:57", "remaining_time": "18:10:36"}
{"current_steps": 145, "total_steps": 2525, "loss": 0.0171, "lr": 5.731225296442688e-05, "epoch": 1.4356435643564356, "percentage": 5.74, "elapsed_time": "1:06:23", "remaining_time": "18:09:48"}
{"current_steps": 146, "total_steps": 2525, "loss": 0.0231, "lr": 5.7707509881422926e-05, "epoch": 1.4455445544554455, "percentage": 5.78, "elapsed_time": "1:06:50", "remaining_time": "18:09:02"}
{"current_steps": 147, "total_steps": 2525, "loss": 0.0147, "lr": 5.810276679841897e-05, "epoch": 1.4554455445544554, "percentage": 5.82, "elapsed_time": "1:07:16", "remaining_time": "18:08:15"}
{"current_steps": 148, "total_steps": 2525, "loss": 0.0273, "lr": 5.8498023715415016e-05, "epoch": 1.4653465346534653, "percentage": 5.86, "elapsed_time": "1:07:42", "remaining_time": "18:07:29"}
{"current_steps": 149, "total_steps": 2525, "loss": 0.0185, "lr": 5.8893280632411074e-05, "epoch": 1.4752475247524752, "percentage": 5.9, "elapsed_time": "1:08:08", "remaining_time": "18:06:43"}
{"current_steps": 150, "total_steps": 2525, "loss": 0.0321, "lr": 5.928853754940712e-05, "epoch": 1.4851485148514851, "percentage": 5.94, "elapsed_time": "1:08:35", "remaining_time": "18:05:57"}
{"current_steps": 150, "total_steps": 2525, "eval_loss": 0.025141000747680664, "epoch": 1.4851485148514851, "percentage": 5.94, "elapsed_time": "1:08:56", "remaining_time": "18:11:29"}
{"current_steps": 151, "total_steps": 2525, "loss": 0.0227, "lr": 5.9683794466403164e-05, "epoch": 1.495049504950495, "percentage": 5.98, "elapsed_time": "1:09:22", "remaining_time": "18:10:41"}
{"current_steps": 152, "total_steps": 2525, "loss": 0.0175, "lr": 6.007905138339921e-05, "epoch": 1.504950495049505, "percentage": 6.02, "elapsed_time": "1:09:48", "remaining_time": "18:09:54"}
{"current_steps": 153, "total_steps": 2525, "loss": 0.0227, "lr": 6.0474308300395254e-05, "epoch": 1.5148514851485149, "percentage": 6.06, "elapsed_time": "1:10:14", "remaining_time": "18:09:06"}
{"current_steps": 154, "total_steps": 2525, "loss": 0.0183, "lr": 6.086956521739131e-05, "epoch": 1.5247524752475248, "percentage": 6.1, "elapsed_time": "1:10:41", "remaining_time": "18:08:18"}
{"current_steps": 155, "total_steps": 2525, "loss": 0.02, "lr": 6.126482213438736e-05, "epoch": 1.5346534653465347, "percentage": 6.14, "elapsed_time": "1:11:07", "remaining_time": "18:07:30"}
{"current_steps": 156, "total_steps": 2525, "loss": 0.0157, "lr": 6.16600790513834e-05, "epoch": 1.5445544554455446, "percentage": 6.18, "elapsed_time": "1:11:33", "remaining_time": "18:06:42"}
{"current_steps": 157, "total_steps": 2525, "loss": 0.0265, "lr": 6.205533596837945e-05, "epoch": 1.5544554455445545, "percentage": 6.22, "elapsed_time": "1:11:59", "remaining_time": "18:05:56"}
{"current_steps": 158, "total_steps": 2525, "loss": 0.014, "lr": 6.245059288537549e-05, "epoch": 1.5643564356435644, "percentage": 6.26, "elapsed_time": "1:12:26", "remaining_time": "18:05:11"}
{"current_steps": 159, "total_steps": 2525, "loss": 0.0264, "lr": 6.284584980237155e-05, "epoch": 1.5742574257425743, "percentage": 6.3, "elapsed_time": "1:12:52", "remaining_time": "18:04:25"}
{"current_steps": 160, "total_steps": 2525, "loss": 0.0153, "lr": 6.32411067193676e-05, "epoch": 1.5841584158415842, "percentage": 6.34, "elapsed_time": "1:13:18", "remaining_time": "18:03:38"}
{"current_steps": 161, "total_steps": 2525, "loss": 0.0172, "lr": 6.363636363636364e-05, "epoch": 1.5940594059405941, "percentage": 6.38, "elapsed_time": "1:13:44", "remaining_time": "18:02:51"}
{"current_steps": 162, "total_steps": 2525, "loss": 0.023, "lr": 6.403162055335969e-05, "epoch": 1.603960396039604, "percentage": 6.42, "elapsed_time": "1:14:11", "remaining_time": "18:02:05"}
{"current_steps": 163, "total_steps": 2525, "loss": 0.0388, "lr": 6.442687747035574e-05, "epoch": 1.613861386138614, "percentage": 6.46, "elapsed_time": "1:14:37", "remaining_time": "18:01:20"}
{"current_steps": 164, "total_steps": 2525, "loss": 0.0198, "lr": 6.482213438735179e-05, "epoch": 1.6237623762376239, "percentage": 6.5, "elapsed_time": "1:15:03", "remaining_time": "18:00:36"}
{"current_steps": 165, "total_steps": 2525, "loss": 0.0303, "lr": 6.521739130434783e-05, "epoch": 1.6336633663366338, "percentage": 6.53, "elapsed_time": "1:15:30", "remaining_time": "17:59:53"}
{"current_steps": 166, "total_steps": 2525, "loss": 0.0157, "lr": 6.561264822134388e-05, "epoch": 1.6435643564356437, "percentage": 6.57, "elapsed_time": "1:15:56", "remaining_time": "17:59:09"}
{"current_steps": 167, "total_steps": 2525, "loss": 0.0157, "lr": 6.600790513833992e-05, "epoch": 1.6534653465346536, "percentage": 6.61, "elapsed_time": "1:16:22", "remaining_time": "17:58:25"}
{"current_steps": 168, "total_steps": 2525, "loss": 0.0288, "lr": 6.640316205533598e-05, "epoch": 1.6633663366336635, "percentage": 6.65, "elapsed_time": "1:16:49", "remaining_time": "17:57:43"}
{"current_steps": 169, "total_steps": 2525, "loss": 0.0344, "lr": 6.679841897233203e-05, "epoch": 1.6732673267326734, "percentage": 6.69, "elapsed_time": "1:17:15", "remaining_time": "17:57:00"}
{"current_steps": 170, "total_steps": 2525, "loss": 0.0315, "lr": 6.719367588932807e-05, "epoch": 1.6831683168316833, "percentage": 6.73, "elapsed_time": "1:17:41", "remaining_time": "17:56:15"}
{"current_steps": 171, "total_steps": 2525, "loss": 0.0219, "lr": 6.758893280632412e-05, "epoch": 1.693069306930693, "percentage": 6.77, "elapsed_time": "1:18:07", "remaining_time": "17:55:32"}
{"current_steps": 172, "total_steps": 2525, "loss": 0.0309, "lr": 6.798418972332016e-05, "epoch": 1.702970297029703, "percentage": 6.81, "elapsed_time": "1:18:33", "remaining_time": "17:54:47"}
{"current_steps": 173, "total_steps": 2525, "loss": 0.0303, "lr": 6.837944664031622e-05, "epoch": 1.7128712871287128, "percentage": 6.85, "elapsed_time": "1:19:00", "remaining_time": "17:54:05"}
{"current_steps": 174, "total_steps": 2525, "loss": 0.0289, "lr": 6.877470355731227e-05, "epoch": 1.7227722772277227, "percentage": 6.89, "elapsed_time": "1:19:26", "remaining_time": "17:53:23"}
{"current_steps": 175, "total_steps": 2525, "loss": 0.026, "lr": 6.916996047430831e-05, "epoch": 1.7326732673267327, "percentage": 6.93, "elapsed_time": "1:19:52", "remaining_time": "17:52:40"}
{"current_steps": 175, "total_steps": 2525, "eval_loss": 0.022802595049142838, "epoch": 1.7326732673267327, "percentage": 6.93, "elapsed_time": "1:20:13", "remaining_time": "17:57:22"}
{"current_steps": 176, "total_steps": 2525, "loss": 0.0296, "lr": 6.956521739130436e-05, "epoch": 1.7425742574257426, "percentage": 6.97, "elapsed_time": "1:20:40", "remaining_time": "17:56:37"}
{"current_steps": 177, "total_steps": 2525, "loss": 0.0203, "lr": 6.99604743083004e-05, "epoch": 1.7524752475247525, "percentage": 7.01, "elapsed_time": "1:21:06", "remaining_time": "17:55:53"}
{"current_steps": 178, "total_steps": 2525, "loss": 0.016, "lr": 7.035573122529645e-05, "epoch": 1.7623762376237624, "percentage": 7.05, "elapsed_time": "1:21:32", "remaining_time": "17:55:09"}
{"current_steps": 179, "total_steps": 2525, "loss": 0.0161, "lr": 7.075098814229249e-05, "epoch": 1.7722772277227723, "percentage": 7.09, "elapsed_time": "1:21:58", "remaining_time": "17:54:25"}
{"current_steps": 180, "total_steps": 2525, "loss": 0.0351, "lr": 7.114624505928854e-05, "epoch": 1.7821782178217822, "percentage": 7.13, "elapsed_time": "1:22:25", "remaining_time": "17:53:42"}
{"current_steps": 181, "total_steps": 2525, "loss": 0.0198, "lr": 7.154150197628458e-05, "epoch": 1.7920792079207921, "percentage": 7.17, "elapsed_time": "1:22:51", "remaining_time": "17:53:00"}
{"current_steps": 182, "total_steps": 2525, "loss": 0.0214, "lr": 7.193675889328062e-05, "epoch": 1.801980198019802, "percentage": 7.21, "elapsed_time": "1:23:17", "remaining_time": "17:52:17"}
{"current_steps": 183, "total_steps": 2525, "loss": 0.0211, "lr": 7.233201581027668e-05, "epoch": 1.811881188118812, "percentage": 7.25, "elapsed_time": "1:23:44", "remaining_time": "17:51:37"}
{"current_steps": 184, "total_steps": 2525, "loss": 0.0291, "lr": 7.272727272727273e-05, "epoch": 1.8217821782178216, "percentage": 7.29, "elapsed_time": "1:24:10", "remaining_time": "17:50:54"}
{"current_steps": 185, "total_steps": 2525, "loss": 0.0151, "lr": 7.312252964426877e-05, "epoch": 1.8316831683168315, "percentage": 7.33, "elapsed_time": "1:24:36", "remaining_time": "17:50:10"}
{"current_steps": 186, "total_steps": 2525, "loss": 0.0227, "lr": 7.351778656126482e-05, "epoch": 1.8415841584158414, "percentage": 7.37, "elapsed_time": "1:25:02", "remaining_time": "17:49:28"}
{"current_steps": 187, "total_steps": 2525, "loss": 0.0335, "lr": 7.391304347826086e-05, "epoch": 1.8514851485148514, "percentage": 7.41, "elapsed_time": "1:25:29", "remaining_time": "17:48:47"}
{"current_steps": 188, "total_steps": 2525, "loss": 0.0272, "lr": 7.430830039525692e-05, "epoch": 1.8613861386138613, "percentage": 7.45, "elapsed_time": "1:25:55", "remaining_time": "17:48:06"}
{"current_steps": 189, "total_steps": 2525, "loss": 0.0244, "lr": 7.470355731225297e-05, "epoch": 1.8712871287128712, "percentage": 7.49, "elapsed_time": "1:26:21", "remaining_time": "17:47:24"}
{"current_steps": 190, "total_steps": 2525, "loss": 0.0139, "lr": 7.509881422924901e-05, "epoch": 1.881188118811881, "percentage": 7.52, "elapsed_time": "1:26:47", "remaining_time": "17:46:43"}
{"current_steps": 191, "total_steps": 2525, "loss": 0.0161, "lr": 7.549407114624506e-05, "epoch": 1.891089108910891, "percentage": 7.56, "elapsed_time": "1:27:14", "remaining_time": "17:46:01"}
{"current_steps": 192, "total_steps": 2525, "loss": 0.0246, "lr": 7.58893280632411e-05, "epoch": 1.900990099009901, "percentage": 7.6, "elapsed_time": "1:27:40", "remaining_time": "17:45:22"}
{"current_steps": 193, "total_steps": 2525, "loss": 0.0207, "lr": 7.628458498023716e-05, "epoch": 1.9108910891089108, "percentage": 7.64, "elapsed_time": "1:28:07", "remaining_time": "17:44:42"}
{"current_steps": 194, "total_steps": 2525, "loss": 0.0219, "lr": 7.66798418972332e-05, "epoch": 1.9207920792079207, "percentage": 7.68, "elapsed_time": "1:28:33", "remaining_time": "17:44:01"}
{"current_steps": 195, "total_steps": 2525, "loss": 0.0279, "lr": 7.707509881422925e-05, "epoch": 1.9306930693069306, "percentage": 7.72, "elapsed_time": "1:28:59", "remaining_time": "17:43:20"}
{"current_steps": 196, "total_steps": 2525, "loss": 0.0284, "lr": 7.74703557312253e-05, "epoch": 1.9405940594059405, "percentage": 7.76, "elapsed_time": "1:29:25", "remaining_time": "17:42:39"}
{"current_steps": 197, "total_steps": 2525, "loss": 0.022, "lr": 7.786561264822134e-05, "epoch": 1.9504950495049505, "percentage": 7.8, "elapsed_time": "1:29:52", "remaining_time": "17:41:59"}
{"current_steps": 198, "total_steps": 2525, "loss": 0.0189, "lr": 7.82608695652174e-05, "epoch": 1.9603960396039604, "percentage": 7.84, "elapsed_time": "1:30:18", "remaining_time": "17:41:19"}
{"current_steps": 199, "total_steps": 2525, "loss": 0.0279, "lr": 7.865612648221344e-05, "epoch": 1.9702970297029703, "percentage": 7.88, "elapsed_time": "1:30:44", "remaining_time": "17:40:38"}
{"current_steps": 200, "total_steps": 2525, "loss": 0.029, "lr": 7.905138339920949e-05, "epoch": 1.9801980198019802, "percentage": 7.92, "elapsed_time": "1:31:10", "remaining_time": "17:39:57"}
{"current_steps": 200, "total_steps": 2525, "eval_loss": 0.021168576553463936, "epoch": 1.9801980198019802, "percentage": 7.92, "elapsed_time": "1:31:31", "remaining_time": "17:44:01"}
{"current_steps": 201, "total_steps": 2525, "loss": 0.0174, "lr": 7.944664031620553e-05, "epoch": 1.99009900990099, "percentage": 7.96, "elapsed_time": "1:32:06", "remaining_time": "17:45:03"}
{"current_steps": 202, "total_steps": 2525, "loss": 0.0162, "lr": 7.984189723320159e-05, "epoch": 2.0, "percentage": 8.0, "elapsed_time": "1:32:15", "remaining_time": "17:41:00"}
{"current_steps": 203, "total_steps": 2525, "loss": 0.017, "lr": 8.023715415019764e-05, "epoch": 2.00990099009901, "percentage": 8.04, "elapsed_time": "1:32:43", "remaining_time": "17:40:34"}
{"current_steps": 204, "total_steps": 2525, "loss": 0.0108, "lr": 8.063241106719368e-05, "epoch": 2.01980198019802, "percentage": 8.08, "elapsed_time": "1:33:09", "remaining_time": "17:39:58"}
{"current_steps": 205, "total_steps": 2525, "loss": 0.0129, "lr": 8.102766798418973e-05, "epoch": 2.0297029702970297, "percentage": 8.12, "elapsed_time": "1:33:36", "remaining_time": "17:39:23"}
{"current_steps": 206, "total_steps": 2525, "loss": 0.0497, "lr": 8.142292490118577e-05, "epoch": 2.0396039603960396, "percentage": 8.16, "elapsed_time": "1:34:03", "remaining_time": "17:38:48"}
{"current_steps": 207, "total_steps": 2525, "loss": 0.0132, "lr": 8.181818181818183e-05, "epoch": 2.0495049504950495, "percentage": 8.2, "elapsed_time": "1:34:30", "remaining_time": "17:38:13"}
{"current_steps": 208, "total_steps": 2525, "loss": 0.0139, "lr": 8.221343873517787e-05, "epoch": 2.0594059405940595, "percentage": 8.24, "elapsed_time": "1:34:56", "remaining_time": "17:37:39"}
{"current_steps": 209, "total_steps": 2525, "loss": 0.0186, "lr": 8.260869565217392e-05, "epoch": 2.0693069306930694, "percentage": 8.28, "elapsed_time": "1:35:23", "remaining_time": "17:37:06"}
{"current_steps": 210, "total_steps": 2525, "loss": 0.0146, "lr": 8.300395256916996e-05, "epoch": 2.0792079207920793, "percentage": 8.32, "elapsed_time": "1:35:50", "remaining_time": "17:36:31"}
{"current_steps": 211, "total_steps": 2525, "loss": 0.0234, "lr": 8.339920948616601e-05, "epoch": 2.089108910891089, "percentage": 8.36, "elapsed_time": "1:36:17", "remaining_time": "17:35:56"}
{"current_steps": 212, "total_steps": 2525, "loss": 0.0266, "lr": 8.379446640316207e-05, "epoch": 2.099009900990099, "percentage": 8.4, "elapsed_time": "1:36:43", "remaining_time": "17:35:22"}
{"current_steps": 213, "total_steps": 2525, "loss": 0.0201, "lr": 8.418972332015811e-05, "epoch": 2.108910891089109, "percentage": 8.44, "elapsed_time": "1:37:10", "remaining_time": "17:34:47"}
{"current_steps": 214, "total_steps": 2525, "loss": 0.0464, "lr": 8.458498023715416e-05, "epoch": 2.118811881188119, "percentage": 8.48, "elapsed_time": "1:37:37", "remaining_time": "17:34:11"}
{"current_steps": 215, "total_steps": 2525, "loss": 0.0117, "lr": 8.49802371541502e-05, "epoch": 2.128712871287129, "percentage": 8.51, "elapsed_time": "1:38:04", "remaining_time": "17:33:39"}
{"current_steps": 216, "total_steps": 2525, "loss": 0.0311, "lr": 8.537549407114625e-05, "epoch": 2.1386138613861387, "percentage": 8.55, "elapsed_time": "1:38:30", "remaining_time": "17:33:05"}
{"current_steps": 217, "total_steps": 2525, "loss": 0.01, "lr": 8.57707509881423e-05, "epoch": 2.1485148514851486, "percentage": 8.59, "elapsed_time": "1:38:57", "remaining_time": "17:32:31"}
{"current_steps": 218, "total_steps": 2525, "loss": 0.0141, "lr": 8.616600790513835e-05, "epoch": 2.1584158415841586, "percentage": 8.63, "elapsed_time": "1:39:24", "remaining_time": "17:31:58"}
{"current_steps": 219, "total_steps": 2525, "loss": 0.0175, "lr": 8.65612648221344e-05, "epoch": 2.1683168316831685, "percentage": 8.67, "elapsed_time": "1:39:51", "remaining_time": "17:31:25"}
{"current_steps": 220, "total_steps": 2525, "loss": 0.0201, "lr": 8.695652173913044e-05, "epoch": 2.1782178217821784, "percentage": 8.71, "elapsed_time": "1:40:17", "remaining_time": "17:30:51"}
{"current_steps": 221, "total_steps": 2525, "loss": 0.0317, "lr": 8.735177865612649e-05, "epoch": 2.1881188118811883, "percentage": 8.75, "elapsed_time": "1:40:44", "remaining_time": "17:30:17"}
{"current_steps": 222, "total_steps": 2525, "loss": 0.02, "lr": 8.774703557312254e-05, "epoch": 2.198019801980198, "percentage": 8.79, "elapsed_time": "1:41:11", "remaining_time": "17:29:42"}
{"current_steps": 223, "total_steps": 2525, "loss": 0.0142, "lr": 8.814229249011859e-05, "epoch": 2.207920792079208, "percentage": 8.83, "elapsed_time": "1:41:38", "remaining_time": "17:29:09"}
{"current_steps": 224, "total_steps": 2525, "loss": 0.0398, "lr": 8.853754940711463e-05, "epoch": 2.217821782178218, "percentage": 8.87, "elapsed_time": "1:42:04", "remaining_time": "17:28:35"}
{"current_steps": 225, "total_steps": 2525, "loss": 0.0152, "lr": 8.893280632411068e-05, "epoch": 2.227722772277228, "percentage": 8.91, "elapsed_time": "1:42:31", "remaining_time": "17:28:01"}
{"current_steps": 225, "total_steps": 2525, "eval_loss": 0.021625498309731483, "epoch": 2.227722772277228, "percentage": 8.91, "elapsed_time": "1:42:53", "remaining_time": "17:31:43"}
{"current_steps": 226, "total_steps": 2525, "loss": 0.0153, "lr": 8.932806324110672e-05, "epoch": 2.237623762376238, "percentage": 8.95, "elapsed_time": "1:43:19", "remaining_time": "17:31:04"}
{"current_steps": 227, "total_steps": 2525, "loss": 0.0143, "lr": 8.972332015810277e-05, "epoch": 2.2475247524752477, "percentage": 8.99, "elapsed_time": "1:43:45", "remaining_time": "17:30:25"}
{"current_steps": 228, "total_steps": 2525, "loss": 0.0144, "lr": 9.011857707509881e-05, "epoch": 2.2574257425742577, "percentage": 9.03, "elapsed_time": "1:44:12", "remaining_time": "17:29:46"}
{"current_steps": 229, "total_steps": 2525, "loss": 0.0204, "lr": 9.051383399209486e-05, "epoch": 2.2673267326732676, "percentage": 9.07, "elapsed_time": "1:44:38", "remaining_time": "17:29:07"}
{"current_steps": 230, "total_steps": 2525, "loss": 0.0241, "lr": 9.090909090909092e-05, "epoch": 2.2772277227722775, "percentage": 9.11, "elapsed_time": "1:45:04", "remaining_time": "17:28:29"}
{"current_steps": 231, "total_steps": 2525, "loss": 0.0189, "lr": 9.130434782608696e-05, "epoch": 2.287128712871287, "percentage": 9.15, "elapsed_time": "1:45:30", "remaining_time": "17:27:49"}
{"current_steps": 232, "total_steps": 2525, "loss": 0.0168, "lr": 9.169960474308301e-05, "epoch": 2.297029702970297, "percentage": 9.19, "elapsed_time": "1:45:57", "remaining_time": "17:27:11"}
{"current_steps": 233, "total_steps": 2525, "loss": 0.0173, "lr": 9.209486166007905e-05, "epoch": 2.3069306930693068, "percentage": 9.23, "elapsed_time": "1:46:23", "remaining_time": "17:26:33"}
{"current_steps": 234, "total_steps": 2525, "loss": 0.0186, "lr": 9.24901185770751e-05, "epoch": 2.3168316831683167, "percentage": 9.27, "elapsed_time": "1:46:49", "remaining_time": "17:25:55"}
{"current_steps": 235, "total_steps": 2525, "loss": 0.0166, "lr": 9.288537549407114e-05, "epoch": 2.3267326732673266, "percentage": 9.31, "elapsed_time": "1:47:16", "remaining_time": "17:25:16"}
{"current_steps": 236, "total_steps": 2525, "loss": 0.0258, "lr": 9.32806324110672e-05, "epoch": 2.3366336633663365, "percentage": 9.35, "elapsed_time": "1:47:42", "remaining_time": "17:24:39"}
{"current_steps": 237, "total_steps": 2525, "loss": 0.0165, "lr": 9.367588932806325e-05, "epoch": 2.3465346534653464, "percentage": 9.39, "elapsed_time": "1:48:08", "remaining_time": "17:24:00"}
{"current_steps": 238, "total_steps": 2525, "loss": 0.0288, "lr": 9.407114624505929e-05, "epoch": 2.3564356435643563, "percentage": 9.43, "elapsed_time": "1:48:34", "remaining_time": "17:23:21"}
{"current_steps": 239, "total_steps": 2525, "loss": 0.0216, "lr": 9.446640316205534e-05, "epoch": 2.366336633663366, "percentage": 9.47, "elapsed_time": "1:49:01", "remaining_time": "17:22:45"}
{"current_steps": 240, "total_steps": 2525, "loss": 0.0133, "lr": 9.486166007905138e-05, "epoch": 2.376237623762376, "percentage": 9.5, "elapsed_time": "1:49:27", "remaining_time": "17:22:08"}
{"current_steps": 241, "total_steps": 2525, "loss": 0.026, "lr": 9.525691699604744e-05, "epoch": 2.386138613861386, "percentage": 9.54, "elapsed_time": "1:49:53", "remaining_time": "17:21:31"}
{"current_steps": 242, "total_steps": 2525, "loss": 0.0218, "lr": 9.565217391304348e-05, "epoch": 2.396039603960396, "percentage": 9.58, "elapsed_time": "1:50:20", "remaining_time": "17:20:55"}
{"current_steps": 243, "total_steps": 2525, "loss": 0.0099, "lr": 9.604743083003953e-05, "epoch": 2.405940594059406, "percentage": 9.62, "elapsed_time": "1:50:46", "remaining_time": "17:20:18"}
{"current_steps": 244, "total_steps": 2525, "loss": 0.0202, "lr": 9.644268774703557e-05, "epoch": 2.4158415841584158, "percentage": 9.66, "elapsed_time": "1:51:12", "remaining_time": "17:19:41"}
{"current_steps": 245, "total_steps": 2525, "loss": 0.0203, "lr": 9.683794466403162e-05, "epoch": 2.4257425742574257, "percentage": 9.7, "elapsed_time": "1:51:39", "remaining_time": "17:19:04"}
{"current_steps": 246, "total_steps": 2525, "loss": 0.0299, "lr": 9.723320158102768e-05, "epoch": 2.4356435643564356, "percentage": 9.74, "elapsed_time": "1:52:05", "remaining_time": "17:18:28"}
{"current_steps": 247, "total_steps": 2525, "loss": 0.0209, "lr": 9.762845849802372e-05, "epoch": 2.4455445544554455, "percentage": 9.78, "elapsed_time": "1:52:31", "remaining_time": "17:17:50"}
{"current_steps": 248, "total_steps": 2525, "loss": 0.0264, "lr": 9.802371541501977e-05, "epoch": 2.4554455445544554, "percentage": 9.82, "elapsed_time": "1:52:58", "remaining_time": "17:17:12"}
{"current_steps": 249, "total_steps": 2525, "loss": 0.0132, "lr": 9.841897233201581e-05, "epoch": 2.4653465346534653, "percentage": 9.86, "elapsed_time": "1:53:24", "remaining_time": "17:16:35"}
{"current_steps": 250, "total_steps": 2525, "loss": 0.011, "lr": 9.881422924901186e-05, "epoch": 2.4752475247524752, "percentage": 9.9, "elapsed_time": "1:53:50", "remaining_time": "17:15:58"}
{"current_steps": 250, "total_steps": 2525, "eval_loss": 0.02048182487487793, "epoch": 2.4752475247524752, "percentage": 9.9, "elapsed_time": "1:54:11", "remaining_time": "17:19:09"}
{"current_steps": 251, "total_steps": 2525, "loss": 0.0112, "lr": 9.920948616600791e-05, "epoch": 2.485148514851485, "percentage": 9.94, "elapsed_time": "1:54:37", "remaining_time": "17:18:31"}
{"current_steps": 252, "total_steps": 2525, "loss": 0.0172, "lr": 9.960474308300396e-05, "epoch": 2.495049504950495, "percentage": 9.98, "elapsed_time": "1:55:04", "remaining_time": "17:17:53"}
{"current_steps": 253, "total_steps": 2525, "loss": 0.0135, "lr": 0.0001, "epoch": 2.504950495049505, "percentage": 10.02, "elapsed_time": "1:55:30", "remaining_time": "17:17:15"}
{"current_steps": 254, "total_steps": 2525, "loss": 0.0175, "lr": 9.999995220053555e-05, "epoch": 2.514851485148515, "percentage": 10.06, "elapsed_time": "1:55:56", "remaining_time": "17:16:38"}
{"current_steps": 255, "total_steps": 2525, "loss": 0.0305, "lr": 9.999980880223359e-05, "epoch": 2.5247524752475248, "percentage": 10.1, "elapsed_time": "1:56:22", "remaining_time": "17:16:02"}
{"current_steps": 256, "total_steps": 2525, "loss": 0.0246, "lr": 9.999956980536828e-05, "epoch": 2.5346534653465347, "percentage": 10.14, "elapsed_time": "1:56:51", "remaining_time": "17:15:45"}
{"current_steps": 257, "total_steps": 2525, "loss": 0.0109, "lr": 9.999923521039659e-05, "epoch": 2.5445544554455446, "percentage": 10.18, "elapsed_time": "1:57:17", "remaining_time": "17:15:06"}
{"current_steps": 258, "total_steps": 2525, "loss": 0.0138, "lr": 9.999880501795826e-05, "epoch": 2.5544554455445545, "percentage": 10.22, "elapsed_time": "1:57:43", "remaining_time": "17:14:29"}
{"current_steps": 259, "total_steps": 2525, "loss": 0.0099, "lr": 9.99982792288758e-05, "epoch": 2.5643564356435644, "percentage": 10.26, "elapsed_time": "1:58:10", "remaining_time": "17:13:52"}
{"current_steps": 260, "total_steps": 2525, "loss": 0.0192, "lr": 9.999765784415451e-05, "epoch": 2.5742574257425743, "percentage": 10.3, "elapsed_time": "1:58:36", "remaining_time": "17:13:16"}
{"current_steps": 261, "total_steps": 2525, "loss": 0.0211, "lr": 9.999694086498248e-05, "epoch": 2.5841584158415842, "percentage": 10.34, "elapsed_time": "1:59:02", "remaining_time": "17:12:39"}
{"current_steps": 262, "total_steps": 2525, "loss": 0.0125, "lr": 9.999612829273053e-05, "epoch": 2.594059405940594, "percentage": 10.38, "elapsed_time": "1:59:29", "remaining_time": "17:12:02"}
{"current_steps": 263, "total_steps": 2525, "loss": 0.0237, "lr": 9.99952201289523e-05, "epoch": 2.603960396039604, "percentage": 10.42, "elapsed_time": "1:59:55", "remaining_time": "17:11:26"}
{"current_steps": 264, "total_steps": 2525, "loss": 0.0156, "lr": 9.999421637538418e-05, "epoch": 2.613861386138614, "percentage": 10.46, "elapsed_time": "2:00:21", "remaining_time": "17:10:50"}
{"current_steps": 265, "total_steps": 2525, "loss": 0.0175, "lr": 9.999311703394532e-05, "epoch": 2.623762376237624, "percentage": 10.5, "elapsed_time": "2:00:48", "remaining_time": "17:10:13"}
{"current_steps": 266, "total_steps": 2525, "loss": 0.0301, "lr": 9.999192210673762e-05, "epoch": 2.633663366336634, "percentage": 10.53, "elapsed_time": "2:01:14", "remaining_time": "17:09:36"}
{"current_steps": 267, "total_steps": 2525, "loss": 0.0178, "lr": 9.999063159604579e-05, "epoch": 2.6435643564356437, "percentage": 10.57, "elapsed_time": "2:01:40", "remaining_time": "17:08:59"}
{"current_steps": 268, "total_steps": 2525, "loss": 0.0161, "lr": 9.998924550433723e-05, "epoch": 2.6534653465346536, "percentage": 10.61, "elapsed_time": "2:02:06", "remaining_time": "17:08:23"}
{"current_steps": 269, "total_steps": 2525, "loss": 0.024, "lr": 9.998776383426216e-05, "epoch": 2.6633663366336635, "percentage": 10.65, "elapsed_time": "2:02:33", "remaining_time": "17:07:47"}
{"current_steps": 270, "total_steps": 2525, "loss": 0.0125, "lr": 9.998618658865344e-05, "epoch": 2.6732673267326734, "percentage": 10.69, "elapsed_time": "2:02:59", "remaining_time": "17:07:12"}
{"current_steps": 271, "total_steps": 2525, "loss": 0.0214, "lr": 9.998451377052678e-05, "epoch": 2.6831683168316833, "percentage": 10.73, "elapsed_time": "2:03:25", "remaining_time": "17:06:35"}
{"current_steps": 272, "total_steps": 2525, "loss": 0.0182, "lr": 9.998274538308054e-05, "epoch": 2.693069306930693, "percentage": 10.77, "elapsed_time": "2:03:52", "remaining_time": "17:06:00"}
{"current_steps": 273, "total_steps": 2525, "loss": 0.0268, "lr": 9.998088142969586e-05, "epoch": 2.7029702970297027, "percentage": 10.81, "elapsed_time": "2:04:18", "remaining_time": "17:05:24"}
{"current_steps": 274, "total_steps": 2525, "loss": 0.0088, "lr": 9.997892191393657e-05, "epoch": 2.7128712871287126, "percentage": 10.85, "elapsed_time": "2:04:44", "remaining_time": "17:04:49"}
{"current_steps": 275, "total_steps": 2525, "loss": 0.0154, "lr": 9.997686683954923e-05, "epoch": 2.7227722772277225, "percentage": 10.89, "elapsed_time": "2:05:10", "remaining_time": "17:04:13"}
{"current_steps": 275, "total_steps": 2525, "eval_loss": 0.019408825784921646, "epoch": 2.7227722772277225, "percentage": 10.89, "elapsed_time": "2:05:31", "remaining_time": "17:07:04"}
{"current_steps": 276, "total_steps": 2525, "loss": 0.0172, "lr": 9.997471621046308e-05, "epoch": 2.7326732673267324, "percentage": 10.93, "elapsed_time": "2:05:58", "remaining_time": "17:06:29"}
{"current_steps": 277, "total_steps": 2525, "loss": 0.0317, "lr": 9.997247003079008e-05, "epoch": 2.7425742574257423, "percentage": 10.97, "elapsed_time": "2:06:24", "remaining_time": "17:05:52"}
{"current_steps": 278, "total_steps": 2525, "loss": 0.0246, "lr": 9.997012830482491e-05, "epoch": 2.7524752475247523, "percentage": 11.01, "elapsed_time": "2:06:50", "remaining_time": "17:05:15"}
{"current_steps": 279, "total_steps": 2525, "loss": 0.0183, "lr": 9.996769103704486e-05, "epoch": 2.762376237623762, "percentage": 11.05, "elapsed_time": "2:07:16", "remaining_time": "17:04:38"}
{"current_steps": 280, "total_steps": 2525, "loss": 0.0219, "lr": 9.996515823210997e-05, "epoch": 2.772277227722772, "percentage": 11.09, "elapsed_time": "2:07:43", "remaining_time": "17:04:01"}
{"current_steps": 281, "total_steps": 2525, "loss": 0.0143, "lr": 9.996252989486287e-05, "epoch": 2.782178217821782, "percentage": 11.13, "elapsed_time": "2:08:09", "remaining_time": "17:03:25"}
{"current_steps": 282, "total_steps": 2525, "loss": 0.0178, "lr": 9.99598060303289e-05, "epoch": 2.792079207920792, "percentage": 11.17, "elapsed_time": "2:08:35", "remaining_time": "17:02:49"}
{"current_steps": 283, "total_steps": 2525, "loss": 0.0114, "lr": 9.995698664371604e-05, "epoch": 2.801980198019802, "percentage": 11.21, "elapsed_time": "2:09:01", "remaining_time": "17:02:13"}
{"current_steps": 284, "total_steps": 2525, "loss": 0.019, "lr": 9.995407174041489e-05, "epoch": 2.8118811881188117, "percentage": 11.25, "elapsed_time": "2:09:28", "remaining_time": "17:01:38"}
{"current_steps": 285, "total_steps": 2525, "loss": 0.0114, "lr": 9.995106132599869e-05, "epoch": 2.8217821782178216, "percentage": 11.29, "elapsed_time": "2:09:54", "remaining_time": "17:01:02"}
{"current_steps": 286, "total_steps": 2525, "loss": 0.0121, "lr": 9.994795540622328e-05, "epoch": 2.8316831683168315, "percentage": 11.33, "elapsed_time": "2:10:20", "remaining_time": "17:00:26"}
{"current_steps": 287, "total_steps": 2525, "loss": 0.0133, "lr": 9.99447539870271e-05, "epoch": 2.8415841584158414, "percentage": 11.37, "elapsed_time": "2:10:47", "remaining_time": "16:59:51"}
{"current_steps": 288, "total_steps": 2525, "loss": 0.0198, "lr": 9.99414570745312e-05, "epoch": 2.8514851485148514, "percentage": 11.41, "elapsed_time": "2:11:13", "remaining_time": "16:59:14"}
{"current_steps": 289, "total_steps": 2525, "loss": 0.0169, "lr": 9.993806467503923e-05, "epoch": 2.8613861386138613, "percentage": 11.45, "elapsed_time": "2:11:39", "remaining_time": "16:58:38"}
{"current_steps": 290, "total_steps": 2525, "loss": 0.0214, "lr": 9.993457679503737e-05, "epoch": 2.871287128712871, "percentage": 11.49, "elapsed_time": "2:12:05", "remaining_time": "16:58:03"}
{"current_steps": 291, "total_steps": 2525, "loss": 0.0104, "lr": 9.993099344119437e-05, "epoch": 2.881188118811881, "percentage": 11.52, "elapsed_time": "2:12:32", "remaining_time": "16:57:28"}
{"current_steps": 292, "total_steps": 2525, "loss": 0.0183, "lr": 9.992731462036152e-05, "epoch": 2.891089108910891, "percentage": 11.56, "elapsed_time": "2:12:58", "remaining_time": "16:56:53"}
{"current_steps": 293, "total_steps": 2525, "loss": 0.0095, "lr": 9.992354033957266e-05, "epoch": 2.900990099009901, "percentage": 11.6, "elapsed_time": "2:13:24", "remaining_time": "16:56:18"}
{"current_steps": 294, "total_steps": 2525, "loss": 0.0197, "lr": 9.991967060604413e-05, "epoch": 2.910891089108911, "percentage": 11.64, "elapsed_time": "2:13:51", "remaining_time": "16:55:43"}
{"current_steps": 295, "total_steps": 2525, "loss": 0.0219, "lr": 9.991570542717477e-05, "epoch": 2.9207920792079207, "percentage": 11.68, "elapsed_time": "2:14:17", "remaining_time": "16:55:08"}
{"current_steps": 296, "total_steps": 2525, "loss": 0.0127, "lr": 9.991164481054591e-05, "epoch": 2.9306930693069306, "percentage": 11.72, "elapsed_time": "2:14:43", "remaining_time": "16:54:33"}
{"current_steps": 297, "total_steps": 2525, "loss": 0.0161, "lr": 9.99074887639214e-05, "epoch": 2.9405940594059405, "percentage": 11.76, "elapsed_time": "2:15:10", "remaining_time": "16:53:58"}
{"current_steps": 298, "total_steps": 2525, "loss": 0.019, "lr": 9.990323729524747e-05, "epoch": 2.9504950495049505, "percentage": 11.8, "elapsed_time": "2:15:36", "remaining_time": "16:53:22"}
{"current_steps": 299, "total_steps": 2525, "loss": 0.0149, "lr": 9.989889041265286e-05, "epoch": 2.9603960396039604, "percentage": 11.84, "elapsed_time": "2:16:02", "remaining_time": "16:52:47"}
{"current_steps": 300, "total_steps": 2525, "loss": 0.021, "lr": 9.98944481244487e-05, "epoch": 2.9702970297029703, "percentage": 11.88, "elapsed_time": "2:16:28", "remaining_time": "16:52:12"}
{"current_steps": 300, "total_steps": 2525, "eval_loss": 0.019180113449692726, "epoch": 2.9702970297029703, "percentage": 11.88, "elapsed_time": "2:16:49", "remaining_time": "16:54:47"}
{"current_steps": 301, "total_steps": 2525, "loss": 0.01, "lr": 9.988991043912857e-05, "epoch": 2.98019801980198, "percentage": 11.92, "elapsed_time": "2:17:23", "remaining_time": "16:55:10"}
{"current_steps": 302, "total_steps": 2525, "loss": 0.0326, "lr": 9.988527736536841e-05, "epoch": 2.99009900990099, "percentage": 11.96, "elapsed_time": "2:17:49", "remaining_time": "16:54:32"}
{"current_steps": 303, "total_steps": 2525, "loss": 0.0052, "lr": 9.988054891202656e-05, "epoch": 3.0, "percentage": 12.0, "elapsed_time": "2:17:58", "remaining_time": "16:51:48"}
{"current_steps": 304, "total_steps": 2525, "loss": 0.0093, "lr": 9.987572508814372e-05, "epoch": 3.00990099009901, "percentage": 12.04, "elapsed_time": "2:18:24", "remaining_time": "16:51:15"}
{"current_steps": 305, "total_steps": 2525, "loss": 0.0293, "lr": 9.987080590294295e-05, "epoch": 3.01980198019802, "percentage": 12.08, "elapsed_time": "2:18:51", "remaining_time": "16:50:40"}
{"current_steps": 306, "total_steps": 2525, "loss": 0.0273, "lr": 9.986579136582963e-05, "epoch": 3.0297029702970297, "percentage": 12.12, "elapsed_time": "2:19:17", "remaining_time": "16:50:04"}
{"current_steps": 307, "total_steps": 2525, "loss": 0.0079, "lr": 9.986068148639143e-05, "epoch": 3.0396039603960396, "percentage": 12.16, "elapsed_time": "2:19:43", "remaining_time": "16:49:30"}
{"current_steps": 308, "total_steps": 2525, "loss": 0.0139, "lr": 9.985547627439835e-05, "epoch": 3.0495049504950495, "percentage": 12.2, "elapsed_time": "2:20:10", "remaining_time": "16:48:56"}
{"current_steps": 309, "total_steps": 2525, "loss": 0.0094, "lr": 9.985017573980262e-05, "epoch": 3.0594059405940595, "percentage": 12.24, "elapsed_time": "2:20:36", "remaining_time": "16:48:20"}
{"current_steps": 310, "total_steps": 2525, "loss": 0.0156, "lr": 9.984477989273876e-05, "epoch": 3.0693069306930694, "percentage": 12.28, "elapsed_time": "2:21:02", "remaining_time": "16:47:47"}
{"current_steps": 311, "total_steps": 2525, "loss": 0.0069, "lr": 9.983928874352352e-05, "epoch": 3.0792079207920793, "percentage": 12.32, "elapsed_time": "2:21:28", "remaining_time": "16:47:12"}
{"current_steps": 312, "total_steps": 2525, "loss": 0.0234, "lr": 9.983370230265585e-05, "epoch": 3.089108910891089, "percentage": 12.36, "elapsed_time": "2:21:55", "remaining_time": "16:46:38"}
{"current_steps": 313, "total_steps": 2525, "loss": 0.0133, "lr": 9.982802058081691e-05, "epoch": 3.099009900990099, "percentage": 12.4, "elapsed_time": "2:22:21", "remaining_time": "16:46:04"}
{"current_steps": 314, "total_steps": 2525, "loss": 0.0225, "lr": 9.982224358887003e-05, "epoch": 3.108910891089109, "percentage": 12.44, "elapsed_time": "2:22:47", "remaining_time": "16:45:29"}
{"current_steps": 315, "total_steps": 2525, "loss": 0.01, "lr": 9.981637133786071e-05, "epoch": 3.118811881188119, "percentage": 12.48, "elapsed_time": "2:23:14", "remaining_time": "16:44:56"}
{"current_steps": 316, "total_steps": 2525, "loss": 0.0071, "lr": 9.981040383901652e-05, "epoch": 3.128712871287129, "percentage": 12.51, "elapsed_time": "2:23:40", "remaining_time": "16:44:21"}
{"current_steps": 317, "total_steps": 2525, "loss": 0.023, "lr": 9.980434110374724e-05, "epoch": 3.1386138613861387, "percentage": 12.55, "elapsed_time": "2:24:06", "remaining_time": "16:43:47"}
{"current_steps": 318, "total_steps": 2525, "loss": 0.0118, "lr": 9.979818314364468e-05, "epoch": 3.1485148514851486, "percentage": 12.59, "elapsed_time": "2:24:33", "remaining_time": "16:43:12"}
{"current_steps": 319, "total_steps": 2525, "loss": 0.0089, "lr": 9.979192997048271e-05, "epoch": 3.1584158415841586, "percentage": 12.63, "elapsed_time": "2:24:59", "remaining_time": "16:42:39"}
{"current_steps": 320, "total_steps": 2525, "loss": 0.0135, "lr": 9.978558159621728e-05, "epoch": 3.1683168316831685, "percentage": 12.67, "elapsed_time": "2:25:25", "remaining_time": "16:42:04"}
{"current_steps": 321, "total_steps": 2525, "loss": 0.012, "lr": 9.977913803298633e-05, "epoch": 3.1782178217821784, "percentage": 12.71, "elapsed_time": "2:25:51", "remaining_time": "16:41:30"}
{"current_steps": 322, "total_steps": 2525, "loss": 0.0089, "lr": 9.977259929310985e-05, "epoch": 3.1881188118811883, "percentage": 12.75, "elapsed_time": "2:26:18", "remaining_time": "16:40:56"}
{"current_steps": 323, "total_steps": 2525, "loss": 0.0088, "lr": 9.97659653890897e-05, "epoch": 3.198019801980198, "percentage": 12.79, "elapsed_time": "2:26:44", "remaining_time": "16:40:22"}
{"current_steps": 324, "total_steps": 2525, "loss": 0.022, "lr": 9.975923633360985e-05, "epoch": 3.207920792079208, "percentage": 12.83, "elapsed_time": "2:27:10", "remaining_time": "16:39:48"}
{"current_steps": 325, "total_steps": 2525, "loss": 0.0282, "lr": 9.975241213953606e-05, "epoch": 3.217821782178218, "percentage": 12.87, "elapsed_time": "2:27:36", "remaining_time": "16:39:15"}
{"current_steps": 325, "total_steps": 2525, "eval_loss": 0.018639273941516876, "epoch": 3.217821782178218, "percentage": 12.87, "elapsed_time": "2:27:57", "remaining_time": "16:41:37"}
{"current_steps": 326, "total_steps": 2525, "loss": 0.0072, "lr": 9.974549281991603e-05, "epoch": 3.227722772277228, "percentage": 12.91, "elapsed_time": "2:28:24", "remaining_time": "16:41:02"}
{"current_steps": 327, "total_steps": 2525, "loss": 0.0199, "lr": 9.973847838797939e-05, "epoch": 3.237623762376238, "percentage": 12.95, "elapsed_time": "2:28:50", "remaining_time": "16:40:28"}
{"current_steps": 328, "total_steps": 2525, "loss": 0.0132, "lr": 9.973136885713754e-05, "epoch": 3.2475247524752477, "percentage": 12.99, "elapsed_time": "2:29:16", "remaining_time": "16:39:54"}
{"current_steps": 329, "total_steps": 2525, "loss": 0.0157, "lr": 9.972416424098379e-05, "epoch": 3.2574257425742577, "percentage": 13.03, "elapsed_time": "2:29:43", "remaining_time": "16:39:20"}
{"current_steps": 330, "total_steps": 2525, "loss": 0.0165, "lr": 9.971686455329319e-05, "epoch": 3.2673267326732676, "percentage": 13.07, "elapsed_time": "2:30:09", "remaining_time": "16:38:46"}
{"current_steps": 331, "total_steps": 2525, "loss": 0.0147, "lr": 9.970946980802261e-05, "epoch": 3.2772277227722775, "percentage": 13.11, "elapsed_time": "2:30:35", "remaining_time": "16:38:11"}
{"current_steps": 332, "total_steps": 2525, "loss": 0.0088, "lr": 9.970198001931062e-05, "epoch": 3.287128712871287, "percentage": 13.15, "elapsed_time": "2:31:01", "remaining_time": "16:37:37"}
{"current_steps": 333, "total_steps": 2525, "loss": 0.0169, "lr": 9.969439520147754e-05, "epoch": 3.297029702970297, "percentage": 13.19, "elapsed_time": "2:31:28", "remaining_time": "16:37:03"}
{"current_steps": 334, "total_steps": 2525, "loss": 0.0176, "lr": 9.968671536902539e-05, "epoch": 3.3069306930693068, "percentage": 13.23, "elapsed_time": "2:31:54", "remaining_time": "16:36:29"}
{"current_steps": 335, "total_steps": 2525, "loss": 0.0128, "lr": 9.967894053663782e-05, "epoch": 3.3168316831683167, "percentage": 13.27, "elapsed_time": "2:32:20", "remaining_time": "16:35:55"}
{"current_steps": 336, "total_steps": 2525, "loss": 0.0124, "lr": 9.967107071918019e-05, "epoch": 3.3267326732673266, "percentage": 13.31, "elapsed_time": "2:32:46", "remaining_time": "16:35:21"}
{"current_steps": 337, "total_steps": 2525, "loss": 0.0266, "lr": 9.966310593169936e-05, "epoch": 3.3366336633663365, "percentage": 13.35, "elapsed_time": "2:33:13", "remaining_time": "16:34:48"}
{"current_steps": 338, "total_steps": 2525, "loss": 0.0078, "lr": 9.965504618942389e-05, "epoch": 3.3465346534653464, "percentage": 13.39, "elapsed_time": "2:33:39", "remaining_time": "16:34:14"}
{"current_steps": 339, "total_steps": 2525, "loss": 0.0163, "lr": 9.96468915077638e-05, "epoch": 3.3564356435643563, "percentage": 13.43, "elapsed_time": "2:34:05", "remaining_time": "16:33:40"}
{"current_steps": 340, "total_steps": 2525, "loss": 0.0212, "lr": 9.963864190231067e-05, "epoch": 3.366336633663366, "percentage": 13.47, "elapsed_time": "2:34:32", "remaining_time": "16:33:06"}
{"current_steps": 341, "total_steps": 2525, "loss": 0.0315, "lr": 9.96302973888376e-05, "epoch": 3.376237623762376, "percentage": 13.5, "elapsed_time": "2:34:58", "remaining_time": "16:32:33"}
{"current_steps": 342, "total_steps": 2525, "loss": 0.0111, "lr": 9.962185798329909e-05, "epoch": 3.386138613861386, "percentage": 13.54, "elapsed_time": "2:35:24", "remaining_time": "16:31:59"}
{"current_steps": 343, "total_steps": 2525, "loss": 0.0107, "lr": 9.96133237018311e-05, "epoch": 3.396039603960396, "percentage": 13.58, "elapsed_time": "2:35:50", "remaining_time": "16:31:26"}
{"current_steps": 344, "total_steps": 2525, "loss": 0.0166, "lr": 9.960469456075099e-05, "epoch": 3.405940594059406, "percentage": 13.62, "elapsed_time": "2:36:17", "remaining_time": "16:30:53"}
{"current_steps": 345, "total_steps": 2525, "loss": 0.0215, "lr": 9.959597057655753e-05, "epoch": 3.4158415841584158, "percentage": 13.66, "elapsed_time": "2:36:43", "remaining_time": "16:30:19"}
{"current_steps": 346, "total_steps": 2525, "loss": 0.0139, "lr": 9.958715176593076e-05, "epoch": 3.4257425742574257, "percentage": 13.7, "elapsed_time": "2:37:09", "remaining_time": "16:29:46"}
{"current_steps": 347, "total_steps": 2525, "loss": 0.0096, "lr": 9.957823814573206e-05, "epoch": 3.4356435643564356, "percentage": 13.74, "elapsed_time": "2:37:36", "remaining_time": "16:29:13"}
{"current_steps": 348, "total_steps": 2525, "loss": 0.0129, "lr": 9.956922973300409e-05, "epoch": 3.4455445544554455, "percentage": 13.78, "elapsed_time": "2:38:02", "remaining_time": "16:28:39"}
{"current_steps": 349, "total_steps": 2525, "loss": 0.016, "lr": 9.956012654497074e-05, "epoch": 3.4554455445544554, "percentage": 13.82, "elapsed_time": "2:38:28", "remaining_time": "16:28:06"}
{"current_steps": 350, "total_steps": 2525, "loss": 0.007, "lr": 9.95509285990371e-05, "epoch": 3.4653465346534653, "percentage": 13.86, "elapsed_time": "2:38:54", "remaining_time": "16:27:32"}
{"current_steps": 350, "total_steps": 2525, "eval_loss": 0.018103841692209244, "epoch": 3.4653465346534653, "percentage": 13.86, "elapsed_time": "2:39:15", "remaining_time": "16:29:42"}
{"current_steps": 351, "total_steps": 2525, "loss": 0.0322, "lr": 9.954163591278945e-05, "epoch": 3.4752475247524752, "percentage": 13.9, "elapsed_time": "2:39:42", "remaining_time": "16:29:08"}
{"current_steps": 352, "total_steps": 2525, "loss": 0.0091, "lr": 9.953224850399524e-05, "epoch": 3.485148514851485, "percentage": 13.94, "elapsed_time": "2:40:08", "remaining_time": "16:28:34"}
{"current_steps": 353, "total_steps": 2525, "loss": 0.0298, "lr": 9.952276639060292e-05, "epoch": 3.495049504950495, "percentage": 13.98, "elapsed_time": "2:40:34", "remaining_time": "16:28:00"}
{"current_steps": 354, "total_steps": 2525, "loss": 0.009, "lr": 9.951318959074216e-05, "epoch": 3.504950495049505, "percentage": 14.02, "elapsed_time": "2:41:00", "remaining_time": "16:27:27"}
{"current_steps": 355, "total_steps": 2525, "loss": 0.0081, "lr": 9.950351812272356e-05, "epoch": 3.514851485148515, "percentage": 14.06, "elapsed_time": "2:41:27", "remaining_time": "16:26:54"}
{"current_steps": 356, "total_steps": 2525, "loss": 0.0086, "lr": 9.949375200503877e-05, "epoch": 3.5247524752475248, "percentage": 14.1, "elapsed_time": "2:41:53", "remaining_time": "16:26:20"}
{"current_steps": 357, "total_steps": 2525, "loss": 0.0201, "lr": 9.948389125636039e-05, "epoch": 3.5346534653465347, "percentage": 14.14, "elapsed_time": "2:42:19", "remaining_time": "16:25:47"}
{"current_steps": 358, "total_steps": 2525, "loss": 0.015, "lr": 9.947393589554197e-05, "epoch": 3.5445544554455446, "percentage": 14.18, "elapsed_time": "2:42:46", "remaining_time": "16:25:14"}
{"current_steps": 359, "total_steps": 2525, "loss": 0.0081, "lr": 9.946388594161795e-05, "epoch": 3.5544554455445545, "percentage": 14.22, "elapsed_time": "2:43:12", "remaining_time": "16:24:40"}
{"current_steps": 360, "total_steps": 2525, "loss": 0.0153, "lr": 9.945374141380361e-05, "epoch": 3.5643564356435644, "percentage": 14.26, "elapsed_time": "2:43:38", "remaining_time": "16:24:08"}
{"current_steps": 361, "total_steps": 2525, "loss": 0.0128, "lr": 9.944350233149509e-05, "epoch": 3.5742574257425743, "percentage": 14.3, "elapsed_time": "2:44:04", "remaining_time": "16:23:34"}
{"current_steps": 362, "total_steps": 2525, "loss": 0.0368, "lr": 9.943316871426929e-05, "epoch": 3.5841584158415842, "percentage": 14.34, "elapsed_time": "2:44:31", "remaining_time": "16:23:01"}
{"current_steps": 363, "total_steps": 2525, "loss": 0.0245, "lr": 9.942274058188383e-05, "epoch": 3.594059405940594, "percentage": 14.38, "elapsed_time": "2:44:57", "remaining_time": "16:22:29"}
{"current_steps": 364, "total_steps": 2525, "loss": 0.0119, "lr": 9.941221795427713e-05, "epoch": 3.603960396039604, "percentage": 14.42, "elapsed_time": "2:45:23", "remaining_time": "16:21:56"}
{"current_steps": 365, "total_steps": 2525, "loss": 0.007, "lr": 9.94016008515682e-05, "epoch": 3.613861386138614, "percentage": 14.46, "elapsed_time": "2:45:50", "remaining_time": "16:21:23"}
{"current_steps": 366, "total_steps": 2525, "loss": 0.0124, "lr": 9.939088929405674e-05, "epoch": 3.623762376237624, "percentage": 14.5, "elapsed_time": "2:46:16", "remaining_time": "16:20:51"}
{"current_steps": 367, "total_steps": 2525, "loss": 0.0089, "lr": 9.938008330222296e-05, "epoch": 3.633663366336634, "percentage": 14.53, "elapsed_time": "2:46:42", "remaining_time": "16:20:17"}
{"current_steps": 368, "total_steps": 2525, "loss": 0.0101, "lr": 9.936918289672774e-05, "epoch": 3.6435643564356437, "percentage": 14.57, "elapsed_time": "2:47:09", "remaining_time": "16:19:44"}
{"current_steps": 369, "total_steps": 2525, "loss": 0.0093, "lr": 9.93581880984124e-05, "epoch": 3.6534653465346536, "percentage": 14.61, "elapsed_time": "2:47:35", "remaining_time": "16:19:11"}
{"current_steps": 370, "total_steps": 2525, "loss": 0.0143, "lr": 9.934709892829875e-05, "epoch": 3.6633663366336635, "percentage": 14.65, "elapsed_time": "2:48:01", "remaining_time": "16:18:38"}
{"current_steps": 371, "total_steps": 2525, "loss": 0.0403, "lr": 9.933591540758907e-05, "epoch": 3.6732673267326734, "percentage": 14.69, "elapsed_time": "2:48:27", "remaining_time": "16:18:05"}
{"current_steps": 372, "total_steps": 2525, "loss": 0.0297, "lr": 9.932463755766599e-05, "epoch": 3.6831683168316833, "percentage": 14.73, "elapsed_time": "2:48:54", "remaining_time": "16:17:32"}
{"current_steps": 373, "total_steps": 2525, "loss": 0.0228, "lr": 9.931326540009253e-05, "epoch": 3.693069306930693, "percentage": 14.77, "elapsed_time": "2:49:20", "remaining_time": "16:16:59"}
{"current_steps": 374, "total_steps": 2525, "loss": 0.007, "lr": 9.930179895661201e-05, "epoch": 3.7029702970297027, "percentage": 14.81, "elapsed_time": "2:49:46", "remaining_time": "16:16:26"}
{"current_steps": 375, "total_steps": 2525, "loss": 0.017, "lr": 9.929023824914802e-05, "epoch": 3.7128712871287126, "percentage": 14.85, "elapsed_time": "2:50:12", "remaining_time": "16:15:54"}
{"current_steps": 375, "total_steps": 2525, "eval_loss": 0.018772218376398087, "epoch": 3.7128712871287126, "percentage": 14.85, "elapsed_time": "2:50:33", "remaining_time": "16:17:54"}
{"current_steps": 376, "total_steps": 2525, "loss": 0.0177, "lr": 9.927858329980439e-05, "epoch": 3.7227722772277225, "percentage": 14.89, "elapsed_time": "2:51:00", "remaining_time": "16:17:21"}
{"current_steps": 377, "total_steps": 2525, "loss": 0.0229, "lr": 9.926683413086514e-05, "epoch": 3.7326732673267324, "percentage": 14.93, "elapsed_time": "2:51:26", "remaining_time": "16:16:48"}
{"current_steps": 378, "total_steps": 2525, "loss": 0.0169, "lr": 9.925499076479441e-05, "epoch": 3.7425742574257423, "percentage": 14.97, "elapsed_time": "2:51:52", "remaining_time": "16:16:14"}
{"current_steps": 379, "total_steps": 2525, "loss": 0.034, "lr": 9.924305322423649e-05, "epoch": 3.7524752475247523, "percentage": 15.01, "elapsed_time": "2:52:19", "remaining_time": "16:15:42"}
{"current_steps": 380, "total_steps": 2525, "loss": 0.0098, "lr": 9.923102153201566e-05, "epoch": 3.762376237623762, "percentage": 15.05, "elapsed_time": "2:52:45", "remaining_time": "16:15:10"}
{"current_steps": 381, "total_steps": 2525, "loss": 0.0123, "lr": 9.921889571113628e-05, "epoch": 3.772277227722772, "percentage": 15.09, "elapsed_time": "2:53:11", "remaining_time": "16:14:37"}
{"current_steps": 382, "total_steps": 2525, "loss": 0.0202, "lr": 9.920667578478268e-05, "epoch": 3.782178217821782, "percentage": 15.13, "elapsed_time": "2:53:38", "remaining_time": "16:14:05"}
{"current_steps": 383, "total_steps": 2525, "loss": 0.0096, "lr": 9.919436177631907e-05, "epoch": 3.792079207920792, "percentage": 15.17, "elapsed_time": "2:54:04", "remaining_time": "16:13:32"}
{"current_steps": 384, "total_steps": 2525, "loss": 0.017, "lr": 9.918195370928957e-05, "epoch": 3.801980198019802, "percentage": 15.21, "elapsed_time": "2:54:30", "remaining_time": "16:12:59"}
{"current_steps": 385, "total_steps": 2525, "loss": 0.007, "lr": 9.916945160741817e-05, "epoch": 3.8118811881188117, "percentage": 15.25, "elapsed_time": "2:54:56", "remaining_time": "16:12:26"}
{"current_steps": 386, "total_steps": 2525, "loss": 0.0091, "lr": 9.915685549460861e-05, "epoch": 3.8217821782178216, "percentage": 15.29, "elapsed_time": "2:55:23", "remaining_time": "16:11:54"}
{"current_steps": 387, "total_steps": 2525, "loss": 0.009, "lr": 9.914416539494435e-05, "epoch": 3.8316831683168315, "percentage": 15.33, "elapsed_time": "2:55:49", "remaining_time": "16:11:21"}
{"current_steps": 388, "total_steps": 2525, "loss": 0.0082, "lr": 9.913138133268862e-05, "epoch": 3.8415841584158414, "percentage": 15.37, "elapsed_time": "2:56:15", "remaining_time": "16:10:49"}
{"current_steps": 389, "total_steps": 2525, "loss": 0.0159, "lr": 9.911850333228427e-05, "epoch": 3.8514851485148514, "percentage": 15.41, "elapsed_time": "2:56:42", "remaining_time": "16:10:16"}
{"current_steps": 390, "total_steps": 2525, "loss": 0.0179, "lr": 9.910553141835376e-05, "epoch": 3.8613861386138613, "percentage": 15.45, "elapsed_time": "2:57:08", "remaining_time": "16:09:44"}
{"current_steps": 391, "total_steps": 2525, "loss": 0.0192, "lr": 9.909246561569912e-05, "epoch": 3.871287128712871, "percentage": 15.49, "elapsed_time": "2:57:34", "remaining_time": "16:09:11"}
{"current_steps": 392, "total_steps": 2525, "loss": 0.0233, "lr": 9.907930594930185e-05, "epoch": 3.881188118811881, "percentage": 15.52, "elapsed_time": "2:58:01", "remaining_time": "16:08:39"}
{"current_steps": 393, "total_steps": 2525, "loss": 0.012, "lr": 9.9066052444323e-05, "epoch": 3.891089108910891, "percentage": 15.56, "elapsed_time": "2:58:27", "remaining_time": "16:08:06"}
{"current_steps": 394, "total_steps": 2525, "loss": 0.0279, "lr": 9.905270512610296e-05, "epoch": 3.900990099009901, "percentage": 15.6, "elapsed_time": "2:58:53", "remaining_time": "16:07:34"}
{"current_steps": 395, "total_steps": 2525, "loss": 0.0069, "lr": 9.903926402016153e-05, "epoch": 3.910891089108911, "percentage": 15.64, "elapsed_time": "2:59:19", "remaining_time": "16:07:01"}
{"current_steps": 396, "total_steps": 2525, "loss": 0.0073, "lr": 9.902572915219779e-05, "epoch": 3.9207920792079207, "percentage": 15.68, "elapsed_time": "2:59:46", "remaining_time": "16:06:29"}
{"current_steps": 397, "total_steps": 2525, "loss": 0.0181, "lr": 9.901210054809015e-05, "epoch": 3.9306930693069306, "percentage": 15.72, "elapsed_time": "3:00:12", "remaining_time": "16:05:56"}
{"current_steps": 398, "total_steps": 2525, "loss": 0.0078, "lr": 9.899837823389618e-05, "epoch": 3.9405940594059405, "percentage": 15.76, "elapsed_time": "3:00:38", "remaining_time": "16:05:24"}
{"current_steps": 399, "total_steps": 2525, "loss": 0.0132, "lr": 9.898456223585267e-05, "epoch": 3.9504950495049505, "percentage": 15.8, "elapsed_time": "3:01:05", "remaining_time": "16:04:52"}
{"current_steps": 400, "total_steps": 2525, "loss": 0.0315, "lr": 9.897065258037552e-05, "epoch": 3.9603960396039604, "percentage": 15.84, "elapsed_time": "3:01:31", "remaining_time": "16:04:20"}
{"current_steps": 400, "total_steps": 2525, "eval_loss": 0.018521126359701157, "epoch": 3.9603960396039604, "percentage": 15.84, "elapsed_time": "3:01:52", "remaining_time": "16:06:11"}
{"current_steps": 401, "total_steps": 2525, "loss": 0.0164, "lr": 9.895664929405966e-05, "epoch": 3.9702970297029703, "percentage": 15.88, "elapsed_time": "3:02:26", "remaining_time": "16:06:21"}
{"current_steps": 402, "total_steps": 2525, "loss": 0.015, "lr": 9.89425524036791e-05, "epoch": 3.98019801980198, "percentage": 15.92, "elapsed_time": "3:02:52", "remaining_time": "16:05:48"}
{"current_steps": 403, "total_steps": 2525, "loss": 0.012, "lr": 9.892836193618679e-05, "epoch": 3.99009900990099, "percentage": 15.96, "elapsed_time": "3:03:19", "remaining_time": "16:05:15"}
{"current_steps": 404, "total_steps": 2525, "loss": 0.009, "lr": 9.89140779187146e-05, "epoch": 4.0, "percentage": 16.0, "elapsed_time": "3:03:27", "remaining_time": "16:03:10"}
{"current_steps": 405, "total_steps": 2525, "loss": 0.0169, "lr": 9.889970037857324e-05, "epoch": 4.00990099009901, "percentage": 16.04, "elapsed_time": "3:03:54", "remaining_time": "16:02:40"}
{"current_steps": 406, "total_steps": 2525, "loss": 0.0201, "lr": 9.88852293432523e-05, "epoch": 4.01980198019802, "percentage": 16.08, "elapsed_time": "3:04:20", "remaining_time": "16:02:07"}
{"current_steps": 407, "total_steps": 2525, "loss": 0.0134, "lr": 9.887066484042007e-05, "epoch": 4.02970297029703, "percentage": 16.12, "elapsed_time": "3:04:46", "remaining_time": "16:01:35"}
{"current_steps": 408, "total_steps": 2525, "loss": 0.0063, "lr": 9.885600689792356e-05, "epoch": 4.03960396039604, "percentage": 16.16, "elapsed_time": "3:05:13", "remaining_time": "16:01:03"}
{"current_steps": 409, "total_steps": 2525, "loss": 0.0112, "lr": 9.884125554378845e-05, "epoch": 4.0495049504950495, "percentage": 16.2, "elapsed_time": "3:05:39", "remaining_time": "16:00:30"}
{"current_steps": 410, "total_steps": 2525, "loss": 0.0265, "lr": 9.882641080621902e-05, "epoch": 4.0594059405940595, "percentage": 16.24, "elapsed_time": "3:06:05", "remaining_time": "15:59:58"}
{"current_steps": 411, "total_steps": 2525, "loss": 0.0141, "lr": 9.881147271359807e-05, "epoch": 4.069306930693069, "percentage": 16.28, "elapsed_time": "3:06:31", "remaining_time": "15:59:26"}
{"current_steps": 412, "total_steps": 2525, "loss": 0.0072, "lr": 9.879644129448694e-05, "epoch": 4.079207920792079, "percentage": 16.32, "elapsed_time": "3:06:58", "remaining_time": "15:58:54"}
{"current_steps": 413, "total_steps": 2525, "loss": 0.0112, "lr": 9.878131657762535e-05, "epoch": 4.089108910891089, "percentage": 16.36, "elapsed_time": "3:07:24", "remaining_time": "15:58:22"}
{"current_steps": 414, "total_steps": 2525, "loss": 0.0057, "lr": 9.876609859193145e-05, "epoch": 4.099009900990099, "percentage": 16.4, "elapsed_time": "3:07:50", "remaining_time": "15:57:50"}
{"current_steps": 415, "total_steps": 2525, "loss": 0.0183, "lr": 9.875078736650172e-05, "epoch": 4.108910891089109, "percentage": 16.44, "elapsed_time": "3:08:17", "remaining_time": "15:57:18"}
{"current_steps": 416, "total_steps": 2525, "loss": 0.0148, "lr": 9.873538293061087e-05, "epoch": 4.118811881188119, "percentage": 16.48, "elapsed_time": "3:08:43", "remaining_time": "15:56:46"}
{"current_steps": 417, "total_steps": 2525, "loss": 0.006, "lr": 9.871988531371185e-05, "epoch": 4.128712871287129, "percentage": 16.51, "elapsed_time": "3:09:09", "remaining_time": "15:56:15"}
{"current_steps": 418, "total_steps": 2525, "loss": 0.0083, "lr": 9.870429454543582e-05, "epoch": 4.138613861386139, "percentage": 16.55, "elapsed_time": "3:09:36", "remaining_time": "15:55:42"}
{"current_steps": 419, "total_steps": 2525, "loss": 0.0157, "lr": 9.868861065559192e-05, "epoch": 4.148514851485149, "percentage": 16.59, "elapsed_time": "3:10:02", "remaining_time": "15:55:10"}
{"current_steps": 420, "total_steps": 2525, "loss": 0.0066, "lr": 9.867283367416747e-05, "epoch": 4.158415841584159, "percentage": 16.63, "elapsed_time": "3:10:28", "remaining_time": "15:54:38"}
{"current_steps": 421, "total_steps": 2525, "loss": 0.0144, "lr": 9.865696363132769e-05, "epoch": 4.1683168316831685, "percentage": 16.67, "elapsed_time": "3:10:54", "remaining_time": "15:54:06"}
{"current_steps": 422, "total_steps": 2525, "loss": 0.005, "lr": 9.864100055741576e-05, "epoch": 4.178217821782178, "percentage": 16.71, "elapsed_time": "3:11:21", "remaining_time": "15:53:34"}
{"current_steps": 423, "total_steps": 2525, "loss": 0.0066, "lr": 9.862494448295277e-05, "epoch": 4.188118811881188, "percentage": 16.75, "elapsed_time": "3:11:47", "remaining_time": "15:53:02"}
{"current_steps": 424, "total_steps": 2525, "loss": 0.0182, "lr": 9.860879543863755e-05, "epoch": 4.198019801980198, "percentage": 16.79, "elapsed_time": "3:12:13", "remaining_time": "15:52:31"}
{"current_steps": 425, "total_steps": 2525, "loss": 0.0156, "lr": 9.859255345534675e-05, "epoch": 4.207920792079208, "percentage": 16.83, "elapsed_time": "3:12:40", "remaining_time": "15:52:00"}
{"current_steps": 425, "total_steps": 2525, "eval_loss": 0.019263744354248047, "epoch": 4.207920792079208, "percentage": 16.83, "elapsed_time": "3:13:01", "remaining_time": "15:53:43"}
{"current_steps": 426, "total_steps": 2525, "loss": 0.0052, "lr": 9.857621856413469e-05, "epoch": 4.217821782178218, "percentage": 16.87, "elapsed_time": "3:13:27", "remaining_time": "15:53:11"}
{"current_steps": 427, "total_steps": 2525, "loss": 0.0118, "lr": 9.855979079623332e-05, "epoch": 4.227722772277228, "percentage": 16.91, "elapsed_time": "3:13:53", "remaining_time": "15:52:39"}
{"current_steps": 428, "total_steps": 2525, "loss": 0.0093, "lr": 9.85432701830522e-05, "epoch": 4.237623762376238, "percentage": 16.95, "elapsed_time": "3:14:19", "remaining_time": "15:52:08"}
{"current_steps": 429, "total_steps": 2525, "loss": 0.0174, "lr": 9.852665675617837e-05, "epoch": 4.247524752475248, "percentage": 16.99, "elapsed_time": "3:14:46", "remaining_time": "15:51:37"}
{"current_steps": 430, "total_steps": 2525, "loss": 0.0062, "lr": 9.850995054737637e-05, "epoch": 4.257425742574258, "percentage": 17.03, "elapsed_time": "3:15:12", "remaining_time": "15:51:04"}
{"current_steps": 431, "total_steps": 2525, "loss": 0.0067, "lr": 9.849315158858807e-05, "epoch": 4.267326732673268, "percentage": 17.07, "elapsed_time": "3:15:38", "remaining_time": "15:50:32"}
{"current_steps": 432, "total_steps": 2525, "loss": 0.019, "lr": 9.847625991193277e-05, "epoch": 4.2772277227722775, "percentage": 17.11, "elapsed_time": "3:16:05", "remaining_time": "15:50:00"}
{"current_steps": 433, "total_steps": 2525, "loss": 0.0275, "lr": 9.845927554970698e-05, "epoch": 4.287128712871287, "percentage": 17.15, "elapsed_time": "3:16:31", "remaining_time": "15:49:28"}
{"current_steps": 434, "total_steps": 2525, "loss": 0.0263, "lr": 9.84421985343844e-05, "epoch": 4.297029702970297, "percentage": 17.19, "elapsed_time": "3:16:57", "remaining_time": "15:48:56"}
{"current_steps": 435, "total_steps": 2525, "loss": 0.0063, "lr": 9.842502889861596e-05, "epoch": 4.306930693069307, "percentage": 17.23, "elapsed_time": "3:17:23", "remaining_time": "15:48:25"}
{"current_steps": 436, "total_steps": 2525, "loss": 0.0104, "lr": 9.840776667522962e-05, "epoch": 4.316831683168317, "percentage": 17.27, "elapsed_time": "3:17:50", "remaining_time": "15:47:53"}
{"current_steps": 437, "total_steps": 2525, "loss": 0.0113, "lr": 9.839041189723039e-05, "epoch": 4.326732673267327, "percentage": 17.31, "elapsed_time": "3:18:16", "remaining_time": "15:47:21"}
{"current_steps": 438, "total_steps": 2525, "loss": 0.0277, "lr": 9.837296459780022e-05, "epoch": 4.336633663366337, "percentage": 17.35, "elapsed_time": "3:18:42", "remaining_time": "15:46:49"}
{"current_steps": 439, "total_steps": 2525, "loss": 0.014, "lr": 9.835542481029798e-05, "epoch": 4.346534653465347, "percentage": 17.39, "elapsed_time": "3:19:09", "remaining_time": "15:46:18"}
{"current_steps": 440, "total_steps": 2525, "loss": 0.014, "lr": 9.833779256825937e-05, "epoch": 4.356435643564357, "percentage": 17.43, "elapsed_time": "3:19:35", "remaining_time": "15:45:47"}
{"current_steps": 441, "total_steps": 2525, "loss": 0.0075, "lr": 9.832006790539685e-05, "epoch": 4.366336633663367, "percentage": 17.47, "elapsed_time": "3:20:01", "remaining_time": "15:45:15"}
{"current_steps": 442, "total_steps": 2525, "loss": 0.0106, "lr": 9.830225085559961e-05, "epoch": 4.376237623762377, "percentage": 17.5, "elapsed_time": "3:20:27", "remaining_time": "15:44:43"}
{"current_steps": 443, "total_steps": 2525, "loss": 0.02, "lr": 9.828434145293346e-05, "epoch": 4.3861386138613865, "percentage": 17.54, "elapsed_time": "3:20:54", "remaining_time": "15:44:12"}
{"current_steps": 444, "total_steps": 2525, "loss": 0.0122, "lr": 9.826633973164079e-05, "epoch": 4.396039603960396, "percentage": 17.58, "elapsed_time": "3:21:20", "remaining_time": "15:43:41"}
{"current_steps": 445, "total_steps": 2525, "loss": 0.0134, "lr": 9.824824572614051e-05, "epoch": 4.405940594059406, "percentage": 17.62, "elapsed_time": "3:21:47", "remaining_time": "15:43:10"}
{"current_steps": 446, "total_steps": 2525, "loss": 0.0056, "lr": 9.823005947102797e-05, "epoch": 4.415841584158416, "percentage": 17.66, "elapsed_time": "3:22:13", "remaining_time": "15:42:39"}
{"current_steps": 447, "total_steps": 2525, "loss": 0.0211, "lr": 9.821178100107489e-05, "epoch": 4.425742574257426, "percentage": 17.7, "elapsed_time": "3:22:39", "remaining_time": "15:42:07"}
{"current_steps": 448, "total_steps": 2525, "loss": 0.0065, "lr": 9.819341035122933e-05, "epoch": 4.435643564356436, "percentage": 17.74, "elapsed_time": "3:23:05", "remaining_time": "15:41:35"}
{"current_steps": 449, "total_steps": 2525, "loss": 0.0164, "lr": 9.817494755661558e-05, "epoch": 4.445544554455446, "percentage": 17.78, "elapsed_time": "3:23:32", "remaining_time": "15:41:04"}
{"current_steps": 450, "total_steps": 2525, "loss": 0.0059, "lr": 9.815639265253409e-05, "epoch": 4.455445544554456, "percentage": 17.82, "elapsed_time": "3:23:58", "remaining_time": "15:40:33"}
{"current_steps": 450, "total_steps": 2525, "eval_loss": 0.01967804692685604, "epoch": 4.455445544554456, "percentage": 17.82, "elapsed_time": "3:24:19", "remaining_time": "15:42:09"}
{"current_steps": 451, "total_steps": 2525, "loss": 0.0064, "lr": 9.813774567446145e-05, "epoch": 4.465346534653466, "percentage": 17.86, "elapsed_time": "3:24:45", "remaining_time": "15:41:37"}
{"current_steps": 452, "total_steps": 2525, "loss": 0.0167, "lr": 9.811900665805029e-05, "epoch": 4.475247524752476, "percentage": 17.9, "elapsed_time": "3:25:11", "remaining_time": "15:41:06"}
{"current_steps": 453, "total_steps": 2525, "loss": 0.0062, "lr": 9.81001756391292e-05, "epoch": 4.485148514851485, "percentage": 17.94, "elapsed_time": "3:25:38", "remaining_time": "15:40:34"}
{"current_steps": 454, "total_steps": 2525, "loss": 0.0082, "lr": 9.808125265370269e-05, "epoch": 4.4950495049504955, "percentage": 17.98, "elapsed_time": "3:26:04", "remaining_time": "15:40:02"}
{"current_steps": 455, "total_steps": 2525, "loss": 0.0083, "lr": 9.806223773795108e-05, "epoch": 4.5049504950495045, "percentage": 18.02, "elapsed_time": "3:26:30", "remaining_time": "15:39:30"}
{"current_steps": 456, "total_steps": 2525, "loss": 0.0131, "lr": 9.804313092823049e-05, "epoch": 4.514851485148515, "percentage": 18.06, "elapsed_time": "3:26:57", "remaining_time": "15:38:59"}
{"current_steps": 457, "total_steps": 2525, "loss": 0.0086, "lr": 9.802393226107278e-05, "epoch": 4.524752475247524, "percentage": 18.1, "elapsed_time": "3:27:23", "remaining_time": "15:38:28"}
{"current_steps": 458, "total_steps": 2525, "loss": 0.0131, "lr": 9.800464177318531e-05, "epoch": 4.534653465346535, "percentage": 18.14, "elapsed_time": "3:27:49", "remaining_time": "15:37:56"}
{"current_steps": 459, "total_steps": 2525, "loss": 0.0056, "lr": 9.798525950145115e-05, "epoch": 4.544554455445544, "percentage": 18.18, "elapsed_time": "3:28:15", "remaining_time": "15:37:25"}
{"current_steps": 460, "total_steps": 2525, "loss": 0.0113, "lr": 9.796578548292874e-05, "epoch": 4.554455445544555, "percentage": 18.22, "elapsed_time": "3:28:42", "remaining_time": "15:36:53"}
{"current_steps": 461, "total_steps": 2525, "loss": 0.0081, "lr": 9.794621975485201e-05, "epoch": 4.564356435643564, "percentage": 18.26, "elapsed_time": "3:29:08", "remaining_time": "15:36:22"}
{"current_steps": 462, "total_steps": 2525, "loss": 0.0091, "lr": 9.79265623546302e-05, "epoch": 4.574257425742574, "percentage": 18.3, "elapsed_time": "3:29:34", "remaining_time": "15:35:50"}
{"current_steps": 463, "total_steps": 2525, "loss": 0.0217, "lr": 9.790681331984785e-05, "epoch": 4.584158415841584, "percentage": 18.34, "elapsed_time": "3:30:01", "remaining_time": "15:35:19"}
{"current_steps": 464, "total_steps": 2525, "loss": 0.0067, "lr": 9.78869726882647e-05, "epoch": 4.594059405940594, "percentage": 18.38, "elapsed_time": "3:30:27", "remaining_time": "15:34:48"}
{"current_steps": 465, "total_steps": 2525, "loss": 0.017, "lr": 9.786704049781558e-05, "epoch": 4.603960396039604, "percentage": 18.42, "elapsed_time": "3:30:53", "remaining_time": "15:34:17"}
{"current_steps": 466, "total_steps": 2525, "loss": 0.006, "lr": 9.784701678661045e-05, "epoch": 4.6138613861386135, "percentage": 18.46, "elapsed_time": "3:31:20", "remaining_time": "15:33:46"}
{"current_steps": 467, "total_steps": 2525, "loss": 0.0214, "lr": 9.782690159293419e-05, "epoch": 4.623762376237623, "percentage": 18.5, "elapsed_time": "3:31:46", "remaining_time": "15:33:15"}
{"current_steps": 468, "total_steps": 2525, "loss": 0.0068, "lr": 9.780669495524661e-05, "epoch": 4.633663366336633, "percentage": 18.53, "elapsed_time": "3:32:12", "remaining_time": "15:32:44"}
{"current_steps": 469, "total_steps": 2525, "loss": 0.0132, "lr": 9.77863969121824e-05, "epoch": 4.643564356435643, "percentage": 18.57, "elapsed_time": "3:32:39", "remaining_time": "15:32:13"}
{"current_steps": 470, "total_steps": 2525, "loss": 0.0104, "lr": 9.776600750255099e-05, "epoch": 4.653465346534653, "percentage": 18.61, "elapsed_time": "3:33:05", "remaining_time": "15:31:42"}
{"current_steps": 471, "total_steps": 2525, "loss": 0.019, "lr": 9.774552676533644e-05, "epoch": 4.663366336633663, "percentage": 18.65, "elapsed_time": "3:33:31", "remaining_time": "15:31:11"}
{"current_steps": 472, "total_steps": 2525, "loss": 0.0185, "lr": 9.772495473969751e-05, "epoch": 4.673267326732673, "percentage": 18.69, "elapsed_time": "3:33:58", "remaining_time": "15:30:39"}
{"current_steps": 473, "total_steps": 2525, "loss": 0.013, "lr": 9.77042914649675e-05, "epoch": 4.683168316831683, "percentage": 18.73, "elapsed_time": "3:34:24", "remaining_time": "15:30:08"}
{"current_steps": 474, "total_steps": 2525, "loss": 0.0111, "lr": 9.768353698065412e-05, "epoch": 4.693069306930693, "percentage": 18.77, "elapsed_time": "3:34:50", "remaining_time": "15:29:37"}
{"current_steps": 475, "total_steps": 2525, "loss": 0.0136, "lr": 9.766269132643951e-05, "epoch": 4.702970297029703, "percentage": 18.81, "elapsed_time": "3:35:16", "remaining_time": "15:29:06"}
{"current_steps": 475, "total_steps": 2525, "eval_loss": 0.019799688830971718, "epoch": 4.702970297029703, "percentage": 18.81, "elapsed_time": "3:35:37", "remaining_time": "15:30:36"}
{"current_steps": 476, "total_steps": 2525, "loss": 0.0163, "lr": 9.76417545421801e-05, "epoch": 4.712871287128713, "percentage": 18.85, "elapsed_time": "3:36:04", "remaining_time": "15:30:05"}
{"current_steps": 477, "total_steps": 2525, "loss": 0.0245, "lr": 9.762072666790658e-05, "epoch": 4.7227722772277225, "percentage": 18.89, "elapsed_time": "3:36:30", "remaining_time": "15:29:34"}
{"current_steps": 478, "total_steps": 2525, "loss": 0.0142, "lr": 9.75996077438238e-05, "epoch": 4.732673267326732, "percentage": 18.93, "elapsed_time": "3:36:56", "remaining_time": "15:29:03"}
{"current_steps": 479, "total_steps": 2525, "loss": 0.0114, "lr": 9.757839781031069e-05, "epoch": 4.742574257425742, "percentage": 18.97, "elapsed_time": "3:37:23", "remaining_time": "15:28:31"}
{"current_steps": 480, "total_steps": 2525, "loss": 0.0095, "lr": 9.755709690792017e-05, "epoch": 4.752475247524752, "percentage": 19.01, "elapsed_time": "3:37:49", "remaining_time": "15:28:00"}
{"current_steps": 481, "total_steps": 2525, "loss": 0.0223, "lr": 9.753570507737914e-05, "epoch": 4.762376237623762, "percentage": 19.05, "elapsed_time": "3:38:15", "remaining_time": "15:27:29"}
{"current_steps": 482, "total_steps": 2525, "loss": 0.0196, "lr": 9.751422235958829e-05, "epoch": 4.772277227722772, "percentage": 19.09, "elapsed_time": "3:38:42", "remaining_time": "15:26:58"}
{"current_steps": 483, "total_steps": 2525, "loss": 0.0275, "lr": 9.749264879562216e-05, "epoch": 4.782178217821782, "percentage": 19.13, "elapsed_time": "3:39:08", "remaining_time": "15:26:27"}
{"current_steps": 484, "total_steps": 2525, "loss": 0.0197, "lr": 9.74709844267289e-05, "epoch": 4.792079207920792, "percentage": 19.17, "elapsed_time": "3:39:34", "remaining_time": "15:25:56"}
{"current_steps": 485, "total_steps": 2525, "loss": 0.018, "lr": 9.744922929433033e-05, "epoch": 4.801980198019802, "percentage": 19.21, "elapsed_time": "3:40:00", "remaining_time": "15:25:25"}
{"current_steps": 486, "total_steps": 2525, "loss": 0.0185, "lr": 9.74273834400218e-05, "epoch": 4.811881188118812, "percentage": 19.25, "elapsed_time": "3:40:27", "remaining_time": "15:24:54"}
{"current_steps": 487, "total_steps": 2525, "loss": 0.0284, "lr": 9.740544690557213e-05, "epoch": 4.821782178217822, "percentage": 19.29, "elapsed_time": "3:40:53", "remaining_time": "15:24:22"}
{"current_steps": 488, "total_steps": 2525, "loss": 0.0319, "lr": 9.738341973292349e-05, "epoch": 4.8316831683168315, "percentage": 19.33, "elapsed_time": "3:41:19", "remaining_time": "15:23:51"}
{"current_steps": 489, "total_steps": 2525, "loss": 0.0139, "lr": 9.736130196419135e-05, "epoch": 4.841584158415841, "percentage": 19.37, "elapsed_time": "3:41:45", "remaining_time": "15:23:20"}
{"current_steps": 490, "total_steps": 2525, "loss": 0.0078, "lr": 9.733909364166442e-05, "epoch": 4.851485148514851, "percentage": 19.41, "elapsed_time": "3:42:12", "remaining_time": "15:22:49"}
{"current_steps": 491, "total_steps": 2525, "loss": 0.0175, "lr": 9.731679480780456e-05, "epoch": 4.861386138613861, "percentage": 19.45, "elapsed_time": "3:42:38", "remaining_time": "15:22:18"}
{"current_steps": 492, "total_steps": 2525, "loss": 0.0065, "lr": 9.729440550524664e-05, "epoch": 4.871287128712871, "percentage": 19.49, "elapsed_time": "3:43:04", "remaining_time": "15:21:47"}
{"current_steps": 493, "total_steps": 2525, "loss": 0.0126, "lr": 9.727192577679851e-05, "epoch": 4.881188118811881, "percentage": 19.52, "elapsed_time": "3:43:30", "remaining_time": "15:21:16"}
{"current_steps": 494, "total_steps": 2525, "loss": 0.0365, "lr": 9.724935566544098e-05, "epoch": 4.891089108910891, "percentage": 19.56, "elapsed_time": "3:43:57", "remaining_time": "15:20:45"}
{"current_steps": 495, "total_steps": 2525, "loss": 0.0219, "lr": 9.722669521432757e-05, "epoch": 4.900990099009901, "percentage": 19.6, "elapsed_time": "3:44:23", "remaining_time": "15:20:13"}
{"current_steps": 496, "total_steps": 2525, "loss": 0.0147, "lr": 9.720394446678458e-05, "epoch": 4.910891089108911, "percentage": 19.64, "elapsed_time": "3:44:49", "remaining_time": "15:19:42"}
{"current_steps": 497, "total_steps": 2525, "loss": 0.0152, "lr": 9.718110346631099e-05, "epoch": 4.920792079207921, "percentage": 19.68, "elapsed_time": "3:45:16", "remaining_time": "15:19:11"}
{"current_steps": 498, "total_steps": 2525, "loss": 0.0117, "lr": 9.715817225657827e-05, "epoch": 4.930693069306931, "percentage": 19.72, "elapsed_time": "3:45:42", "remaining_time": "15:18:41"}
{"current_steps": 499, "total_steps": 2525, "loss": 0.0099, "lr": 9.713515088143042e-05, "epoch": 4.9405940594059405, "percentage": 19.76, "elapsed_time": "3:46:08", "remaining_time": "15:18:10"}
{"current_steps": 500, "total_steps": 2525, "loss": 0.0092, "lr": 9.71120393848838e-05, "epoch": 4.9504950495049505, "percentage": 19.8, "elapsed_time": "3:46:35", "remaining_time": "15:17:39"}
{"current_steps": 500, "total_steps": 2525, "eval_loss": 0.021699432283639908, "epoch": 4.9504950495049505, "percentage": 19.8, "elapsed_time": "3:46:56", "remaining_time": "15:19:05"}
{"current_steps": 501, "total_steps": 2525, "loss": 0.0138, "lr": 9.70888378111271e-05, "epoch": 4.96039603960396, "percentage": 19.84, "elapsed_time": "3:47:30", "remaining_time": "15:19:06"}
{"current_steps": 502, "total_steps": 2525, "loss": 0.0065, "lr": 9.706554620452125e-05, "epoch": 4.97029702970297, "percentage": 19.88, "elapsed_time": "3:47:56", "remaining_time": "15:18:35"}
{"current_steps": 503, "total_steps": 2525, "loss": 0.013, "lr": 9.704216460959929e-05, "epoch": 4.98019801980198, "percentage": 19.92, "elapsed_time": "3:48:23", "remaining_time": "15:18:04"}
{"current_steps": 504, "total_steps": 2525, "loss": 0.0208, "lr": 9.701869307106633e-05, "epoch": 4.99009900990099, "percentage": 19.96, "elapsed_time": "3:48:49", "remaining_time": "15:17:32"}
{"current_steps": 505, "total_steps": 2525, "loss": 0.0146, "lr": 9.699513163379943e-05, "epoch": 5.0, "percentage": 20.0, "elapsed_time": "3:48:57", "remaining_time": "15:15:51"}
{"current_steps": 506, "total_steps": 2525, "loss": 0.0117, "lr": 9.697148034284759e-05, "epoch": 5.00990099009901, "percentage": 20.04, "elapsed_time": "3:49:24", "remaining_time": "15:15:21"}
{"current_steps": 507, "total_steps": 2525, "loss": 0.0052, "lr": 9.694773924343154e-05, "epoch": 5.01980198019802, "percentage": 20.08, "elapsed_time": "3:49:50", "remaining_time": "15:14:50"}
{"current_steps": 508, "total_steps": 2525, "loss": 0.0121, "lr": 9.692390838094377e-05, "epoch": 5.02970297029703, "percentage": 20.12, "elapsed_time": "3:50:16", "remaining_time": "15:14:19"}
{"current_steps": 509, "total_steps": 2525, "loss": 0.0261, "lr": 9.689998780094837e-05, "epoch": 5.03960396039604, "percentage": 20.16, "elapsed_time": "3:50:43", "remaining_time": "15:13:50"}
{"current_steps": 510, "total_steps": 2525, "loss": 0.006, "lr": 9.687597754918099e-05, "epoch": 5.0495049504950495, "percentage": 20.2, "elapsed_time": "3:51:09", "remaining_time": "15:13:19"}
{"current_steps": 511, "total_steps": 2525, "loss": 0.0067, "lr": 9.68518776715487e-05, "epoch": 5.0594059405940595, "percentage": 20.24, "elapsed_time": "3:51:36", "remaining_time": "15:12:48"}
{"current_steps": 512, "total_steps": 2525, "loss": 0.0067, "lr": 9.682768821412997e-05, "epoch": 5.069306930693069, "percentage": 20.28, "elapsed_time": "3:52:02", "remaining_time": "15:12:17"}
{"current_steps": 513, "total_steps": 2525, "loss": 0.0079, "lr": 9.68034092231745e-05, "epoch": 5.079207920792079, "percentage": 20.32, "elapsed_time": "3:52:28", "remaining_time": "15:11:46"}
{"current_steps": 514, "total_steps": 2525, "loss": 0.0199, "lr": 9.677904074510322e-05, "epoch": 5.089108910891089, "percentage": 20.36, "elapsed_time": "3:52:54", "remaining_time": "15:11:15"}
{"current_steps": 515, "total_steps": 2525, "loss": 0.0121, "lr": 9.675458282650813e-05, "epoch": 5.099009900990099, "percentage": 20.4, "elapsed_time": "3:53:21", "remaining_time": "15:10:45"}
{"current_steps": 516, "total_steps": 2525, "loss": 0.0063, "lr": 9.673003551415224e-05, "epoch": 5.108910891089109, "percentage": 20.44, "elapsed_time": "3:53:47", "remaining_time": "15:10:14"}
{"current_steps": 517, "total_steps": 2525, "loss": 0.0207, "lr": 9.67053988549695e-05, "epoch": 5.118811881188119, "percentage": 20.48, "elapsed_time": "3:54:13", "remaining_time": "15:09:43"}
{"current_steps": 518, "total_steps": 2525, "loss": 0.012, "lr": 9.668067289606466e-05, "epoch": 5.128712871287129, "percentage": 20.51, "elapsed_time": "3:54:40", "remaining_time": "15:09:13"}
{"current_steps": 519, "total_steps": 2525, "loss": 0.0052, "lr": 9.665585768471324e-05, "epoch": 5.138613861386139, "percentage": 20.55, "elapsed_time": "3:55:06", "remaining_time": "15:08:43"}
{"current_steps": 520, "total_steps": 2525, "loss": 0.0226, "lr": 9.663095326836138e-05, "epoch": 5.148514851485149, "percentage": 20.59, "elapsed_time": "3:55:32", "remaining_time": "15:08:13"}
{"current_steps": 521, "total_steps": 2525, "loss": 0.0157, "lr": 9.660595969462578e-05, "epoch": 5.158415841584159, "percentage": 20.63, "elapsed_time": "3:55:59", "remaining_time": "15:07:42"}
{"current_steps": 522, "total_steps": 2525, "loss": 0.0052, "lr": 9.658087701129365e-05, "epoch": 5.1683168316831685, "percentage": 20.67, "elapsed_time": "3:56:25", "remaining_time": "15:07:11"}
{"current_steps": 523, "total_steps": 2525, "loss": 0.0129, "lr": 9.655570526632252e-05, "epoch": 5.178217821782178, "percentage": 20.71, "elapsed_time": "3:56:51", "remaining_time": "15:06:41"}
{"current_steps": 524, "total_steps": 2525, "loss": 0.0177, "lr": 9.653044450784023e-05, "epoch": 5.188118811881188, "percentage": 20.75, "elapsed_time": "3:57:18", "remaining_time": "15:06:11"}
{"current_steps": 525, "total_steps": 2525, "loss": 0.008, "lr": 9.650509478414482e-05, "epoch": 5.198019801980198, "percentage": 20.79, "elapsed_time": "3:57:44", "remaining_time": "15:05:41"}
{"current_steps": 525, "total_steps": 2525, "eval_loss": 0.01887640729546547, "epoch": 5.198019801980198, "percentage": 20.79, "elapsed_time": "3:58:05", "remaining_time": "15:07:00"}
{"current_steps": 525, "total_steps": 2525, "epoch": 5.198019801980198, "percentage": 20.79, "elapsed_time": "3:58:05", "remaining_time": "15:07:02"}