File size: 11,458 Bytes
dfdcb70 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 |
{"current_steps": 10, "total_steps": 450, "loss": 0.3017, "lr": 9.987820251299122e-05, "epoch": 0.022222222222222223, "percentage": 2.22, "elapsed_time": "0:01:08", "remaining_time": "0:50:10"}
{"current_steps": 20, "total_steps": 450, "loss": 0.0063, "lr": 9.951340343707852e-05, "epoch": 0.044444444444444446, "percentage": 4.44, "elapsed_time": "0:02:16", "remaining_time": "0:48:45"}
{"current_steps": 30, "total_steps": 450, "loss": 0.0041, "lr": 9.890738003669029e-05, "epoch": 0.06666666666666667, "percentage": 6.67, "elapsed_time": "0:03:24", "remaining_time": "0:47:36"}
{"current_steps": 30, "total_steps": 450, "eval_loss": 0.004034009762108326, "epoch": 0.06666666666666667, "percentage": 6.67, "elapsed_time": "0:05:08", "remaining_time": "1:11:53"}
{"current_steps": 40, "total_steps": 450, "loss": 0.004, "lr": 9.806308479691595e-05, "epoch": 0.08888888888888889, "percentage": 8.89, "elapsed_time": "0:06:16", "remaining_time": "1:04:15"}
{"current_steps": 50, "total_steps": 450, "loss": 0.004, "lr": 9.698463103929542e-05, "epoch": 0.1111111111111111, "percentage": 11.11, "elapsed_time": "0:07:24", "remaining_time": "0:59:14"}
{"current_steps": 60, "total_steps": 450, "loss": 0.0039, "lr": 9.567727288213005e-05, "epoch": 0.13333333333333333, "percentage": 13.33, "elapsed_time": "0:08:32", "remaining_time": "0:55:30"}
{"current_steps": 60, "total_steps": 450, "eval_loss": 0.0039054970256984234, "epoch": 0.13333333333333333, "percentage": 13.33, "elapsed_time": "0:10:16", "remaining_time": "1:06:46"}
{"current_steps": 70, "total_steps": 450, "loss": 0.0039, "lr": 9.414737964294636e-05, "epoch": 0.15555555555555556, "percentage": 15.56, "elapsed_time": "0:11:24", "remaining_time": "1:01:55"}
{"current_steps": 80, "total_steps": 450, "loss": 0.0039, "lr": 9.24024048078213e-05, "epoch": 0.17777777777777778, "percentage": 17.78, "elapsed_time": "0:12:32", "remaining_time": "0:58:00"}
{"current_steps": 90, "total_steps": 450, "loss": 0.0039, "lr": 9.045084971874738e-05, "epoch": 0.2, "percentage": 20.0, "elapsed_time": "0:13:40", "remaining_time": "0:54:42"}
{"current_steps": 90, "total_steps": 450, "eval_loss": 0.0038894277531653643, "epoch": 0.2, "percentage": 20.0, "elapsed_time": "0:16:30", "remaining_time": "1:06:01"}
{"current_steps": 100, "total_steps": 450, "loss": 0.0039, "lr": 8.83022221559489e-05, "epoch": 0.2222222222222222, "percentage": 22.22, "elapsed_time": "0:18:36", "remaining_time": "1:05:08"}
{"current_steps": 110, "total_steps": 450, "loss": 0.0039, "lr": 8.596699001693255e-05, "epoch": 0.24444444444444444, "percentage": 24.44, "elapsed_time": "0:19:44", "remaining_time": "1:01:01"}
{"current_steps": 120, "total_steps": 450, "loss": 0.0039, "lr": 8.345653031794292e-05, "epoch": 0.26666666666666666, "percentage": 26.67, "elapsed_time": "0:20:52", "remaining_time": "0:57:25"}
{"current_steps": 120, "total_steps": 450, "eval_loss": 0.00390805397182703, "epoch": 0.26666666666666666, "percentage": 26.67, "elapsed_time": "0:22:37", "remaining_time": "1:02:11"}
{"current_steps": 130, "total_steps": 450, "loss": 0.0039, "lr": 8.07830737662829e-05, "epoch": 0.28888888888888886, "percentage": 28.89, "elapsed_time": "0:23:45", "remaining_time": "0:58:27"}
{"current_steps": 140, "total_steps": 450, "loss": 0.0039, "lr": 7.795964517353735e-05, "epoch": 0.3111111111111111, "percentage": 31.11, "elapsed_time": "0:24:53", "remaining_time": "0:55:06"}
{"current_steps": 150, "total_steps": 450, "loss": 0.0038, "lr": 7.500000000000001e-05, "epoch": 0.3333333333333333, "percentage": 33.33, "elapsed_time": "0:26:01", "remaining_time": "0:52:02"}
{"current_steps": 150, "total_steps": 450, "eval_loss": 0.00407786201685667, "epoch": 0.3333333333333333, "percentage": 33.33, "elapsed_time": "0:27:45", "remaining_time": "0:55:30"}
{"current_steps": 160, "total_steps": 450, "loss": 0.0039, "lr": 7.191855733945387e-05, "epoch": 0.35555555555555557, "percentage": 35.56, "elapsed_time": "0:28:53", "remaining_time": "0:52:21"}
{"current_steps": 170, "total_steps": 450, "loss": 0.0039, "lr": 6.873032967079561e-05, "epoch": 0.37777777777777777, "percentage": 37.78, "elapsed_time": "0:30:01", "remaining_time": "0:49:27"}
{"current_steps": 180, "total_steps": 450, "loss": 0.0038, "lr": 6.545084971874738e-05, "epoch": 0.4, "percentage": 40.0, "elapsed_time": "0:31:09", "remaining_time": "0:46:44"}
{"current_steps": 180, "total_steps": 450, "eval_loss": 0.0037861280143260956, "epoch": 0.4, "percentage": 40.0, "elapsed_time": "0:32:53", "remaining_time": "0:49:20"}
{"current_steps": 190, "total_steps": 450, "loss": 0.0037, "lr": 6.209609477998338e-05, "epoch": 0.4222222222222222, "percentage": 42.22, "elapsed_time": "0:34:01", "remaining_time": "0:46:34"}
{"current_steps": 200, "total_steps": 450, "loss": 0.0034, "lr": 5.868240888334653e-05, "epoch": 0.4444444444444444, "percentage": 44.44, "elapsed_time": "0:35:09", "remaining_time": "0:43:57"}
{"current_steps": 210, "total_steps": 450, "loss": 0.003, "lr": 5.522642316338268e-05, "epoch": 0.4666666666666667, "percentage": 46.67, "elapsed_time": "0:36:18", "remaining_time": "0:41:29"}
{"current_steps": 210, "total_steps": 450, "eval_loss": 0.002776140347123146, "epoch": 0.4666666666666667, "percentage": 46.67, "elapsed_time": "0:38:02", "remaining_time": "0:43:28"}
{"current_steps": 220, "total_steps": 450, "loss": 0.0031, "lr": 5.174497483512506e-05, "epoch": 0.4888888888888889, "percentage": 48.89, "elapsed_time": "0:39:10", "remaining_time": "0:40:56"}
{"current_steps": 230, "total_steps": 450, "loss": 0.0028, "lr": 4.825502516487497e-05, "epoch": 0.5111111111111111, "percentage": 51.11, "elapsed_time": "0:40:18", "remaining_time": "0:38:33"}
{"current_steps": 240, "total_steps": 450, "loss": 0.0029, "lr": 4.477357683661734e-05, "epoch": 0.5333333333333333, "percentage": 53.33, "elapsed_time": "0:41:26", "remaining_time": "0:36:15"}
{"current_steps": 240, "total_steps": 450, "eval_loss": 0.0026384310331195593, "epoch": 0.5333333333333333, "percentage": 53.33, "elapsed_time": "0:43:10", "remaining_time": "0:37:46"}
{"current_steps": 250, "total_steps": 450, "loss": 0.0028, "lr": 4.131759111665349e-05, "epoch": 0.5555555555555556, "percentage": 55.56, "elapsed_time": "0:44:18", "remaining_time": "0:35:26"}
{"current_steps": 260, "total_steps": 450, "loss": 0.0027, "lr": 3.790390522001662e-05, "epoch": 0.5777777777777777, "percentage": 57.78, "elapsed_time": "0:45:26", "remaining_time": "0:33:12"}
{"current_steps": 270, "total_steps": 450, "loss": 0.0027, "lr": 3.4549150281252636e-05, "epoch": 0.6, "percentage": 60.0, "elapsed_time": "0:46:34", "remaining_time": "0:31:02"}
{"current_steps": 270, "total_steps": 450, "eval_loss": 0.0025762419681996107, "epoch": 0.6, "percentage": 60.0, "elapsed_time": "0:48:18", "remaining_time": "0:32:12"}
{"current_steps": 280, "total_steps": 450, "loss": 0.0027, "lr": 3.12696703292044e-05, "epoch": 0.6222222222222222, "percentage": 62.22, "elapsed_time": "0:49:26", "remaining_time": "0:30:01"}
{"current_steps": 290, "total_steps": 450, "loss": 0.0024, "lr": 2.8081442660546125e-05, "epoch": 0.6444444444444445, "percentage": 64.44, "elapsed_time": "0:50:34", "remaining_time": "0:27:54"}
{"current_steps": 300, "total_steps": 450, "loss": 0.0027, "lr": 2.500000000000001e-05, "epoch": 0.6666666666666666, "percentage": 66.67, "elapsed_time": "0:51:42", "remaining_time": "0:25:51"}
{"current_steps": 300, "total_steps": 450, "eval_loss": 0.002488846192136407, "epoch": 0.6666666666666666, "percentage": 66.67, "elapsed_time": "0:53:26", "remaining_time": "0:26:43"}
{"current_steps": 310, "total_steps": 450, "loss": 0.0024, "lr": 2.2040354826462668e-05, "epoch": 0.6888888888888889, "percentage": 68.89, "elapsed_time": "0:54:34", "remaining_time": "0:24:38"}
{"current_steps": 320, "total_steps": 450, "loss": 0.0029, "lr": 1.9216926233717085e-05, "epoch": 0.7111111111111111, "percentage": 71.11, "elapsed_time": "0:55:42", "remaining_time": "0:22:37"}
{"current_steps": 330, "total_steps": 450, "loss": 0.0027, "lr": 1.6543469682057106e-05, "epoch": 0.7333333333333333, "percentage": 73.33, "elapsed_time": "0:56:50", "remaining_time": "0:20:40"}
{"current_steps": 330, "total_steps": 450, "eval_loss": 0.002476006979122758, "epoch": 0.7333333333333333, "percentage": 73.33, "elapsed_time": "0:58:34", "remaining_time": "0:21:18"}
{"current_steps": 340, "total_steps": 450, "loss": 0.0025, "lr": 1.4033009983067452e-05, "epoch": 0.7555555555555555, "percentage": 75.56, "elapsed_time": "0:59:42", "remaining_time": "0:19:19"}
{"current_steps": 350, "total_steps": 450, "loss": 0.0028, "lr": 1.1697777844051105e-05, "epoch": 0.7777777777777778, "percentage": 77.78, "elapsed_time": "1:00:50", "remaining_time": "0:17:23"}
{"current_steps": 360, "total_steps": 450, "loss": 0.0026, "lr": 9.549150281252633e-06, "epoch": 0.8, "percentage": 80.0, "elapsed_time": "1:01:58", "remaining_time": "0:15:29"}
{"current_steps": 360, "total_steps": 450, "eval_loss": 0.0024831434711813927, "epoch": 0.8, "percentage": 80.0, "elapsed_time": "1:03:42", "remaining_time": "0:15:55"}
{"current_steps": 370, "total_steps": 450, "loss": 0.0028, "lr": 7.597595192178702e-06, "epoch": 0.8222222222222222, "percentage": 82.22, "elapsed_time": "1:04:50", "remaining_time": "0:14:01"}
{"current_steps": 380, "total_steps": 450, "loss": 0.0023, "lr": 5.852620357053651e-06, "epoch": 0.8444444444444444, "percentage": 84.44, "elapsed_time": "1:05:58", "remaining_time": "0:12:09"}
{"current_steps": 390, "total_steps": 450, "loss": 0.0026, "lr": 4.322727117869951e-06, "epoch": 0.8666666666666667, "percentage": 86.67, "elapsed_time": "1:07:07", "remaining_time": "0:10:19"}
{"current_steps": 390, "total_steps": 450, "eval_loss": 0.0023999777622520924, "epoch": 0.8666666666666667, "percentage": 86.67, "elapsed_time": "1:08:51", "remaining_time": "0:10:35"}
{"current_steps": 400, "total_steps": 450, "loss": 0.0025, "lr": 3.0153689607045845e-06, "epoch": 0.8888888888888888, "percentage": 88.89, "elapsed_time": "1:09:59", "remaining_time": "0:08:44"}
{"current_steps": 410, "total_steps": 450, "loss": 0.0028, "lr": 1.9369152030840556e-06, "epoch": 0.9111111111111111, "percentage": 91.11, "elapsed_time": "1:11:07", "remaining_time": "0:06:56"}
{"current_steps": 420, "total_steps": 450, "loss": 0.0024, "lr": 1.0926199633097157e-06, "epoch": 0.9333333333333333, "percentage": 93.33, "elapsed_time": "1:12:15", "remaining_time": "0:05:09"}
{"current_steps": 420, "total_steps": 450, "eval_loss": 0.002397245028987527, "epoch": 0.9333333333333333, "percentage": 93.33, "elapsed_time": "1:13:59", "remaining_time": "0:05:17"}
{"current_steps": 430, "total_steps": 450, "loss": 0.0024, "lr": 4.865965629214819e-07, "epoch": 0.9555555555555556, "percentage": 95.56, "elapsed_time": "1:15:07", "remaining_time": "0:03:29"}
{"current_steps": 440, "total_steps": 450, "loss": 0.0023, "lr": 1.2179748700879012e-07, "epoch": 0.9777777777777777, "percentage": 97.78, "elapsed_time": "1:16:15", "remaining_time": "0:01:43"}
{"current_steps": 450, "total_steps": 450, "loss": 0.0025, "lr": 0.0, "epoch": 1.0, "percentage": 100.0, "elapsed_time": "1:17:23", "remaining_time": "0:00:00"}
{"current_steps": 450, "total_steps": 450, "eval_loss": 0.0023939567618072033, "epoch": 1.0, "percentage": 100.0, "elapsed_time": "1:19:07", "remaining_time": "0:00:00"}
{"current_steps": 450, "total_steps": 450, "epoch": 1.0, "percentage": 100.0, "elapsed_time": "1:19:09", "remaining_time": "0:00:00"}
|