Training in progress, epoch 3
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2a1a657e58d0376878b368730aaf4d17b43c84d20486f60a84c29a7c45cad5c0
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:84e9c0314f8dac47c4983a232e0f97fbb9c9dbe3e65707e436724ffc5d0e4802
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8398ac509ddf86ddc30bb5a64f8b7d5635ed9654dd4e9b150fdac5cb2ce53821
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ea3a55d7741ae8fff53a95ae5250da1dfafbef02749a456c108b4eac279f0ce
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -269,3 +269,136 @@
|
|
269 |
{"current_steps": 2680, "total_steps": 4023, "loss": 0.4804, "lr": 5e-06, "epoch": 1.9985085756897838, "percentage": 66.62, "elapsed_time": "9:58:18", "remaining_time": "4:59:49"}
|
270 |
{"current_steps": 2682, "total_steps": 4023, "eval_loss": 0.5512435436248779, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "10:04:26", "remaining_time": "5:02:13"}
|
271 |
{"current_steps": 2690, "total_steps": 4023, "loss": 0.4215, "lr": 5e-06, "epoch": 2.005965697240865, "percentage": 66.87, "elapsed_time": "10:07:20", "remaining_time": "5:00:57"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
269 |
{"current_steps": 2680, "total_steps": 4023, "loss": 0.4804, "lr": 5e-06, "epoch": 1.9985085756897838, "percentage": 66.62, "elapsed_time": "9:58:18", "remaining_time": "4:59:49"}
|
270 |
{"current_steps": 2682, "total_steps": 4023, "eval_loss": 0.5512435436248779, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "10:04:26", "remaining_time": "5:02:13"}
|
271 |
{"current_steps": 2690, "total_steps": 4023, "loss": 0.4215, "lr": 5e-06, "epoch": 2.005965697240865, "percentage": 66.87, "elapsed_time": "10:07:20", "remaining_time": "5:00:57"}
|
272 |
+
{"current_steps": 2700, "total_steps": 4023, "loss": 0.4033, "lr": 5e-06, "epoch": 2.0134228187919465, "percentage": 67.11, "elapsed_time": "10:09:32", "remaining_time": "4:58:40"}
|
273 |
+
{"current_steps": 2710, "total_steps": 4023, "loss": 0.3907, "lr": 5e-06, "epoch": 2.0208799403430278, "percentage": 67.36, "elapsed_time": "10:11:45", "remaining_time": "4:56:23"}
|
274 |
+
{"current_steps": 2720, "total_steps": 4023, "loss": 0.3977, "lr": 5e-06, "epoch": 2.028337061894109, "percentage": 67.61, "elapsed_time": "10:13:58", "remaining_time": "4:54:07"}
|
275 |
+
{"current_steps": 2730, "total_steps": 4023, "loss": 0.4112, "lr": 5e-06, "epoch": 2.0357941834451903, "percentage": 67.86, "elapsed_time": "10:16:10", "remaining_time": "4:51:50"}
|
276 |
+
{"current_steps": 2740, "total_steps": 4023, "loss": 0.4176, "lr": 5e-06, "epoch": 2.0432513049962715, "percentage": 68.11, "elapsed_time": "10:18:23", "remaining_time": "4:49:33"}
|
277 |
+
{"current_steps": 2750, "total_steps": 4023, "loss": 0.4026, "lr": 5e-06, "epoch": 2.0507084265473527, "percentage": 68.36, "elapsed_time": "10:20:35", "remaining_time": "4:47:16"}
|
278 |
+
{"current_steps": 2760, "total_steps": 4023, "loss": 0.409, "lr": 5e-06, "epoch": 2.058165548098434, "percentage": 68.61, "elapsed_time": "10:22:48", "remaining_time": "4:45:00"}
|
279 |
+
{"current_steps": 2770, "total_steps": 4023, "loss": 0.4024, "lr": 5e-06, "epoch": 2.0656226696495152, "percentage": 68.85, "elapsed_time": "10:25:01", "remaining_time": "4:42:43"}
|
280 |
+
{"current_steps": 2780, "total_steps": 4023, "loss": 0.4175, "lr": 5e-06, "epoch": 2.0730797912005965, "percentage": 69.1, "elapsed_time": "10:27:13", "remaining_time": "4:40:26"}
|
281 |
+
{"current_steps": 2790, "total_steps": 4023, "loss": 0.403, "lr": 5e-06, "epoch": 2.0805369127516777, "percentage": 69.35, "elapsed_time": "10:29:26", "remaining_time": "4:38:10"}
|
282 |
+
{"current_steps": 2800, "total_steps": 4023, "loss": 0.413, "lr": 5e-06, "epoch": 2.087994034302759, "percentage": 69.6, "elapsed_time": "10:31:39", "remaining_time": "4:35:53"}
|
283 |
+
{"current_steps": 2810, "total_steps": 4023, "loss": 0.4159, "lr": 5e-06, "epoch": 2.0954511558538402, "percentage": 69.85, "elapsed_time": "10:33:52", "remaining_time": "4:33:37"}
|
284 |
+
{"current_steps": 2820, "total_steps": 4023, "loss": 0.4107, "lr": 5e-06, "epoch": 2.1029082774049215, "percentage": 70.1, "elapsed_time": "10:36:04", "remaining_time": "4:31:21"}
|
285 |
+
{"current_steps": 2830, "total_steps": 4023, "loss": 0.415, "lr": 5e-06, "epoch": 2.110365398956003, "percentage": 70.35, "elapsed_time": "10:38:17", "remaining_time": "4:29:04"}
|
286 |
+
{"current_steps": 2840, "total_steps": 4023, "loss": 0.415, "lr": 5e-06, "epoch": 2.1178225205070844, "percentage": 70.59, "elapsed_time": "10:40:30", "remaining_time": "4:26:48"}
|
287 |
+
{"current_steps": 2850, "total_steps": 4023, "loss": 0.4096, "lr": 5e-06, "epoch": 2.1252796420581657, "percentage": 70.84, "elapsed_time": "10:42:43", "remaining_time": "4:24:31"}
|
288 |
+
{"current_steps": 2860, "total_steps": 4023, "loss": 0.4015, "lr": 5e-06, "epoch": 2.132736763609247, "percentage": 71.09, "elapsed_time": "10:44:55", "remaining_time": "4:22:15"}
|
289 |
+
{"current_steps": 2870, "total_steps": 4023, "loss": 0.4068, "lr": 5e-06, "epoch": 2.140193885160328, "percentage": 71.34, "elapsed_time": "10:47:08", "remaining_time": "4:19:58"}
|
290 |
+
{"current_steps": 2880, "total_steps": 4023, "loss": 0.4215, "lr": 5e-06, "epoch": 2.1476510067114094, "percentage": 71.59, "elapsed_time": "10:49:20", "remaining_time": "4:17:42"}
|
291 |
+
{"current_steps": 2890, "total_steps": 4023, "loss": 0.4141, "lr": 5e-06, "epoch": 2.1551081282624907, "percentage": 71.84, "elapsed_time": "10:51:33", "remaining_time": "4:15:26"}
|
292 |
+
{"current_steps": 2900, "total_steps": 4023, "loss": 0.407, "lr": 5e-06, "epoch": 2.162565249813572, "percentage": 72.09, "elapsed_time": "10:53:45", "remaining_time": "4:13:09"}
|
293 |
+
{"current_steps": 2910, "total_steps": 4023, "loss": 0.417, "lr": 5e-06, "epoch": 2.170022371364653, "percentage": 72.33, "elapsed_time": "10:55:58", "remaining_time": "4:10:53"}
|
294 |
+
{"current_steps": 2920, "total_steps": 4023, "loss": 0.4225, "lr": 5e-06, "epoch": 2.1774794929157344, "percentage": 72.58, "elapsed_time": "10:58:11", "remaining_time": "4:08:37"}
|
295 |
+
{"current_steps": 2930, "total_steps": 4023, "loss": 0.4138, "lr": 5e-06, "epoch": 2.1849366144668156, "percentage": 72.83, "elapsed_time": "11:00:23", "remaining_time": "4:06:21"}
|
296 |
+
{"current_steps": 2940, "total_steps": 4023, "loss": 0.4112, "lr": 5e-06, "epoch": 2.192393736017897, "percentage": 73.08, "elapsed_time": "11:02:36", "remaining_time": "4:04:04"}
|
297 |
+
{"current_steps": 2950, "total_steps": 4023, "loss": 0.4208, "lr": 5e-06, "epoch": 2.1998508575689786, "percentage": 73.33, "elapsed_time": "11:04:48", "remaining_time": "4:01:48"}
|
298 |
+
{"current_steps": 2960, "total_steps": 4023, "loss": 0.4167, "lr": 5e-06, "epoch": 2.20730797912006, "percentage": 73.58, "elapsed_time": "11:07:01", "remaining_time": "3:59:32"}
|
299 |
+
{"current_steps": 2970, "total_steps": 4023, "loss": 0.413, "lr": 5e-06, "epoch": 2.214765100671141, "percentage": 73.83, "elapsed_time": "11:09:13", "remaining_time": "3:57:16"}
|
300 |
+
{"current_steps": 2980, "total_steps": 4023, "loss": 0.4126, "lr": 5e-06, "epoch": 2.2222222222222223, "percentage": 74.07, "elapsed_time": "11:11:26", "remaining_time": "3:55:00"}
|
301 |
+
{"current_steps": 2990, "total_steps": 4023, "loss": 0.4189, "lr": 5e-06, "epoch": 2.2296793437733036, "percentage": 74.32, "elapsed_time": "11:13:38", "remaining_time": "3:52:44"}
|
302 |
+
{"current_steps": 3000, "total_steps": 4023, "loss": 0.416, "lr": 5e-06, "epoch": 2.237136465324385, "percentage": 74.57, "elapsed_time": "11:15:51", "remaining_time": "3:50:27"}
|
303 |
+
{"current_steps": 3010, "total_steps": 4023, "loss": 0.4182, "lr": 5e-06, "epoch": 2.244593586875466, "percentage": 74.82, "elapsed_time": "11:18:03", "remaining_time": "3:48:11"}
|
304 |
+
{"current_steps": 3020, "total_steps": 4023, "loss": 0.4401, "lr": 5e-06, "epoch": 2.2520507084265473, "percentage": 75.07, "elapsed_time": "11:20:16", "remaining_time": "3:45:55"}
|
305 |
+
{"current_steps": 3030, "total_steps": 4023, "loss": 0.4093, "lr": 5e-06, "epoch": 2.2595078299776286, "percentage": 75.32, "elapsed_time": "11:22:28", "remaining_time": "3:43:39"}
|
306 |
+
{"current_steps": 3040, "total_steps": 4023, "loss": 0.4201, "lr": 5e-06, "epoch": 2.26696495152871, "percentage": 75.57, "elapsed_time": "11:24:41", "remaining_time": "3:41:23"}
|
307 |
+
{"current_steps": 3050, "total_steps": 4023, "loss": 0.4216, "lr": 5e-06, "epoch": 2.274422073079791, "percentage": 75.81, "elapsed_time": "11:26:54", "remaining_time": "3:39:08"}
|
308 |
+
{"current_steps": 3060, "total_steps": 4023, "loss": 0.4225, "lr": 5e-06, "epoch": 2.2818791946308723, "percentage": 76.06, "elapsed_time": "11:29:06", "remaining_time": "3:36:52"}
|
309 |
+
{"current_steps": 3070, "total_steps": 4023, "loss": 0.4187, "lr": 5e-06, "epoch": 2.289336316181954, "percentage": 76.31, "elapsed_time": "11:31:19", "remaining_time": "3:34:36"}
|
310 |
+
{"current_steps": 3080, "total_steps": 4023, "loss": 0.4238, "lr": 5e-06, "epoch": 2.2967934377330352, "percentage": 76.56, "elapsed_time": "11:33:32", "remaining_time": "3:32:20"}
|
311 |
+
{"current_steps": 3090, "total_steps": 4023, "loss": 0.4219, "lr": 5e-06, "epoch": 2.3042505592841165, "percentage": 76.81, "elapsed_time": "11:35:44", "remaining_time": "3:30:04"}
|
312 |
+
{"current_steps": 3100, "total_steps": 4023, "loss": 0.4246, "lr": 5e-06, "epoch": 2.3117076808351977, "percentage": 77.06, "elapsed_time": "11:37:57", "remaining_time": "3:27:48"}
|
313 |
+
{"current_steps": 3110, "total_steps": 4023, "loss": 0.4071, "lr": 5e-06, "epoch": 2.319164802386279, "percentage": 77.31, "elapsed_time": "11:40:09", "remaining_time": "3:25:32"}
|
314 |
+
{"current_steps": 3120, "total_steps": 4023, "loss": 0.4114, "lr": 5e-06, "epoch": 2.3266219239373602, "percentage": 77.55, "elapsed_time": "11:42:22", "remaining_time": "3:23:16"}
|
315 |
+
{"current_steps": 3130, "total_steps": 4023, "loss": 0.4154, "lr": 5e-06, "epoch": 2.3340790454884415, "percentage": 77.8, "elapsed_time": "11:44:34", "remaining_time": "3:21:01"}
|
316 |
+
{"current_steps": 3140, "total_steps": 4023, "loss": 0.4342, "lr": 5e-06, "epoch": 2.3415361670395227, "percentage": 78.05, "elapsed_time": "11:46:47", "remaining_time": "3:18:45"}
|
317 |
+
{"current_steps": 3150, "total_steps": 4023, "loss": 0.4115, "lr": 5e-06, "epoch": 2.348993288590604, "percentage": 78.3, "elapsed_time": "11:48:59", "remaining_time": "3:16:29"}
|
318 |
+
{"current_steps": 3160, "total_steps": 4023, "loss": 0.4129, "lr": 5e-06, "epoch": 2.356450410141685, "percentage": 78.55, "elapsed_time": "11:51:11", "remaining_time": "3:14:13"}
|
319 |
+
{"current_steps": 3170, "total_steps": 4023, "loss": 0.4116, "lr": 5e-06, "epoch": 2.3639075316927665, "percentage": 78.8, "elapsed_time": "11:53:24", "remaining_time": "3:11:58"}
|
320 |
+
{"current_steps": 3180, "total_steps": 4023, "loss": 0.4257, "lr": 5e-06, "epoch": 2.3713646532438477, "percentage": 79.05, "elapsed_time": "11:55:36", "remaining_time": "3:09:42"}
|
321 |
+
{"current_steps": 3190, "total_steps": 4023, "loss": 0.4332, "lr": 5e-06, "epoch": 2.378821774794929, "percentage": 79.29, "elapsed_time": "11:57:49", "remaining_time": "3:07:26"}
|
322 |
+
{"current_steps": 3200, "total_steps": 4023, "loss": 0.4166, "lr": 5e-06, "epoch": 2.3862788963460106, "percentage": 79.54, "elapsed_time": "12:00:01", "remaining_time": "3:05:10"}
|
323 |
+
{"current_steps": 3210, "total_steps": 4023, "loss": 0.4214, "lr": 5e-06, "epoch": 2.393736017897092, "percentage": 79.79, "elapsed_time": "12:02:13", "remaining_time": "3:02:55"}
|
324 |
+
{"current_steps": 3220, "total_steps": 4023, "loss": 0.4175, "lr": 5e-06, "epoch": 2.401193139448173, "percentage": 80.04, "elapsed_time": "12:04:26", "remaining_time": "3:00:39"}
|
325 |
+
{"current_steps": 3230, "total_steps": 4023, "loss": 0.4205, "lr": 5e-06, "epoch": 2.4086502609992544, "percentage": 80.29, "elapsed_time": "12:06:38", "remaining_time": "2:58:23"}
|
326 |
+
{"current_steps": 3240, "total_steps": 4023, "loss": 0.4106, "lr": 5e-06, "epoch": 2.4161073825503356, "percentage": 80.54, "elapsed_time": "12:08:51", "remaining_time": "2:56:08"}
|
327 |
+
{"current_steps": 3250, "total_steps": 4023, "loss": 0.435, "lr": 5e-06, "epoch": 2.423564504101417, "percentage": 80.79, "elapsed_time": "12:11:03", "remaining_time": "2:53:52"}
|
328 |
+
{"current_steps": 3260, "total_steps": 4023, "loss": 0.4148, "lr": 5e-06, "epoch": 2.431021625652498, "percentage": 81.03, "elapsed_time": "12:13:15", "remaining_time": "2:51:37"}
|
329 |
+
{"current_steps": 3270, "total_steps": 4023, "loss": 0.4071, "lr": 5e-06, "epoch": 2.4384787472035794, "percentage": 81.28, "elapsed_time": "12:15:28", "remaining_time": "2:49:21"}
|
330 |
+
{"current_steps": 3280, "total_steps": 4023, "loss": 0.4222, "lr": 5e-06, "epoch": 2.4459358687546606, "percentage": 81.53, "elapsed_time": "12:17:40", "remaining_time": "2:47:06"}
|
331 |
+
{"current_steps": 3290, "total_steps": 4023, "loss": 0.4152, "lr": 5e-06, "epoch": 2.453392990305742, "percentage": 81.78, "elapsed_time": "12:19:52", "remaining_time": "2:44:50"}
|
332 |
+
{"current_steps": 3300, "total_steps": 4023, "loss": 0.4051, "lr": 5e-06, "epoch": 2.460850111856823, "percentage": 82.03, "elapsed_time": "12:22:05", "remaining_time": "2:42:35"}
|
333 |
+
{"current_steps": 3310, "total_steps": 4023, "loss": 0.4221, "lr": 5e-06, "epoch": 2.4683072334079044, "percentage": 82.28, "elapsed_time": "12:24:17", "remaining_time": "2:40:19"}
|
334 |
+
{"current_steps": 3320, "total_steps": 4023, "loss": 0.4116, "lr": 5e-06, "epoch": 2.4757643549589856, "percentage": 82.53, "elapsed_time": "12:26:29", "remaining_time": "2:38:04"}
|
335 |
+
{"current_steps": 3330, "total_steps": 4023, "loss": 0.4211, "lr": 5e-06, "epoch": 2.4832214765100673, "percentage": 82.77, "elapsed_time": "12:28:42", "remaining_time": "2:35:48"}
|
336 |
+
{"current_steps": 3340, "total_steps": 4023, "loss": 0.4176, "lr": 5e-06, "epoch": 2.4906785980611486, "percentage": 83.02, "elapsed_time": "12:30:54", "remaining_time": "2:33:33"}
|
337 |
+
{"current_steps": 3350, "total_steps": 4023, "loss": 0.4283, "lr": 5e-06, "epoch": 2.49813571961223, "percentage": 83.27, "elapsed_time": "12:33:06", "remaining_time": "2:31:17"}
|
338 |
+
{"current_steps": 3360, "total_steps": 4023, "loss": 0.4207, "lr": 5e-06, "epoch": 2.505592841163311, "percentage": 83.52, "elapsed_time": "12:35:19", "remaining_time": "2:29:02"}
|
339 |
+
{"current_steps": 3370, "total_steps": 4023, "loss": 0.4239, "lr": 5e-06, "epoch": 2.5130499627143923, "percentage": 83.77, "elapsed_time": "12:37:31", "remaining_time": "2:26:47"}
|
340 |
+
{"current_steps": 3380, "total_steps": 4023, "loss": 0.4266, "lr": 5e-06, "epoch": 2.5205070842654735, "percentage": 84.02, "elapsed_time": "12:39:43", "remaining_time": "2:24:31"}
|
341 |
+
{"current_steps": 3390, "total_steps": 4023, "loss": 0.4262, "lr": 5e-06, "epoch": 2.527964205816555, "percentage": 84.27, "elapsed_time": "12:41:56", "remaining_time": "2:22:16"}
|
342 |
+
{"current_steps": 3400, "total_steps": 4023, "loss": 0.4082, "lr": 5e-06, "epoch": 2.535421327367636, "percentage": 84.51, "elapsed_time": "12:44:08", "remaining_time": "2:20:01"}
|
343 |
+
{"current_steps": 3410, "total_steps": 4023, "loss": 0.4123, "lr": 5e-06, "epoch": 2.5428784489187173, "percentage": 84.76, "elapsed_time": "12:46:20", "remaining_time": "2:17:45"}
|
344 |
+
{"current_steps": 3420, "total_steps": 4023, "loss": 0.4177, "lr": 5e-06, "epoch": 2.5503355704697985, "percentage": 85.01, "elapsed_time": "12:48:33", "remaining_time": "2:15:30"}
|
345 |
+
{"current_steps": 3430, "total_steps": 4023, "loss": 0.4238, "lr": 5e-06, "epoch": 2.5577926920208798, "percentage": 85.26, "elapsed_time": "12:50:45", "remaining_time": "2:13:15"}
|
346 |
+
{"current_steps": 3440, "total_steps": 4023, "loss": 0.4333, "lr": 5e-06, "epoch": 2.5652498135719615, "percentage": 85.51, "elapsed_time": "12:52:58", "remaining_time": "2:11:00"}
|
347 |
+
{"current_steps": 3450, "total_steps": 4023, "loss": 0.4253, "lr": 5e-06, "epoch": 2.5727069351230423, "percentage": 85.76, "elapsed_time": "12:55:10", "remaining_time": "2:08:44"}
|
348 |
+
{"current_steps": 3460, "total_steps": 4023, "loss": 0.4249, "lr": 5e-06, "epoch": 2.580164056674124, "percentage": 86.01, "elapsed_time": "12:57:23", "remaining_time": "2:06:29"}
|
349 |
+
{"current_steps": 3470, "total_steps": 4023, "loss": 0.4177, "lr": 5e-06, "epoch": 2.587621178225205, "percentage": 86.25, "elapsed_time": "12:59:35", "remaining_time": "2:04:14"}
|
350 |
+
{"current_steps": 3480, "total_steps": 4023, "loss": 0.4161, "lr": 5e-06, "epoch": 2.5950782997762865, "percentage": 86.5, "elapsed_time": "13:01:48", "remaining_time": "2:01:59"}
|
351 |
+
{"current_steps": 3490, "total_steps": 4023, "loss": 0.4163, "lr": 5e-06, "epoch": 2.6025354213273677, "percentage": 86.75, "elapsed_time": "13:04:00", "remaining_time": "1:59:44"}
|
352 |
+
{"current_steps": 3500, "total_steps": 4023, "loss": 0.4186, "lr": 5e-06, "epoch": 2.609992542878449, "percentage": 87.0, "elapsed_time": "13:06:13", "remaining_time": "1:57:29"}
|
353 |
+
{"current_steps": 3510, "total_steps": 4023, "loss": 0.428, "lr": 5e-06, "epoch": 2.61744966442953, "percentage": 87.25, "elapsed_time": "13:08:25", "remaining_time": "1:55:13"}
|
354 |
+
{"current_steps": 3520, "total_steps": 4023, "loss": 0.4171, "lr": 5e-06, "epoch": 2.6249067859806114, "percentage": 87.5, "elapsed_time": "13:10:37", "remaining_time": "1:52:58"}
|
355 |
+
{"current_steps": 3530, "total_steps": 4023, "loss": 0.4208, "lr": 5e-06, "epoch": 2.6323639075316927, "percentage": 87.75, "elapsed_time": "13:12:50", "remaining_time": "1:50:43"}
|
356 |
+
{"current_steps": 3540, "total_steps": 4023, "loss": 0.4232, "lr": 5e-06, "epoch": 2.639821029082774, "percentage": 87.99, "elapsed_time": "13:15:02", "remaining_time": "1:48:28"}
|
357 |
+
{"current_steps": 3550, "total_steps": 4023, "loss": 0.4145, "lr": 5e-06, "epoch": 2.647278150633855, "percentage": 88.24, "elapsed_time": "13:17:14", "remaining_time": "1:46:13"}
|
358 |
+
{"current_steps": 3560, "total_steps": 4023, "loss": 0.428, "lr": 5e-06, "epoch": 2.6547352721849364, "percentage": 88.49, "elapsed_time": "13:19:27", "remaining_time": "1:43:58"}
|
359 |
+
{"current_steps": 3570, "total_steps": 4023, "loss": 0.4271, "lr": 5e-06, "epoch": 2.662192393736018, "percentage": 88.74, "elapsed_time": "13:21:39", "remaining_time": "1:41:43"}
|
360 |
+
{"current_steps": 3580, "total_steps": 4023, "loss": 0.4153, "lr": 5e-06, "epoch": 2.669649515287099, "percentage": 88.99, "elapsed_time": "13:23:52", "remaining_time": "1:39:28"}
|
361 |
+
{"current_steps": 3590, "total_steps": 4023, "loss": 0.4157, "lr": 5e-06, "epoch": 2.6771066368381806, "percentage": 89.24, "elapsed_time": "13:26:04", "remaining_time": "1:37:13"}
|
362 |
+
{"current_steps": 3600, "total_steps": 4023, "loss": 0.427, "lr": 5e-06, "epoch": 2.684563758389262, "percentage": 89.49, "elapsed_time": "13:28:16", "remaining_time": "1:34:58"}
|
363 |
+
{"current_steps": 3610, "total_steps": 4023, "loss": 0.4141, "lr": 5e-06, "epoch": 2.692020879940343, "percentage": 89.73, "elapsed_time": "13:30:29", "remaining_time": "1:32:43"}
|
364 |
+
{"current_steps": 3620, "total_steps": 4023, "loss": 0.4169, "lr": 5e-06, "epoch": 2.6994780014914244, "percentage": 89.98, "elapsed_time": "13:32:41", "remaining_time": "1:30:28"}
|
365 |
+
{"current_steps": 3630, "total_steps": 4023, "loss": 0.4363, "lr": 5e-06, "epoch": 2.7069351230425056, "percentage": 90.23, "elapsed_time": "13:34:54", "remaining_time": "1:28:13"}
|
366 |
+
{"current_steps": 3640, "total_steps": 4023, "loss": 0.4247, "lr": 5e-06, "epoch": 2.714392244593587, "percentage": 90.48, "elapsed_time": "13:37:06", "remaining_time": "1:25:58"}
|
367 |
+
{"current_steps": 3650, "total_steps": 4023, "loss": 0.4275, "lr": 5e-06, "epoch": 2.721849366144668, "percentage": 90.73, "elapsed_time": "13:39:18", "remaining_time": "1:23:43"}
|
368 |
+
{"current_steps": 3660, "total_steps": 4023, "loss": 0.4294, "lr": 5e-06, "epoch": 2.7293064876957494, "percentage": 90.98, "elapsed_time": "13:41:31", "remaining_time": "1:21:28"}
|
369 |
+
{"current_steps": 3670, "total_steps": 4023, "loss": 0.4274, "lr": 5e-06, "epoch": 2.7367636092468306, "percentage": 91.23, "elapsed_time": "13:43:43", "remaining_time": "1:19:13"}
|
370 |
+
{"current_steps": 3680, "total_steps": 4023, "loss": 0.4184, "lr": 5e-06, "epoch": 2.744220730797912, "percentage": 91.47, "elapsed_time": "13:45:56", "remaining_time": "1:16:58"}
|
371 |
+
{"current_steps": 3690, "total_steps": 4023, "loss": 0.4172, "lr": 5e-06, "epoch": 2.751677852348993, "percentage": 91.72, "elapsed_time": "13:48:08", "remaining_time": "1:14:44"}
|
372 |
+
{"current_steps": 3700, "total_steps": 4023, "loss": 0.4189, "lr": 5e-06, "epoch": 2.759134973900075, "percentage": 91.97, "elapsed_time": "13:50:21", "remaining_time": "1:12:29"}
|
373 |
+
{"current_steps": 3710, "total_steps": 4023, "loss": 0.4219, "lr": 5e-06, "epoch": 2.7665920954511556, "percentage": 92.22, "elapsed_time": "13:52:33", "remaining_time": "1:10:14"}
|
374 |
+
{"current_steps": 3720, "total_steps": 4023, "loss": 0.4199, "lr": 5e-06, "epoch": 2.7740492170022373, "percentage": 92.47, "elapsed_time": "13:54:46", "remaining_time": "1:07:59"}
|
375 |
+
{"current_steps": 3730, "total_steps": 4023, "loss": 0.417, "lr": 5e-06, "epoch": 2.7815063385533185, "percentage": 92.72, "elapsed_time": "13:56:58", "remaining_time": "1:05:44"}
|
376 |
+
{"current_steps": 3740, "total_steps": 4023, "loss": 0.4247, "lr": 5e-06, "epoch": 2.7889634601043998, "percentage": 92.97, "elapsed_time": "13:59:11", "remaining_time": "1:03:30"}
|
377 |
+
{"current_steps": 3750, "total_steps": 4023, "loss": 0.4185, "lr": 5e-06, "epoch": 2.796420581655481, "percentage": 93.21, "elapsed_time": "14:01:23", "remaining_time": "1:01:15"}
|
378 |
+
{"current_steps": 3760, "total_steps": 4023, "loss": 0.4289, "lr": 5e-06, "epoch": 2.8038777032065623, "percentage": 93.46, "elapsed_time": "14:03:36", "remaining_time": "0:59:00"}
|
379 |
+
{"current_steps": 3770, "total_steps": 4023, "loss": 0.4295, "lr": 5e-06, "epoch": 2.8113348247576435, "percentage": 93.71, "elapsed_time": "14:05:48", "remaining_time": "0:56:45"}
|
380 |
+
{"current_steps": 3780, "total_steps": 4023, "loss": 0.4278, "lr": 5e-06, "epoch": 2.8187919463087248, "percentage": 93.96, "elapsed_time": "14:08:01", "remaining_time": "0:54:30"}
|
381 |
+
{"current_steps": 3790, "total_steps": 4023, "loss": 0.4194, "lr": 5e-06, "epoch": 2.826249067859806, "percentage": 94.21, "elapsed_time": "14:10:13", "remaining_time": "0:52:16"}
|
382 |
+
{"current_steps": 3800, "total_steps": 4023, "loss": 0.4191, "lr": 5e-06, "epoch": 2.8337061894108873, "percentage": 94.46, "elapsed_time": "14:12:26", "remaining_time": "0:50:01"}
|
383 |
+
{"current_steps": 3810, "total_steps": 4023, "loss": 0.4249, "lr": 5e-06, "epoch": 2.841163310961969, "percentage": 94.71, "elapsed_time": "14:14:39", "remaining_time": "0:47:46"}
|
384 |
+
{"current_steps": 3820, "total_steps": 4023, "loss": 0.4141, "lr": 5e-06, "epoch": 2.8486204325130497, "percentage": 94.95, "elapsed_time": "14:16:51", "remaining_time": "0:45:32"}
|
385 |
+
{"current_steps": 3830, "total_steps": 4023, "loss": 0.4226, "lr": 5e-06, "epoch": 2.8560775540641314, "percentage": 95.2, "elapsed_time": "14:19:04", "remaining_time": "0:43:17"}
|
386 |
+
{"current_steps": 3840, "total_steps": 4023, "loss": 0.4237, "lr": 5e-06, "epoch": 2.8635346756152127, "percentage": 95.45, "elapsed_time": "14:21:16", "remaining_time": "0:41:02"}
|
387 |
+
{"current_steps": 3850, "total_steps": 4023, "loss": 0.4247, "lr": 5e-06, "epoch": 2.870991797166294, "percentage": 95.7, "elapsed_time": "14:23:28", "remaining_time": "0:38:48"}
|
388 |
+
{"current_steps": 3860, "total_steps": 4023, "loss": 0.4259, "lr": 5e-06, "epoch": 2.878448918717375, "percentage": 95.95, "elapsed_time": "14:25:41", "remaining_time": "0:36:33"}
|
389 |
+
{"current_steps": 3870, "total_steps": 4023, "loss": 0.4307, "lr": 5e-06, "epoch": 2.8859060402684564, "percentage": 96.2, "elapsed_time": "14:27:53", "remaining_time": "0:34:18"}
|
390 |
+
{"current_steps": 3880, "total_steps": 4023, "loss": 0.4302, "lr": 5e-06, "epoch": 2.8933631618195377, "percentage": 96.45, "elapsed_time": "14:30:06", "remaining_time": "0:32:04"}
|
391 |
+
{"current_steps": 3890, "total_steps": 4023, "loss": 0.4197, "lr": 5e-06, "epoch": 2.900820283370619, "percentage": 96.69, "elapsed_time": "14:32:18", "remaining_time": "0:29:49"}
|
392 |
+
{"current_steps": 3900, "total_steps": 4023, "loss": 0.4196, "lr": 5e-06, "epoch": 2.9082774049217, "percentage": 96.94, "elapsed_time": "14:34:31", "remaining_time": "0:27:34"}
|
393 |
+
{"current_steps": 3910, "total_steps": 4023, "loss": 0.4234, "lr": 5e-06, "epoch": 2.9157345264727814, "percentage": 97.19, "elapsed_time": "14:36:43", "remaining_time": "0:25:20"}
|
394 |
+
{"current_steps": 3920, "total_steps": 4023, "loss": 0.4155, "lr": 5e-06, "epoch": 2.9231916480238627, "percentage": 97.44, "elapsed_time": "14:38:56", "remaining_time": "0:23:05"}
|
395 |
+
{"current_steps": 3930, "total_steps": 4023, "loss": 0.4245, "lr": 5e-06, "epoch": 2.930648769574944, "percentage": 97.69, "elapsed_time": "14:41:08", "remaining_time": "0:20:51"}
|
396 |
+
{"current_steps": 3940, "total_steps": 4023, "loss": 0.4141, "lr": 5e-06, "epoch": 2.9381058911260256, "percentage": 97.94, "elapsed_time": "14:43:20", "remaining_time": "0:18:36"}
|
397 |
+
{"current_steps": 3950, "total_steps": 4023, "loss": 0.4111, "lr": 5e-06, "epoch": 2.9455630126771064, "percentage": 98.19, "elapsed_time": "14:45:33", "remaining_time": "0:16:21"}
|
398 |
+
{"current_steps": 3960, "total_steps": 4023, "loss": 0.413, "lr": 5e-06, "epoch": 2.953020134228188, "percentage": 98.43, "elapsed_time": "14:47:45", "remaining_time": "0:14:07"}
|
399 |
+
{"current_steps": 3970, "total_steps": 4023, "loss": 0.4254, "lr": 5e-06, "epoch": 2.9604772557792693, "percentage": 98.68, "elapsed_time": "14:49:57", "remaining_time": "0:11:52"}
|
400 |
+
{"current_steps": 3980, "total_steps": 4023, "loss": 0.4116, "lr": 5e-06, "epoch": 2.9679343773303506, "percentage": 98.93, "elapsed_time": "14:52:10", "remaining_time": "0:09:38"}
|
401 |
+
{"current_steps": 3990, "total_steps": 4023, "loss": 0.4188, "lr": 5e-06, "epoch": 2.975391498881432, "percentage": 99.18, "elapsed_time": "14:54:22", "remaining_time": "0:07:23"}
|
402 |
+
{"current_steps": 4000, "total_steps": 4023, "loss": 0.4393, "lr": 5e-06, "epoch": 2.982848620432513, "percentage": 99.43, "elapsed_time": "14:56:35", "remaining_time": "0:05:09"}
|
403 |
+
{"current_steps": 4010, "total_steps": 4023, "loss": 0.4298, "lr": 5e-06, "epoch": 2.9903057419835943, "percentage": 99.68, "elapsed_time": "14:58:47", "remaining_time": "0:02:54"}
|
404 |
+
{"current_steps": 4020, "total_steps": 4023, "loss": 0.4292, "lr": 5e-06, "epoch": 2.9977628635346756, "percentage": 99.93, "elapsed_time": "15:01:00", "remaining_time": "0:00:40"}
|