Jeckmu's picture
Upload folder using huggingface_hub
424baac verified
{"current_steps": 5, "total_steps": 105, "loss": 0.5319, "lr": 4.972077065562821e-05, "epoch": 0.1413427561837456, "percentage": 4.76, "elapsed_time": "0:02:28", "remaining_time": "0:49:26", "throughput": 602.45, "total_tokens": 89360}
{"current_steps": 10, "total_steps": 105, "loss": 0.346, "lr": 4.888932014465352e-05, "epoch": 0.2826855123674912, "percentage": 9.52, "elapsed_time": "0:04:43", "remaining_time": "0:44:52", "throughput": 612.79, "total_tokens": 173680}
{"current_steps": 15, "total_steps": 105, "loss": 0.3586, "lr": 4.752422169756048e-05, "epoch": 0.42402826855123676, "percentage": 14.29, "elapsed_time": "0:06:54", "remaining_time": "0:41:27", "throughput": 618.32, "total_tokens": 256320}
{"current_steps": 20, "total_steps": 105, "loss": 0.3476, "lr": 4.5655969357899874e-05, "epoch": 0.5653710247349824, "percentage": 19.05, "elapsed_time": "0:09:32", "remaining_time": "0:40:34", "throughput": 618.07, "total_tokens": 354080}
{"current_steps": 25, "total_steps": 105, "loss": 0.2828, "lr": 4.332629679574566e-05, "epoch": 0.7067137809187279, "percentage": 23.81, "elapsed_time": "0:11:58", "remaining_time": "0:38:20", "throughput": 619.26, "total_tokens": 445120}
{"current_steps": 30, "total_steps": 105, "loss": 0.3261, "lr": 4.058724504646834e-05, "epoch": 0.8480565371024735, "percentage": 28.57, "elapsed_time": "0:14:24", "remaining_time": "0:36:02", "throughput": 619.9, "total_tokens": 536160}
{"current_steps": 35, "total_steps": 105, "loss": 0.1752, "lr": 3.7500000000000003e-05, "epoch": 0.9893992932862191, "percentage": 33.33, "elapsed_time": "0:16:45", "remaining_time": "0:33:31", "throughput": 618.49, "total_tokens": 622160}
{"current_steps": 40, "total_steps": 105, "loss": 0.1521, "lr": 3.413352560915988e-05, "epoch": 1.1130742049469964, "percentage": 38.1, "elapsed_time": "0:18:55", "remaining_time": "0:30:45", "throughput": 618.88, "total_tokens": 702992}
{"current_steps": 45, "total_steps": 105, "loss": 0.1056, "lr": 3.056302334890786e-05, "epoch": 1.254416961130742, "percentage": 42.86, "elapsed_time": "0:21:25", "remaining_time": "0:28:33", "throughput": 619.19, "total_tokens": 795712}
{"current_steps": 50, "total_steps": 105, "loss": 0.2243, "lr": 2.686825233966061e-05, "epoch": 1.3957597173144876, "percentage": 47.62, "elapsed_time": "0:23:46", "remaining_time": "0:26:09", "throughput": 616.89, "total_tokens": 880032}
{"current_steps": 55, "total_steps": 105, "loss": 0.1218, "lr": 2.3131747660339394e-05, "epoch": 1.5371024734982333, "percentage": 52.38, "elapsed_time": "0:26:10", "remaining_time": "0:23:47", "throughput": 617.2, "total_tokens": 969392}
{"current_steps": 60, "total_steps": 105, "loss": 0.1474, "lr": 1.9436976651092144e-05, "epoch": 1.6784452296819787, "percentage": 57.14, "elapsed_time": "0:28:41", "remaining_time": "0:21:30", "throughput": 615.14, "total_tokens": 1058752}
{"current_steps": 65, "total_steps": 105, "loss": 0.0559, "lr": 1.5866474390840125e-05, "epoch": 1.8197879858657244, "percentage": 61.9, "elapsed_time": "0:30:54", "remaining_time": "0:19:01", "throughput": 616.26, "total_tokens": 1143072}
{"current_steps": 70, "total_steps": 105, "loss": 0.0936, "lr": 1.2500000000000006e-05, "epoch": 1.96113074204947, "percentage": 66.67, "elapsed_time": "0:33:20", "remaining_time": "0:16:40", "throughput": 616.77, "total_tokens": 1234112}
{"current_steps": 75, "total_steps": 105, "loss": 0.0648, "lr": 9.412754953531663e-06, "epoch": 2.0848056537102475, "percentage": 71.43, "elapsed_time": "0:35:09", "remaining_time": "0:14:03", "throughput": 617.75, "total_tokens": 1303184}
{"current_steps": 80, "total_steps": 105, "loss": 0.0676, "lr": 6.673703204254347e-06, "epoch": 2.2261484098939928, "percentage": 76.19, "elapsed_time": "0:37:20", "remaining_time": "0:11:40", "throughput": 618.56, "total_tokens": 1385824}
{"current_steps": 85, "total_steps": 105, "loss": 0.0947, "lr": 4.344030642100133e-06, "epoch": 2.3674911660777385, "percentage": 80.95, "elapsed_time": "0:39:46", "remaining_time": "0:09:21", "throughput": 618.87, "total_tokens": 1476864}
{"current_steps": 90, "total_steps": 105, "loss": 0.0447, "lr": 2.475778302439524e-06, "epoch": 2.508833922261484, "percentage": 85.71, "elapsed_time": "0:42:23", "remaining_time": "0:07:03", "throughput": 617.15, "total_tokens": 1569584}
{"current_steps": 95, "total_steps": 105, "loss": 0.0535, "lr": 1.1106798553464804e-06, "epoch": 2.65017667844523, "percentage": 90.48, "elapsed_time": "0:44:43", "remaining_time": "0:04:42", "throughput": 617.57, "total_tokens": 1657264}
{"current_steps": 100, "total_steps": 105, "loss": 0.1107, "lr": 2.7922934437178695e-07, "epoch": 2.791519434628975, "percentage": 95.24, "elapsed_time": "0:47:10", "remaining_time": "0:02:21", "throughput": 617.02, "total_tokens": 1746624}
{"current_steps": 105, "total_steps": 105, "loss": 0.0806, "lr": 0.0, "epoch": 2.932862190812721, "percentage": 100.0, "elapsed_time": "0:49:48", "remaining_time": "0:00:00", "throughput": 616.09, "total_tokens": 1841024}
{"current_steps": 105, "total_steps": 105, "epoch": 2.932862190812721, "percentage": 100.0, "elapsed_time": "0:49:49", "remaining_time": "0:00:00", "throughput": 615.8, "total_tokens": 1841024}