STAIR-Llama-3.1-8B-SFT / trainer_log.jsonl
skyai798's picture
Upload folder using huggingface_hub
1a46ef7 verified
{"current_steps": 30, "total_steps": 468, "loss": 1.2723, "learning_rate": 4.94947663010567e-06, "epoch": 0.192, "percentage": 6.41, "elapsed_time": "0:02:11", "remaining_time": "0:32:01"}
{"current_steps": 60, "total_steps": 468, "loss": 1.1224, "learning_rate": 4.799948609147061e-06, "epoch": 0.384, "percentage": 12.82, "elapsed_time": "0:04:20", "remaining_time": "0:29:34"}
{"current_steps": 90, "total_steps": 468, "loss": 1.0991, "learning_rate": 4.5574596647341414e-06, "epoch": 0.576, "percentage": 19.23, "elapsed_time": "0:06:31", "remaining_time": "0:27:24"}
{"current_steps": 120, "total_steps": 468, "loss": 1.1043, "learning_rate": 4.231810883773999e-06, "epoch": 0.768, "percentage": 25.64, "elapsed_time": "0:09:34", "remaining_time": "0:27:44"}
{"current_steps": 150, "total_steps": 468, "loss": 1.0811, "learning_rate": 3.836164565319503e-06, "epoch": 0.96, "percentage": 32.05, "elapsed_time": "0:11:50", "remaining_time": "0:25:05"}
{"current_steps": 180, "total_steps": 468, "loss": 0.979, "learning_rate": 3.386512217606339e-06, "epoch": 1.152, "percentage": 38.46, "elapsed_time": "0:13:52", "remaining_time": "0:22:12"}
{"current_steps": 210, "total_steps": 468, "loss": 0.9475, "learning_rate": 2.9010282021444008e-06, "epoch": 1.3439999999999999, "percentage": 44.87, "elapsed_time": "0:16:56", "remaining_time": "0:20:48"}
{"current_steps": 240, "total_steps": 468, "loss": 0.9448, "learning_rate": 2.399335149726463e-06, "epoch": 1.536, "percentage": 51.28, "elapsed_time": "0:19:11", "remaining_time": "0:18:14"}
{"current_steps": 270, "total_steps": 468, "loss": 0.948, "learning_rate": 1.9017108392811065e-06, "epoch": 1.728, "percentage": 57.69, "elapsed_time": "0:21:19", "remaining_time": "0:15:38"}
{"current_steps": 300, "total_steps": 468, "loss": 0.9441, "learning_rate": 1.4282685964923643e-06, "epoch": 1.92, "percentage": 64.1, "elapsed_time": "0:23:26", "remaining_time": "0:13:07"}
{"current_steps": 330, "total_steps": 468, "loss": 0.8881, "learning_rate": 9.981443394050525e-07, "epoch": 2.112, "percentage": 70.51, "elapsed_time": "0:26:28", "remaining_time": "0:11:04"}
{"current_steps": 360, "total_steps": 468, "loss": 0.8517, "learning_rate": 6.28723129572247e-07, "epoch": 2.304, "percentage": 76.92, "elapsed_time": "0:28:37", "remaining_time": "0:08:35"}
{"current_steps": 390, "total_steps": 468, "loss": 0.8528, "learning_rate": 3.3493649053890325e-07, "epoch": 2.496, "percentage": 83.33, "elapsed_time": "0:30:47", "remaining_time": "0:06:09"}
{"current_steps": 420, "total_steps": 468, "loss": 0.85, "learning_rate": 1.286588951321363e-07, "epoch": 2.6879999999999997, "percentage": 89.74, "elapsed_time": "0:39:24", "remaining_time": "0:04:30"}
{"current_steps": 450, "total_steps": 468, "loss": 0.8456, "learning_rate": 1.822781475486507e-08, "epoch": 2.88, "percentage": 96.15, "elapsed_time": "0:41:34", "remaining_time": "0:01:39"}
{"current_steps": 468, "total_steps": 468, "epoch": 2.9952, "percentage": 100.0, "elapsed_time": "0:43:35", "remaining_time": "0:00:00"}