{ "loss": 2.0942, "learning_rate": 5.150214592274677e-07, "epoch": 2.0, "train_runtime": 13910.5631, "train_samples_per_second": 5.396, "train_steps_per_second": 0.084, "total_flos": 3.844740927455232e+17, "train_loss": 2.2632525492039965 }