{ "epoch": 0.9999493031929397, "eval_loss": 1.1684964895248413, "eval_runtime": 428.841, "eval_samples": 14447, "eval_samples_per_second": 33.688, "eval_steps_per_second": 8.423, "perplexity": 3.2171519787488077, "total_flos": 5.643098158163558e+18, "train_loss": 1.2418534558435956, "train_runtime": 283616.7229, "train_samples": 2919315, "train_samples_per_second": 10.293, "train_steps_per_second": 0.04 }