{ "epoch": 1.0, "eval_loss": 2.0893874168395996, "eval_runtime": 32.9539, "eval_samples_per_second": 13.716, "eval_steps_per_second": 1.73, "perplexity": 8.079963998077499, "total_flos": 5.34201935659008e+16, "train_loss": 2.1967257285604673, "train_runtime": 922.9625, "train_samples_per_second": 6.37, "train_steps_per_second": 3.185 }