{ "epoch": 1.0, "eval_loss": 1.9035444259643555, "eval_runtime": 31.4258, "eval_samples_per_second": 13.778, "eval_steps_per_second": 1.75, "perplexity": 6.709634147095092, "total_flos": 3.0394718060544e+16, "train_loss": 2.029054084226035, "train_runtime": 519.4686, "train_samples_per_second": 6.439, "train_steps_per_second": 3.221 }