{ "epoch": 1.0, "eval_loss": 1.922713041305542, "eval_runtime": 63.7378, "eval_samples_per_second": 15.579, "eval_steps_per_second": 1.961, "perplexity": 6.839489137228699, "total_flos": 1.0003539689472e+17, "train_loss": 2.061430201075499, "train_runtime": 1617.6118, "train_samples_per_second": 6.79, "train_steps_per_second": 3.395 }