{ "epoch": 1.0, "eval_loss": 2.4264748096466064, "eval_runtime": 126.3712, "eval_samples_per_second": 145.183, "eval_steps_per_second": 9.076, "perplexity": 11.318910353833383, "total_flos": 1.59124040841796e+18, "train_loss": 2.4629864172184424, "train_runtime": 3399.9284, "train_samples_per_second": 51.387, "train_steps_per_second": 3.212 }