{ "epoch": 1.0, "eval_loss": 1.9291760921478271, "eval_runtime": 73.4757, "eval_samples_per_second": 14.059, "eval_steps_per_second": 1.769, "perplexity": 6.88383625773652, "total_flos": 1.0006271901696e+17, "train_loss": 2.0624009956218217, "train_runtime": 1767.6809, "train_samples_per_second": 6.215, "train_steps_per_second": 3.108 }