{ "epoch": 1.0, "eval_loss": 2.183828830718994, "eval_runtime": 59.4359, "eval_samples_per_second": 13.746, "eval_steps_per_second": 1.733, "perplexity": 8.880242193891197, "total_flos": 8.2279274151936e+16, "train_loss": 2.2892676124303164, "train_runtime": 1413.0668, "train_samples_per_second": 6.408, "train_steps_per_second": 3.204 }