{ "epoch": 0.9999588580080144, "eval_loss": 0.10019518435001373, "eval_runtime": 106.3168, "eval_samples": 14749, "eval_samples_per_second": 138.727, "eval_steps_per_second": 17.344, "perplexity": 1.105386651196126, "total_flos": 5.63814937437143e+18, "train_loss": 3.3859311055856667, "train_runtime": 70616.0694, "train_samples": 2916727, "train_samples_per_second": 41.304, "train_steps_per_second": 0.161 }