{ "epoch": 2.987551867219917, "total_flos": 2.252458950505005e+18, "train_loss": 1.4155288457870483, "train_runtime": 9888.3803, "train_samples_per_second": 0.584, "train_steps_per_second": 0.009 }