epoch = 5.0 train_loss = 2.1648097335031746 train_runtime = 1785.4315 train_samples = 42367 train_samples_per_second = 118.646 train_steps_per_second = 0.927