epoch = 8.0 train_loss = 0.7255945914830917 train_runtime = 8445.2384 train_samples_per_second = 1.473 train_steps_per_second = 0.185