epoch = 5.0 train_loss = 2.1076272324853074 train_runtime = 3749.7881 train_samples = 42367 train_samples_per_second = 56.493 train_steps_per_second = 0.883