epoch = 3.0 train_runtime = 334.4894 train_samples_per_second = 0.511 train_runtime = 344.0338144302368