epoch = 3.0 train_runtime = 211.7345 train_samples_per_second = 0.808 train_runtime = 218.340802192688