epoch = 3.0 train_runtime = 445.7457 train_samples_per_second = 1.117 train_runtime = 450.5952482223511