{ "mean_reward": -114.75, "std_reward": 11.423112535557024, "datetime": "2025-07-28T16:14:07.952898+00:00", "train_duration_min": "1.65" }