{"mean_reward": 9.5, "std_reward": 0.6708203932499369, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2024-06-13T06:07:55.086747"}