{"mean_reward": 636.0, "std_reward": 214.32218737218972, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2024-09-21T08:44:19.019432"}