{"mean_reward": 1050.0, "std_reward": 350.1642471755219, "is_deterministic": false, "n_eval_episodes": 10}