{"mean_reward": 8230.0, "std_reward": 1263.368513142543, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2024-05-12T23:22:06.120652"} |
{"mean_reward": 8230.0, "std_reward": 1263.368513142543, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2024-05-12T23:22:06.120652"} |