{"mean_reward": 577.0, "std_reward": 219.2966028008642, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2023-12-12T05:46:45.969133"}