{"mean_reward": 851.0, "std_reward": 443.5076098557949, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2023-11-16T08:57:20.609524"}