{"mean_reward": 541.5, "std_reward": 211.991155475883, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2023-12-27T00:51:10.831941"}