{"mean_reward": -5.08055796, "std_reward": 2.14066629037605, "is_deterministic": true, "n_eval_episodes": 50, "eval_datetime": "2024-11-20T16:37:50.142591"}