{"mean_reward": 879.0, "std_reward": 327.25983560467665, "is_deterministic": false, "n_eval_episodes": 10}