{"env_id": "PandaReach-v3", "max_steps": 50000, "n_training_episodes": 9624, "n_eval_episodes": 3000, "learning_rate": 0.001}