{"policy": "MlpPolicy", "env": "CartPole-v1", "gamma": 0.0037857070275125987, "max_grad_norm": 1.068991897259356, "exponent_n_steps": 9, "learning_rate": 0.0061663610638304405, "net_arch": "small", "activation_fn": "tanh", "n_training_timesteps": 20000, "n_eval_episodes": 10}