general_cfg: algo_name: A2C device: cpu env_name: CartPole-v1 eval_eps: 10 eval_per_episode: 5 load_checkpoint: false load_path: Train_CartPole-v1_DQN_20221026-054757 max_steps: 200 mode: train new_step_api: true render: false save_fig: true seed: 1 show_fig: false test_eps: 10 train_eps: 1000 wrapper: null algo_cfg: actor_hidden_dim: 256 actor_lr: 0.0003 continuous: false critic_hidden_dim: 256 critic_lr: 0.001 entropy_coef: 0.001 gamma: 0.99 update_freq: 20