general_cfg: algo_name: SAC continuous: true device: cuda env_name: LunarLanderContinuous-v2 eval_eps: 10 eval_per_episode: 5 load_checkpoint: false load_path: Train_LunarLanderContinuous-v2_PPO_20230401-102521 max_steps: 500 mode: train new_step_api: true render: false save_fig: true seed: 666 show_fig: false test_eps: 20 train_eps: 2000 wrapper: null algo_cfg: alpha: 0.1 automatic_entropy_tuning: false batch_size: 64 buffer_size: 1000000 gamma: 0.99 hidden_dim: 256 lr: 0.001 n_epochs: 1 policy_type: Gaussian start_steps: 10000 target_update_fre: 1 tau: 0.005