johnjim0816
add all benchmarks
62e03a2
|
general_cfg: |
|
algo_name: DDPG_HER |
|
device: cpu |
|
env_name: Pendulum-v1 |
|
eval_eps: 10 |
|
eval_per_episode: 5 |
|
her_sample_num: 4 |
|
load_checkpoint: false |
|
load_path: tasks |
|
max_steps: 200 |
|
mode: train |
|
mp_backend: mp |
|
new_step_api: true |
|
render: false |
|
render_mode: human |
|
save_fig: true |
|
seed: 0 |
|
show_fig: false |
|
test_eps: 20 |
|
train_eps: 150 |
|
update_every: 100 |
|
wrapper: null |
|
algo_cfg: |
|
actor_hidden_dim: 256 |
|
actor_lr: 0.0001 |
|
batch_size: 128 |
|
buffer_size: 8000 |
|
critic_hidden_dim: 256 |
|
critic_lr: 0.001 |
|
gamma: 0.99 |
|
tau: 0.001 |
|
|