dqn-Acrobot-v1 / config.yml
araffin's picture
Initial commit
9b232ec
!!python/object/apply:collections.OrderedDict
- - - batch_size
- 128
- - buffer_size
- 50000
- - exploration_final_eps
- 0.1
- - exploration_fraction
- 0.12
- - gamma
- 0.99
- - gradient_steps
- -1
- - learning_rate
- 0.00063
- - learning_starts
- 0
- - n_timesteps
- 100000.0
- - policy
- MlpPolicy
- - policy_kwargs
- dict(net_arch=[256, 256])
- - target_update_interval
- 250
- - train_freq
- 4