tqc-PandaReach-v1 / config.yml
araffin's picture
Initial commit
b07589a
raw
history blame contribute delete
616 Bytes
!!python/object/apply:collections.OrderedDict
- - - batch_size
- 256
- - buffer_size
- 1000000
- - ent_coef
- auto
- - env_wrapper
- sb3_contrib.common.wrappers.TimeFeatureWrapper
- - gamma
- 0.95
- - learning_rate
- 0.001
- - learning_starts
- 1000
- - n_timesteps
- 20000.0
- - normalize
- true
- - policy
- MultiInputPolicy
- - policy_kwargs
- dict(net_arch=[64, 64], n_critics=1)
- - replay_buffer_class
- HerReplayBuffer
- - replay_buffer_kwargs
- dict( online_sampling=True, goal_selection_strategy='future', n_sampled_goal=4
)