Quentin Gallouédec
Initial commit
5222784
raw
history blame
490 Bytes
!!python/object/apply:collections.OrderedDict
- - - batch_size
- 128
- - buffer_size
- 50000
- - exploration_final_eps
- 0.1
- - exploration_fraction
- 0.12
- - gamma
- 0.99
- - gradient_steps
- -1
- - learning_rate
- 0.00063
- - learning_starts
- 0
- - n_timesteps
- 100000.0
- - policy
- MlpPolicy
- - policy_kwargs
- dict(net_arch=[256, 256], n_quantiles=25)
- - target_update_interval
- 250
- - train_freq
- 4