!!python/object/apply:collections.OrderedDict - - - batch_size - 64 - - buffer_size - 700000 - - env_wrapper - - stable_baselines3.common.atari_wrappers.AtariWrapper - - exploration_final_eps - 0.01 - - exploration_fraction - 0.025 - - frame_stack - 2 - - gamma - 0.99 - - gradient_steps - 1 - - learning_rate - 5.0e-05 - - learning_starts - 50000 - - n_timesteps - 1000000.0 - - normalize - false - - policy - CnnPolicy - - target_update_interval - 10000 - - train_freq - 4