!!python/object/apply:collections.OrderedDict - - - batch_size - 128 - - ent_coef - 0.01 - - gae_lambda - 0.98 - - gamma - 0.999 - - n_envs - 8 - - n_epochs - 4 - - n_steps - 512 - - n_timesteps - 5000000.0 - - normalize - true - - policy - MlpLstmPolicy - - policy_kwargs - dict( ortho_init=False, activation_fn=nn.ReLU, lstm_hidden_size=64, enable_critic_lstm=True, net_arch=[dict(pi=[64], vf=[64])] )