DanGalt commited on
Commit
a7a1822
1 Parent(s): e9cff6e

Upload 2nd model with longer training.

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
- value: -530.25 +/- 79.21
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
+ value: 181.85 +/- 36.62
20
  name: mean_reward
21
  verified: false
22
  ---
config.json CHANGED
@@ -1 +1 @@
1
- {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f14f73a74c0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f14f73a7550>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f14f73a75e0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f14f73a7670>", "_build": "<function ActorCriticPolicy._build at 0x7f14f73a7700>", "forward": "<function ActorCriticPolicy.forward at 0x7f14f73a7790>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f14f73a7820>", "_predict": "<function ActorCriticPolicy._predict at 0x7f14f73a78b0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f14f73a7940>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f14f73a79d0>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f14f73a7a60>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc_data object at 0x7f14f7416de0>"}, "verbose": 1, "policy_kwargs": {}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVnwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/5RoCksIhZSMAUOUdJRSlIwEaGlnaJRoEiiWIAAAAAAAAAAAAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAf5RoCksIhZRoFXSUUpSMDWJvdW5kZWRfYmVsb3eUaBIolggAAAAAAAAAAAAAAAAAAACUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYIAAAAAAAAAAAAAAAAAAAAlGghSwiFlGgVdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [8], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False]", "bounded_above": "[False False False False False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gAWVggAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUaAeTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu", "n": 4, "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "num_timesteps": 2048, "_total_timesteps": 2000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1670605634789431138, "learning_rate": 0.0003, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4BDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/M6kqMFUyYYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAIZmOL6LAWA/Ipz7viG6Zr9QTu0+MxiJPgAAAAAAAAAAWlKQPeo2qT/RjQo/732+vq2ljr36J5W9AAAAAAAAAACa1xo8HpzUPzQiLz1zIf29NVu0PS5mhrwAAAAAAAAAANrYtL4yTiQ/0hpTv1KJbb+iJWY+NuN4PQAAAAAAAAAAZoanPBWeUj9k6i895ct9v0qPz7y6yw69AAAAAAAAAACGJEC+cQArP54ZE7/htoy/0+yWPmvK9z0AAAAAAAAAALNQ2D3WbaI/YHUhP8DM/74Lu/u9s5b0vQAAAAAAAAAAmt2xu4kfqj+Gfg29zH3tvoFAnLyS9LG9AAAAAAAAAAAzznc9I7imP1XabD6yTN6+kDrrvFL2Dr0AAAAAAAAAAABdv7zUJ7A/lsAZv4PA2b7b49g882gvPgAAAAAAAAAAoN4+vu0Mjj/5R7S+Z5Mvv4SKWD7ycSS7AAAAAAAAAAAaGIO9vrlrP2XtpL36yk+/p0bWvU623r0AAAAAAAAAALptHj+jHRs//PGXPyBIk7/41l2/ByLLvgAAAAAAAAAAPlPyvl+PxTxyRKG/PQSIvqRpFkBkTgpAAAAAAAAAAAAaSHA/9LvavVhtij+vw5u/ettKviiRcb8AAAAAAACAP7OUgj7b0fA9fYZbP5divr+FRHm/s47zvgAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.02400000000000002, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWV1QIAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMI2bERiNc7WMCUhpRSlIwBbJRLO4wBdJRHQCMH+Idlum91fZQoaAZoCWgPQwj/lZUmpZhawJSGlFKUaBVLPGgWR0AjCj1wo9cKdX2UKGgGaAloD0MI/iyWIvkHUMCUhpRSlGgVS0VoFkdAIxn9WIXTE3V9lChoBmgJaA9DCJEsYAK39FjAlIaUUpRoFUtKaBZHQCMishgVoHt1fZQoaAZoCWgPQwiXxcTm45FRwJSGlFKUaBVLS2gWR0AjJTXrdFfBdX2UKGgGaAloD0MIf/eOGhPEWcCUhpRSlGgVS1FoFkdAIzELhJiAlXV9lChoBmgJaA9DCB9Hc2TlVVzAlIaUUpRoFUtTaBZHQCM3EKmbb111fZQoaAZoCWgPQwh+bmjKzjJnwJSGlFKUaBVLVGgWR0AjPmzSkTHsdX2UKGgGaAloD0MId50N+WevZcCUhpRSlGgVS1loFkdAI0h7E5yU93V9lChoBmgJaA9DCLqe6LrwxF/AlIaUUpRoFUtbaBZHQCNMRWcSXdF1fZQoaAZoCWgPQwjylNV0PatewJSGlFKUaBVLZ2gWR0AjX4O+ZgG9dX2UKGgGaAloD0MI/YaJBqlidsCUhpRSlGgVS3BoFkdAI3aE8JUo8nV9lChoBmgJaA9DCJm36jpUrFzAlIaUUpRoFUt0aBZHQCN/Ho5ggHN1fZQoaAZoCWgPQwgRV87eGZprwJSGlFKUaBVLdmgWR0AjgaiKziS8dX2UKGgGaAloD0MIsi/ZePAce8CUhpRSlGgVS31oFkdAI42Gyon8bnVlLg=="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 10, "n_steps": 128, "gamma": 0.99, "gae_lambda": 0.95, "ent_coef": 0.0, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 512, "n_epochs": 10, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4BDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/yZmZmZmZmoWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "system_info": {"OS": "Linux-5.10.133+-x86_64-with-glibc2.27 #1 SMP Fri Aug 26 08:44:51 UTC 2022", "Python": "3.8.16", "Stable-Baselines3": "1.6.2", "PyTorch": "1.13.0+cu116", "GPU Enabled": "True", "Numpy": "1.21.6", "Gym": "0.21.0"}}
 
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f99012d3550>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f99012d35e0>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f99012d3670>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f99012d3700>", "_build": "<function ActorCriticPolicy._build at 0x7f99012d3790>", "forward": "<function ActorCriticPolicy.forward at 0x7f99012d3820>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f99012d38b0>", "_predict": "<function ActorCriticPolicy._predict at 0x7f99012d3940>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f99012d39d0>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f99012d3a60>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f99012d3af0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc_data object at 0x7f99012d0690>"}, "verbose": 1, "policy_kwargs": {}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVnwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/5RoCksIhZSMAUOUdJRSlIwEaGlnaJRoEiiWIAAAAAAAAAAAAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAf5RoCksIhZRoFXSUUpSMDWJvdW5kZWRfYmVsb3eUaBIolggAAAAAAAAAAAAAAAAAAACUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYIAAAAAAAAAAAAAAAAAAAAlGghSwiFlGgVdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [8], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False]", "bounded_above": "[False False False False False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gAWVggAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUaAeTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu", "n": 4, "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 64, "num_timesteps": 1048576, "_total_timesteps": 1048576, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1670610620641692433, "learning_rate": {":type:": "<class 'function'>", ":serialized:": "gAWVAQMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLA0tDQwp0AGQBfACDAlMAlE5HP2iTdLxqfvqGlIwJb25lX2N5Y2xllIWUjAVhbHBoYZSFlIwePGlweXRob24taW5wdXQtMy1mYWM5MjUxYTkyYWI+lIwIPGxhbWJkYT6USwdDAJQpKXSUUpR9lCiMC19fcGFja2FnZV9flE6MCF9fbmFtZV9flIwIX19tYWluX1+UdU5OTnSUUpSMHGNsb3VkcGlja2xlLmNsb3VkcGlja2xlX2Zhc3SUjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoGH2UfZQoaBVoD4wMX19xdWFsbmFtZV9flGgPjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgWjAdfX2RvY19flE6MC19fY2xvc3VyZV9flE6MF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lGgKaAIoaAcoSwNLAEsASwNLBEtDQ0B8AWQBawByIHwAZAJkAXwBGABkARsAGAAUAHwCFwBTAHQAfAFkARgAZAMbAHQBFABkBBsAgwF8ABQAfAIXAFMAlChORz/JmZmZmZmaSwFHP+mZmZmZmZpLAnSUjANjb3OUjAJwaZSGlIwDbHIwlGgMjANlcHOUh5SMHjxpcHl0aG9uLWlucHV0LTEtMjU2YjU1NzE1MzY4PpRoCksfQwYAAQgBGAGUKSl0lFKUaBNOTk50lFKUaBtoN32UfZQoaBVoCmgeaApoH32UaCFOaCJHPnrX8pq8r0iFlGgjaBZoJE5oJU5oJl2UaCh9lChoLIwEbWF0aJSMA2Nvc5STlGgtR0AJIftURC0YdXWGlIZSMHN1hpSGUjAu"}, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVAQMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLA0tDQwp0AGQBfACDAlMAlE5HP2iTdLxqfvqGlIwJb25lX2N5Y2xllIWUjAVhbHBoYZSFlIwePGlweXRob24taW5wdXQtMy1mYWM5MjUxYTkyYWI+lIwIPGxhbWJkYT6USwdDAJQpKXSUUpR9lCiMC19fcGFja2FnZV9flE6MCF9fbmFtZV9flIwIX19tYWluX1+UdU5OTnSUUpSMHGNsb3VkcGlja2xlLmNsb3VkcGlja2xlX2Zhc3SUjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoGH2UfZQoaBVoD4wMX19xdWFsbmFtZV9flGgPjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgWjAdfX2RvY19flE6MC19fY2xvc3VyZV9flE6MF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lGgKaAIoaAcoSwNLAEsASwNLBEtDQ0B8AWQBawByIHwAZAJkAXwBGABkARsAGAAUAHwCFwBTAHQAfAFkARgAZAMbAHQBFABkBBsAgwF8ABQAfAIXAFMAlChORz/JmZmZmZmaSwFHP+mZmZmZmZpLAnSUjANjb3OUjAJwaZSGlIwDbHIwlGgMjANlcHOUh5SMHjxpcHl0aG9uLWlucHV0LTEtMjU2YjU1NzE1MzY4PpRoCksfQwYAAQgBGAGUKSl0lFKUaBNOTk50lFKUaBtoN32UfZQoaBVoCmgeaApoH32UaCFOaCJHPnrX8pq8r0iFlGgjaBZoJE5oJU5oJl2UaCh9lChoLIwEbWF0aJSMA2Nvc5STlGgtR0AJIftURC0YdXWGlIZSMHN1hpSGUjAu"}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQgAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYACAAAAAAAABpcmL3Inqg/VDKsvVx9Ar7biiK9Y+otvAAAAAAAAAAAALY8vPZQc7pyGpa7fy1MOEHtB7sKcec4AACAPwAAgD8Av5W9GWRRPuylOLzvMce9XtPku9bR3zwAAAAAAAAAAJqeVL3D+QK6S3mvOKtHo7WnIEK5lDbLtwAAgD8AAIA/LSmKPq/Iaj8C3Gq9bksPvsYNoDzGhE09AAAAAAAAAAAzg4S8rcFsP+heTj5drMi9i8zdPFbtJD0AAAAAAAAAABBiMD+o0II/47uqPnGqG74nmiU+O7OYOgAAAAAAAAAAYLuMvtnGNT+T6Io+5Of/vbB0kTy6ZIe7AAAAAAAAAABNGjI+nN93Pg1heb1XBQe+VhuGu9KpqDwAAAAAAAAAAHpWub5VFZ8/YbuuPcuVnL14YHi9678hPQAAAAAAAAAAzWvMPSMOJz2UcDW+Lyfjvbik47ymKZu9AAAAAAAAAAANuIE9XGsEujIlWDqQHtg1i4mbOrZSfbkAAIA/AACAP4aOCj4hRoQ/vhL6vDKb8b02Q2K75e1ZvQAAAAAAAAAAjXGyveFQjroCDRe5a8npNdZekjr0UbM3AACAPwAAgD+FKLq+6BWCP0TOgL0N83K9TmmKvXLME7sAAAAAAAAAAABA5jpXG7I//8GhO0LJzr3Zcly8GVUevQAAAAAAAAAAIDUkPhxASLz+EjY80e2duth3rL19X4G7AACAPwAAgD/60Uw+OGCou90OgTpL17W3TbUSvbZAmrkAAIA/AACAP5rHWTxzeIo/7pg/Pcu8Ab5t7a675VrMvAAAAAAAAAAAbcd+vhg0Kj+hr6s+YD6dvWpEXT1yowa9AAAAAAAAAABmHh28C/axPa8vib3br7S9+pmGu6Bvdz0AAAAAAAAAAAPU6z7uhEk/Yms8vv1pLL5ftSG7xQjevAAAAAAAAAAAzbpfPXt6pLoiVmK4GrVPszIjszpO+IE3AACAPwAAgD/T3DQ+m0z1PaPmNr6/JNW9Tmq6vCHVhL0AAAAAAAAAAFrq6j3hdGk+U1pWPaKOBL7o2fM8mcgBvAAAAAAAAAAArXImPulnQ7y/eis77zw4uemftb0AFFy6AACAPwAAgD8A/GK8KUxeutCgj7k8Xc2z9wN0u1J5pzgAAIA/AACAP9M+Yj4oYZo+Coatve/X5b3BwI079tsvvQAAAAAAAAAAxhcuPhksbD8CEXu8pai0veyfjzxL8dQ8AAAAAAAAAABAUN+9zvGLP1N9/Dwt/p69GwqJvJ3q7DwAAAAAAAAAAC0NEb5s1Jc/ToLmvqLfkr5SBO09AL7YvQAAAAAAAAAAY6KZPjl1Jz8OhOS939XsvWdZp7nmAi87AAAAAAAAAACKHe2+pYGFP2D4Vz1M0Za9zRdsvY5fzbwAAAAAAAAAAL3Nxj5XKno/z+DGO88JAr73EGg913uBuwAAAAAAAAAAmqwhvcMBarqnlR62PPsUseyCi7n4EkQ1AACAPwAAgD/aIhe+H+1OP1mQKz7uEoS9cNYOPJqcWbwAAAAAAAAAAIAidz17qrC6AtXUOsDHhTVPhy26OpjyuQAAgD8AAIA/yL/cvmuEPj/C84A+MakAvhT2RzwSULI9AAAAAAAAAAAAnJ29Evb0PhvqtT0ww+O9KPKROwTDIr0AAAAAAAAAAICZcz17hJe6HUzpOuKNRzVRavq6/sIFugAAgD8AAAAA4/rPPqJqsD+Htg0/11PrvStMLD5lhX68AAAAAAAAAABmzt+97FHsufRCQ7uv9o01RU4MOyCDYjoAAIA/AAAAAIAyaL0vG0Q/TlcpPlugmr0UhaY8WMCCPAAAAAAAAAAAWkSaPYWz7rl3g0K8Ng1MNZGqlzsLvby0AACAPwAAgD/Gki8+p7hEP92cWb0EKgy+EoJePI6GPj0AAAAAAAAAADPvvDuP2Dw/O1W0vMGw6b3LK2e8xrDHvAAAAAAAAAAAevyIPuT8T72lABI950K7u+3dt74fnoW8AACAPwAAgD/NhKS+F7AqPyB8gz79eMC9XpqWPP7PajwAAAAAAAAAAEDRUT7Xg167YIA7ubcZDTawxbS8ZttbOAAAgD8AAIA/M4rlPhifMT/uCDa9jPkGvgA0VT0Dwtu8AAAAAAAAAADaXAG+4i+3P98yib5wGLu9M6KuvYsQET0AAAAAAAAAAGLgC78GR4M/JOgmvvT2qL17tw++04pbPQAAAAAAAAAArSAZPq7/krrqmIW5JpMwNfmq1rsejJ84AACAPwAAgD9m2JK8euppPr1kzbwvuMS9Y3rputkOMTwAAAAAAAAAAJqJ5rpkZTE/AsGPuzK3or0CTOG6cJ5euwAAAAAAAAAA830GP4t0lz+YgpI+X2Quviwa9D2Oa1u9AAAAAAAAAADN73+9CeWOPrKsKj1l4sa9A/kTPPYlZDwAAAAAAAAAADMv77x03pE/bm21PIeJrb2bRpS80/ANOwAAAAAAAAAAmvG6u3jXmT8TKVk99Z1yvVJ1z7tDu0k8AAAAAAAAAADtb/Q+/O93P8L2IT3LewO+afIpPYFjCLwAAAAAAAAAAPjR7L5YepY/yGpOvu9/pb1w3ga+oq/TtwAAAAAAAAAATUKBPfa4SrqYZHg8/ASGPN8MeTvVH2o9AACAPwAAgD8wg5U+SbDdPrhxV76yRBK+c8ncvIKdVL0AAAAAAAAAAKbImr094WU8oJNRvmIekL18gCa9loOIPAAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYktASwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVswAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJZAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiS0CFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": 0.0, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVgBAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIrRVtjnPdQkCUhpRSlIwBbJRN6AOMAXSUR0CQ+AfHPu5SdX2UKGgGaAloD0MIPpRoyWN/ZUCUhpRSlGgVTQkDaBZHQJEH4MDwH7h1fZQoaAZoCWgPQwiAu+zXnWpKQJSGlFKUaBVN6ANoFkdAkQz/bCaZyHV9lChoBmgJaA9DCAVvSKMC7WhAlIaUUpRoFU1eA2gWR0CREH6d1+y7dX2UKGgGaAloD0MIHCRE+QLOa0CUhpRSlGgVTfoCaBZHQJEZyvQnhKl1fZQoaAZoCWgPQwg/kSdJ1w5cQJSGlFKUaBVN6ANoFkdAkR5bQokRjHV9lChoBmgJaA9DCONTAIxnfWdAlIaUUpRoFU3wAmgWR0CRIybpu/DcdX2UKGgGaAloD0MI/OB86lhJW0CUhpRSlGgVTegDaBZHQJEmdK28Zk11fZQoaAZoCWgPQwg1C7Q7pD5FQJSGlFKUaBVN6ANoFkdAkSqT3IuGsXV9lChoBmgJaA9DCAhyUMLMbmhAlIaUUpRoFU3oAmgWR0CRM/depn6EdX2UKGgGaAloD0MIij20jxUJYECUhpRSlGgVTegDaBZHQJE0U4lyBCl1fZQoaAZoCWgPQwhRacTMvrVoQJSGlFKUaBVNUANoFkdAkTTGLLpzLnV9lChoBmgJaA9DCOSHSiNmV1NAlIaUUpRoFU3oA2gWR0CRNe6CDmKZdX2UKGgGaAloD0MIpFUt6SjFYkCUhpRSlGgVTdYCaBZHQJE68R28qWl1fZQoaAZoCWgPQwia0vpbgtxnQJSGlFKUaBVNmwNoFkdAkUBJu/Dcd3V9lChoBmgJaA9DCHSbcK/M1GJAlIaUUpRoFU0EA2gWR0CRQf5OrQw9dX2UKGgGaAloD0MI963WictMZkCUhpRSlGgVTQADaBZHQJFKUu14Pf91fZQoaAZoCWgPQwi7RPXWwGZDQJSGlFKUaBVN6ANoFkdAkUqUdzXBg3V9lChoBmgJaA9DCFVrYRZalmlAlIaUUpRoFU3hAmgWR0CRTQpblijMdX2UKGgGaAloD0MIu+8YHvs8XUCUhpRSlGgVTegDaBZHQJFO9ZowmE51fZQoaAZoCWgPQwhp/MIrSWdVQJSGlFKUaBVN6ANoFkdAkVDeD3/PxHV9lChoBmgJaA9DCC7HKxC9hGNAlIaUUpRoFU3fA2gWR0CRUfmw7kn1dX2UKGgGaAloD0MINNsV+mBXaECUhpRSlGgVTYwDaBZHQJFU4j/uLJl1fZQoaAZoCWgPQwgJGcizyxVjQJSGlFKUaBVNywNoFkdAkVyn+AEt/XV9lChoBmgJaA9DCITVWMLaamVAlIaUUpRoFU0XA2gWR0CRYYd1MdtEdX2UKGgGaAloD0MIUfhsHRxebECUhpRSlGgVTX0DaBZHQJFjv2Jzkp91fZQoaAZoCWgPQwhGtB1Td8dmQJSGlFKUaBVNGQNoFkdAkWsL1ZkkKXV9lChoBmgJaA9DCPPlBdhHzVRAlIaUUpRoFU3oA2gWR0CRbjXWvr4WdX2UKGgGaAloD0MI3enOE0/UZkCUhpRSlGgVTVgDaBZHQJFxAXwb2lF1fZQoaAZoCWgPQwgXg4dp3xVsQJSGlFKUaBVNFgNoFkdAkXTb8BMi8nV9lChoBmgJaA9DCCtLdJZZ3VNAlIaUUpRoFU3oA2gWR0CRdRpcX3xndX2UKGgGaAloD0MI7MGk+Pi8TUCUhpRSlGgVTegDaBZHQJGSvCWNWEN1fZQoaAZoCWgPQwjvHqD7cstiQJSGlFKUaBVN0gNoFkdAkZYVSS/0unV9lChoBmgJaA9DCCE6BI4E+GdAlIaUUpRoFU15A2gWR0CRlss1sLv1dX2UKGgGaAloD0MIaoe/JuuDakCUhpRSlGgVTfsCaBZHQJGYYT9KmKt1fZQoaAZoCWgPQwjG/Uemw/ZhQJSGlFKUaBVNRANoFkdAkZqXmA9V3nV9lChoBmgJaA9DCI54spuZ3GhAlIaUUpRoFU0YA2gWR0CRnYHqNZNgdX2UKGgGaAloD0MIAJATJowKPECUhpRSlGgVTegDaBZHQJGhfmSyMUB1fZQoaAZoCWgPQwiJJlDEoiRmQJSGlFKUaBVNAANoFkdAkaH3Z5AyEnV9lChoBmgJaA9DCNtv7URJjVRAlIaUUpRoFU3oA2gWR0CRpS/kNnXedX2UKGgGaAloD0MI0QX1LXNTYUCUhpRSlGgVTVMDaBZHQJGnLrOZ9eB1fZQoaAZoCWgPQwhE393KEpJZQJSGlFKUaBVN6ANoFkdAka1gh4dIXnV9lChoBmgJaA9DCNBCAkaXrVlAlIaUUpRoFU3oA2gWR0CRu9kNFz+4dX2UKGgGaAloD0MIGJXUCWjESUCUhpRSlGgVTegDaBZHQJHCRJ4B3id1fZQoaAZoCWgPQwgN+tLbHyJkQJSGlFKUaBVNBgNoFkdAkdBoOUdJa3V9lChoBmgJaA9DCAOUhhqFYVFAlIaUUpRoFU3oA2gWR0CR2iTd+G47dX2UKGgGaAloD0MIZOWXwRgnUECUhpRSlGgVTegDaBZHQJHhjj94u9R1fZQoaAZoCWgPQwhZEwt8RcteQJSGlFKUaBVN6ANoFkdAkfiWGh24eHV9lChoBmgJaA9DCFVOe0rOm0lAlIaUUpRoFU3oA2gWR0CSA1NjbzshdX2UKGgGaAloD0MIv7oqUIs2V0CUhpRSlGgVTegDaBZHQJIE0V9F4LV1fZQoaAZoCWgPQwjFknL3OYRGQJSGlFKUaBVN6ANoFkdAkgbDFZPl+3V9lChoBmgJaA9DCLZpbK8FOTVAlIaUUpRoFU3oA2gWR0CSFVlAu7HydX2UKGgGaAloD0MIrDdqhel6VUCUhpRSlGgVTegDaBZHQJIWusKb8WN1fZQoaAZoCWgPQwhprP2d7QpSQJSGlFKUaBVN6ANoFkdAkhdiOearm3V9lChoBmgJaA9DCCdKQiJtI1lAlIaUUpRoFU3oA2gWR0CSGXhZQpF1dX2UKGgGaAloD0MI9x+ZDp3+CECUhpRSlGgVTfsBaBZHQJIbnxwyZa51fZQoaAZoCWgPQwgJqHAEqd9ZQJSGlFKUaBVN6ANoFkdAkhylT3qRl3V9lChoBmgJaA9DCFcG1QYnPlxAlIaUUpRoFU3oA2gWR0CSIu7ROUMYdX2UKGgGaAloD0MIJzCd1m0IRUCUhpRSlGgVTegDaBZHQJIqhxlxwQ11fZQoaAZoCWgPQwiGqwMg7rlSQJSGlFKUaBVN6ANoFkdAkjVcj7hvSHV9lChoBmgJaA9DCHlZEwt831NAlIaUUpRoFU3oA2gWR0CSR29itq59dX2UKGgGaAloD0MIXaj8a3lRSUCUhpRSlGgVTegDaBZHQJJQOYv38Gd1fZQoaAZoCWgPQwhVUbzK2uNdQJSGlFKUaBVN9wJoFkdAklmo6XBxgnV9lChoBmgJaA9DCMDMd/CTqGFAlIaUUpRoFU0rA2gWR0CSYATHKfWddX2UKGgGaAloD0MIW+1hL5RLaUCUhpRSlGgVTbkDaBZHQJJ4Wn1nM+x1fZQoaAZoCWgPQwj0FaQZC/lnQJSGlFKUaBVNswJoFkdAknrx6nivPnV9lChoBmgJaA9DCAaf5uRFeGhAlIaUUpRoFU1WA2gWR0CSgGt5D7ZWdX2UKGgGaAloD0MI1NUdi239UECUhpRSlGgVTegDaBZHQJKB/KNhmXh1fZQoaAZoCWgPQwgsgCkDBw9rQJSGlFKUaBVNlANoFkdAkoKNWuHN5nV9lChoBmgJaA9DCF+0xwvpGl1AlIaUUpRoFU3oA2gWR0CSivF3pwCKdX2UKGgGaAloD0MIb9dLU4SpY0CUhpRSlGgVTYgDaBZHQJKN6l9Brvd1fZQoaAZoCWgPQwj5hsJn60dlQJSGlFKUaBVNuwNoFkdAko4uyE+PinV9lChoBmgJaA9DCCS5/Id09mpAlIaUUpRoFU27AmgWR0CSkSb7TDwZdX2UKGgGaAloD0MIOpShKibsZkCUhpRSlGgVTbsCaBZHQJKRczbeuV51fZQoaAZoCWgPQwiIvruVJVFUQJSGlFKUaBVN6ANoFkdAkpLmIGhVVHV9lChoBmgJaA9DCG9/LhqyVWpAlIaUUpRoFU1eA2gWR0CSnNXtBv74dX2UKGgGaAloD0MIkkCDTR1iaUCUhpRSlGgVTfUCaBZHQJKhNYhdMTN1fZQoaAZoCWgPQwiI9UatMI1qQJSGlFKUaBVNVgNoFkdAkqH9qgyuZHV9lChoBmgJaA9DCF0Y6UXtp1RAlIaUUpRoFU3oA2gWR0CSqL6oVEeAdX2UKGgGaAloD0MI2dDN/sCsYECUhpRSlGgVTVkCaBZHQJK066BiCrd1fZQoaAZoCWgPQwjdmJ6wxB5RQJSGlFKUaBVN6ANoFkdAkri6yjYZmHV9lChoBmgJaA9DCHqmlxhL72pAlIaUUpRoFU3GA2gWR0CSuzxFiKBNdX2UKGgGaAloD0MI00z3OqlyZECUhpRSlGgVTcsDaBZHQJK7uohpxm11fZQoaAZoCWgPQwgukQvO4GljQJSGlFKUaBVN4ANoFkdAksMukP+XJHV9lChoBmgJaA9DCOurqwK1Sl5AlIaUUpRoFU3oA2gWR0CSxU0PH1e0dX2UKGgGaAloD0MIR450BkbiUMCUhpRSlGgVS5VoFkdAksnqB/Zuh3V9lChoBmgJaA9DCL9hokEKplJAlIaUUpRoFU3oA2gWR0CSyjFY+0PZdX2UKGgGaAloD0MIWDm0yHYDWkCUhpRSlGgVTegDaBZHQJLOjpfQa751fZQoaAZoCWgPQwiP/wJBgOlYQJSGlFKUaBVN6ANoFkdAktiKDsdDIHV9lChoBmgJaA9DCGUBE7h1zmZAlIaUUpRoFU0VA2gWR0CS2O13+uNhdX2UKGgGaAloD0MIpyOAm8URR0CUhpRSlGgVTegDaBZHQJLaz7MxGlR1fZQoaAZoCWgPQwjChTyCG+BlQJSGlFKUaBVNmQNoFkdAktvEyckMTnV9lChoBmgJaA9DCAhZFkz8Y1ZAlIaUUpRoFU3oA2gWR0CS3GisGPgfdX2UKGgGaAloD0MIZhah2Ar6XUCUhpRSlGgVTegDaBZHQJLd//Q0GeN1fZQoaAZoCWgPQwjMC7CPTmddQJSGlFKUaBVN6ANoFkdAkt70xASnL3V9lChoBmgJaA9DCLd9j/rrwlNAlIaUUpRoFU3oA2gWR0CS6BJP69CedX2UKGgGaAloD0MIEHS0qiXpNECUhpRSlGgVTegDaBZHQJLsTr9l2/11fZQoaAZoCWgPQwh5eTpXlEpnQJSGlFKUaBVNaANoFkdAku/EBsANonV9lChoBmgJaA9DCNKqlnSUNmdAlIaUUpRoFU1hA2gWR0CS8tYzi0fHdX2UKGgGaAloD0MINE3YfjLPWkCUhpRSlGgVTegDaBZHQJL5B6X0Gu91ZS4="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 1280, "n_steps": 128, "gamma": 0.9999, "gae_lambda": 0.95, "ent_coef": 0.0001, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 2048, "n_epochs": 10, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4BDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/yZmZmZmZmoWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "system_info": {"OS": "Linux-5.10.133+-x86_64-with-glibc2.27 #1 SMP Fri Aug 26 08:44:51 UTC 2022", "Python": "3.8.16", "Stable-Baselines3": "1.6.2", "PyTorch": "1.13.0+cu116", "GPU Enabled": "True", "Numpy": "1.21.6", "Gym": "0.21.0"}}
ppo-LunarLander-v2.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5b1e0e160c33299b4608f64ebc9225cc41d09fdbb9764a9f762fd1145d9e4508
3
- size 142545
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:713cbb464d8d4364f9119a3fe4af69e04879b8c3bd9480e8b3193820f29b0e13
3
+ size 150506
ppo-LunarLander-v2/data CHANGED
@@ -4,19 +4,19 @@
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
- "__init__": "<function ActorCriticPolicy.__init__ at 0x7f14f73a74c0>",
8
- "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f14f73a7550>",
9
- "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f14f73a75e0>",
10
- "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f14f73a7670>",
11
- "_build": "<function ActorCriticPolicy._build at 0x7f14f73a7700>",
12
- "forward": "<function ActorCriticPolicy.forward at 0x7f14f73a7790>",
13
- "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f14f73a7820>",
14
- "_predict": "<function ActorCriticPolicy._predict at 0x7f14f73a78b0>",
15
- "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f14f73a7940>",
16
- "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f14f73a79d0>",
17
- "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f14f73a7a60>",
18
  "__abstractmethods__": "frozenset()",
19
- "_abc_impl": "<_abc_data object at 0x7f14f7416de0>"
20
  },
21
  "verbose": 1,
22
  "policy_kwargs": {},
@@ -41,48 +41,51 @@
41
  "dtype": "int64",
42
  "_np_random": null
43
  },
44
- "n_envs": 16,
45
- "num_timesteps": 2048,
46
- "_total_timesteps": 2000,
47
  "_num_timesteps_at_start": 0,
48
  "seed": null,
49
  "action_noise": null,
50
- "start_time": 1670605634789431138,
51
- "learning_rate": 0.0003,
 
 
 
52
  "tensorboard_log": null,
53
  "lr_schedule": {
54
  ":type:": "<class 'function'>",
55
- ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4BDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/M6kqMFUyYYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="
56
  },
57
  "_last_obs": {
58
  ":type:": "<class 'numpy.ndarray'>",
59
- ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAIZmOL6LAWA/Ipz7viG6Zr9QTu0+MxiJPgAAAAAAAAAAWlKQPeo2qT/RjQo/732+vq2ljr36J5W9AAAAAAAAAACa1xo8HpzUPzQiLz1zIf29NVu0PS5mhrwAAAAAAAAAANrYtL4yTiQ/0hpTv1KJbb+iJWY+NuN4PQAAAAAAAAAAZoanPBWeUj9k6i895ct9v0qPz7y6yw69AAAAAAAAAACGJEC+cQArP54ZE7/htoy/0+yWPmvK9z0AAAAAAAAAALNQ2D3WbaI/YHUhP8DM/74Lu/u9s5b0vQAAAAAAAAAAmt2xu4kfqj+Gfg29zH3tvoFAnLyS9LG9AAAAAAAAAAAzznc9I7imP1XabD6yTN6+kDrrvFL2Dr0AAAAAAAAAAABdv7zUJ7A/lsAZv4PA2b7b49g882gvPgAAAAAAAAAAoN4+vu0Mjj/5R7S+Z5Mvv4SKWD7ycSS7AAAAAAAAAAAaGIO9vrlrP2XtpL36yk+/p0bWvU623r0AAAAAAAAAALptHj+jHRs//PGXPyBIk7/41l2/ByLLvgAAAAAAAAAAPlPyvl+PxTxyRKG/PQSIvqRpFkBkTgpAAAAAAAAAAAAaSHA/9LvavVhtij+vw5u/ettKviiRcb8AAAAAAACAP7OUgj7b0fA9fYZbP5divr+FRHm/s47zvgAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
60
  },
61
  "_last_episode_starts": {
62
  ":type:": "<class 'numpy.ndarray'>",
63
- ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="
64
  },
65
  "_last_original_obs": null,
66
  "_episode_num": 0,
67
  "use_sde": false,
68
  "sde_sample_freq": -1,
69
- "_current_progress_remaining": -0.02400000000000002,
70
  "ep_info_buffer": {
71
  ":type:": "<class 'collections.deque'>",
72
- ":serialized:": "gAWV1QIAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMI2bERiNc7WMCUhpRSlIwBbJRLO4wBdJRHQCMH+Idlum91fZQoaAZoCWgPQwj/lZUmpZhawJSGlFKUaBVLPGgWR0AjCj1wo9cKdX2UKGgGaAloD0MI/iyWIvkHUMCUhpRSlGgVS0VoFkdAIxn9WIXTE3V9lChoBmgJaA9DCJEsYAK39FjAlIaUUpRoFUtKaBZHQCMishgVoHt1fZQoaAZoCWgPQwiXxcTm45FRwJSGlFKUaBVLS2gWR0AjJTXrdFfBdX2UKGgGaAloD0MIf/eOGhPEWcCUhpRSlGgVS1FoFkdAIzELhJiAlXV9lChoBmgJaA9DCB9Hc2TlVVzAlIaUUpRoFUtTaBZHQCM3EKmbb111fZQoaAZoCWgPQwh+bmjKzjJnwJSGlFKUaBVLVGgWR0AjPmzSkTHsdX2UKGgGaAloD0MId50N+WevZcCUhpRSlGgVS1loFkdAI0h7E5yU93V9lChoBmgJaA9DCLqe6LrwxF/AlIaUUpRoFUtbaBZHQCNMRWcSXdF1fZQoaAZoCWgPQwjylNV0PatewJSGlFKUaBVLZ2gWR0AjX4O+ZgG9dX2UKGgGaAloD0MI/YaJBqlidsCUhpRSlGgVS3BoFkdAI3aE8JUo8nV9lChoBmgJaA9DCJm36jpUrFzAlIaUUpRoFUt0aBZHQCN/Ho5ggHN1fZQoaAZoCWgPQwgRV87eGZprwJSGlFKUaBVLdmgWR0AjgaiKziS8dX2UKGgGaAloD0MIsi/ZePAce8CUhpRSlGgVS31oFkdAI42Gyon8bnVlLg=="
73
  },
74
  "ep_success_buffer": {
75
  ":type:": "<class 'collections.deque'>",
76
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
77
  },
78
- "_n_updates": 10,
79
  "n_steps": 128,
80
- "gamma": 0.99,
81
  "gae_lambda": 0.95,
82
- "ent_coef": 0.0,
83
  "vf_coef": 0.5,
84
  "max_grad_norm": 0.5,
85
- "batch_size": 512,
86
  "n_epochs": 10,
87
  "clip_range": {
88
  ":type:": "<class 'function'>",
 
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
+ "__init__": "<function ActorCriticPolicy.__init__ at 0x7f99012d3550>",
8
+ "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f99012d35e0>",
9
+ "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f99012d3670>",
10
+ "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f99012d3700>",
11
+ "_build": "<function ActorCriticPolicy._build at 0x7f99012d3790>",
12
+ "forward": "<function ActorCriticPolicy.forward at 0x7f99012d3820>",
13
+ "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f99012d38b0>",
14
+ "_predict": "<function ActorCriticPolicy._predict at 0x7f99012d3940>",
15
+ "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f99012d39d0>",
16
+ "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f99012d3a60>",
17
+ "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f99012d3af0>",
18
  "__abstractmethods__": "frozenset()",
19
+ "_abc_impl": "<_abc_data object at 0x7f99012d0690>"
20
  },
21
  "verbose": 1,
22
  "policy_kwargs": {},
 
41
  "dtype": "int64",
42
  "_np_random": null
43
  },
44
+ "n_envs": 64,
45
+ "num_timesteps": 1048576,
46
+ "_total_timesteps": 1048576,
47
  "_num_timesteps_at_start": 0,
48
  "seed": null,
49
  "action_noise": null,
50
+ "start_time": 1670610620641692433,
51
+ "learning_rate": {
52
+ ":type:": "<class 'function'>",
53
+ ":serialized:": "gAWVAQMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLA0tDQwp0AGQBfACDAlMAlE5HP2iTdLxqfvqGlIwJb25lX2N5Y2xllIWUjAVhbHBoYZSFlIwePGlweXRob24taW5wdXQtMy1mYWM5MjUxYTkyYWI+lIwIPGxhbWJkYT6USwdDAJQpKXSUUpR9lCiMC19fcGFja2FnZV9flE6MCF9fbmFtZV9flIwIX19tYWluX1+UdU5OTnSUUpSMHGNsb3VkcGlja2xlLmNsb3VkcGlja2xlX2Zhc3SUjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoGH2UfZQoaBVoD4wMX19xdWFsbmFtZV9flGgPjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgWjAdfX2RvY19flE6MC19fY2xvc3VyZV9flE6MF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lGgKaAIoaAcoSwNLAEsASwNLBEtDQ0B8AWQBawByIHwAZAJkAXwBGABkARsAGAAUAHwCFwBTAHQAfAFkARgAZAMbAHQBFABkBBsAgwF8ABQAfAIXAFMAlChORz/JmZmZmZmaSwFHP+mZmZmZmZpLAnSUjANjb3OUjAJwaZSGlIwDbHIwlGgMjANlcHOUh5SMHjxpcHl0aG9uLWlucHV0LTEtMjU2YjU1NzE1MzY4PpRoCksfQwYAAQgBGAGUKSl0lFKUaBNOTk50lFKUaBtoN32UfZQoaBVoCmgeaApoH32UaCFOaCJHPnrX8pq8r0iFlGgjaBZoJE5oJU5oJl2UaCh9lChoLIwEbWF0aJSMA2Nvc5STlGgtR0AJIftURC0YdXWGlIZSMHN1hpSGUjAu"
54
+ },
55
  "tensorboard_log": null,
56
  "lr_schedule": {
57
  ":type:": "<class 'function'>",
58
+ ":serialized:": "gAWVAQMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLA0tDQwp0AGQBfACDAlMAlE5HP2iTdLxqfvqGlIwJb25lX2N5Y2xllIWUjAVhbHBoYZSFlIwePGlweXRob24taW5wdXQtMy1mYWM5MjUxYTkyYWI+lIwIPGxhbWJkYT6USwdDAJQpKXSUUpR9lCiMC19fcGFja2FnZV9flE6MCF9fbmFtZV9flIwIX19tYWluX1+UdU5OTnSUUpSMHGNsb3VkcGlja2xlLmNsb3VkcGlja2xlX2Zhc3SUjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoGH2UfZQoaBVoD4wMX19xdWFsbmFtZV9flGgPjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgWjAdfX2RvY19flE6MC19fY2xvc3VyZV9flE6MF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lGgKaAIoaAcoSwNLAEsASwNLBEtDQ0B8AWQBawByIHwAZAJkAXwBGABkARsAGAAUAHwCFwBTAHQAfAFkARgAZAMbAHQBFABkBBsAgwF8ABQAfAIXAFMAlChORz/JmZmZmZmaSwFHP+mZmZmZmZpLAnSUjANjb3OUjAJwaZSGlIwDbHIwlGgMjANlcHOUh5SMHjxpcHl0aG9uLWlucHV0LTEtMjU2YjU1NzE1MzY4PpRoCksfQwYAAQgBGAGUKSl0lFKUaBNOTk50lFKUaBtoN32UfZQoaBVoCmgeaApoH32UaCFOaCJHPnrX8pq8r0iFlGgjaBZoJE5oJU5oJl2UaCh9lChoLIwEbWF0aJSMA2Nvc5STlGgtR0AJIftURC0YdXWGlIZSMHN1hpSGUjAu"
59
  },
60
  "_last_obs": {
61
  ":type:": "<class 'numpy.ndarray'>",
62
+ ":serialized:": "gAWVdQgAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYACAAAAAAAABpcmL3Inqg/VDKsvVx9Ar7biiK9Y+otvAAAAAAAAAAAALY8vPZQc7pyGpa7fy1MOEHtB7sKcec4AACAPwAAgD8Av5W9GWRRPuylOLzvMce9XtPku9bR3zwAAAAAAAAAAJqeVL3D+QK6S3mvOKtHo7WnIEK5lDbLtwAAgD8AAIA/LSmKPq/Iaj8C3Gq9bksPvsYNoDzGhE09AAAAAAAAAAAzg4S8rcFsP+heTj5drMi9i8zdPFbtJD0AAAAAAAAAABBiMD+o0II/47uqPnGqG74nmiU+O7OYOgAAAAAAAAAAYLuMvtnGNT+T6Io+5Of/vbB0kTy6ZIe7AAAAAAAAAABNGjI+nN93Pg1heb1XBQe+VhuGu9KpqDwAAAAAAAAAAHpWub5VFZ8/YbuuPcuVnL14YHi9678hPQAAAAAAAAAAzWvMPSMOJz2UcDW+Lyfjvbik47ymKZu9AAAAAAAAAAANuIE9XGsEujIlWDqQHtg1i4mbOrZSfbkAAIA/AACAP4aOCj4hRoQ/vhL6vDKb8b02Q2K75e1ZvQAAAAAAAAAAjXGyveFQjroCDRe5a8npNdZekjr0UbM3AACAPwAAgD+FKLq+6BWCP0TOgL0N83K9TmmKvXLME7sAAAAAAAAAAABA5jpXG7I//8GhO0LJzr3Zcly8GVUevQAAAAAAAAAAIDUkPhxASLz+EjY80e2duth3rL19X4G7AACAPwAAgD/60Uw+OGCou90OgTpL17W3TbUSvbZAmrkAAIA/AACAP5rHWTxzeIo/7pg/Pcu8Ab5t7a675VrMvAAAAAAAAAAAbcd+vhg0Kj+hr6s+YD6dvWpEXT1yowa9AAAAAAAAAABmHh28C/axPa8vib3br7S9+pmGu6Bvdz0AAAAAAAAAAAPU6z7uhEk/Yms8vv1pLL5ftSG7xQjevAAAAAAAAAAAzbpfPXt6pLoiVmK4GrVPszIjszpO+IE3AACAPwAAgD/T3DQ+m0z1PaPmNr6/JNW9Tmq6vCHVhL0AAAAAAAAAAFrq6j3hdGk+U1pWPaKOBL7o2fM8mcgBvAAAAAAAAAAArXImPulnQ7y/eis77zw4uemftb0AFFy6AACAPwAAgD8A/GK8KUxeutCgj7k8Xc2z9wN0u1J5pzgAAIA/AACAP9M+Yj4oYZo+Coatve/X5b3BwI079tsvvQAAAAAAAAAAxhcuPhksbD8CEXu8pai0veyfjzxL8dQ8AAAAAAAAAABAUN+9zvGLP1N9/Dwt/p69GwqJvJ3q7DwAAAAAAAAAAC0NEb5s1Jc/ToLmvqLfkr5SBO09AL7YvQAAAAAAAAAAY6KZPjl1Jz8OhOS939XsvWdZp7nmAi87AAAAAAAAAACKHe2+pYGFP2D4Vz1M0Za9zRdsvY5fzbwAAAAAAAAAAL3Nxj5XKno/z+DGO88JAr73EGg913uBuwAAAAAAAAAAmqwhvcMBarqnlR62PPsUseyCi7n4EkQ1AACAPwAAgD/aIhe+H+1OP1mQKz7uEoS9cNYOPJqcWbwAAAAAAAAAAIAidz17qrC6AtXUOsDHhTVPhy26OpjyuQAAgD8AAIA/yL/cvmuEPj/C84A+MakAvhT2RzwSULI9AAAAAAAAAAAAnJ29Evb0PhvqtT0ww+O9KPKROwTDIr0AAAAAAAAAAICZcz17hJe6HUzpOuKNRzVRavq6/sIFugAAgD8AAAAA4/rPPqJqsD+Htg0/11PrvStMLD5lhX68AAAAAAAAAABmzt+97FHsufRCQ7uv9o01RU4MOyCDYjoAAIA/AAAAAIAyaL0vG0Q/TlcpPlugmr0UhaY8WMCCPAAAAAAAAAAAWkSaPYWz7rl3g0K8Ng1MNZGqlzsLvby0AACAPwAAgD/Gki8+p7hEP92cWb0EKgy+EoJePI6GPj0AAAAAAAAAADPvvDuP2Dw/O1W0vMGw6b3LK2e8xrDHvAAAAAAAAAAAevyIPuT8T72lABI950K7u+3dt74fnoW8AACAPwAAgD/NhKS+F7AqPyB8gz79eMC9XpqWPP7PajwAAAAAAAAAAEDRUT7Xg167YIA7ubcZDTawxbS8ZttbOAAAgD8AAIA/M4rlPhifMT/uCDa9jPkGvgA0VT0Dwtu8AAAAAAAAAADaXAG+4i+3P98yib5wGLu9M6KuvYsQET0AAAAAAAAAAGLgC78GR4M/JOgmvvT2qL17tw++04pbPQAAAAAAAAAArSAZPq7/krrqmIW5JpMwNfmq1rsejJ84AACAPwAAgD9m2JK8euppPr1kzbwvuMS9Y3rputkOMTwAAAAAAAAAAJqJ5rpkZTE/AsGPuzK3or0CTOG6cJ5euwAAAAAAAAAA830GP4t0lz+YgpI+X2Quviwa9D2Oa1u9AAAAAAAAAADN73+9CeWOPrKsKj1l4sa9A/kTPPYlZDwAAAAAAAAAADMv77x03pE/bm21PIeJrb2bRpS80/ANOwAAAAAAAAAAmvG6u3jXmT8TKVk99Z1yvVJ1z7tDu0k8AAAAAAAAAADtb/Q+/O93P8L2IT3LewO+afIpPYFjCLwAAAAAAAAAAPjR7L5YepY/yGpOvu9/pb1w3ga+oq/TtwAAAAAAAAAATUKBPfa4SrqYZHg8/ASGPN8MeTvVH2o9AACAPwAAgD8wg5U+SbDdPrhxV76yRBK+c8ncvIKdVL0AAAAAAAAAAKbImr094WU8oJNRvmIekL18gCa9loOIPAAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYktASwiGlIwBQ5R0lFKULg=="
63
  },
64
  "_last_episode_starts": {
65
  ":type:": "<class 'numpy.ndarray'>",
66
+ ":serialized:": "gAWVswAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJZAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiS0CFlIwBQ5R0lFKULg=="
67
  },
68
  "_last_original_obs": null,
69
  "_episode_num": 0,
70
  "use_sde": false,
71
  "sde_sample_freq": -1,
72
+ "_current_progress_remaining": 0.0,
73
  "ep_info_buffer": {
74
  ":type:": "<class 'collections.deque'>",
75
+ ":serialized:": "gAWVgBAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIrRVtjnPdQkCUhpRSlIwBbJRN6AOMAXSUR0CQ+AfHPu5SdX2UKGgGaAloD0MIPpRoyWN/ZUCUhpRSlGgVTQkDaBZHQJEH4MDwH7h1fZQoaAZoCWgPQwiAu+zXnWpKQJSGlFKUaBVN6ANoFkdAkQz/bCaZyHV9lChoBmgJaA9DCAVvSKMC7WhAlIaUUpRoFU1eA2gWR0CREH6d1+y7dX2UKGgGaAloD0MIHCRE+QLOa0CUhpRSlGgVTfoCaBZHQJEZyvQnhKl1fZQoaAZoCWgPQwg/kSdJ1w5cQJSGlFKUaBVN6ANoFkdAkR5bQokRjHV9lChoBmgJaA9DCONTAIxnfWdAlIaUUpRoFU3wAmgWR0CRIybpu/DcdX2UKGgGaAloD0MI/OB86lhJW0CUhpRSlGgVTegDaBZHQJEmdK28Zk11fZQoaAZoCWgPQwg1C7Q7pD5FQJSGlFKUaBVN6ANoFkdAkSqT3IuGsXV9lChoBmgJaA9DCAhyUMLMbmhAlIaUUpRoFU3oAmgWR0CRM/depn6EdX2UKGgGaAloD0MIij20jxUJYECUhpRSlGgVTegDaBZHQJE0U4lyBCl1fZQoaAZoCWgPQwhRacTMvrVoQJSGlFKUaBVNUANoFkdAkTTGLLpzLnV9lChoBmgJaA9DCOSHSiNmV1NAlIaUUpRoFU3oA2gWR0CRNe6CDmKZdX2UKGgGaAloD0MIpFUt6SjFYkCUhpRSlGgVTdYCaBZHQJE68R28qWl1fZQoaAZoCWgPQwia0vpbgtxnQJSGlFKUaBVNmwNoFkdAkUBJu/Dcd3V9lChoBmgJaA9DCHSbcK/M1GJAlIaUUpRoFU0EA2gWR0CRQf5OrQw9dX2UKGgGaAloD0MI963WictMZkCUhpRSlGgVTQADaBZHQJFKUu14Pf91fZQoaAZoCWgPQwi7RPXWwGZDQJSGlFKUaBVN6ANoFkdAkUqUdzXBg3V9lChoBmgJaA9DCFVrYRZalmlAlIaUUpRoFU3hAmgWR0CRTQpblijMdX2UKGgGaAloD0MIu+8YHvs8XUCUhpRSlGgVTegDaBZHQJFO9ZowmE51fZQoaAZoCWgPQwhp/MIrSWdVQJSGlFKUaBVN6ANoFkdAkVDeD3/PxHV9lChoBmgJaA9DCC7HKxC9hGNAlIaUUpRoFU3fA2gWR0CRUfmw7kn1dX2UKGgGaAloD0MINNsV+mBXaECUhpRSlGgVTYwDaBZHQJFU4j/uLJl1fZQoaAZoCWgPQwgJGcizyxVjQJSGlFKUaBVNywNoFkdAkVyn+AEt/XV9lChoBmgJaA9DCITVWMLaamVAlIaUUpRoFU0XA2gWR0CRYYd1MdtEdX2UKGgGaAloD0MIUfhsHRxebECUhpRSlGgVTX0DaBZHQJFjv2Jzkp91fZQoaAZoCWgPQwhGtB1Td8dmQJSGlFKUaBVNGQNoFkdAkWsL1ZkkKXV9lChoBmgJaA9DCPPlBdhHzVRAlIaUUpRoFU3oA2gWR0CRbjXWvr4WdX2UKGgGaAloD0MI3enOE0/UZkCUhpRSlGgVTVgDaBZHQJFxAXwb2lF1fZQoaAZoCWgPQwgXg4dp3xVsQJSGlFKUaBVNFgNoFkdAkXTb8BMi8nV9lChoBmgJaA9DCCtLdJZZ3VNAlIaUUpRoFU3oA2gWR0CRdRpcX3xndX2UKGgGaAloD0MI7MGk+Pi8TUCUhpRSlGgVTegDaBZHQJGSvCWNWEN1fZQoaAZoCWgPQwjvHqD7cstiQJSGlFKUaBVN0gNoFkdAkZYVSS/0unV9lChoBmgJaA9DCCE6BI4E+GdAlIaUUpRoFU15A2gWR0CRlss1sLv1dX2UKGgGaAloD0MIaoe/JuuDakCUhpRSlGgVTfsCaBZHQJGYYT9KmKt1fZQoaAZoCWgPQwjG/Uemw/ZhQJSGlFKUaBVNRANoFkdAkZqXmA9V3nV9lChoBmgJaA9DCI54spuZ3GhAlIaUUpRoFU0YA2gWR0CRnYHqNZNgdX2UKGgGaAloD0MIAJATJowKPECUhpRSlGgVTegDaBZHQJGhfmSyMUB1fZQoaAZoCWgPQwiJJlDEoiRmQJSGlFKUaBVNAANoFkdAkaH3Z5AyEnV9lChoBmgJaA9DCNtv7URJjVRAlIaUUpRoFU3oA2gWR0CRpS/kNnXedX2UKGgGaAloD0MI0QX1LXNTYUCUhpRSlGgVTVMDaBZHQJGnLrOZ9eB1fZQoaAZoCWgPQwhE393KEpJZQJSGlFKUaBVN6ANoFkdAka1gh4dIXnV9lChoBmgJaA9DCNBCAkaXrVlAlIaUUpRoFU3oA2gWR0CRu9kNFz+4dX2UKGgGaAloD0MIGJXUCWjESUCUhpRSlGgVTegDaBZHQJHCRJ4B3id1fZQoaAZoCWgPQwgN+tLbHyJkQJSGlFKUaBVNBgNoFkdAkdBoOUdJa3V9lChoBmgJaA9DCAOUhhqFYVFAlIaUUpRoFU3oA2gWR0CR2iTd+G47dX2UKGgGaAloD0MIZOWXwRgnUECUhpRSlGgVTegDaBZHQJHhjj94u9R1fZQoaAZoCWgPQwhZEwt8RcteQJSGlFKUaBVN6ANoFkdAkfiWGh24eHV9lChoBmgJaA9DCFVOe0rOm0lAlIaUUpRoFU3oA2gWR0CSA1NjbzshdX2UKGgGaAloD0MIv7oqUIs2V0CUhpRSlGgVTegDaBZHQJIE0V9F4LV1fZQoaAZoCWgPQwjFknL3OYRGQJSGlFKUaBVN6ANoFkdAkgbDFZPl+3V9lChoBmgJaA9DCLZpbK8FOTVAlIaUUpRoFU3oA2gWR0CSFVlAu7HydX2UKGgGaAloD0MIrDdqhel6VUCUhpRSlGgVTegDaBZHQJIWusKb8WN1fZQoaAZoCWgPQwhprP2d7QpSQJSGlFKUaBVN6ANoFkdAkhdiOearm3V9lChoBmgJaA9DCCdKQiJtI1lAlIaUUpRoFU3oA2gWR0CSGXhZQpF1dX2UKGgGaAloD0MI9x+ZDp3+CECUhpRSlGgVTfsBaBZHQJIbnxwyZa51fZQoaAZoCWgPQwgJqHAEqd9ZQJSGlFKUaBVN6ANoFkdAkhylT3qRl3V9lChoBmgJaA9DCFcG1QYnPlxAlIaUUpRoFU3oA2gWR0CSIu7ROUMYdX2UKGgGaAloD0MIJzCd1m0IRUCUhpRSlGgVTegDaBZHQJIqhxlxwQ11fZQoaAZoCWgPQwiGqwMg7rlSQJSGlFKUaBVN6ANoFkdAkjVcj7hvSHV9lChoBmgJaA9DCHlZEwt831NAlIaUUpRoFU3oA2gWR0CSR29itq59dX2UKGgGaAloD0MIXaj8a3lRSUCUhpRSlGgVTegDaBZHQJJQOYv38Gd1fZQoaAZoCWgPQwhVUbzK2uNdQJSGlFKUaBVN9wJoFkdAklmo6XBxgnV9lChoBmgJaA9DCMDMd/CTqGFAlIaUUpRoFU0rA2gWR0CSYATHKfWddX2UKGgGaAloD0MIW+1hL5RLaUCUhpRSlGgVTbkDaBZHQJJ4Wn1nM+x1fZQoaAZoCWgPQwj0FaQZC/lnQJSGlFKUaBVNswJoFkdAknrx6nivPnV9lChoBmgJaA9DCAaf5uRFeGhAlIaUUpRoFU1WA2gWR0CSgGt5D7ZWdX2UKGgGaAloD0MI1NUdi239UECUhpRSlGgVTegDaBZHQJKB/KNhmXh1fZQoaAZoCWgPQwgsgCkDBw9rQJSGlFKUaBVNlANoFkdAkoKNWuHN5nV9lChoBmgJaA9DCF+0xwvpGl1AlIaUUpRoFU3oA2gWR0CSivF3pwCKdX2UKGgGaAloD0MIb9dLU4SpY0CUhpRSlGgVTYgDaBZHQJKN6l9Brvd1fZQoaAZoCWgPQwj5hsJn60dlQJSGlFKUaBVNuwNoFkdAko4uyE+PinV9lChoBmgJaA9DCCS5/Id09mpAlIaUUpRoFU27AmgWR0CSkSb7TDwZdX2UKGgGaAloD0MIOpShKibsZkCUhpRSlGgVTbsCaBZHQJKRczbeuV51fZQoaAZoCWgPQwiIvruVJVFUQJSGlFKUaBVN6ANoFkdAkpLmIGhVVHV9lChoBmgJaA9DCG9/LhqyVWpAlIaUUpRoFU1eA2gWR0CSnNXtBv74dX2UKGgGaAloD0MIkkCDTR1iaUCUhpRSlGgVTfUCaBZHQJKhNYhdMTN1fZQoaAZoCWgPQwiI9UatMI1qQJSGlFKUaBVNVgNoFkdAkqH9qgyuZHV9lChoBmgJaA9DCF0Y6UXtp1RAlIaUUpRoFU3oA2gWR0CSqL6oVEeAdX2UKGgGaAloD0MI2dDN/sCsYECUhpRSlGgVTVkCaBZHQJK066BiCrd1fZQoaAZoCWgPQwjdmJ6wxB5RQJSGlFKUaBVN6ANoFkdAkri6yjYZmHV9lChoBmgJaA9DCHqmlxhL72pAlIaUUpRoFU3GA2gWR0CSuzxFiKBNdX2UKGgGaAloD0MI00z3OqlyZECUhpRSlGgVTcsDaBZHQJK7uohpxm11fZQoaAZoCWgPQwgukQvO4GljQJSGlFKUaBVN4ANoFkdAksMukP+XJHV9lChoBmgJaA9DCOurqwK1Sl5AlIaUUpRoFU3oA2gWR0CSxU0PH1e0dX2UKGgGaAloD0MIR450BkbiUMCUhpRSlGgVS5VoFkdAksnqB/Zuh3V9lChoBmgJaA9DCL9hokEKplJAlIaUUpRoFU3oA2gWR0CSyjFY+0PZdX2UKGgGaAloD0MIWDm0yHYDWkCUhpRSlGgVTegDaBZHQJLOjpfQa751fZQoaAZoCWgPQwiP/wJBgOlYQJSGlFKUaBVN6ANoFkdAktiKDsdDIHV9lChoBmgJaA9DCGUBE7h1zmZAlIaUUpRoFU0VA2gWR0CS2O13+uNhdX2UKGgGaAloD0MIpyOAm8URR0CUhpRSlGgVTegDaBZHQJLaz7MxGlR1fZQoaAZoCWgPQwjChTyCG+BlQJSGlFKUaBVNmQNoFkdAktvEyckMTnV9lChoBmgJaA9DCAhZFkz8Y1ZAlIaUUpRoFU3oA2gWR0CS3GisGPgfdX2UKGgGaAloD0MIZhah2Ar6XUCUhpRSlGgVTegDaBZHQJLd//Q0GeN1fZQoaAZoCWgPQwjMC7CPTmddQJSGlFKUaBVN6ANoFkdAkt70xASnL3V9lChoBmgJaA9DCLd9j/rrwlNAlIaUUpRoFU3oA2gWR0CS6BJP69CedX2UKGgGaAloD0MIEHS0qiXpNECUhpRSlGgVTegDaBZHQJLsTr9l2/11fZQoaAZoCWgPQwh5eTpXlEpnQJSGlFKUaBVNaANoFkdAku/EBsANonV9lChoBmgJaA9DCNKqlnSUNmdAlIaUUpRoFU1hA2gWR0CS8tYzi0fHdX2UKGgGaAloD0MINE3YfjLPWkCUhpRSlGgVTegDaBZHQJL5B6X0Gu91ZS4="
76
  },
77
  "ep_success_buffer": {
78
  ":type:": "<class 'collections.deque'>",
79
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
80
  },
81
+ "_n_updates": 1280,
82
  "n_steps": 128,
83
+ "gamma": 0.9999,
84
  "gae_lambda": 0.95,
85
+ "ent_coef": 0.0001,
86
  "vf_coef": 0.5,
87
  "max_grad_norm": 0.5,
88
+ "batch_size": 2048,
89
  "n_epochs": 10,
90
  "clip_range": {
91
  ":type:": "<class 'function'>",
ppo-LunarLander-v2/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bfdf3e166069e2944a7e3570bede47da4f462aeb0de77f556b343f00c7c02652
3
  size 87929
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:22fa466626e2092189cbaa0260ab25e4cc7829c3ed6017d767c65bc716854e97
3
  size 87929
ppo-LunarLander-v2/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7e1041eb09b87cb1d8f5970007b29935f881e0235d2f6d2bbb9817b78ec73d77
3
  size 43201
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:97798434789f827e4a17d5635c00bb8ccffe13a502b1d48a5ec451339f34f640
3
  size 43201
replay.mp4 CHANGED
Binary files a/replay.mp4 and b/replay.mp4 differ
 
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": -530.2456635535752, "std_reward": 79.20735986802777, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2022-12-09T17:08:21.989143"}
 
1
+ {"mean_reward": 181.85235156533537, "std_reward": 36.62072669298787, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2022-12-09T18:51:00.039599"}