Abid commited on
Commit
59ff150
1 Parent(s): 9abd06b

best performing model with Hyperparmeter optimization

Browse files
Moonman-Lunar-Lander-v2.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:91f8cd7de742a30fd5468402ac98cc2e8f6eeb17bf1a987c8b410a90460dc489
3
- size 144028
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:304a3397d029255d10867095ad80c1c7579ce0b3b686aebe363931b8a33afe4e
3
+ size 144099
Moonman-Lunar-Lander-v2/data CHANGED
@@ -4,19 +4,19 @@
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
- "__init__": "<function ActorCriticPolicy.__init__ at 0x7f80342229e0>",
8
- "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f8034222a70>",
9
- "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f8034222b00>",
10
- "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f8034222b90>",
11
- "_build": "<function ActorCriticPolicy._build at 0x7f8034222c20>",
12
- "forward": "<function ActorCriticPolicy.forward at 0x7f8034222cb0>",
13
- "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f8034222d40>",
14
- "_predict": "<function ActorCriticPolicy._predict at 0x7f8034222dd0>",
15
- "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f8034222e60>",
16
- "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f8034222ef0>",
17
- "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f8034222f80>",
18
  "__abstractmethods__": "frozenset()",
19
- "_abc_impl": "<_abc_data object at 0x7f80341f92d0>"
20
  },
21
  "verbose": 1,
22
  "policy_kwargs": {},
@@ -42,12 +42,12 @@
42
  "_np_random": null
43
  },
44
  "n_envs": 16,
45
- "num_timesteps": 505680,
46
  "_total_timesteps": 500000,
47
  "_num_timesteps_at_start": 0,
48
  "seed": null,
49
  "action_noise": null,
50
- "start_time": 1652269635.8794794,
51
  "learning_rate": 0.0003,
52
  "tensorboard_log": null,
53
  "lr_schedule": {
@@ -56,7 +56,7 @@
56
  },
57
  "_last_obs": {
58
  ":type:": "<class 'numpy.ndarray'>",
59
- ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAFMoD76AOJ0/41elvkQEH7+XJ8u972uwvQAAAAAAAAAAmny3vQvI7z7CegS+C6qdvjhRor3euB28AAAAAAAAAADAKjK+2Fh1P2MgQb567Bu/0mt8vouIjr0AAAAAAAAAAIAEaz34wJ4/BzqVPmUBCb+H6LY9fow0PgAAAAAAAAAAM2x6Pqd4Cb0Hdjs8mTOxuppCb75O44O7AACAPwAAgD/Ntio8l1x/P/R8gjxHnRa/B8XlvFL2ubsAAAAAAAAAAEATJb6yauM+UjDTPRTFm74Y0Lq9S3WoOwAAAAAAAAAA7dMmPvurIz/naAM+6z3kvuFeCj5tRFO9AAAAAAAAAAAAV429LrX3PSrwrbxhcp++fEclvWKg7L0AAAAAAAAAAOaIOz1Ksgs+3Y7xvQFpQb4mEZm8G6O2uwAAAAAAAAAAmoztvYrcajxSm/w9OXMfvk96BrxQktc7AAAAAAAAAAAa6qE9mKOLPWJsm77cqiy+jQzrvds4Ur0AAAAAAAAAAC2zPL6+Rmk/DSbCvgmWIb9ENGS+fjX0vQAAAAAAAAAAmjbvPZw8fz/+9iA+nd/5vqPHHj7WVoq9AAAAAAAAAADNnFI74ZCTuh8qKbjgIzmzjAG5Os7sQzcAAIA/AACAP4CKob0UfYs92lpBPpPSlL62fik9dg07PAAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
60
  },
61
  "_last_episode_starts": {
62
  ":type:": "<class 'numpy.ndarray'>",
@@ -66,23 +66,23 @@
66
  "_episode_num": 0,
67
  "use_sde": false,
68
  "sde_sample_freq": -1,
69
- "_current_progress_remaining": -0.011360000000000037,
70
  "ep_info_buffer": {
71
  ":type:": "<class 'collections.deque'>",
72
- ":serialized:": "gAWVQRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIPX5v099pcECUhpRSlIwBbJRL9YwBdJRHQJX/7hLoOhF1fZQoaAZoCWgPQwghPUUOEcNHQJSGlFKUaBVLzWgWR0CV//S+QEIPdX2UKGgGaAloD0MIm/7sR4qAckCUhpRSlGgVTQ8BaBZHQJYA+RGMGX51fZQoaAZoCWgPQwhiZwqdFxpzQJSGlFKUaBVNGgFoFkdAlgGU5+6RQ3V9lChoBmgJaA9DCP9dnzlrhHFAlIaUUpRoFUviaBZHQJYBoghbGFV1fZQoaAZoCWgPQwjFWKZfIn9tQJSGlFKUaBVL52gWR0CWAw9ETg2qdX2UKGgGaAloD0MIcVga+NHYckCUhpRSlGgVS/9oFkdAlgWBf0Eov3V9lChoBmgJaA9DCDG0OjlDrWJAlIaUUpRoFU3oA2gWR0CWBkZqVQhwdX2UKGgGaAloD0MII/WeymmOYkCUhpRSlGgVTegDaBZHQJYIsetCAtp1fZQoaAZoCWgPQwjmXIqryutwQJSGlFKUaBVNCgFoFkdAlgkfV7Qb/HV9lChoBmgJaA9DCMLc7uX+wHJAlIaUUpRoFU0UAWgWR0CWCjOwxFiKdX2UKGgGaAloD0MI1lWBWszecECUhpRSlGgVS+xoFkdAlgqCjHn2ZnV9lChoBmgJaA9DCMxiYvPx5XBAlIaUUpRoFUvpaBZHQJYLWtaIN3J1fZQoaAZoCWgPQwjY1eQpa2JxQJSGlFKUaBVL4mgWR0CWC688cMmXdX2UKGgGaAloD0MIYvay7TRDaMCUhpRSlGgVTQoCaBZHQJYMNk1/DtR1fZQoaAZoCWgPQwhIiV3bG0JwQJSGlFKUaBVNKAFoFkdAlg0TOkcjq3V9lChoBmgJaA9DCJqzPuUY1W9AlIaUUpRoFUv5aBZHQJYOE5EMLF51fZQoaAZoCWgPQwhe9utON5BwQJSGlFKUaBVNJAFoFkdAlg5ob0e2eHV9lChoBmgJaA9DCPMAFvl1HmVAlIaUUpRoFU3oA2gWR0CWDs7KaG5+dX2UKGgGaAloD0MInGotzEKqY0CUhpRSlGgVTegDaBZHQJYRAHfMwDh1fZQoaAZoCWgPQwh/NJwyN9BTQJSGlFKUaBVL1mgWR0CWEZVZcLSedX2UKGgGaAloD0MI5Nh6hrByckCUhpRSlGgVTUABaBZHQJZm9zCDVYp1fZQoaAZoCWgPQwhOJ9nqcidxQJSGlFKUaBVL7mgWR0CWaGWSlnAZdX2UKGgGaAloD0MIaeBHNawxcUCUhpRSlGgVS+loFkdAlmh4WcjJMnV9lChoBmgJaA9DCMST3cxohm9AlIaUUpRoFUvmaBZHQJZo4O9WZJF1fZQoaAZoCWgPQwjaPA6DuaFxQJSGlFKUaBVNHgFoFkdAlmmwpON5t3V9lChoBmgJaA9DCJFGBU42i3FAlIaUUpRoFU0mAWgWR0CWabm+CbtrdX2UKGgGaAloD0MIeAyP/Sz4b0CUhpRSlGgVS/JoFkdAlmpkpAlfJHV9lChoBmgJaA9DCJ0std7vfXFAlIaUUpRoFU2FAWgWR0CWbOpxWDHwdX2UKGgGaAloD0MILhoyHiVDcECUhpRSlGgVTQsBaBZHQJZtDHNorWl1fZQoaAZoCWgPQwiw/s9hPsByQJSGlFKUaBVNDgFoFkdAlm2mjKxLTXV9lChoBmgJaA9DCEEN38I63WVAlIaUUpRoFU3oA2gWR0CWbdWu5jH5dX2UKGgGaAloD0MI88zLYffscECUhpRSlGgVS/9oFkdAlm9dvjwQUnV9lChoBmgJaA9DCIS3ByEgwXJAlIaUUpRoFU0PAWgWR0CWcLKs+3YudX2UKGgGaAloD0MIO3DOiBLycUCUhpRSlGgVS9BoFkdAlnG4GhVU/HV9lChoBmgJaA9DCIBEEygijHFAlIaUUpRoFUvQaBZHQJZxyRDCxeN1fZQoaAZoCWgPQwju68A5I3xiQJSGlFKUaBVN6ANoFkdAlnHi6DoQnXV9lChoBmgJaA9DCA0a+ic4jnFAlIaUUpRoFUvfaBZHQJZytmdy1eB1fZQoaAZoCWgPQwjpuBrZldduQJSGlFKUaBVL3mgWR0CWc1rzoUzsdX2UKGgGaAloD0MIWvYksLlrckCUhpRSlGgVS+JoFkdAlnOHpbD/EXV9lChoBmgJaA9DCEljtI4qn3FAlIaUUpRoFU0HAWgWR0CWdZpNKyv+dX2UKGgGaAloD0MIOZ1kq8tuUUCUhpRSlGgVS8hoFkdAlnX3mFJxvXV9lChoBmgJaA9DCOasTzmmV3BAlIaUUpRoFUvzaBZHQJZ3QQlKK511fZQoaAZoCWgPQwih8xq7RIdOQJSGlFKUaBVL5WgWR0CWd2ldTo+wdX2UKGgGaAloD0MID7kZbsCecUCUhpRSlGgVTQwBaBZHQJZ4ORHPNV11fZQoaAZoCWgPQwiwdD48Sx5EQJSGlFKUaBVLp2gWR0CWeZZ9/jKgdX2UKGgGaAloD0MIUtZvJqYzUECUhpRSlGgVS7loFkdAlntFrl/6PHV9lChoBmgJaA9DCGMl5llJfXFAlIaUUpRoFUvzaBZHQJZ72ZtvXK91fZQoaAZoCWgPQwhYPPVIwzFwQJSGlFKUaBVL+GgWR0CWfAC0WuYAdX2UKGgGaAloD0MIETl9PR+qc0CUhpRSlGgVTRMBaBZHQJZ8O8QI2O11fZQoaAZoCWgPQwj2KFyPgvNwQJSGlFKUaBVL/mgWR0CWfGbBXS0CdX2UKGgGaAloD0MIEJTb9r3mcUCUhpRSlGgVS+VoFkdAlnzluivgWXV9lChoBmgJaA9DCBEbLJykh2VAlIaUUpRoFU0KAmgWR0CWfWSpR4yHdX2UKGgGaAloD0MINNdppKXVcUCUhpRSlGgVTVEBaBZHQJZ9dahYeT51fZQoaAZoCWgPQwhy4UBIFgZGQJSGlFKUaBVLvWgWR0CWfYUVBUrDdX2UKGgGaAloD0MIl6lJ8IYgcUCUhpRSlGgVTQABaBZHQJaAM1XNke91fZQoaAZoCWgPQwi4WicuR5FtQJSGlFKUaBVL5GgWR0CWgEkSmIj4dX2UKGgGaAloD0MIMSWS6OVDckCUhpRSlGgVS/ZoFkdAltQ/VNHpbHV9lChoBmgJaA9DCPc96q9X4EtAlIaUUpRoFUuxaBZHQJbVFUaQ3gl1fZQoaAZoCWgPQwiVfOwuEMZwQJSGlFKUaBVNBgFoFkdAltWdp7CzknV9lChoBmgJaA9DCGyTisZaEmdAlIaUUpRoFU3oA2gWR0CW1bwZwXImdX2UKGgGaAloD0MI2XiwxW79b0CUhpRSlGgVS+toFkdAltXZGFzuGHV9lChoBmgJaA9DCKa6gJfZ+HBAlIaUUpRoFUvdaBZHQJbXRAxBVuJ1fZQoaAZoCWgPQwga3qzBu41wQJSGlFKUaBVL7mgWR0CW2FUg0TDgdX2UKGgGaAloD0MImNwosla6bkCUhpRSlGgVS+RoFkdAltib/S6UaHV9lChoBmgJaA9DCMWsF0O5aHFAlIaUUpRoFUvXaBZHQJbYnFhoduJ1fZQoaAZoCWgPQwgQW3o0lVVyQJSGlFKUaBVL9WgWR0CW2LxtYSxrdX2UKGgGaAloD0MImzkktZD4cUCUhpRSlGgVS/5oFkdAltiz0QK8c3V9lChoBmgJaA9DCEtywK7mq3BAlIaUUpRoFUvqaBZHQJbZSt4iX6Z1fZQoaAZoCWgPQwhcBTHQtZluQJSGlFKUaBVNBAFoFkdAltpBAv+OwXV9lChoBmgJaA9DCJOKxtrftHFAlIaUUpRoFU3EA2gWR0CW23N5+pfhdX2UKGgGaAloD0MIEHf1KjJocUCUhpRSlGgVS/FoFkdAltxIRdyDI3V9lChoBmgJaA9DCHOh8q9lrXBAlIaUUpRoFUvRaBZHQJbcpQVKwpx1fZQoaAZoCWgPQwgBGTp2EF5wQJSGlFKUaBVL+GgWR0CW3TIiTt9hdX2UKGgGaAloD0MI/oFy2773TkCUhpRSlGgVS61oFkdAlt1TfJmuknV9lChoBmgJaA9DCMqLTMCvWHJAlIaUUpRoFU0bAWgWR0CW3Zhpxm03dX2UKGgGaAloD0MIflUuVP6Jb0CUhpRSlGgVS/doFkdAlt5S2H+IdnV9lChoBmgJaA9DCG/whcmUx3FAlIaUUpRoFUvxaBZHQJbeTsrupjt1fZQoaAZoCWgPQwjxSScSzNZyQJSGlFKUaBVNIgFoFkdAlt+0cjqv/3V9lChoBmgJaA9DCCCWzRzSg3BAlIaUUpRoFUvyaBZHQJbgWGDcuap1fZQoaAZoCWgPQwiaz7nbNdlxQJSGlFKUaBVL8mgWR0CW4JV6NVBEdX2UKGgGaAloD0MIO/w1WSNXbUCUhpRSlGgVS/RoFkdAluC1cdHUdHV9lChoBmgJaA9DCA7Xag/7P3FAlIaUUpRoFU0EAWgWR0CW4R71ZkkKdX2UKGgGaAloD0MIZVBtcGJ4cUCUhpRSlGgVS/NoFkdAluE6fzz3AXV9lChoBmgJaA9DCHmVtU2xPHJAlIaUUpRoFU0EAWgWR0CW4TocaOxTdX2UKGgGaAloD0MIFVYqqKjbckCUhpRSlGgVS/loFkdAluIsmShaknV9lChoBmgJaA9DCIf7yK1J4z5AlIaUUpRoFUvJaBZHQJbjfcVQAMl1fZQoaAZoCWgPQwhIwr6dxNVwQJSGlFKUaBVL6mgWR0CW496j3225dX2UKGgGaAloD0MIuVD513KSckCUhpRSlGgVS99oFkdAluQW/8EV33V9lChoBmgJaA9DCKGhf4ILFnFAlIaUUpRoFU0OAWgWR0CW5K5UcXFcdX2UKGgGaAloD0MIQ+OJIA7vckCUhpRSlGgVS+toFkdAluTWucMEzXV9lChoBmgJaA9DCCgK9In8BHBAlIaUUpRoFUvraBZHQJbljY4ACGN1fZQoaAZoCWgPQwgBUTBjCh5wQJSGlFKUaBVNBgFoFkdAluZ0qx1PnHV9lChoBmgJaA9DCKosCrsomlJAlIaUUpRoFUvYaBZHQJbnGPq9oOB1fZQoaAZoCWgPQwheK6G7JOdvQJSGlFKUaBVL9GgWR0CW52mEXcgydX2UKGgGaAloD0MIHaopybpPbkCUhpRSlGgVS+NoFkdAlue5aJQ+EHV9lChoBmgJaA9DCEdX6e56v3FAlIaUUpRoFUvgaBZHQJboORFI/aB1fZQoaAZoCWgPQwgoRpbMMeRsQJSGlFKUaBVL7GgWR0CW6CwYLsrvdX2UKGgGaAloD0MI6dfWT3/ZcECUhpRSlGgVS+BoFkdAluhTdtVJc3V9lChoBmgJaA9DCCWTUzsDXXJAlIaUUpRoFUvxaBZHQJboy6kIomZ1ZS4="
73
  },
74
  "ep_success_buffer": {
75
  ":type:": "<class 'collections.deque'>",
76
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
77
  },
78
- "_n_updates": 490,
79
- "n_steps": 645,
80
  "gamma": 0.997,
81
- "gae_lambda": 0.97,
82
  "ent_coef": 0.01,
83
  "vf_coef": 0.5,
84
  "max_grad_norm": 0.5,
85
- "batch_size": 32,
86
  "n_epochs": 10,
87
  "clip_range": {
88
  ":type:": "<class 'function'>",
 
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
+ "__init__": "<function ActorCriticPolicy.__init__ at 0x7f06d9ef5170>",
8
+ "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f06d9ef5200>",
9
+ "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f06d9ef5290>",
10
+ "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f06d9ef5320>",
11
+ "_build": "<function ActorCriticPolicy._build at 0x7f06d9ef53b0>",
12
+ "forward": "<function ActorCriticPolicy.forward at 0x7f06d9ef5440>",
13
+ "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f06d9ef54d0>",
14
+ "_predict": "<function ActorCriticPolicy._predict at 0x7f06d9ef5560>",
15
+ "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f06d9ef55f0>",
16
+ "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f06d9ef5680>",
17
+ "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f06d9ef5710>",
18
  "__abstractmethods__": "frozenset()",
19
+ "_abc_impl": "<_abc_data object at 0x7f06d9f37ab0>"
20
  },
21
  "verbose": 1,
22
  "policy_kwargs": {},
 
42
  "_np_random": null
43
  },
44
  "n_envs": 16,
45
+ "num_timesteps": 512000,
46
  "_total_timesteps": 500000,
47
  "_num_timesteps_at_start": 0,
48
  "seed": null,
49
  "action_noise": null,
50
+ "start_time": 1652273847.1759872,
51
  "learning_rate": 0.0003,
52
  "tensorboard_log": null,
53
  "lr_schedule": {
 
56
  },
57
  "_last_obs": {
58
  ":type:": "<class 'numpy.ndarray'>",
59
+ ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAADOEQb2B2OU96WMQPrUcjL55wNw8tizxvAAAAAAAAAAAZjY8O+X9VT59cOU74iheviu2iTw2Wgq8AAAAAAAAAAAzom49KVAPulpRkDqtHZo1uiNBOiRDpLkAAIA/AACAP81oKrykk2084ckLPisiNr44D8k9zbwzvQAAAAAAAAAA8/v2PXu2v7rucdI5pES/tiaNNbzza/24AACAPwAAgD+mZ6E9KZh1ujBUhzWHiaYwGftbO06OubQAAIA/AACAP2YWETt7soq6ohmnuxEIQDUE5Ya4nkLAOgAAgD8AAIA/M2eyPOz0pT5vvBa9QpukvptpzTsTY1k8AAAAAAAAAAAz1hQ9e26zul7FCTqEZ4a1pan8uVwxHbkAAIA/AACAPzO4uDxceyG6ZklHuxwvD7bgcQw6ncBoOgAAgD8AAIA/M+eyPVxbULqLope7auX2OYqJvjpOsIy6AACAPwAAgD+aFlY9XOtxuqcBtTpeRi02lB9DOl3nz7kAAIA/AACAPxPMXr7E57g+t8A/PiSKlb5ibQ6+lt1KPQAAAAAAAAAATVmKPVIQqbm4InK5kTvRtPJrYzvulpA4AACAPwAAgD/awdU95JJlP2hQDTzDzfC+1FgzPh5ZCLsAAAAAAAAAAAClJT1sKve7D1gEPI1vKzyJhF29DL4UPQAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
60
  },
61
  "_last_episode_starts": {
62
  ":type:": "<class 'numpy.ndarray'>",
 
66
  "_episode_num": 0,
67
  "use_sde": false,
68
  "sde_sample_freq": -1,
69
+ "_current_progress_remaining": -0.02400000000000002,
70
  "ep_info_buffer": {
71
  ":type:": "<class 'collections.deque'>",
72
+ ":serialized:": "gAWVeBAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMI4pANpIvAZUCUhpRSlIwBbJRN6AOMAXSUR0Cj8UsMZxaQdX2UKGgGaAloD0MI0qsBSsMlZ0CUhpRSlGgVTegDaBZHQKPymowVTJh1fZQoaAZoCWgPQwgZj1IJzzxvQJSGlFKUaBVNzQJoFkdAo/Raf4AS4HV9lChoBmgJaA9DCDgvTnw11WhAlIaUUpRoFU3oA2gWR0Cj9cxcmjTKdX2UKGgGaAloD0MIaB8r+G3oZECUhpRSlGgVTegDaBZHQKP2XvOQhfV1fZQoaAZoCWgPQwhnSBXFK/JyQJSGlFKUaBVNIwFoFkdAo/bpKraM73V9lChoBmgJaA9DCM+8HHbfFWVAlIaUUpRoFU3oA2gWR0Cj+BgVXV9XdX2UKGgGaAloD0MIHeVgNgFrZkCUhpRSlGgVTegDaBZHQKP4gPlMh5h1fZQoaAZoCWgPQwhOfSB558VVQJSGlFKUaBVLm2gWR0Cj+cI5ggHNdX2UKGgGaAloD0MIlE4kmOrsY0CUhpRSlGgVTegDaBZHQKP6g+otL+R1fZQoaAZoCWgPQwhK7xtfe3xvQJSGlFKUaBVNgwFoFkdAo/uE4tHx0HV9lChoBmgJaA9DCD4JbM5BwHBAlIaUUpRoFU2PA2gWR0Cj/LPHtF8YdX2UKGgGaAloD0MIA0AVNy5DcUCUhpRSlGgVTWkCaBZHQKP87nBciW51fZQoaAZoCWgPQwi3Yn/ZPQdkQJSGlFKUaBVN6ANoFkdApAETWAf+0nV9lChoBmgJaA9DCK358ZcWIW1AlIaUUpRoFU31AWgWR0CkAbE/8l5XdX2UKGgGaAloD0MIhSaJJWVZcECUhpRSlGgVTZUBaBZHQKQDbS0jTrp1fZQoaAZoCWgPQwgCg6RPK7NsQJSGlFKUaBVNVwNoFkdApATbb+Lm63V9lChoBmgJaA9DCJp8s80N/GNAlIaUUpRoFU3oA2gWR0CkBVykCV8kdX2UKGgGaAloD0MIOPdXj3uhZ0CUhpRSlGgVTegDaBZHQKQFjyeZof11fZQoaAZoCWgPQwhaSSu+oQtkQJSGlFKUaBVN6ANoFkdApIP5zJZGKHV9lChoBmgJaA9DCOvkDMWdHXBAlIaUUpRoFU2XA2gWR0CkiKtz8xbjdX2UKGgGaAloD0MIDrxa7ozAcECUhpRSlGgVTQYDaBZHQKSJCjCYTkB1fZQoaAZoCWgPQwjQmbSpunZyQJSGlFKUaBVN4gFoFkdApI7I6IWP93V9lChoBmgJaA9DCPtz0ZDxMWFAlIaUUpRoFU3oA2gWR0Ckj772L5ymdX2UKGgGaAloD0MITMecZ2yEaECUhpRSlGgVTegDaBZHQKSR+XHim2t1fZQoaAZoCWgPQwie0VYlEVtiQJSGlFKUaBVN6ANoFkdApJQPy08eS3V9lChoBmgJaA9DCI22KoksdnJAlIaUUpRoFU1oAmgWR0CklLkFnqVydX2UKGgGaAloD0MIhjlBmxw6RECUhpRSlGgVS59oFkdApJTYNkOI7HV9lChoBmgJaA9DCNXrFoGxAmlAlIaUUpRoFU3oA2gWR0CklPawdKdydX2UKGgGaAloD0MIvhb03hjDcECUhpRSlGgVTaIBaBZHQKSWA2jO9nN1fZQoaAZoCWgPQwiNCTGX1DhjQJSGlFKUaBVN6ANoFkdApJYK55JK8XV9lChoBmgJaA9DCFluaTWk12NAlIaUUpRoFU3oA2gWR0CklygB91EFdX2UKGgGaAloD0MIpOTVOQaOZUCUhpRSlGgVTegDaBZHQKSXYfSx7iR1fZQoaAZoCWgPQwiUFi6rsElDQJSGlFKUaBVLimgWR0CkmEnYg7o0dX2UKGgGaAloD0MIO6kvS7tCZECUhpRSlGgVTegDaBZHQKUZLfWtlqd1fZQoaAZoCWgPQwgw16IFaPpnQJSGlFKUaBVN6ANoFkdApRnBfdAPd3V9lChoBmgJaA9DCJI+raJ/NnNAlIaUUpRoFU0kAWgWR0ClG52IoE0SdX2UKGgGaAloD0MIUoAomLH5Y0CUhpRSlGgVTegDaBZHQKUdbltj0+V1fZQoaAZoCWgPQwhXem02Vg1gQJSGlFKUaBVN6ANoFkdApR2fiT+vQnV9lChoBmgJaA9DCOdQhqqYpWRAlIaUUpRoFU3oA2gWR0ClH4A/s3Q2dX2UKGgGaAloD0MISQ7Y1WRSZkCUhpRSlGgVTegDaBZHQKUkMeZG8VZ1fZQoaAZoCWgPQwg9SE+RA4RxQJSGlFKUaBVNgQJoFkdApSidZDArQXV9lChoBmgJaA9DCEkrvqFwUGVAlIaUUpRoFU3oA2gWR0ClKadZA6dUdX2UKGgGaAloD0MI/G1PkFiYYkCUhpRSlGgVTegDaBZHQKUsii8nNPh1fZQoaAZoCWgPQwibN04KcyBhQJSGlFKUaBVN6ANoFkdApS5/UnXumnV9lChoBmgJaA9DCGvXhLRGqWVAlIaUUpRoFU3oA2gWR0ClLySAxzq9dX2UKGgGaAloD0MIkElGzkKDZUCUhpRSlGgVTegDaBZHQKUvXtw71Zl1fZQoaAZoCWgPQwhi9rLtNONkQJSGlFKUaBVN6ANoFkdApTBr28IzFnV9lChoBmgJaA9DCEEN38K6ZXFAlIaUUpRoFU2lAmgWR0ClrXa6z3RHdX2UKGgGaAloD0MIcOtunupJZkCUhpRSlGgVTegDaBZHQKWt3dZ7ojh1fZQoaAZoCWgPQwg3+pgPCIhlQJSGlFKUaBVN6ANoFkdApa4fSpiqhnV9lChoBmgJaA9DCMfXnlnSl3FAlIaUUpRoFU0PA2gWR0ClrpoB7u2JdX2UKGgGaAloD0MICMkCJvDpaECUhpRSlGgVTegDaBZHQKWyLOqNp/R1fZQoaAZoCWgPQwjdtYR8UMppQJSGlFKUaBVN6ANoFkdApbLPJ7sv7HV9lChoBmgJaA9DCEt1AS/z8nBAlIaUUpRoFU1ZAWgWR0CltVI7/4qPdX2UKGgGaAloD0MIkGYsmo6acUCUhpRSlGgVTTQBaBZHQKW2bHww0wd1fZQoaAZoCWgPQwiXdJSDWT5jQJSGlFKUaBVN6ANoFkdApbchwhnrZHV9lChoBmgJaA9DCC4dc54xD2VAlIaUUpRoFU3oA2gWR0CluTzYVZcLdX2UKGgGaAloD0MI11HVBFHiZUCUhpRSlGgVTegDaBZHQKW+YBpYcNp1fZQoaAZoCWgPQwgdAdwsnpRyQJSGlFKUaBVNXgFoFkdApcJi8an753V9lChoBmgJaA9DCHjuPVzyL2ZAlIaUUpRoFU3oA2gWR0ClwzcAzYVZdX2UKGgGaAloD0MIixagbTW8Z0CUhpRSlGgVTegDaBZHQKXEQ1eBxxV1fZQoaAZoCWgPQwiKA+j3/W1NQJSGlFKUaBVLsmgWR0ClxFOkUKzBdX2UKGgGaAloD0MILVvri4RrZECUhpRSlGgVTegDaBZHQKZFE+2VmjF1fZQoaAZoCWgPQwjdRZiiXDxiQJSGlFKUaBVN6ANoFkdApkcdPYWcjXV9lChoBmgJaA9DCHxgx3+Bs2VAlIaUUpRoFU3oA2gWR0CmR8XcYZVGdX2UKGgGaAloD0MIf4eiQB+vY0CUhpRSlGgVTegDaBZHQKZJLA6+36R1fZQoaAZoCWgPQwhGzy10pRZhQJSGlFKUaBVN6ANoFkdApkqsIiTt9nV9lChoBmgJaA9DCINStHKvRWlAlIaUUpRoFU3oA2gWR0CmSvUaqCHzdX2UKGgGaAloD0MINIEiFjHOZECUhpRSlGgVTegDaBZHQKZLir1/UfB1fZQoaAZoCWgPQwiYUSy3tMhKQJSGlFKUaBVLtWgWR0CmTVWNm16WdX2UKGgGaAloD0MI9x4uOe7CZUCUhpRSlGgVTegDaBZHQKZPjvKlpGp1fZQoaAZoCWgPQwgogGJkSR5hQJSGlFKUaBVN6ANoFkdAplA6OzY29HV9lChoBmgJaA9DCPKaV3VWwGNAlIaUUpRoFU3oA2gWR0CmUp5u63AmdX2UKGgGaAloD0MIgT/8/PeGTECUhpRSlGgVS7FoFkdAplLF6LOzIHV9lChoBmgJaA9DCPPK9baZKGNAlIaUUpRoFU3oA2gWR0CmU6I6r/83dX2UKGgGaAloD0MIzSIUW0H7YECUhpRSlGgVTegDaBZHQKZWSs90Rvp1fZQoaAZoCWgPQwhTzaylgOhMQJSGlFKUaBVLyGgWR0CmWNAvtdAxdX2UKGgGaAloD0MImNwoslY+YUCUhpRSlGgVTegDaBZHQKbbU7J4jbB1fZQoaAZoCWgPQwirIAa6dglmQJSGlFKUaBVN6ANoFkdAptwjv9cbBHV9lChoBmgJaA9DCHiZYaPs5XBAlIaUUpRoFU0+A2gWR0Cm3P0AtFrmdX2UKGgGaAloD0MIlgfpKbKxcECUhpRSlGgVTVABaBZHQKbdILBsQ/Z1fZQoaAZoCWgPQwgN3lflwoViQJSGlFKUaBVN6ANoFkdApt07VrhzeXV9lChoBmgJaA9DCAPpYtPKoGBAlIaUUpRoFU3oA2gWR0Cm3Uov8IiUdX2UKGgGaAloD0MIisqGNZU0bUCUhpRSlGgVTSYBaBZHQKbeIhje9Bd1fZQoaAZoCWgPQwgbutkfKPtuQJSGlFKUaBVNeQJoFkdApt9+KXOW0XV9lChoBmgJaA9DCLKbGf1oz2RAlIaUUpRoFU3oA2gWR0Cm36itA9mpdX2UKGgGaAloD0MI6E8b1WltaECUhpRSlGgVTegDaBZHQKbi4IO6NER1fZQoaAZoCWgPQwiZnxuaMnNjQJSGlFKUaBVN6ANoFkdApuQwbEP1+XV9lChoBmgJaA9DCP9YiA6BM19AlIaUUpRoFU3oA2gWR0Cm5HBMSK3vdX2UKGgGaAloD0MI8ppXdVaFZkCUhpRSlGgVTegDaBZHQKbk8JRfnfV1fZQoaAZoCWgPQwiM17yqsxdSQJSGlFKUaBVL22gWR0Cm5TOpbUw0dX2UKGgGaAloD0MIX7Uy4dfWcUCUhpRSlGgVTa4BaBZHQKbmrtUn5SF1fZQoaAZoCWgPQwj5oGezqjZwQJSGlFKUaBVNTgFoFkdApugOxdIGyHV9lChoBmgJaA9DCMoxWdz/425AlIaUUpRoFU2EAWgWR0Cm6A2uPmxMdX2UKGgGaAloD0MIujDSi9p0Y0CUhpRSlGgVTegDaBZHQKboWEIw/Ph1fZQoaAZoCWgPQwjuJvim6eJvQJSGlFKUaBVN3AFoFkdApulPDR+jM3V9lChoBmgJaA9DCCGunL0z+k1AlIaUUpRoFUvIaBZHQKbqKcy31Bd1fZQoaAZoCWgPQwhszOuIQ0hjQJSGlFKUaBVN6ANoFkdApuqis8xKx3V9lChoBmgJaA9DCH3mrE+5q2JAlIaUUpRoFU3oA2gWR0Cm62j9GZuydWUu"
73
  },
74
  "ep_success_buffer": {
75
  ":type:": "<class 'collections.deque'>",
76
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
77
  },
78
+ "_n_updates": 400,
79
+ "n_steps": 800,
80
  "gamma": 0.997,
81
+ "gae_lambda": 0.98,
82
  "ent_coef": 0.01,
83
  "vf_coef": 0.5,
84
  "max_grad_norm": 0.5,
85
+ "batch_size": 16,
86
  "n_epochs": 10,
87
  "clip_range": {
88
  ":type:": "<class 'function'>",
Moonman-Lunar-Lander-v2/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3bfa4cea32ae6d6f84329e119143bb66011583e3b68d61721a3831311a5e1c32
3
  size 84893
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c4b6cd295c0d69834c9b6d58e44388d4dfb86f34f09e88b4122a4dfad4c2eee5
3
  size 84893
Moonman-Lunar-Lander-v2/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b2ca2f9e2f00c6bf6d8a31b38237fb40f3cdd5e7dc02951034ec7c7fb7c6e2ca
3
  size 43201
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c2880468f5ccbff2fda44ee711941801a6dcd2d82c15eb5da8fd62bc56519c7
3
  size 43201
README.md CHANGED
@@ -10,7 +10,7 @@ model-index:
10
  results:
11
  - metrics:
12
  - type: mean_reward
13
- value: 287.76 +/- 13.72
14
  name: mean_reward
15
  task:
16
  type: reinforcement-learning
 
10
  results:
11
  - metrics:
12
  - type: mean_reward
13
+ value: 244.28 +/- 67.94
14
  name: mean_reward
15
  task:
16
  type: reinforcement-learning
config.json CHANGED
@@ -1 +1 @@
1
- {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f80342229e0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f8034222a70>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f8034222b00>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f8034222b90>", "_build": "<function ActorCriticPolicy._build at 0x7f8034222c20>", "forward": "<function ActorCriticPolicy.forward at 0x7f8034222cb0>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f8034222d40>", "_predict": "<function ActorCriticPolicy._predict at 0x7f8034222dd0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f8034222e60>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f8034222ef0>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f8034222f80>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc_data object at 0x7f80341f92d0>"}, "verbose": 1, "policy_kwargs": {}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVnwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/5RoCksIhZSMAUOUdJRSlIwEaGlnaJRoEiiWIAAAAAAAAAAAAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAf5RoCksIhZRoFXSUUpSMDWJvdW5kZWRfYmVsb3eUaBIolggAAAAAAAAAAAAAAAAAAACUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYIAAAAAAAAAAAAAAAAAAAAlGghSwiFlGgVdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [8], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False]", "bounded_above": "[False False False False False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gAWVggAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUaAeTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu", "n": 4, "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "num_timesteps": 505680, "_total_timesteps": 500000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1652269635.8794794, "learning_rate": 0.0003, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVvwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAUsBSxNDBIgAUwCUToWUKYwBX5SFlIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCB9lH2UKGgXaA6MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgYjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAFMoD76AOJ0/41elvkQEH7+XJ8u972uwvQAAAAAAAAAAmny3vQvI7z7CegS+C6qdvjhRor3euB28AAAAAAAAAADAKjK+2Fh1P2MgQb567Bu/0mt8vouIjr0AAAAAAAAAAIAEaz34wJ4/BzqVPmUBCb+H6LY9fow0PgAAAAAAAAAAM2x6Pqd4Cb0Hdjs8mTOxuppCb75O44O7AACAPwAAgD/Ntio8l1x/P/R8gjxHnRa/B8XlvFL2ubsAAAAAAAAAAEATJb6yauM+UjDTPRTFm74Y0Lq9S3WoOwAAAAAAAAAA7dMmPvurIz/naAM+6z3kvuFeCj5tRFO9AAAAAAAAAAAAV429LrX3PSrwrbxhcp++fEclvWKg7L0AAAAAAAAAAOaIOz1Ksgs+3Y7xvQFpQb4mEZm8G6O2uwAAAAAAAAAAmoztvYrcajxSm/w9OXMfvk96BrxQktc7AAAAAAAAAAAa6qE9mKOLPWJsm77cqiy+jQzrvds4Ur0AAAAAAAAAAC2zPL6+Rmk/DSbCvgmWIb9ENGS+fjX0vQAAAAAAAAAAmjbvPZw8fz/+9iA+nd/5vqPHHj7WVoq9AAAAAAAAAADNnFI74ZCTuh8qKbjgIzmzjAG5Os7sQzcAAIA/AACAP4CKob0UfYs92lpBPpPSlL62fik9dg07PAAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.011360000000000037, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVQRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIPX5v099pcECUhpRSlIwBbJRL9YwBdJRHQJX/7hLoOhF1fZQoaAZoCWgPQwghPUUOEcNHQJSGlFKUaBVLzWgWR0CV//S+QEIPdX2UKGgGaAloD0MIm/7sR4qAckCUhpRSlGgVTQ8BaBZHQJYA+RGMGX51fZQoaAZoCWgPQwhiZwqdFxpzQJSGlFKUaBVNGgFoFkdAlgGU5+6RQ3V9lChoBmgJaA9DCP9dnzlrhHFAlIaUUpRoFUviaBZHQJYBoghbGFV1fZQoaAZoCWgPQwjFWKZfIn9tQJSGlFKUaBVL52gWR0CWAw9ETg2qdX2UKGgGaAloD0MIcVga+NHYckCUhpRSlGgVS/9oFkdAlgWBf0Eov3V9lChoBmgJaA9DCDG0OjlDrWJAlIaUUpRoFU3oA2gWR0CWBkZqVQhwdX2UKGgGaAloD0MII/WeymmOYkCUhpRSlGgVTegDaBZHQJYIsetCAtp1fZQoaAZoCWgPQwjmXIqryutwQJSGlFKUaBVNCgFoFkdAlgkfV7Qb/HV9lChoBmgJaA9DCMLc7uX+wHJAlIaUUpRoFU0UAWgWR0CWCjOwxFiKdX2UKGgGaAloD0MI1lWBWszecECUhpRSlGgVS+xoFkdAlgqCjHn2ZnV9lChoBmgJaA9DCMxiYvPx5XBAlIaUUpRoFUvpaBZHQJYLWtaIN3J1fZQoaAZoCWgPQwjY1eQpa2JxQJSGlFKUaBVL4mgWR0CWC688cMmXdX2UKGgGaAloD0MIYvay7TRDaMCUhpRSlGgVTQoCaBZHQJYMNk1/DtR1fZQoaAZoCWgPQwhIiV3bG0JwQJSGlFKUaBVNKAFoFkdAlg0TOkcjq3V9lChoBmgJaA9DCJqzPuUY1W9AlIaUUpRoFUv5aBZHQJYOE5EMLF51fZQoaAZoCWgPQwhe9utON5BwQJSGlFKUaBVNJAFoFkdAlg5ob0e2eHV9lChoBmgJaA9DCPMAFvl1HmVAlIaUUpRoFU3oA2gWR0CWDs7KaG5+dX2UKGgGaAloD0MInGotzEKqY0CUhpRSlGgVTegDaBZHQJYRAHfMwDh1fZQoaAZoCWgPQwh/NJwyN9BTQJSGlFKUaBVL1mgWR0CWEZVZcLSedX2UKGgGaAloD0MI5Nh6hrByckCUhpRSlGgVTUABaBZHQJZm9zCDVYp1fZQoaAZoCWgPQwhOJ9nqcidxQJSGlFKUaBVL7mgWR0CWaGWSlnAZdX2UKGgGaAloD0MIaeBHNawxcUCUhpRSlGgVS+loFkdAlmh4WcjJMnV9lChoBmgJaA9DCMST3cxohm9AlIaUUpRoFUvmaBZHQJZo4O9WZJF1fZQoaAZoCWgPQwjaPA6DuaFxQJSGlFKUaBVNHgFoFkdAlmmwpON5t3V9lChoBmgJaA9DCJFGBU42i3FAlIaUUpRoFU0mAWgWR0CWabm+CbtrdX2UKGgGaAloD0MIeAyP/Sz4b0CUhpRSlGgVS/JoFkdAlmpkpAlfJHV9lChoBmgJaA9DCJ0std7vfXFAlIaUUpRoFU2FAWgWR0CWbOpxWDHwdX2UKGgGaAloD0MILhoyHiVDcECUhpRSlGgVTQsBaBZHQJZtDHNorWl1fZQoaAZoCWgPQwiw/s9hPsByQJSGlFKUaBVNDgFoFkdAlm2mjKxLTXV9lChoBmgJaA9DCEEN38I63WVAlIaUUpRoFU3oA2gWR0CWbdWu5jH5dX2UKGgGaAloD0MI88zLYffscECUhpRSlGgVS/9oFkdAlm9dvjwQUnV9lChoBmgJaA9DCIS3ByEgwXJAlIaUUpRoFU0PAWgWR0CWcLKs+3YudX2UKGgGaAloD0MIO3DOiBLycUCUhpRSlGgVS9BoFkdAlnG4GhVU/HV9lChoBmgJaA9DCIBEEygijHFAlIaUUpRoFUvQaBZHQJZxyRDCxeN1fZQoaAZoCWgPQwju68A5I3xiQJSGlFKUaBVN6ANoFkdAlnHi6DoQnXV9lChoBmgJaA9DCA0a+ic4jnFAlIaUUpRoFUvfaBZHQJZytmdy1eB1fZQoaAZoCWgPQwjpuBrZldduQJSGlFKUaBVL3mgWR0CWc1rzoUzsdX2UKGgGaAloD0MIWvYksLlrckCUhpRSlGgVS+JoFkdAlnOHpbD/EXV9lChoBmgJaA9DCEljtI4qn3FAlIaUUpRoFU0HAWgWR0CWdZpNKyv+dX2UKGgGaAloD0MIOZ1kq8tuUUCUhpRSlGgVS8hoFkdAlnX3mFJxvXV9lChoBmgJaA9DCOasTzmmV3BAlIaUUpRoFUvzaBZHQJZ3QQlKK511fZQoaAZoCWgPQwih8xq7RIdOQJSGlFKUaBVL5WgWR0CWd2ldTo+wdX2UKGgGaAloD0MID7kZbsCecUCUhpRSlGgVTQwBaBZHQJZ4ORHPNV11fZQoaAZoCWgPQwiwdD48Sx5EQJSGlFKUaBVLp2gWR0CWeZZ9/jKgdX2UKGgGaAloD0MIUtZvJqYzUECUhpRSlGgVS7loFkdAlntFrl/6PHV9lChoBmgJaA9DCGMl5llJfXFAlIaUUpRoFUvzaBZHQJZ72ZtvXK91fZQoaAZoCWgPQwhYPPVIwzFwQJSGlFKUaBVL+GgWR0CWfAC0WuYAdX2UKGgGaAloD0MIETl9PR+qc0CUhpRSlGgVTRMBaBZHQJZ8O8QI2O11fZQoaAZoCWgPQwj2KFyPgvNwQJSGlFKUaBVL/mgWR0CWfGbBXS0CdX2UKGgGaAloD0MIEJTb9r3mcUCUhpRSlGgVS+VoFkdAlnzluivgWXV9lChoBmgJaA9DCBEbLJykh2VAlIaUUpRoFU0KAmgWR0CWfWSpR4yHdX2UKGgGaAloD0MINNdppKXVcUCUhpRSlGgVTVEBaBZHQJZ9dahYeT51fZQoaAZoCWgPQwhy4UBIFgZGQJSGlFKUaBVLvWgWR0CWfYUVBUrDdX2UKGgGaAloD0MIl6lJ8IYgcUCUhpRSlGgVTQABaBZHQJaAM1XNke91fZQoaAZoCWgPQwi4WicuR5FtQJSGlFKUaBVL5GgWR0CWgEkSmIj4dX2UKGgGaAloD0MIMSWS6OVDckCUhpRSlGgVS/ZoFkdAltQ/VNHpbHV9lChoBmgJaA9DCPc96q9X4EtAlIaUUpRoFUuxaBZHQJbVFUaQ3gl1fZQoaAZoCWgPQwiVfOwuEMZwQJSGlFKUaBVNBgFoFkdAltWdp7CzknV9lChoBmgJaA9DCGyTisZaEmdAlIaUUpRoFU3oA2gWR0CW1bwZwXImdX2UKGgGaAloD0MI2XiwxW79b0CUhpRSlGgVS+toFkdAltXZGFzuGHV9lChoBmgJaA9DCKa6gJfZ+HBAlIaUUpRoFUvdaBZHQJbXRAxBVuJ1fZQoaAZoCWgPQwga3qzBu41wQJSGlFKUaBVL7mgWR0CW2FUg0TDgdX2UKGgGaAloD0MImNwosla6bkCUhpRSlGgVS+RoFkdAltib/S6UaHV9lChoBmgJaA9DCMWsF0O5aHFAlIaUUpRoFUvXaBZHQJbYnFhoduJ1fZQoaAZoCWgPQwgQW3o0lVVyQJSGlFKUaBVL9WgWR0CW2LxtYSxrdX2UKGgGaAloD0MImzkktZD4cUCUhpRSlGgVS/5oFkdAltiz0QK8c3V9lChoBmgJaA9DCEtywK7mq3BAlIaUUpRoFUvqaBZHQJbZSt4iX6Z1fZQoaAZoCWgPQwhcBTHQtZluQJSGlFKUaBVNBAFoFkdAltpBAv+OwXV9lChoBmgJaA9DCJOKxtrftHFAlIaUUpRoFU3EA2gWR0CW23N5+pfhdX2UKGgGaAloD0MIEHf1KjJocUCUhpRSlGgVS/FoFkdAltxIRdyDI3V9lChoBmgJaA9DCHOh8q9lrXBAlIaUUpRoFUvRaBZHQJbcpQVKwpx1fZQoaAZoCWgPQwgBGTp2EF5wQJSGlFKUaBVL+GgWR0CW3TIiTt9hdX2UKGgGaAloD0MI/oFy2773TkCUhpRSlGgVS61oFkdAlt1TfJmuknV9lChoBmgJaA9DCMqLTMCvWHJAlIaUUpRoFU0bAWgWR0CW3Zhpxm03dX2UKGgGaAloD0MIflUuVP6Jb0CUhpRSlGgVS/doFkdAlt5S2H+IdnV9lChoBmgJaA9DCG/whcmUx3FAlIaUUpRoFUvxaBZHQJbeTsrupjt1fZQoaAZoCWgPQwjxSScSzNZyQJSGlFKUaBVNIgFoFkdAlt+0cjqv/3V9lChoBmgJaA9DCCCWzRzSg3BAlIaUUpRoFUvyaBZHQJbgWGDcuap1fZQoaAZoCWgPQwiaz7nbNdlxQJSGlFKUaBVL8mgWR0CW4JV6NVBEdX2UKGgGaAloD0MIO/w1WSNXbUCUhpRSlGgVS/RoFkdAluC1cdHUdHV9lChoBmgJaA9DCA7Xag/7P3FAlIaUUpRoFU0EAWgWR0CW4R71ZkkKdX2UKGgGaAloD0MIZVBtcGJ4cUCUhpRSlGgVS/NoFkdAluE6fzz3AXV9lChoBmgJaA9DCHmVtU2xPHJAlIaUUpRoFU0EAWgWR0CW4TocaOxTdX2UKGgGaAloD0MIFVYqqKjbckCUhpRSlGgVS/loFkdAluIsmShaknV9lChoBmgJaA9DCIf7yK1J4z5AlIaUUpRoFUvJaBZHQJbjfcVQAMl1fZQoaAZoCWgPQwhIwr6dxNVwQJSGlFKUaBVL6mgWR0CW496j3225dX2UKGgGaAloD0MIuVD513KSckCUhpRSlGgVS99oFkdAluQW/8EV33V9lChoBmgJaA9DCKGhf4ILFnFAlIaUUpRoFU0OAWgWR0CW5K5UcXFcdX2UKGgGaAloD0MIQ+OJIA7vckCUhpRSlGgVS+toFkdAluTWucMEzXV9lChoBmgJaA9DCCgK9In8BHBAlIaUUpRoFUvraBZHQJbljY4ACGN1fZQoaAZoCWgPQwgBUTBjCh5wQJSGlFKUaBVNBgFoFkdAluZ0qx1PnHV9lChoBmgJaA9DCKosCrsomlJAlIaUUpRoFUvYaBZHQJbnGPq9oOB1fZQoaAZoCWgPQwheK6G7JOdvQJSGlFKUaBVL9GgWR0CW52mEXcgydX2UKGgGaAloD0MIHaopybpPbkCUhpRSlGgVS+NoFkdAlue5aJQ+EHV9lChoBmgJaA9DCEdX6e56v3FAlIaUUpRoFUvgaBZHQJboORFI/aB1fZQoaAZoCWgPQwgoRpbMMeRsQJSGlFKUaBVL7GgWR0CW6CwYLsrvdX2UKGgGaAloD0MI6dfWT3/ZcECUhpRSlGgVS+BoFkdAluhTdtVJc3V9lChoBmgJaA9DCCWTUzsDXXJAlIaUUpRoFUvxaBZHQJboy6kIomZ1ZS4="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 490, "n_steps": 645, "gamma": 0.997, "gae_lambda": 0.97, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 32, "n_epochs": 10, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVvwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAUsBSxNDBIgAUwCUToWUKYwBX5SFlIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCB9lH2UKGgXaA6MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgYjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "system_info": {"OS": "Linux-5.4.188+-x86_64-with-Ubuntu-18.04-bionic #1 SMP Sun Apr 24 10:03:06 PDT 2022", "Python": "3.7.13", "Stable-Baselines3": "1.5.0", "PyTorch": "1.11.0+cu113", "GPU Enabled": "True", "Numpy": "1.21.6", "Gym": "0.21.0"}}
 
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f06d9ef5170>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f06d9ef5200>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f06d9ef5290>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f06d9ef5320>", "_build": "<function ActorCriticPolicy._build at 0x7f06d9ef53b0>", "forward": "<function ActorCriticPolicy.forward at 0x7f06d9ef5440>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f06d9ef54d0>", "_predict": "<function ActorCriticPolicy._predict at 0x7f06d9ef5560>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f06d9ef55f0>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f06d9ef5680>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f06d9ef5710>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc_data object at 0x7f06d9f37ab0>"}, "verbose": 1, "policy_kwargs": {}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVnwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/5RoCksIhZSMAUOUdJRSlIwEaGlnaJRoEiiWIAAAAAAAAAAAAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAf5RoCksIhZRoFXSUUpSMDWJvdW5kZWRfYmVsb3eUaBIolggAAAAAAAAAAAAAAAAAAACUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYIAAAAAAAAAAAAAAAAAAAAlGghSwiFlGgVdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [8], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False]", "bounded_above": "[False False False False False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gAWVggAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUaAeTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu", "n": 4, "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "num_timesteps": 512000, "_total_timesteps": 500000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1652273847.1759872, "learning_rate": 0.0003, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVvwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAUsBSxNDBIgAUwCUToWUKYwBX5SFlIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCB9lH2UKGgXaA6MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgYjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAADOEQb2B2OU96WMQPrUcjL55wNw8tizxvAAAAAAAAAAAZjY8O+X9VT59cOU74iheviu2iTw2Wgq8AAAAAAAAAAAzom49KVAPulpRkDqtHZo1uiNBOiRDpLkAAIA/AACAP81oKrykk2084ckLPisiNr44D8k9zbwzvQAAAAAAAAAA8/v2PXu2v7rucdI5pES/tiaNNbzza/24AACAPwAAgD+mZ6E9KZh1ujBUhzWHiaYwGftbO06OubQAAIA/AACAP2YWETt7soq6ohmnuxEIQDUE5Ya4nkLAOgAAgD8AAIA/M2eyPOz0pT5vvBa9QpukvptpzTsTY1k8AAAAAAAAAAAz1hQ9e26zul7FCTqEZ4a1pan8uVwxHbkAAIA/AACAPzO4uDxceyG6ZklHuxwvD7bgcQw6ncBoOgAAgD8AAIA/M+eyPVxbULqLope7auX2OYqJvjpOsIy6AACAPwAAgD+aFlY9XOtxuqcBtTpeRi02lB9DOl3nz7kAAIA/AACAPxPMXr7E57g+t8A/PiSKlb5ibQ6+lt1KPQAAAAAAAAAATVmKPVIQqbm4InK5kTvRtPJrYzvulpA4AACAPwAAgD/awdU95JJlP2hQDTzDzfC+1FgzPh5ZCLsAAAAAAAAAAAClJT1sKve7D1gEPI1vKzyJhF29DL4UPQAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.02400000000000002, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVeBAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMI4pANpIvAZUCUhpRSlIwBbJRN6AOMAXSUR0Cj8UsMZxaQdX2UKGgGaAloD0MI0qsBSsMlZ0CUhpRSlGgVTegDaBZHQKPymowVTJh1fZQoaAZoCWgPQwgZj1IJzzxvQJSGlFKUaBVNzQJoFkdAo/Raf4AS4HV9lChoBmgJaA9DCDgvTnw11WhAlIaUUpRoFU3oA2gWR0Cj9cxcmjTKdX2UKGgGaAloD0MIaB8r+G3oZECUhpRSlGgVTegDaBZHQKP2XvOQhfV1fZQoaAZoCWgPQwhnSBXFK/JyQJSGlFKUaBVNIwFoFkdAo/bpKraM73V9lChoBmgJaA9DCM+8HHbfFWVAlIaUUpRoFU3oA2gWR0Cj+BgVXV9XdX2UKGgGaAloD0MIHeVgNgFrZkCUhpRSlGgVTegDaBZHQKP4gPlMh5h1fZQoaAZoCWgPQwhOfSB558VVQJSGlFKUaBVLm2gWR0Cj+cI5ggHNdX2UKGgGaAloD0MIlE4kmOrsY0CUhpRSlGgVTegDaBZHQKP6g+otL+R1fZQoaAZoCWgPQwhK7xtfe3xvQJSGlFKUaBVNgwFoFkdAo/uE4tHx0HV9lChoBmgJaA9DCD4JbM5BwHBAlIaUUpRoFU2PA2gWR0Cj/LPHtF8YdX2UKGgGaAloD0MIA0AVNy5DcUCUhpRSlGgVTWkCaBZHQKP87nBciW51fZQoaAZoCWgPQwi3Yn/ZPQdkQJSGlFKUaBVN6ANoFkdApAETWAf+0nV9lChoBmgJaA9DCK358ZcWIW1AlIaUUpRoFU31AWgWR0CkAbE/8l5XdX2UKGgGaAloD0MIhSaJJWVZcECUhpRSlGgVTZUBaBZHQKQDbS0jTrp1fZQoaAZoCWgPQwgCg6RPK7NsQJSGlFKUaBVNVwNoFkdApATbb+Lm63V9lChoBmgJaA9DCJp8s80N/GNAlIaUUpRoFU3oA2gWR0CkBVykCV8kdX2UKGgGaAloD0MIOPdXj3uhZ0CUhpRSlGgVTegDaBZHQKQFjyeZof11fZQoaAZoCWgPQwhaSSu+oQtkQJSGlFKUaBVN6ANoFkdApIP5zJZGKHV9lChoBmgJaA9DCOvkDMWdHXBAlIaUUpRoFU2XA2gWR0CkiKtz8xbjdX2UKGgGaAloD0MIDrxa7ozAcECUhpRSlGgVTQYDaBZHQKSJCjCYTkB1fZQoaAZoCWgPQwjQmbSpunZyQJSGlFKUaBVN4gFoFkdApI7I6IWP93V9lChoBmgJaA9DCPtz0ZDxMWFAlIaUUpRoFU3oA2gWR0Ckj772L5ymdX2UKGgGaAloD0MITMecZ2yEaECUhpRSlGgVTegDaBZHQKSR+XHim2t1fZQoaAZoCWgPQwie0VYlEVtiQJSGlFKUaBVN6ANoFkdApJQPy08eS3V9lChoBmgJaA9DCI22KoksdnJAlIaUUpRoFU1oAmgWR0CklLkFnqVydX2UKGgGaAloD0MIhjlBmxw6RECUhpRSlGgVS59oFkdApJTYNkOI7HV9lChoBmgJaA9DCNXrFoGxAmlAlIaUUpRoFU3oA2gWR0CklPawdKdydX2UKGgGaAloD0MIvhb03hjDcECUhpRSlGgVTaIBaBZHQKSWA2jO9nN1fZQoaAZoCWgPQwiNCTGX1DhjQJSGlFKUaBVN6ANoFkdApJYK55JK8XV9lChoBmgJaA9DCFluaTWk12NAlIaUUpRoFU3oA2gWR0CklygB91EFdX2UKGgGaAloD0MIpOTVOQaOZUCUhpRSlGgVTegDaBZHQKSXYfSx7iR1fZQoaAZoCWgPQwiUFi6rsElDQJSGlFKUaBVLimgWR0CkmEnYg7o0dX2UKGgGaAloD0MIO6kvS7tCZECUhpRSlGgVTegDaBZHQKUZLfWtlqd1fZQoaAZoCWgPQwgw16IFaPpnQJSGlFKUaBVN6ANoFkdApRnBfdAPd3V9lChoBmgJaA9DCJI+raJ/NnNAlIaUUpRoFU0kAWgWR0ClG52IoE0SdX2UKGgGaAloD0MIUoAomLH5Y0CUhpRSlGgVTegDaBZHQKUdbltj0+V1fZQoaAZoCWgPQwhXem02Vg1gQJSGlFKUaBVN6ANoFkdApR2fiT+vQnV9lChoBmgJaA9DCOdQhqqYpWRAlIaUUpRoFU3oA2gWR0ClH4A/s3Q2dX2UKGgGaAloD0MISQ7Y1WRSZkCUhpRSlGgVTegDaBZHQKUkMeZG8VZ1fZQoaAZoCWgPQwg9SE+RA4RxQJSGlFKUaBVNgQJoFkdApSidZDArQXV9lChoBmgJaA9DCEkrvqFwUGVAlIaUUpRoFU3oA2gWR0ClKadZA6dUdX2UKGgGaAloD0MI/G1PkFiYYkCUhpRSlGgVTegDaBZHQKUsii8nNPh1fZQoaAZoCWgPQwibN04KcyBhQJSGlFKUaBVN6ANoFkdApS5/UnXumnV9lChoBmgJaA9DCGvXhLRGqWVAlIaUUpRoFU3oA2gWR0ClLySAxzq9dX2UKGgGaAloD0MIkElGzkKDZUCUhpRSlGgVTegDaBZHQKUvXtw71Zl1fZQoaAZoCWgPQwhi9rLtNONkQJSGlFKUaBVN6ANoFkdApTBr28IzFnV9lChoBmgJaA9DCEEN38K6ZXFAlIaUUpRoFU2lAmgWR0ClrXa6z3RHdX2UKGgGaAloD0MIcOtunupJZkCUhpRSlGgVTegDaBZHQKWt3dZ7ojh1fZQoaAZoCWgPQwg3+pgPCIhlQJSGlFKUaBVN6ANoFkdApa4fSpiqhnV9lChoBmgJaA9DCMfXnlnSl3FAlIaUUpRoFU0PA2gWR0ClrpoB7u2JdX2UKGgGaAloD0MICMkCJvDpaECUhpRSlGgVTegDaBZHQKWyLOqNp/R1fZQoaAZoCWgPQwjdtYR8UMppQJSGlFKUaBVN6ANoFkdApbLPJ7sv7HV9lChoBmgJaA9DCEt1AS/z8nBAlIaUUpRoFU1ZAWgWR0CltVI7/4qPdX2UKGgGaAloD0MIkGYsmo6acUCUhpRSlGgVTTQBaBZHQKW2bHww0wd1fZQoaAZoCWgPQwiXdJSDWT5jQJSGlFKUaBVN6ANoFkdApbchwhnrZHV9lChoBmgJaA9DCC4dc54xD2VAlIaUUpRoFU3oA2gWR0CluTzYVZcLdX2UKGgGaAloD0MI11HVBFHiZUCUhpRSlGgVTegDaBZHQKW+YBpYcNp1fZQoaAZoCWgPQwgdAdwsnpRyQJSGlFKUaBVNXgFoFkdApcJi8an753V9lChoBmgJaA9DCHjuPVzyL2ZAlIaUUpRoFU3oA2gWR0ClwzcAzYVZdX2UKGgGaAloD0MIixagbTW8Z0CUhpRSlGgVTegDaBZHQKXEQ1eBxxV1fZQoaAZoCWgPQwiKA+j3/W1NQJSGlFKUaBVLsmgWR0ClxFOkUKzBdX2UKGgGaAloD0MILVvri4RrZECUhpRSlGgVTegDaBZHQKZFE+2VmjF1fZQoaAZoCWgPQwjdRZiiXDxiQJSGlFKUaBVN6ANoFkdApkcdPYWcjXV9lChoBmgJaA9DCHxgx3+Bs2VAlIaUUpRoFU3oA2gWR0CmR8XcYZVGdX2UKGgGaAloD0MIf4eiQB+vY0CUhpRSlGgVTegDaBZHQKZJLA6+36R1fZQoaAZoCWgPQwhGzy10pRZhQJSGlFKUaBVN6ANoFkdApkqsIiTt9nV9lChoBmgJaA9DCINStHKvRWlAlIaUUpRoFU3oA2gWR0CmSvUaqCHzdX2UKGgGaAloD0MINIEiFjHOZECUhpRSlGgVTegDaBZHQKZLir1/UfB1fZQoaAZoCWgPQwiYUSy3tMhKQJSGlFKUaBVLtWgWR0CmTVWNm16WdX2UKGgGaAloD0MI9x4uOe7CZUCUhpRSlGgVTegDaBZHQKZPjvKlpGp1fZQoaAZoCWgPQwgogGJkSR5hQJSGlFKUaBVN6ANoFkdAplA6OzY29HV9lChoBmgJaA9DCPKaV3VWwGNAlIaUUpRoFU3oA2gWR0CmUp5u63AmdX2UKGgGaAloD0MIgT/8/PeGTECUhpRSlGgVS7FoFkdAplLF6LOzIHV9lChoBmgJaA9DCPPK9baZKGNAlIaUUpRoFU3oA2gWR0CmU6I6r/83dX2UKGgGaAloD0MIzSIUW0H7YECUhpRSlGgVTegDaBZHQKZWSs90Rvp1fZQoaAZoCWgPQwhTzaylgOhMQJSGlFKUaBVLyGgWR0CmWNAvtdAxdX2UKGgGaAloD0MImNwoslY+YUCUhpRSlGgVTegDaBZHQKbbU7J4jbB1fZQoaAZoCWgPQwirIAa6dglmQJSGlFKUaBVN6ANoFkdAptwjv9cbBHV9lChoBmgJaA9DCHiZYaPs5XBAlIaUUpRoFU0+A2gWR0Cm3P0AtFrmdX2UKGgGaAloD0MIlgfpKbKxcECUhpRSlGgVTVABaBZHQKbdILBsQ/Z1fZQoaAZoCWgPQwgN3lflwoViQJSGlFKUaBVN6ANoFkdApt07VrhzeXV9lChoBmgJaA9DCAPpYtPKoGBAlIaUUpRoFU3oA2gWR0Cm3Uov8IiUdX2UKGgGaAloD0MIisqGNZU0bUCUhpRSlGgVTSYBaBZHQKbeIhje9Bd1fZQoaAZoCWgPQwgbutkfKPtuQJSGlFKUaBVNeQJoFkdApt9+KXOW0XV9lChoBmgJaA9DCLKbGf1oz2RAlIaUUpRoFU3oA2gWR0Cm36itA9mpdX2UKGgGaAloD0MI6E8b1WltaECUhpRSlGgVTegDaBZHQKbi4IO6NER1fZQoaAZoCWgPQwiZnxuaMnNjQJSGlFKUaBVN6ANoFkdApuQwbEP1+XV9lChoBmgJaA9DCP9YiA6BM19AlIaUUpRoFU3oA2gWR0Cm5HBMSK3vdX2UKGgGaAloD0MI8ppXdVaFZkCUhpRSlGgVTegDaBZHQKbk8JRfnfV1fZQoaAZoCWgPQwiM17yqsxdSQJSGlFKUaBVL22gWR0Cm5TOpbUw0dX2UKGgGaAloD0MIX7Uy4dfWcUCUhpRSlGgVTa4BaBZHQKbmrtUn5SF1fZQoaAZoCWgPQwj5oGezqjZwQJSGlFKUaBVNTgFoFkdApugOxdIGyHV9lChoBmgJaA9DCMoxWdz/425AlIaUUpRoFU2EAWgWR0Cm6A2uPmxMdX2UKGgGaAloD0MIujDSi9p0Y0CUhpRSlGgVTegDaBZHQKboWEIw/Ph1fZQoaAZoCWgPQwjuJvim6eJvQJSGlFKUaBVN3AFoFkdApulPDR+jM3V9lChoBmgJaA9DCCGunL0z+k1AlIaUUpRoFUvIaBZHQKbqKcy31Bd1fZQoaAZoCWgPQwhszOuIQ0hjQJSGlFKUaBVN6ANoFkdApuqis8xKx3V9lChoBmgJaA9DCH3mrE+5q2JAlIaUUpRoFU3oA2gWR0Cm62j9GZuydWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 400, "n_steps": 800, "gamma": 0.997, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 16, "n_epochs": 10, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVvwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAUsBSxNDBIgAUwCUToWUKYwBX5SFlIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCB9lH2UKGgXaA6MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgYjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "system_info": {"OS": "Linux-5.4.188+-x86_64-with-Ubuntu-18.04-bionic #1 SMP Sun Apr 24 10:03:06 PDT 2022", "Python": "3.7.13", "Stable-Baselines3": "1.5.0", "PyTorch": "1.11.0+cu113", "GPU Enabled": "True", "Numpy": "1.21.6", "Gym": "0.21.0"}}
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:279268ed4d1a2570fe3db82ea025bba5b81c8146fffae3921e0603b907334ece
3
- size 222742
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3a9d04968ca0f2ec48e3d6de65acc180de2f446b339e9581e797402ff179c65
3
+ size 190772
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 287.76183821119196, "std_reward": 13.715414452661392, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2022-05-11T12:17:15.566817"}
 
1
+ {"mean_reward": 244.28345422378342, "std_reward": 67.94121959847473, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2022-05-11T13:47:41.841509"}