misza222 commited on
Commit
9b3360f
1 Parent(s): b966f95

Second RL model

Browse files
LunarLander_v2-PPO.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9eae3a4fffbf92d4a9064d3ebeb7b0a3458decc27343c4fce82fb8c05251bd47
3
- size 147280
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b0bbb05cea8d9754bf030c0037a19eab4e97f2e6bc099315e042b7547c1d672c
3
+ size 146699
LunarLander_v2-PPO/data CHANGED
@@ -4,19 +4,19 @@
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
- "__init__": "<function ActorCriticPolicy.__init__ at 0x7f564bfdb310>",
8
- "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f564bfdb3a0>",
9
- "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f564bfdb430>",
10
- "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f564bfdb4c0>",
11
- "_build": "<function ActorCriticPolicy._build at 0x7f564bfdb550>",
12
- "forward": "<function ActorCriticPolicy.forward at 0x7f564bfdb5e0>",
13
- "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f564bfdb670>",
14
- "_predict": "<function ActorCriticPolicy._predict at 0x7f564bfdb700>",
15
- "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f564bfdb790>",
16
- "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f564bfdb820>",
17
- "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f564bfdb8b0>",
18
  "__abstractmethods__": "frozenset()",
19
- "_abc_impl": "<_abc_data object at 0x7f564bfd3ae0>"
20
  },
21
  "verbose": 1,
22
  "policy_kwargs": {},
@@ -47,7 +47,7 @@
47
  "_num_timesteps_at_start": 0,
48
  "seed": null,
49
  "action_noise": null,
50
- "start_time": 1670353699724315896,
51
  "learning_rate": 0.0003,
52
  "tensorboard_log": null,
53
  "lr_schedule": {
@@ -56,7 +56,7 @@
56
  },
57
  "_last_obs": {
58
  ":type:": "<class 'numpy.ndarray'>",
59
- ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAIBx0L1cjxy69eJcu1S8lTgPi2i7deXtOQAAgD8AAIA/AJGVvUzZ7j5H2ri9vPRJvllHzL3Vxtg7AAAAAAAAAADNFye9nSZOPx6Gkj3OJom++IQBPJ30xDwAAAAAAAAAAM0euzxXAX8/k3zvPXYAi743HCW6K5VPvQAAAAAAAAAAGoQVPWRqRj4SpvI9LbQHvvvUJz29Wvy8AAAAAAAAAADArBy+pHx+PHzaQTtL+cC5q3kKvqM+8jkAAIA/AACAP5phBzyvSWM9NjSGvXRcU77UKNq8C7ZvvQAAAAAAAAAAgGlVPewBl7mj64S7fHU4N2znDLsbkHY6AACAPwAAgD+alTg9UkDNuT5bibtvIgs1yVFiulENnjoAAIA/AACAP2ayojv+1dk9yEzfPbfEO766bmY9tgUTvgAAAAAAAAAAAGq9vY+uZLq+vFI7nXIENtebxLi9OPE0AACAPwAAgD8N3oc9exyQutboFTzf6Y82EKsOu2RThjUAAIA/AACAP1PEI77PSAy8K07huwYECLpm6mA9QtTeOgAAgD8AAIA/U6wpvpR3i7xW4jK8Jra7ukbj8D0uvJ47AACAPwAAgD+m98+9KbgHumaa/DiaCXGxTvBDOvprE7gAAIA/AACAP+bLv732NCO6IO4gupwIjbVt02w5GMk9OQAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
60
  },
61
  "_last_episode_starts": {
62
  ":type:": "<class 'numpy.ndarray'>",
@@ -69,21 +69,21 @@
69
  "_current_progress_remaining": -0.015808000000000044,
70
  "ep_info_buffer": {
71
  ":type:": "<class 'collections.deque'>",
72
- ":serialized:": "gAWVfRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIkiOdgRFAYECUhpRSlIwBbJRN6AOMAXSUR0ChdhbF85S4dX2UKGgGaAloD0MIVb/S+fCnY0CUhpRSlGgVTegDaBZHQKF2jp7kXDZ1fZQoaAZoCWgPQwi3f2WlSYxdQJSGlFKUaBVN6ANoFkdAoXjWEGqxT3V9lChoBmgJaA9DCHNIaqHk8WVAlIaUUpRoFU3oA2gWR0ChfajxkNF0dX2UKGgGaAloD0MIJvvnacB4X0CUhpRSlGgVTegDaBZHQKF+WOMERrd1fZQoaAZoCWgPQwhXPzbJj4RiQJSGlFKUaBVN6ANoFkdAoX8ALb5/LHV9lChoBmgJaA9DCLtgcM0dT2RAlIaUUpRoFU3oA2gWR0ChgoiqhlDndX2UKGgGaAloD0MImPijqDOoWUCUhpRSlGgVTegDaBZHQKGCyAq/dqN1fZQoaAZoCWgPQwgb17/rs0ViQJSGlFKUaBVN6ANoFkdAoYWaFZgXuXV9lChoBmgJaA9DCAcLJ2n+ClxAlIaUUpRoFU3oA2gWR0ChieGZE2HddX2UKGgGaAloD0MIyTmxh/aCWECUhpRSlGgVTegDaBZHQKGJ6C2c8T11fZQoaAZoCWgPQwjXMEPjCSJjQJSGlFKUaBVN6ANoFkdAoY9csrd30XV9lChoBmgJaA9DCAYTfxR1OFxAlIaUUpRoFU3oA2gWR0ChkCujIq9XdX2UKGgGaAloD0MIvAfovhyeYECUhpRSlGgVTegDaBZHQKGWo6dUbUB1fZQoaAZoCWgPQwhQ4QhSKSJiQJSGlFKUaBVN6ANoFkdAoZgLdtVJc3V9lChoBmgJaA9DCOV620yFjlhAlIaUUpRoFU3oA2gWR0ChmblSsKb8dX2UKGgGaAloD0MI1eqrq4I4YUCUhpRSlGgVTegDaBZHQKGZvKbrkbR1fZQoaAZoCWgPQwiL/zuiQjhcQJSGlFKUaBVN6ANoFkdAoZo8X7+DOHV9lChoBmgJaA9DCDkroib6uEFAlIaUUpRoFU1YAWgWR0ChnCOm78NydX2UKGgGaAloD0MIoiWPp+XlYECUhpRSlGgVTegDaBZHQKGciAFPi1l1fZQoaAZoCWgPQwjnN0w0SI5gQJSGlFKUaBVN6ANoFkdAoaFCP0Zm7XV9lChoBmgJaA9DCBe86CtIQFpAlIaUUpRoFU3oA2gWR0ChofIMjNY9dX2UKGgGaAloD0MIsacd/pqyYUCUhpRSlGgVTegDaBZHQKGinJhfBvd1fZQoaAZoCWgPQwi+afrsgIJWQJSGlFKUaBVN6ANoFkdAoaYjzXjEN3V9lChoBmgJaA9DCMCUgQNa5llAlIaUUpRoFU3oA2gWR0ChpmKSxJNCdX2UKGgGaAloD0MI0GT/PA0cYECUhpRSlGgVTegDaBZHQKGoThybQTp1fZQoaAZoCWgPQwh+NnLdlG4/QJSGlFKUaBVNGgFoFkdAoat+gL7XQXV9lChoBmgJaA9DCDSitDd4RGBAlIaUUpRoFU3oA2gWR0ChrY/47A+IdX2UKGgGaAloD0MIayxhbQywYkCUhpRSlGgVTegDaBZHQKGtltaY/ml1fZQoaAZoCWgPQwjz6EZYVJtfQJSGlFKUaBVN6ANoFkdAobOOnGbTdHV9lChoBmgJaA9DCNe+gF64LFpAlIaUUpRoFU3oA2gWR0ChueNx+8XfdX2UKGgGaAloD0MIdJXurrMeYkCUhpRSlGgVTegDaBZHQKG7Q0HhS+B1fZQoaAZoCWgPQwggmQ6dnm8vQJSGlFKUaBVL32gWR0Chu/fQKKHgdX2UKGgGaAloD0MIieyDLAscXUCUhpRSlGgVTegDaBZHQKG85ukUKzB1fZQoaAZoCWgPQwgKhnMNM4pdQJSGlFKUaBVN6ANoFkdAobzpY1YQrnV9lChoBmgJaA9DCBO1NLdC+l5AlIaUUpRoFU3oA2gWR0ChvVxzijtYdX2UKGgGaAloD0MIKT+p9unLXUCUhpRSlGgVTegDaBZHQKG/LXsgMc91fZQoaAZoCWgPQwgV/3dEhbRgQJSGlFKUaBVN6ANoFkdAob+MwSJ0n3V9lChoBmgJaA9DCBr4UQ37dFlAlIaUUpRoFU3oA2gWR0ChxM1UMoc8dX2UKGgGaAloD0MIVWr2QCuIWECUhpRSlGgVTegDaBZHQKHFcIJJGvx1fZQoaAZoCWgPQwiMuWsJ+QFZQJSGlFKUaBVN6ANoFkdAockY2ycCo3V9lChoBmgJaA9DCE9bI4Jx7FZAlIaUUpRoFU3oA2gWR0ChyVWTPjXGdX2UKGgGaAloD0MIQ61p3vG2YUCUhpRSlGgVTegDaBZHQKHLVnnuAqd1fZQoaAZoCWgPQwiQ14NJcZRiQJSGlFKUaBVN6ANoFkdAoc6afOD8L3V9lChoBmgJaA9DCNXnaiv2G2FAlIaUUpRoFU3oA2gWR0Ch0I6uOjqOdX2UKGgGaAloD0MIiPVGrTCAYECUhpRSlGgVTegDaBZHQKHQlU83dbh1fZQoaAZoCWgPQwhATpgwmi09QJSGlFKUaBVNPgFoFkdAod4M9yLhrHV9lChoBmgJaA9DCAq/1M+ba2BAlIaUUpRoFU3oA2gWR0Ch34OdXko4dX2UKGgGaAloD0MI+Z0mM94UYkCUhpRSlGgVTegDaBZHQKHg+0tRNyp1fZQoaAZoCWgPQwhgOq3boP5hQJSGlFKUaBVN6ANoFkdAoeG6mbb1y3V9lChoBmgJaA9DCILK+PcZBF5AlIaUUpRoFU3oA2gWR0Ch4qta6jFidX2UKGgGaAloD0MIyM7b2Oy1ZECUhpRSlGgVTegDaBZHQKHirTaTOgR1fZQoaAZoCWgPQwg4nzpWqe1iQJSGlFKUaBVN6ANoFkdAoeMkAR02cnV9lChoBmgJaA9DCKZG6GfqN2BAlIaUUpRoFU3oA2gWR0Ch5RxRdhRZdX2UKGgGaAloD0MIPIcyVMUDXkCUhpRSlGgVTegDaBZHQKHlemUGFBZ1fZQoaAZoCWgPQwj7k/jcCZFcQJSGlFKUaBVN6ANoFkdAoepdsrNGE3V9lChoBmgJaA9DCMCWV663iWJAlIaUUpRoFU3oA2gWR0Ch6wdcbBGhdX2UKGgGaAloD0MIYFs//Wd1XkCUhpRSlGgVTegDaBZHQKHusbdadMF1fZQoaAZoCWgPQwjgaMcNvxsXQJSGlFKUaBVNNwFoFkdAoe7nuTibUnV9lChoBmgJaA9DCHOfHAWIrF1AlIaUUpRoFU3oA2gWR0Ch7vNNrTH9dX2UKGgGaAloD0MIKbLWUGqRWkCUhpRSlGgVTegDaBZHQKHw2FbmlqJ1fZQoaAZoCWgPQwjWG7XC9GteQJSGlFKUaBVN6ANoFkdAofQOJN0vG3V9lChoBmgJaA9DCKg5eZEJkmFAlIaUUpRoFU3oA2gWR0Ch9iShakhzdX2UKGgGaAloD0MIxciSOZYbOECUhpRSlGgVS/FoFkdAoffgG6f8M3V9lChoBmgJaA9DCHdpw2FpYGJAlIaUUpRoFU3oA2gWR0CiAiSk9ECvdX2UKGgGaAloD0MImWGjrN9tW0CUhpRSlGgVTegDaBZHQKIDNUqhDgJ1fZQoaAZoCWgPQwixMEROXxBYQJSGlFKUaBVN6ANoFkdAogSW/zreInV9lChoBmgJaA9DCHZu2ozTWlxAlIaUUpRoFU3oA2gWR0CiBUw7DEWJdX2UKGgGaAloD0MIC19f61K2X0CUhpRSlGgVTegDaBZHQKIGKJvYODt1fZQoaAZoCWgPQwjghhiveZtgQJSGlFKUaBVN6ANoFkdAogYqURnOB3V9lChoBmgJaA9DCFtAaD18CGFAlIaUUpRoFU3oA2gWR0CiBpTuF6AwdX2UKGgGaAloD0MIxhft8UKNX0CUhpRSlGgVTegDaBZHQKIItnFo+Oh1fZQoaAZoCWgPQwhXQQx07T1eQJSGlFKUaBVN6ANoFkdAog23d69kBnV9lChoBmgJaA9DCDV8C+vG6VpAlIaUUpRoFU3oA2gWR0CiDl6lDWsjdX2UKGgGaAloD0MINzXQfE40YECUhpRSlGgVTegDaBZHQKISMDK5kLB1fZQoaAZoCWgPQwi+UMB2MMhiQJSGlFKUaBVN6ANoFkdAohJnsw+MZXV9lChoBmgJaA9DCFga+FGNyGFAlIaUUpRoFU3oA2gWR0CiFHxmseXBdX2UKGgGaAloD0MIUMjO21iBY0CUhpRSlGgVTegDaBZHQKIW4uLaVUx1fZQoaAZoCWgPQwiwxW6f1fthQJSGlFKUaBVN6ANoFkdAohoHxe9i+nV9lChoBmgJaA9DCLtFYKxvulxAlIaUUpRoFU3oA2gWR0CiG/RCY1HfdX2UKGgGaAloD0MI/kgRGVZxLECUhpRSlGgVTVoBaBZHQKIfdVmSQo11fZQoaAZoCWgPQwiwIM1YNNk1QJSGlFKUaBVL4WgWR0CiH/LncL0BdX2UKGgGaAloD0MIMxmO5zPiYUCUhpRSlGgVTegDaBZHQKImAOJcgQp1fZQoaAZoCWgPQwhCYOXQIhdbQJSGlFKUaBVN6ANoFkdAoicMWZZ0S3V9lChoBmgJaA9DCBSUopX7RW9AlIaUUpRoFU1ZAWgWR0CiJxXY+Sr6dX2UKGgGaAloD0MInWUWodhKHUCUhpRSlGgVTSYBaBZHQKInGo5PuXx1fZQoaAZoCWgPQwiHNZVFYZpgQJSGlFKUaBVN6ANoFkdAoihfsRg7YHV9lChoBmgJaA9DCI/7VuvEaF5AlIaUUpRoFU3oA2gWR0CiKQetSydGdX2UKGgGaAloD0MIr+sX7AbHYECUhpRSlGgVTegDaBZHQKIp3y5I6Kd1fZQoaAZoCWgPQwh7vfvjvelWQJSGlFKUaBVN6ANoFkdAoinh+SbH63V9lChoBmgJaA9DCJI81/fhQALAlIaUUpRoFU0HAWgWR0CiKen9ehPCdX2UKGgGaAloD0MIbarukc1cYUCUhpRSlGgVTegDaBZHQKIqQW8h9st1fZQoaAZoCWgPQwhQjgJEwYRfQJSGlFKUaBVN6ANoFkdAoiwH9m6GxnV9lChoBmgJaA9DCKJjB5W4viXAlIaUUpRoFUvPaBZHQKItFZpSJj51fZQoaAZoCWgPQwgpd5/jozUwQJSGlFKUaBVNHAFoFkdAojBiuB+WnnV9lChoBmgJaA9DCA/QfTkz9WFAlIaUUpRoFU3oA2gWR0CiMMBCtzS1dX2UKGgGaAloD0MIPx2PGai/YkCUhpRSlGgVTegDaBZHQKIxWxREWqN1fZQoaAZoCWgPQwh2+kFdJAtiQJSGlFKUaBVN6ANoFkdAojUd3GGVRnV9lChoBmgJaA9DCPKWqx+bsV9AlIaUUpRoFU3oA2gWR0CiN0Tj/+85dX2UKGgGaAloD0MIFLGIYQetbECUhpRSlGgVTZIBaBZHQKI44JfpljF1ZS4="
73
  },
74
  "ep_success_buffer": {
75
  ":type:": "<class 'collections.deque'>",
76
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
77
  },
78
- "_n_updates": 414,
79
  "n_steps": 1024,
80
  "gamma": 0.999,
81
  "gae_lambda": 0.98,
82
  "ent_coef": 0.01,
83
  "vf_coef": 0.5,
84
  "max_grad_norm": 0.5,
85
- "batch_size": 1024,
86
- "n_epochs": 6,
87
  "clip_range": {
88
  ":type:": "<class 'function'>",
89
  ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4BDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/yZmZmZmZmoWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="
 
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
+ "__init__": "<function ActorCriticPolicy.__init__ at 0x7f84226278b0>",
8
+ "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f8422627940>",
9
+ "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f84226279d0>",
10
+ "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f8422627a60>",
11
+ "_build": "<function ActorCriticPolicy._build at 0x7f8422627af0>",
12
+ "forward": "<function ActorCriticPolicy.forward at 0x7f8422627b80>",
13
+ "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f8422627c10>",
14
+ "_predict": "<function ActorCriticPolicy._predict at 0x7f8422627ca0>",
15
+ "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f8422627d30>",
16
+ "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f8422627dc0>",
17
+ "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f8422627e50>",
18
  "__abstractmethods__": "frozenset()",
19
+ "_abc_impl": "<_abc_data object at 0x7f84225a90c0>"
20
  },
21
  "verbose": 1,
22
  "policy_kwargs": {},
 
47
  "_num_timesteps_at_start": 0,
48
  "seed": null,
49
  "action_noise": null,
50
+ "start_time": 1670410119328534839,
51
  "learning_rate": 0.0003,
52
  "tensorboard_log": null,
53
  "lr_schedule": {
 
56
  },
57
  "_last_obs": {
58
  ":type:": "<class 'numpy.ndarray'>",
59
+ ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAIAnG76Bnw4/JuDQPg7dhr4qrRE+svo4PQAAAAAAAAAAM3mbvOyJ+bmaLwI0w4suL9FkQ7p6h5+zAACAPwAAgD+aOki9BfSLu1hNrDvmrSM9lqJEu8hDc7wAAIA/AACAP81DKz1InZi6G+jBu1XrCjifNvE6euQutwAAgD8AAIA/OnUmPqwmKj45ERK+5sZTvu1cB72qbZ87AAAAAAAAAAAz3d89ZJ+CP8a/4T27m5i+EOnOPai5iL0AAAAAAAAAAC2blT4PGeA+tbU5vgCXjr5tyvw8Y3h0vQAAAAAAAAAAjfOMvQ+ETD8jZOG8s/KFvv9WZr0Ipas9AAAAAAAAAADNvBi7rjeRus21OLWjnD2w2IgEu+YiTjQAAIA/AACAP6DVNj7k7So+3nH/vbMglb6rOJi87uCPuwAAAAAAAAAAZkOxPMzVPz5OGmS917KDvpI1PLvaTYO9AAAAAAAAAADt9H0+8Yw2P0oKIL0u3a++Jsi1PXi29TsAAAAAAAAAALPxCT18O+o+wOSyu9tthr6DdjM9gp+WuwAAAAAAAAAAzdbTvTyMOD9FOuQ99kanvoa0Jb1Cll69AAAAAAAAAACaZw29Hx2qudus0jqeJz82HdFaOpuw+rkAAIA/AACAP/qLDr5/6pQ/XrHBvi0gpr5tvSy+hgzkvQAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
60
  },
61
  "_last_episode_starts": {
62
  ":type:": "<class 'numpy.ndarray'>",
 
69
  "_current_progress_remaining": -0.015808000000000044,
70
  "ep_info_buffer": {
71
  ":type:": "<class 'collections.deque'>",
72
+ ":serialized:": "gAWVehAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIPEuQEVCwUkCUhpRSlIwBbJRNHgGMAXSUR0CUNUtMPBi1dX2UKGgGaAloD0MIlugsswjyZECUhpRSlGgVTegDaBZHQJRDcWLxZuB1fZQoaAZoCWgPQwj4+lqXmr5vQJSGlFKUaBVN4AFoFkdAlEbUjcEeQ3V9lChoBmgJaA9DCKJFtvM903BAlIaUUpRoFU3gAmgWR0CUR+Nd7fHhdX2UKGgGaAloD0MIrOEi9zQXcUCUhpRSlGgVTToCaBZHQJRK7DNyHVR1fZQoaAZoCWgPQwhMp3UbFCFwQJSGlFKUaBVNygJoFkdAlEtDw+dK/XV9lChoBmgJaA9DCEKvP4lPqHBAlIaUUpRoFU2fAmgWR0CUS1OdoWYXdX2UKGgGaAloD0MIcLGiBtOOckCUhpRSlGgVTVYBaBZHQJRQz+fh/Al1fZQoaAZoCWgPQwh/F7Zmq6FtQJSGlFKUaBVNIQNoFkdAlFMEgGKQ73V9lChoBmgJaA9DCNy7Bn3pbWNAlIaUUpRoFU3oA2gWR0CUU1MvRJEqdX2UKGgGaAloD0MIg94bQwADbkCUhpRSlGgVTSsBaBZHQJRU2q94/u91fZQoaAZoCWgPQwjNHmgFhj5xQJSGlFKUaBVNDwJoFkdAlFVdQsPJ73V9lChoBmgJaA9DCGU5CaXvPnFAlIaUUpRoFU1yAWgWR0CUV1Bu4wyqdX2UKGgGaAloD0MIW80643sXaUCUhpRSlGgVTegDaBZHQJRaezlcQiB1fZQoaAZoCWgPQwh/Z3v0BpNwQJSGlFKUaBVNIwJoFkdAlFss9Oh0yXV9lChoBmgJaA9DCJKvBFLiwGxAlIaUUpRoFU3zAWgWR0CUXLzmfXf7dX2UKGgGaAloD0MI73Tniecmb0CUhpRSlGgVTRMCaBZHQJRc2BRQ7911fZQoaAZoCWgPQwhYqaCiaslxQJSGlFKUaBVNmAFoFkdAlGKg8wHqvHV9lChoBmgJaA9DCOY7+IkD+kVAlIaUUpRoFUv0aBZHQJRi2Z5Rjz91fZQoaAZoCWgPQwiJCtXNBWJwQJSGlFKUaBVN0AFoFkdAlGYMpsoDxXV9lChoBmgJaA9DCAN7TKQ0Km5AlIaUUpRoFU0qAmgWR0CUZ99kjHGTdX2UKGgGaAloD0MIutkfKPddcUCUhpRSlGgVTfwBaBZHQJRumLm6oVF1fZQoaAZoCWgPQwhe2nBY2nlxQJSGlFKUaBVN9gFoFkdAlHLvFzdUKnV9lChoBmgJaA9DCMB4Bg39s29AlIaUUpRoFU0cAWgWR0CUc9cE/0NCdX2UKGgGaAloD0MIEf+wpcfobkCUhpRSlGgVTSoCaBZHQJR0LGxUvPF1fZQoaAZoCWgPQwhEM0+u6VhxQJSGlFKUaBVNQANoFkdAlHSv557gKnV9lChoBmgJaA9DCPGg2XWviXBAlIaUUpRoFU1bAmgWR0CUdpZ9uxbCdX2UKGgGaAloD0MIpmPOM/YhcECUhpRSlGgVTTkCaBZHQJR4vMyJsO51fZQoaAZoCWgPQwhCrz+Jj5lwQJSGlFKUaBVNUgNoFkdAlHjM10knkXV9lChoBmgJaA9DCHUAxF29DVBAlIaUUpRoFUvmaBZHQJR8GfTTfBN1fZQoaAZoCWgPQwhbeF4q9udxQJSGlFKUaBVNkwFoFkdAlH3Q40dilXV9lChoBmgJaA9DCNF3t7LEfnFAlIaUUpRoFU1gAmgWR0CUjjX668QJdX2UKGgGaAloD0MI4GjHDT8MbkCUhpRSlGgVTaoBaBZHQJSO4jzI3it1fZQoaAZoCWgPQwhKfO4Ee/RxQJSGlFKUaBVNkQJoFkdAlI8rPppvgnV9lChoBmgJaA9DCAoxl1Tt/29AlIaUUpRoFU2+AmgWR0CUkM7ngYP5dX2UKGgGaAloD0MIVG8NbJXlb0CUhpRSlGgVTTQCaBZHQJSRPBInSfF1fZQoaAZoCWgPQwjXT/9Zc8pjQJSGlFKUaBVN6ANoFkdAlJKUhRqGlHV9lChoBmgJaA9DCCwN/KhGd3FAlIaUUpRoFU39AmgWR0CUlcfQa72+dX2UKGgGaAloD0MIT1lN15MGckCUhpRSlGgVTZoBaBZHQJSYcoG6f8N1fZQoaAZoCWgPQwgWpu81BLxwQJSGlFKUaBVNOAFoFkdAlJzQSWZ7X3V9lChoBmgJaA9DCE5DVOFPt2pAlIaUUpRoFU3qAWgWR0CUorTFERapdX2UKGgGaAloD0MIi98UVqqGb0CUhpRSlGgVTVUCaBZHQJSjGIhyKel1fZQoaAZoCWgPQwjwiuB/K0UyQJSGlFKUaBVL/2gWR0CUpq47zTWodX2UKGgGaAloD0MInE1HADe6bECUhpRSlGgVTfEBaBZHQJSnpj/dZaF1fZQoaAZoCWgPQwi+o8aEmNxuQJSGlFKUaBVNewFoFkdAlKi2mHgxanV9lChoBmgJaA9DCMWp1sKsJW5AlIaUUpRoFU27AWgWR0CUqgmZmZmadX2UKGgGaAloD0MIARWOIBVjb0CUhpRSlGgVTS4BaBZHQJSsdL5AQg91fZQoaAZoCWgPQwitS43QD6ZxQJSGlFKUaBVNvQJoFkdAlK3byhBZ6nV9lChoBmgJaA9DCJ5A2ClW1T5AlIaUUpRoFUvXaBZHQJS3MHu7YkF1fZQoaAZoCWgPQwgT8db5t8puQJSGlFKUaBVNIQFoFkdAlLsEWykbgnV9lChoBmgJaA9DCG2sxDyr7WxAlIaUUpRoFU2CAWgWR0CUvEKl54W2dX2UKGgGaAloD0MIj8ahfhekZECUhpRSlGgVTegDaBZHQJS+cv9LpRp1fZQoaAZoCWgPQwjCL/XzpsBlQJSGlFKUaBVN6ANoFkdAlL7Mdkrf+HV9lChoBmgJaA9DCNGt1/Qg6G9AlIaUUpRoFU3mA2gWR0CUxG1NQCSzdX2UKGgGaAloD0MI/ACkNnEabkCUhpRSlGgVTXQBaBZHQJTFSqm0mdB1fZQoaAZoCWgPQwi28pL/yQNvQJSGlFKUaBVN1QFoFkdAlMZyJGe+VXV9lChoBmgJaA9DCPqcu12v+GxAlIaUUpRoFU15AWgWR0CUxxlV94NadX2UKGgGaAloD0MI/yWpTDG3ZUCUhpRSlGgVTegDaBZHQJTM/xvvSc91fZQoaAZoCWgPQwhmZ9E7FahuQJSGlFKUaBVNRAFoFkdAlM0Rj4Hoo3V9lChoBmgJaA9DCDdUjPM3ylVAlIaUUpRoFU3oA2gWR0CU3CMW43FUdX2UKGgGaAloD0MItMu3PqzFbUCUhpRSlGgVTR4BaBZHQJTdSJBPbfx1fZQoaAZoCWgPQwhDqiheZTJyQJSGlFKUaBVNMgFoFkdAlN10T6BRRHV9lChoBmgJaA9DCC/ej9uv02xAlIaUUpRoFU3fA2gWR0CU3d3rD63zdX2UKGgGaAloD0MItHIvMCsNcECUhpRSlGgVTdsDaBZHQJTfv83uNPx1fZQoaAZoCWgPQwhDVOHP8LpuQJSGlFKUaBVNKAFoFkdAlN+/HHWBjHV9lChoBmgJaA9DCEnajT5mG3BAlIaUUpRoFU1GAWgWR0CU4O2dNFjNdX2UKGgGaAloD0MIccgG0sWsQkCUhpRSlGgVTQEBaBZHQJTj34pMHr11fZQoaAZoCWgPQwhrgqj7QB5xQJSGlFKUaBVNJgNoFkdAlOPg5eZ5RnV9lChoBmgJaA9DCBgLQ+T0amxAlIaUUpRoFU2eA2gWR0CU5aDDTBqLdX2UKGgGaAloD0MIar+1E6XebkCUhpRSlGgVTWIBaBZHQJTmg1+AmRh1fZQoaAZoCWgPQwiwq8lTljFwQJSGlFKUaBVNZgFoFkdAlOdbdi2Dx3V9lChoBmgJaA9DCC5yT1d3qFFAlIaUUpRoFUvbaBZHQJToubiIcip1fZQoaAZoCWgPQwi5jQbwFlpAQJSGlFKUaBVL4mgWR0CU8BmnO0LMdX2UKGgGaAloD0MIL2tiga9vbkCUhpRSlGgVTXABaBZHQJTw+dGy5Zt1fZQoaAZoCWgPQwhTPZl/dAFjQJSGlFKUaBVN6ANoFkdAlPGemm+Cb3V9lChoBmgJaA9DCLJiuDoA9WpAlIaUUpRoFU1+AWgWR0CU8hJAt4A0dX2UKGgGaAloD0MI14UfnE+zRECUhpRSlGgVTQ4BaBZHQJT2ic5Ke051fZQoaAZoCWgPQwhlNzP60XFsQJSGlFKUaBVNSQFoFkdAlPbPs/pt8HV9lChoBmgJaA9DCOhKBKp/im1AlIaUUpRoFU32AWgWR0CU96HbypaSdX2UKGgGaAloD0MIP1jGhu4VckCUhpRSlGgVTcYBaBZHQJT5cejmCAd1fZQoaAZoCWgPQwiJtI0/UTxuQJSGlFKUaBVNHwJoFkdAlPonggow23V9lChoBmgJaA9DCE95dCOs83BAlIaUUpRoFU3TAWgWR0CU+jaA4GUwdX2UKGgGaAloD0MIsVHWbyZxcECUhpRSlGgVTX0BaBZHQJT73dbgTAZ1fZQoaAZoCWgPQwi/f/PiRFJuQJSGlFKUaBVNQgJoFkdAlPx+s1baAXV9lChoBmgJaA9DCMed0sG6NnNAlIaUUpRoFU2EAWgWR0CU/c7kXDWLdX2UKGgGaAloD0MItU/HY0YPcUCUhpRSlGgVTWwBaBZHQJT+Cqfe1rt1fZQoaAZoCWgPQwgZkpOJ2xdvQJSGlFKUaBVNHgFoFkdAlQC8BIWgvnV9lChoBmgJaA9DCLfsEP+wpfa/lIaUUpRoFUuqaBZHQJUCNo7FKkF1fZQoaAZoCWgPQwinBwWlaBJsQJSGlFKUaBVNYAFoFkdAlQTFKK5083V9lChoBmgJaA9DCJCEfTuJvGxAlIaUUpRoFU29AWgWR0CVCO/UvwmWdX2UKGgGaAloD0MISddMvtkIbECUhpRSlGgVTWoBaBZHQJUJ7NOdoWZ1fZQoaAZoCWgPQwg+JefEnvBtQJSGlFKUaBVNwgFoFkdAlQsXoxHoYHV9lChoBmgJaA9DCJDZWfTOo29AlIaUUpRoFU1WAWgWR0CVC3qc3EQ5dX2UKGgGaAloD0MI3+LhPQf8ZkCUhpRSlGgVTegDaBZHQJUMk01qFh51fZQoaAZoCWgPQwh+c3/1eJpwQJSGlFKUaBVNGgFoFkdAlQ0myxA0K3V9lChoBmgJaA9DCOC593BJmHFAlIaUUpRoFU0kAWgWR0CVDgE384xUdX2UKGgGaAloD0MI6Zyf4ji/bkCUhpRSlGgVTa0BaBZHQJUOD1Gsmv51fZQoaAZoCWgPQwjPLt/6cPBwQJSGlFKUaBVNqAFoFkdAlQ5ztgKF7HV9lChoBmgJaA9DCHh6pSzD9HFAlIaUUpRoFU2RAWgWR0CVEOVxS5y3dX2UKGgGaAloD0MIS+ZY3lU8cECUhpRSlGgVTTgBaBZHQJURy8OCoTB1ZS4="
73
  },
74
  "ep_success_buffer": {
75
  ":type:": "<class 'collections.deque'>",
76
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
77
  },
78
+ "_n_updates": 248,
79
  "n_steps": 1024,
80
  "gamma": 0.999,
81
  "gae_lambda": 0.98,
82
  "ent_coef": 0.01,
83
  "vf_coef": 0.5,
84
  "max_grad_norm": 0.5,
85
+ "batch_size": 64,
86
+ "n_epochs": 4,
87
  "clip_range": {
88
  ":type:": "<class 'function'>",
89
  ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4BDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/yZmZmZmZmoWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="
LunarLander_v2-PPO/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:04e28354659f7b412533f9a8b551c6db97e6fb71c9541cf92fdc7a1387b9a596
3
- size 87993
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd0d2089f4432af2d60cba0d267be5cf4d27bdb24538656eb0545c349904bc48
3
+ size 87545
LunarLander_v2-PPO/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:46abeb5aaccf1eae2f5616ec25d6360ac7a4519421c400cf1293793fdc41b9e2
3
- size 43201
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fd1dcf24fc5871ad2802867ccfd55675370a9d3c60e628f0430ab5e28b3965fa
3
+ size 43073
LunarLander_v2-PPO/system_info.txt CHANGED
@@ -2,6 +2,6 @@ OS: Linux-5.10.133+-x86_64-with-glibc2.27 #1 SMP Fri Aug 26 08:44:51 UTC 2022
2
  Python: 3.8.15
3
  Stable-Baselines3: 1.6.2
4
  PyTorch: 1.12.1+cu113
5
- GPU Enabled: True
6
  Numpy: 1.21.6
7
  Gym: 0.21.0
 
2
  Python: 3.8.15
3
  Stable-Baselines3: 1.6.2
4
  PyTorch: 1.12.1+cu113
5
+ GPU Enabled: False
6
  Numpy: 1.21.6
7
  Gym: 0.21.0
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
- value: 105.35 +/- 66.06
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
+ value: 254.92 +/- 20.95
20
  name: mean_reward
21
  verified: false
22
  ---
config.json CHANGED
@@ -1 +1 @@
1
- {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f564bfdb310>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f564bfdb3a0>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f564bfdb430>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f564bfdb4c0>", "_build": "<function ActorCriticPolicy._build at 0x7f564bfdb550>", "forward": "<function ActorCriticPolicy.forward at 0x7f564bfdb5e0>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f564bfdb670>", "_predict": "<function ActorCriticPolicy._predict at 0x7f564bfdb700>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f564bfdb790>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f564bfdb820>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f564bfdb8b0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc_data object at 0x7f564bfd3ae0>"}, "verbose": 1, "policy_kwargs": {}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVnwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/5RoCksIhZSMAUOUdJRSlIwEaGlnaJRoEiiWIAAAAAAAAAAAAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAf5RoCksIhZRoFXSUUpSMDWJvdW5kZWRfYmVsb3eUaBIolggAAAAAAAAAAAAAAAAAAACUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYIAAAAAAAAAAAAAAAAAAAAlGghSwiFlGgVdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [8], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False]", "bounded_above": "[False False False False False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gAWVggAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUaAeTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu", "n": 4, "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "num_timesteps": 1015808, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1670353699724315896, "learning_rate": 0.0003, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4BDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/M6kqMFUyYYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAIBx0L1cjxy69eJcu1S8lTgPi2i7deXtOQAAgD8AAIA/AJGVvUzZ7j5H2ri9vPRJvllHzL3Vxtg7AAAAAAAAAADNFye9nSZOPx6Gkj3OJom++IQBPJ30xDwAAAAAAAAAAM0euzxXAX8/k3zvPXYAi743HCW6K5VPvQAAAAAAAAAAGoQVPWRqRj4SpvI9LbQHvvvUJz29Wvy8AAAAAAAAAADArBy+pHx+PHzaQTtL+cC5q3kKvqM+8jkAAIA/AACAP5phBzyvSWM9NjSGvXRcU77UKNq8C7ZvvQAAAAAAAAAAgGlVPewBl7mj64S7fHU4N2znDLsbkHY6AACAPwAAgD+alTg9UkDNuT5bibtvIgs1yVFiulENnjoAAIA/AACAP2ayojv+1dk9yEzfPbfEO766bmY9tgUTvgAAAAAAAAAAAGq9vY+uZLq+vFI7nXIENtebxLi9OPE0AACAPwAAgD8N3oc9exyQutboFTzf6Y82EKsOu2RThjUAAIA/AACAP1PEI77PSAy8K07huwYECLpm6mA9QtTeOgAAgD8AAIA/U6wpvpR3i7xW4jK8Jra7ukbj8D0uvJ47AACAPwAAgD+m98+9KbgHumaa/DiaCXGxTvBDOvprE7gAAIA/AACAP+bLv732NCO6IO4gupwIjbVt02w5GMk9OQAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.015808000000000044, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVfRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIkiOdgRFAYECUhpRSlIwBbJRN6AOMAXSUR0ChdhbF85S4dX2UKGgGaAloD0MIVb/S+fCnY0CUhpRSlGgVTegDaBZHQKF2jp7kXDZ1fZQoaAZoCWgPQwi3f2WlSYxdQJSGlFKUaBVN6ANoFkdAoXjWEGqxT3V9lChoBmgJaA9DCHNIaqHk8WVAlIaUUpRoFU3oA2gWR0ChfajxkNF0dX2UKGgGaAloD0MIJvvnacB4X0CUhpRSlGgVTegDaBZHQKF+WOMERrd1fZQoaAZoCWgPQwhXPzbJj4RiQJSGlFKUaBVN6ANoFkdAoX8ALb5/LHV9lChoBmgJaA9DCLtgcM0dT2RAlIaUUpRoFU3oA2gWR0ChgoiqhlDndX2UKGgGaAloD0MImPijqDOoWUCUhpRSlGgVTegDaBZHQKGCyAq/dqN1fZQoaAZoCWgPQwgb17/rs0ViQJSGlFKUaBVN6ANoFkdAoYWaFZgXuXV9lChoBmgJaA9DCAcLJ2n+ClxAlIaUUpRoFU3oA2gWR0ChieGZE2HddX2UKGgGaAloD0MIyTmxh/aCWECUhpRSlGgVTegDaBZHQKGJ6C2c8T11fZQoaAZoCWgPQwjXMEPjCSJjQJSGlFKUaBVN6ANoFkdAoY9csrd30XV9lChoBmgJaA9DCAYTfxR1OFxAlIaUUpRoFU3oA2gWR0ChkCujIq9XdX2UKGgGaAloD0MIvAfovhyeYECUhpRSlGgVTegDaBZHQKGWo6dUbUB1fZQoaAZoCWgPQwhQ4QhSKSJiQJSGlFKUaBVN6ANoFkdAoZgLdtVJc3V9lChoBmgJaA9DCOV620yFjlhAlIaUUpRoFU3oA2gWR0ChmblSsKb8dX2UKGgGaAloD0MI1eqrq4I4YUCUhpRSlGgVTegDaBZHQKGZvKbrkbR1fZQoaAZoCWgPQwiL/zuiQjhcQJSGlFKUaBVN6ANoFkdAoZo8X7+DOHV9lChoBmgJaA9DCDkroib6uEFAlIaUUpRoFU1YAWgWR0ChnCOm78NydX2UKGgGaAloD0MIoiWPp+XlYECUhpRSlGgVTegDaBZHQKGciAFPi1l1fZQoaAZoCWgPQwjnN0w0SI5gQJSGlFKUaBVN6ANoFkdAoaFCP0Zm7XV9lChoBmgJaA9DCBe86CtIQFpAlIaUUpRoFU3oA2gWR0ChofIMjNY9dX2UKGgGaAloD0MIsacd/pqyYUCUhpRSlGgVTegDaBZHQKGinJhfBvd1fZQoaAZoCWgPQwi+afrsgIJWQJSGlFKUaBVN6ANoFkdAoaYjzXjEN3V9lChoBmgJaA9DCMCUgQNa5llAlIaUUpRoFU3oA2gWR0ChpmKSxJNCdX2UKGgGaAloD0MI0GT/PA0cYECUhpRSlGgVTegDaBZHQKGoThybQTp1fZQoaAZoCWgPQwh+NnLdlG4/QJSGlFKUaBVNGgFoFkdAoat+gL7XQXV9lChoBmgJaA9DCDSitDd4RGBAlIaUUpRoFU3oA2gWR0ChrY/47A+IdX2UKGgGaAloD0MIayxhbQywYkCUhpRSlGgVTegDaBZHQKGtltaY/ml1fZQoaAZoCWgPQwjz6EZYVJtfQJSGlFKUaBVN6ANoFkdAobOOnGbTdHV9lChoBmgJaA9DCNe+gF64LFpAlIaUUpRoFU3oA2gWR0ChueNx+8XfdX2UKGgGaAloD0MIdJXurrMeYkCUhpRSlGgVTegDaBZHQKG7Q0HhS+B1fZQoaAZoCWgPQwggmQ6dnm8vQJSGlFKUaBVL32gWR0Chu/fQKKHgdX2UKGgGaAloD0MIieyDLAscXUCUhpRSlGgVTegDaBZHQKG85ukUKzB1fZQoaAZoCWgPQwgKhnMNM4pdQJSGlFKUaBVN6ANoFkdAobzpY1YQrnV9lChoBmgJaA9DCBO1NLdC+l5AlIaUUpRoFU3oA2gWR0ChvVxzijtYdX2UKGgGaAloD0MIKT+p9unLXUCUhpRSlGgVTegDaBZHQKG/LXsgMc91fZQoaAZoCWgPQwgV/3dEhbRgQJSGlFKUaBVN6ANoFkdAob+MwSJ0n3V9lChoBmgJaA9DCBr4UQ37dFlAlIaUUpRoFU3oA2gWR0ChxM1UMoc8dX2UKGgGaAloD0MIVWr2QCuIWECUhpRSlGgVTegDaBZHQKHFcIJJGvx1fZQoaAZoCWgPQwiMuWsJ+QFZQJSGlFKUaBVN6ANoFkdAockY2ycCo3V9lChoBmgJaA9DCE9bI4Jx7FZAlIaUUpRoFU3oA2gWR0ChyVWTPjXGdX2UKGgGaAloD0MIQ61p3vG2YUCUhpRSlGgVTegDaBZHQKHLVnnuAqd1fZQoaAZoCWgPQwiQ14NJcZRiQJSGlFKUaBVN6ANoFkdAoc6afOD8L3V9lChoBmgJaA9DCNXnaiv2G2FAlIaUUpRoFU3oA2gWR0Ch0I6uOjqOdX2UKGgGaAloD0MIiPVGrTCAYECUhpRSlGgVTegDaBZHQKHQlU83dbh1fZQoaAZoCWgPQwhATpgwmi09QJSGlFKUaBVNPgFoFkdAod4M9yLhrHV9lChoBmgJaA9DCAq/1M+ba2BAlIaUUpRoFU3oA2gWR0Ch34OdXko4dX2UKGgGaAloD0MI+Z0mM94UYkCUhpRSlGgVTegDaBZHQKHg+0tRNyp1fZQoaAZoCWgPQwhgOq3boP5hQJSGlFKUaBVN6ANoFkdAoeG6mbb1y3V9lChoBmgJaA9DCILK+PcZBF5AlIaUUpRoFU3oA2gWR0Ch4qta6jFidX2UKGgGaAloD0MIyM7b2Oy1ZECUhpRSlGgVTegDaBZHQKHirTaTOgR1fZQoaAZoCWgPQwg4nzpWqe1iQJSGlFKUaBVN6ANoFkdAoeMkAR02cnV9lChoBmgJaA9DCKZG6GfqN2BAlIaUUpRoFU3oA2gWR0Ch5RxRdhRZdX2UKGgGaAloD0MIPIcyVMUDXkCUhpRSlGgVTegDaBZHQKHlemUGFBZ1fZQoaAZoCWgPQwj7k/jcCZFcQJSGlFKUaBVN6ANoFkdAoepdsrNGE3V9lChoBmgJaA9DCMCWV663iWJAlIaUUpRoFU3oA2gWR0Ch6wdcbBGhdX2UKGgGaAloD0MIYFs//Wd1XkCUhpRSlGgVTegDaBZHQKHusbdadMF1fZQoaAZoCWgPQwjgaMcNvxsXQJSGlFKUaBVNNwFoFkdAoe7nuTibUnV9lChoBmgJaA9DCHOfHAWIrF1AlIaUUpRoFU3oA2gWR0Ch7vNNrTH9dX2UKGgGaAloD0MIKbLWUGqRWkCUhpRSlGgVTegDaBZHQKHw2FbmlqJ1fZQoaAZoCWgPQwjWG7XC9GteQJSGlFKUaBVN6ANoFkdAofQOJN0vG3V9lChoBmgJaA9DCKg5eZEJkmFAlIaUUpRoFU3oA2gWR0Ch9iShakhzdX2UKGgGaAloD0MIxciSOZYbOECUhpRSlGgVS/FoFkdAoffgG6f8M3V9lChoBmgJaA9DCHdpw2FpYGJAlIaUUpRoFU3oA2gWR0CiAiSk9ECvdX2UKGgGaAloD0MImWGjrN9tW0CUhpRSlGgVTegDaBZHQKIDNUqhDgJ1fZQoaAZoCWgPQwixMEROXxBYQJSGlFKUaBVN6ANoFkdAogSW/zreInV9lChoBmgJaA9DCHZu2ozTWlxAlIaUUpRoFU3oA2gWR0CiBUw7DEWJdX2UKGgGaAloD0MIC19f61K2X0CUhpRSlGgVTegDaBZHQKIGKJvYODt1fZQoaAZoCWgPQwjghhiveZtgQJSGlFKUaBVN6ANoFkdAogYqURnOB3V9lChoBmgJaA9DCFtAaD18CGFAlIaUUpRoFU3oA2gWR0CiBpTuF6AwdX2UKGgGaAloD0MIxhft8UKNX0CUhpRSlGgVTegDaBZHQKIItnFo+Oh1fZQoaAZoCWgPQwhXQQx07T1eQJSGlFKUaBVN6ANoFkdAog23d69kBnV9lChoBmgJaA9DCDV8C+vG6VpAlIaUUpRoFU3oA2gWR0CiDl6lDWsjdX2UKGgGaAloD0MINzXQfE40YECUhpRSlGgVTegDaBZHQKISMDK5kLB1fZQoaAZoCWgPQwi+UMB2MMhiQJSGlFKUaBVN6ANoFkdAohJnsw+MZXV9lChoBmgJaA9DCFga+FGNyGFAlIaUUpRoFU3oA2gWR0CiFHxmseXBdX2UKGgGaAloD0MIUMjO21iBY0CUhpRSlGgVTegDaBZHQKIW4uLaVUx1fZQoaAZoCWgPQwiwxW6f1fthQJSGlFKUaBVN6ANoFkdAohoHxe9i+nV9lChoBmgJaA9DCLtFYKxvulxAlIaUUpRoFU3oA2gWR0CiG/RCY1HfdX2UKGgGaAloD0MI/kgRGVZxLECUhpRSlGgVTVoBaBZHQKIfdVmSQo11fZQoaAZoCWgPQwiwIM1YNNk1QJSGlFKUaBVL4WgWR0CiH/LncL0BdX2UKGgGaAloD0MIMxmO5zPiYUCUhpRSlGgVTegDaBZHQKImAOJcgQp1fZQoaAZoCWgPQwhCYOXQIhdbQJSGlFKUaBVN6ANoFkdAoicMWZZ0S3V9lChoBmgJaA9DCBSUopX7RW9AlIaUUpRoFU1ZAWgWR0CiJxXY+Sr6dX2UKGgGaAloD0MInWUWodhKHUCUhpRSlGgVTSYBaBZHQKInGo5PuXx1fZQoaAZoCWgPQwiHNZVFYZpgQJSGlFKUaBVN6ANoFkdAoihfsRg7YHV9lChoBmgJaA9DCI/7VuvEaF5AlIaUUpRoFU3oA2gWR0CiKQetSydGdX2UKGgGaAloD0MIr+sX7AbHYECUhpRSlGgVTegDaBZHQKIp3y5I6Kd1fZQoaAZoCWgPQwh7vfvjvelWQJSGlFKUaBVN6ANoFkdAoinh+SbH63V9lChoBmgJaA9DCJI81/fhQALAlIaUUpRoFU0HAWgWR0CiKen9ehPCdX2UKGgGaAloD0MIbarukc1cYUCUhpRSlGgVTegDaBZHQKIqQW8h9st1fZQoaAZoCWgPQwhQjgJEwYRfQJSGlFKUaBVN6ANoFkdAoiwH9m6GxnV9lChoBmgJaA9DCKJjB5W4viXAlIaUUpRoFUvPaBZHQKItFZpSJj51fZQoaAZoCWgPQwgpd5/jozUwQJSGlFKUaBVNHAFoFkdAojBiuB+WnnV9lChoBmgJaA9DCA/QfTkz9WFAlIaUUpRoFU3oA2gWR0CiMMBCtzS1dX2UKGgGaAloD0MIPx2PGai/YkCUhpRSlGgVTegDaBZHQKIxWxREWqN1fZQoaAZoCWgPQwh2+kFdJAtiQJSGlFKUaBVN6ANoFkdAojUd3GGVRnV9lChoBmgJaA9DCPKWqx+bsV9AlIaUUpRoFU3oA2gWR0CiN0Tj/+85dX2UKGgGaAloD0MIFLGIYQetbECUhpRSlGgVTZIBaBZHQKI44JfpljF1ZS4="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 414, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 1024, "n_epochs": 6, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4BDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/yZmZmZmZmoWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "system_info": {"OS": "Linux-5.10.133+-x86_64-with-glibc2.27 #1 SMP Fri Aug 26 08:44:51 UTC 2022", "Python": "3.8.15", "Stable-Baselines3": "1.6.2", "PyTorch": "1.12.1+cu113", "GPU Enabled": "True", "Numpy": "1.21.6", "Gym": "0.21.0"}}
 
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f84226278b0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f8422627940>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f84226279d0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f8422627a60>", "_build": "<function ActorCriticPolicy._build at 0x7f8422627af0>", "forward": "<function ActorCriticPolicy.forward at 0x7f8422627b80>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f8422627c10>", "_predict": "<function ActorCriticPolicy._predict at 0x7f8422627ca0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f8422627d30>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f8422627dc0>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f8422627e50>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc_data object at 0x7f84225a90c0>"}, "verbose": 1, "policy_kwargs": {}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVnwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/5RoCksIhZSMAUOUdJRSlIwEaGlnaJRoEiiWIAAAAAAAAAAAAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAf5RoCksIhZRoFXSUUpSMDWJvdW5kZWRfYmVsb3eUaBIolggAAAAAAAAAAAAAAAAAAACUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYIAAAAAAAAAAAAAAAAAAAAlGghSwiFlGgVdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [8], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False]", "bounded_above": "[False False False False False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gAWVggAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUaAeTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu", "n": 4, "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "num_timesteps": 1015808, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1670410119328534839, "learning_rate": 0.0003, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4BDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/M6kqMFUyYYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAIAnG76Bnw4/JuDQPg7dhr4qrRE+svo4PQAAAAAAAAAAM3mbvOyJ+bmaLwI0w4suL9FkQ7p6h5+zAACAPwAAgD+aOki9BfSLu1hNrDvmrSM9lqJEu8hDc7wAAIA/AACAP81DKz1InZi6G+jBu1XrCjifNvE6euQutwAAgD8AAIA/OnUmPqwmKj45ERK+5sZTvu1cB72qbZ87AAAAAAAAAAAz3d89ZJ+CP8a/4T27m5i+EOnOPai5iL0AAAAAAAAAAC2blT4PGeA+tbU5vgCXjr5tyvw8Y3h0vQAAAAAAAAAAjfOMvQ+ETD8jZOG8s/KFvv9WZr0Ipas9AAAAAAAAAADNvBi7rjeRus21OLWjnD2w2IgEu+YiTjQAAIA/AACAP6DVNj7k7So+3nH/vbMglb6rOJi87uCPuwAAAAAAAAAAZkOxPMzVPz5OGmS917KDvpI1PLvaTYO9AAAAAAAAAADt9H0+8Yw2P0oKIL0u3a++Jsi1PXi29TsAAAAAAAAAALPxCT18O+o+wOSyu9tthr6DdjM9gp+WuwAAAAAAAAAAzdbTvTyMOD9FOuQ99kanvoa0Jb1Cll69AAAAAAAAAACaZw29Hx2qudus0jqeJz82HdFaOpuw+rkAAIA/AACAP/qLDr5/6pQ/XrHBvi0gpr5tvSy+hgzkvQAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.015808000000000044, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVehAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIPEuQEVCwUkCUhpRSlIwBbJRNHgGMAXSUR0CUNUtMPBi1dX2UKGgGaAloD0MIlugsswjyZECUhpRSlGgVTegDaBZHQJRDcWLxZuB1fZQoaAZoCWgPQwj4+lqXmr5vQJSGlFKUaBVN4AFoFkdAlEbUjcEeQ3V9lChoBmgJaA9DCKJFtvM903BAlIaUUpRoFU3gAmgWR0CUR+Nd7fHhdX2UKGgGaAloD0MIrOEi9zQXcUCUhpRSlGgVTToCaBZHQJRK7DNyHVR1fZQoaAZoCWgPQwhMp3UbFCFwQJSGlFKUaBVNygJoFkdAlEtDw+dK/XV9lChoBmgJaA9DCEKvP4lPqHBAlIaUUpRoFU2fAmgWR0CUS1OdoWYXdX2UKGgGaAloD0MIcLGiBtOOckCUhpRSlGgVTVYBaBZHQJRQz+fh/Al1fZQoaAZoCWgPQwh/F7Zmq6FtQJSGlFKUaBVNIQNoFkdAlFMEgGKQ73V9lChoBmgJaA9DCNy7Bn3pbWNAlIaUUpRoFU3oA2gWR0CUU1MvRJEqdX2UKGgGaAloD0MIg94bQwADbkCUhpRSlGgVTSsBaBZHQJRU2q94/u91fZQoaAZoCWgPQwjNHmgFhj5xQJSGlFKUaBVNDwJoFkdAlFVdQsPJ73V9lChoBmgJaA9DCGU5CaXvPnFAlIaUUpRoFU1yAWgWR0CUV1Bu4wyqdX2UKGgGaAloD0MIW80643sXaUCUhpRSlGgVTegDaBZHQJRaezlcQiB1fZQoaAZoCWgPQwh/Z3v0BpNwQJSGlFKUaBVNIwJoFkdAlFss9Oh0yXV9lChoBmgJaA9DCJKvBFLiwGxAlIaUUpRoFU3zAWgWR0CUXLzmfXf7dX2UKGgGaAloD0MI73Tniecmb0CUhpRSlGgVTRMCaBZHQJRc2BRQ7911fZQoaAZoCWgPQwhYqaCiaslxQJSGlFKUaBVNmAFoFkdAlGKg8wHqvHV9lChoBmgJaA9DCOY7+IkD+kVAlIaUUpRoFUv0aBZHQJRi2Z5Rjz91fZQoaAZoCWgPQwiJCtXNBWJwQJSGlFKUaBVN0AFoFkdAlGYMpsoDxXV9lChoBmgJaA9DCAN7TKQ0Km5AlIaUUpRoFU0qAmgWR0CUZ99kjHGTdX2UKGgGaAloD0MIutkfKPddcUCUhpRSlGgVTfwBaBZHQJRumLm6oVF1fZQoaAZoCWgPQwhe2nBY2nlxQJSGlFKUaBVN9gFoFkdAlHLvFzdUKnV9lChoBmgJaA9DCMB4Bg39s29AlIaUUpRoFU0cAWgWR0CUc9cE/0NCdX2UKGgGaAloD0MIEf+wpcfobkCUhpRSlGgVTSoCaBZHQJR0LGxUvPF1fZQoaAZoCWgPQwhEM0+u6VhxQJSGlFKUaBVNQANoFkdAlHSv557gKnV9lChoBmgJaA9DCPGg2XWviXBAlIaUUpRoFU1bAmgWR0CUdpZ9uxbCdX2UKGgGaAloD0MIpmPOM/YhcECUhpRSlGgVTTkCaBZHQJR4vMyJsO51fZQoaAZoCWgPQwhCrz+Jj5lwQJSGlFKUaBVNUgNoFkdAlHjM10knkXV9lChoBmgJaA9DCHUAxF29DVBAlIaUUpRoFUvmaBZHQJR8GfTTfBN1fZQoaAZoCWgPQwhbeF4q9udxQJSGlFKUaBVNkwFoFkdAlH3Q40dilXV9lChoBmgJaA9DCNF3t7LEfnFAlIaUUpRoFU1gAmgWR0CUjjX668QJdX2UKGgGaAloD0MI4GjHDT8MbkCUhpRSlGgVTaoBaBZHQJSO4jzI3it1fZQoaAZoCWgPQwhKfO4Ee/RxQJSGlFKUaBVNkQJoFkdAlI8rPppvgnV9lChoBmgJaA9DCAoxl1Tt/29AlIaUUpRoFU2+AmgWR0CUkM7ngYP5dX2UKGgGaAloD0MIVG8NbJXlb0CUhpRSlGgVTTQCaBZHQJSRPBInSfF1fZQoaAZoCWgPQwjXT/9Zc8pjQJSGlFKUaBVN6ANoFkdAlJKUhRqGlHV9lChoBmgJaA9DCCwN/KhGd3FAlIaUUpRoFU39AmgWR0CUlcfQa72+dX2UKGgGaAloD0MIT1lN15MGckCUhpRSlGgVTZoBaBZHQJSYcoG6f8N1fZQoaAZoCWgPQwgWpu81BLxwQJSGlFKUaBVNOAFoFkdAlJzQSWZ7X3V9lChoBmgJaA9DCE5DVOFPt2pAlIaUUpRoFU3qAWgWR0CUorTFERapdX2UKGgGaAloD0MIi98UVqqGb0CUhpRSlGgVTVUCaBZHQJSjGIhyKel1fZQoaAZoCWgPQwjwiuB/K0UyQJSGlFKUaBVL/2gWR0CUpq47zTWodX2UKGgGaAloD0MInE1HADe6bECUhpRSlGgVTfEBaBZHQJSnpj/dZaF1fZQoaAZoCWgPQwi+o8aEmNxuQJSGlFKUaBVNewFoFkdAlKi2mHgxanV9lChoBmgJaA9DCMWp1sKsJW5AlIaUUpRoFU27AWgWR0CUqgmZmZmadX2UKGgGaAloD0MIARWOIBVjb0CUhpRSlGgVTS4BaBZHQJSsdL5AQg91fZQoaAZoCWgPQwitS43QD6ZxQJSGlFKUaBVNvQJoFkdAlK3byhBZ6nV9lChoBmgJaA9DCJ5A2ClW1T5AlIaUUpRoFUvXaBZHQJS3MHu7YkF1fZQoaAZoCWgPQwgT8db5t8puQJSGlFKUaBVNIQFoFkdAlLsEWykbgnV9lChoBmgJaA9DCG2sxDyr7WxAlIaUUpRoFU2CAWgWR0CUvEKl54W2dX2UKGgGaAloD0MIj8ahfhekZECUhpRSlGgVTegDaBZHQJS+cv9LpRp1fZQoaAZoCWgPQwjCL/XzpsBlQJSGlFKUaBVN6ANoFkdAlL7Mdkrf+HV9lChoBmgJaA9DCNGt1/Qg6G9AlIaUUpRoFU3mA2gWR0CUxG1NQCSzdX2UKGgGaAloD0MI/ACkNnEabkCUhpRSlGgVTXQBaBZHQJTFSqm0mdB1fZQoaAZoCWgPQwi28pL/yQNvQJSGlFKUaBVN1QFoFkdAlMZyJGe+VXV9lChoBmgJaA9DCPqcu12v+GxAlIaUUpRoFU15AWgWR0CUxxlV94NadX2UKGgGaAloD0MI/yWpTDG3ZUCUhpRSlGgVTegDaBZHQJTM/xvvSc91fZQoaAZoCWgPQwhmZ9E7FahuQJSGlFKUaBVNRAFoFkdAlM0Rj4Hoo3V9lChoBmgJaA9DCDdUjPM3ylVAlIaUUpRoFU3oA2gWR0CU3CMW43FUdX2UKGgGaAloD0MItMu3PqzFbUCUhpRSlGgVTR4BaBZHQJTdSJBPbfx1fZQoaAZoCWgPQwhDqiheZTJyQJSGlFKUaBVNMgFoFkdAlN10T6BRRHV9lChoBmgJaA9DCC/ej9uv02xAlIaUUpRoFU3fA2gWR0CU3d3rD63zdX2UKGgGaAloD0MItHIvMCsNcECUhpRSlGgVTdsDaBZHQJTfv83uNPx1fZQoaAZoCWgPQwhDVOHP8LpuQJSGlFKUaBVNKAFoFkdAlN+/HHWBjHV9lChoBmgJaA9DCEnajT5mG3BAlIaUUpRoFU1GAWgWR0CU4O2dNFjNdX2UKGgGaAloD0MIccgG0sWsQkCUhpRSlGgVTQEBaBZHQJTj34pMHr11fZQoaAZoCWgPQwhrgqj7QB5xQJSGlFKUaBVNJgNoFkdAlOPg5eZ5RnV9lChoBmgJaA9DCBgLQ+T0amxAlIaUUpRoFU2eA2gWR0CU5aDDTBqLdX2UKGgGaAloD0MIar+1E6XebkCUhpRSlGgVTWIBaBZHQJTmg1+AmRh1fZQoaAZoCWgPQwiwq8lTljFwQJSGlFKUaBVNZgFoFkdAlOdbdi2Dx3V9lChoBmgJaA9DCC5yT1d3qFFAlIaUUpRoFUvbaBZHQJToubiIcip1fZQoaAZoCWgPQwi5jQbwFlpAQJSGlFKUaBVL4mgWR0CU8BmnO0LMdX2UKGgGaAloD0MIL2tiga9vbkCUhpRSlGgVTXABaBZHQJTw+dGy5Zt1fZQoaAZoCWgPQwhTPZl/dAFjQJSGlFKUaBVN6ANoFkdAlPGemm+Cb3V9lChoBmgJaA9DCLJiuDoA9WpAlIaUUpRoFU1+AWgWR0CU8hJAt4A0dX2UKGgGaAloD0MI14UfnE+zRECUhpRSlGgVTQ4BaBZHQJT2ic5Ke051fZQoaAZoCWgPQwhlNzP60XFsQJSGlFKUaBVNSQFoFkdAlPbPs/pt8HV9lChoBmgJaA9DCOhKBKp/im1AlIaUUpRoFU32AWgWR0CU96HbypaSdX2UKGgGaAloD0MIP1jGhu4VckCUhpRSlGgVTcYBaBZHQJT5cejmCAd1fZQoaAZoCWgPQwiJtI0/UTxuQJSGlFKUaBVNHwJoFkdAlPonggow23V9lChoBmgJaA9DCE95dCOs83BAlIaUUpRoFU3TAWgWR0CU+jaA4GUwdX2UKGgGaAloD0MIsVHWbyZxcECUhpRSlGgVTX0BaBZHQJT73dbgTAZ1fZQoaAZoCWgPQwi/f/PiRFJuQJSGlFKUaBVNQgJoFkdAlPx+s1baAXV9lChoBmgJaA9DCMed0sG6NnNAlIaUUpRoFU2EAWgWR0CU/c7kXDWLdX2UKGgGaAloD0MItU/HY0YPcUCUhpRSlGgVTWwBaBZHQJT+Cqfe1rt1fZQoaAZoCWgPQwgZkpOJ2xdvQJSGlFKUaBVNHgFoFkdAlQC8BIWgvnV9lChoBmgJaA9DCLfsEP+wpfa/lIaUUpRoFUuqaBZHQJUCNo7FKkF1fZQoaAZoCWgPQwinBwWlaBJsQJSGlFKUaBVNYAFoFkdAlQTFKK5083V9lChoBmgJaA9DCJCEfTuJvGxAlIaUUpRoFU29AWgWR0CVCO/UvwmWdX2UKGgGaAloD0MISddMvtkIbECUhpRSlGgVTWoBaBZHQJUJ7NOdoWZ1fZQoaAZoCWgPQwg+JefEnvBtQJSGlFKUaBVNwgFoFkdAlQsXoxHoYHV9lChoBmgJaA9DCJDZWfTOo29AlIaUUpRoFU1WAWgWR0CVC3qc3EQ5dX2UKGgGaAloD0MI3+LhPQf8ZkCUhpRSlGgVTegDaBZHQJUMk01qFh51fZQoaAZoCWgPQwh+c3/1eJpwQJSGlFKUaBVNGgFoFkdAlQ0myxA0K3V9lChoBmgJaA9DCOC593BJmHFAlIaUUpRoFU0kAWgWR0CVDgE384xUdX2UKGgGaAloD0MI6Zyf4ji/bkCUhpRSlGgVTa0BaBZHQJUOD1Gsmv51fZQoaAZoCWgPQwjPLt/6cPBwQJSGlFKUaBVNqAFoFkdAlQ5ztgKF7HV9lChoBmgJaA9DCHh6pSzD9HFAlIaUUpRoFU2RAWgWR0CVEOVxS5y3dX2UKGgGaAloD0MIS+ZY3lU8cECUhpRSlGgVTTgBaBZHQJURy8OCoTB1ZS4="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 248, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4BDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/yZmZmZmZmoWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "system_info": {"OS": "Linux-5.10.133+-x86_64-with-glibc2.27 #1 SMP Fri Aug 26 08:44:51 UTC 2022", "Python": "3.8.15", "Stable-Baselines3": "1.6.2", "PyTorch": "1.12.1+cu113", "GPU Enabled": "False", "Numpy": "1.21.6", "Gym": "0.21.0"}}
replay.mp4 CHANGED
Binary files a/replay.mp4 and b/replay.mp4 differ
 
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 105.35131052537062, "std_reward": 66.05886312286175, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2022-12-06T20:29:15.031054"}
 
1
+ {"mean_reward": 254.92429886034785, "std_reward": 20.945575573630375, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2022-12-07T11:21:20.862539"}