robert1003 commited on
Commit
271ebcd
1 Parent(s): 72e18be

Upload PPO LunarLander-v2 trained agent

Browse files
README.md CHANGED
@@ -10,7 +10,7 @@ model-index:
10
  results:
11
  - metrics:
12
  - type: mean_reward
13
- value: 268.88 +/- 16.34
14
  name: mean_reward
15
  task:
16
  type: reinforcement-learning
 
10
  results:
11
  - metrics:
12
  - type: mean_reward
13
+ value: 280.07 +/- 14.87
14
  name: mean_reward
15
  task:
16
  type: reinforcement-learning
config.json CHANGED
@@ -1 +1 @@
1
- {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7fea4bce0310>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7fea4bce03a0>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7fea4bce0430>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7fea4bce04c0>", "_build": "<function ActorCriticPolicy._build at 0x7fea4bce0550>", "forward": "<function ActorCriticPolicy.forward at 0x7fea4bce05e0>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7fea4bce0670>", "_predict": "<function ActorCriticPolicy._predict at 0x7fea4bce0700>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7fea4bce0790>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7fea4bce0820>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7fea4bce08b0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc_data object at 0x7fea4bcfa660>"}, "verbose": 1, "policy_kwargs": {}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVpQEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/5RoC0sIhZSMAUOUdJRSlIwEaGlnaJRoEyiWIAAAAAAAAAAAAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAf5RoC0sIhZRoFnSUUpSMDWJvdW5kZWRfYmVsb3eUaBMolggAAAAAAAAAAAAAAAAAAACUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBZ0lFKUjA1ib3VuZGVkX2Fib3ZllGgTKJYIAAAAAAAAAAAAAAAAAAAAlGgiSwiFlGgWdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [8], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False]", "bounded_above": "[False False False False False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gAWViAAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu", "n": 4, "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "num_timesteps": 2080000, "_total_timesteps": 5000000.0, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1652608229.6440349, "learning_rate": 0.0003, "tensorboard_log": "./logs", "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVlgIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAEsBSwFLE0MEiABTAJROhZQpjAFflIWUjGYvaG9tZS9yb2JlcnQxMDAzLy5weWVudi92ZXJzaW9ucy9kZWVwLXJsL2xpYi9weXRob24zLjgvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuAQwIAAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UaA11Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoF2gOjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoGIwHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/M6kqMFUyYYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAALP7972BPn8/tGkKviawCb/+94a+qqhyPQAAAAAAAAAAzS8XveEQubrn0Qq2DRnFsIKXDLlgohk1AACAPwAAgD/m9Qy9L7QdPoL8Lz03tIq+U+UJPMpeCT4AAAAAAAAAAED4xj1q0/s+PXUmvsyZ174gVxC9Nt4IvgAAAAAAAAAAM8kAvnrPaT9SQaw9pc7nvspMsb2dFAA+AAAAAAAAAACaHo49E1iDP/rauD1+Ls++XKA3PpbORLsAAAAAAAAAAHPxzb3M+Jw+GhECP/uUN75wRHY+OP1mPgAAAAAAAAAAZro1vTanPbzqgI69VOREvBhWJj2IQm4+AACAPwAAgD+aW2w9n7fXuwiPxrx03P88AAw3Pfvc0r0AAIA/AACAP830J724cMa7b+KSPL8buzyoSK28sURIPAAAgD8AAIA/mksdvadTXT4Ki6O8I3h6vth1A777A3I9AAAAAAAAAACaj9e8VSEUPsgyt7tB0Ie+qPSsvAiP1zwAAAAAAAAAACD4RT4riXk/8vs/Ps6e374V7tg+Wb6ZvQAAAAAAAAAA4Ew2vkifdj/i5yQ9kSTnvkmcab6hXQ0+AAAAAAAAAACzYVW9vB6uPvJnLj4Jaoq+bg++PSiLhb0AAAAAAAAAALOjRT2/jU0+Sek+vgUCn74Wn/K9R4OsPAAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": 0.5871232, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVNxAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIkZkLXJ6FcECUhpRSlIwBbJRL3IwBdJRHQKIYWcd5prV1fZQoaAZoCWgPQwgKn62DQwRxQJSGlFKUaBVNDQFoFkdAohhxje9BbHV9lChoBmgJaA9DCPNUh9wM33JAlIaUUpRoFUvuaBZHQKIYdgKF7D51fZQoaAZoCWgPQwgRGOsbGLNvQJSGlFKUaBVL22gWR0CiGKbF0gbIdX2UKGgGaAloD0MIEcgljryIbkCUhpRSlGgVS+JoFkdAohltz+3pfXV9lChoBmgJaA9DCKVOQBNhcXFAlIaUUpRoFUvyaBZHQKIZkXVsk6d1fZQoaAZoCWgPQwhXe9gLxRBzQJSGlFKUaBVNAwFoFkdAohoIhje9BnV9lChoBmgJaA9DCPzkKEBUa3NAlIaUUpRoFUvvaBZHQKIa047Rv3t1fZQoaAZoCWgPQwhw6gPJO4ZyQJSGlFKUaBVL52gWR0CiGwNu+AVgdX2UKGgGaAloD0MIK6ORzys2cUCUhpRSlGgVS95oFkdAohsT6guh9XV9lChoBmgJaA9DCFfPSe+bN3FAlIaUUpRoFU1IAWgWR0CiGz+bmU4adX2UKGgGaAloD0MI8wLso5OwckCUhpRSlGgVS/ZoFkdAohuUQiA2AHV9lChoBmgJaA9DCEAwR4+fIXFAlIaUUpRoFUv/aBZHQKIbl/7SApd1fZQoaAZoCWgPQwhzY3rCEr9xQJSGlFKUaBVL6WgWR0CiG6o0hvBKdX2UKGgGaAloD0MIoUyjycUnckCUhpRSlGgVS9doFkdAohu+biIcinV9lChoBmgJaA9DCFde8j/5jnFAlIaUUpRoFUvfaBZHQKIbz6Skj5d1fZQoaAZoCWgPQwjQ1OsWQepwQJSGlFKUaBVL/mgWR0CiG8/jsD4hdX2UKGgGaAloD0MInwJgPIOBbkCUhpRSlGgVS/BoFkdAohvkDnvDxnV9lChoBmgJaA9DCFQ1QdT9u3BAlIaUUpRoFU0KAWgWR0CiHBX9aUzLdX2UKGgGaAloD0MIa7kzE8y/cECUhpRSlGgVS/VoFkdAohxAd2gWanV9lChoBmgJaA9DCHdpw2FpZm5AlIaUUpRoFUvsaBZHQKIcQ5avA451fZQoaAZoCWgPQwg6evzeJqBvQJSGlFKUaBVL9GgWR0CiHLla0QbudX2UKGgGaAloD0MIlrGhm72QcUCUhpRSlGgVS+BoFkdAoh2JDohY/3V9lChoBmgJaA9DCKG5TiOtb25AlIaUUpRoFU0CAWgWR0CiHdMtsenydX2UKGgGaAloD0MIX9ODglKTbkCUhpRSlGgVS/FoFkdAoh3aF/QSjHV9lChoBmgJaA9DCExxVdm3xXBAlIaUUpRoFUvraBZHQKId8OG0u151fZQoaAZoCWgPQwgmj6flB6JOQJSGlFKUaBVLmmgWR0CiHhL6UJOWdX2UKGgGaAloD0MI1Qj9TD1ccUCUhpRSlGgVS+toFkdAoh5KVD8cdnV9lChoBmgJaA9DCO9VKxP+pHBAlIaUUpRoFUvbaBZHQKIeb1MdtEZ1fZQoaAZoCWgPQwj1nPS+sZ1wQJSGlFKUaBVL7GgWR0CiHnlUQ04zdX2UKGgGaAloD0MIsACmDBx6ckCUhpRSlGgVS+1oFkdAoh6Pag261HV9lChoBmgJaA9DCCP1nsrp9nBAlIaUUpRoFU0BAWgWR0CiHo/LLZBcdX2UKGgGaAloD0MItD7lmOxJckCUhpRSlGgVTQEBaBZHQKIeovJRwZR1fZQoaAZoCWgPQwhfl+E/nSNzQJSGlFKUaBVL42gWR0CiHr4BmwqzdX2UKGgGaAloD0MID9b/OUxecUCUhpRSlGgVTSUBaBZHQKIfIIk7fYV1fZQoaAZoCWgPQwiqYir9BERyQJSGlFKUaBVL/mgWR0CiHzRBeHBUdX2UKGgGaAloD0MIs5quJ7ojckCUhpRSlGgVTRcBaBZHQKIqtSNwR5F1fZQoaAZoCWgPQwj9+bZgae1yQJSGlFKUaBVL7GgWR0CiKvyQgcLjdX2UKGgGaAloD0MIHM9nQL2bcECUhpRSlGgVS+ZoFkdAoiszRKHwgHV9lChoBmgJaA9DCA/Tvrm/s21AlIaUUpRoFUvsaBZHQKIrXqzqrzZ1fZQoaAZoCWgPQwg8o61KIk9uQJSGlFKUaBVL/mgWR0CiK309yLhrdX2UKGgGaAloD0MIshGI13VjcUCUhpRSlGgVS9JoFkdAoiuKSHM2WXV9lChoBmgJaA9DCKCH2jYMrnJAlIaUUpRoFUvRaBZHQKIrkHqu8sd1fZQoaAZoCWgPQwhffqfJDApzQJSGlFKUaBVL4mgWR0CiK5lEiMYNdX2UKGgGaAloD0MINe84RUfXbkCUhpRSlGgVTQgBaBZHQKIr07KaG6B1fZQoaAZoCWgPQwiLpUi+0iNxQJSGlFKUaBVNiwJoFkdAoivfUc4o7XV9lChoBmgJaA9DCBFSt7MvJXFAlIaUUpRoFUv6aBZHQKIsEEqUeMh1fZQoaAZoCWgPQwjfbd44qZ9wQJSGlFKUaBVNBwFoFkdAoiwx0Qsf73V9lChoBmgJaA9DCKvMlNZftXJAlIaUUpRoFU0VAWgWR0CiLGeOGTLXdX2UKGgGaAloD0MIVkW4yag/b0CUhpRSlGgVS+toFkdAoix5ul41P3V9lChoBmgJaA9DCGA6rdtgnnFAlIaUUpRoFU0VAWgWR0CiLING3F1kdX2UKGgGaAloD0MIA5ZcxWL/cECUhpRSlGgVTRABaBZHQKIs4f4h2W91fZQoaAZoCWgPQwi8ehUZXb5wQJSGlFKUaBVL+2gWR0CiLb6Xrt3OdX2UKGgGaAloD0MIzc03orvscUCUhpRSlGgVS99oFkdAoi3CdjG1hXV9lChoBmgJaA9DCACrI0f6XnJAlIaUUpRoFUvXaBZHQKIt2RgZ0jl1fZQoaAZoCWgPQwgTuHU3T+1wQJSGlFKUaBVNJAFoFkdAoi3+nyd4FHV9lChoBmgJaA9DCBsQIa6ckXNAlIaUUpRoFUvmaBZHQKIuAdnTRY11fZQoaAZoCWgPQwg74LpiRulyQJSGlFKUaBVLyWgWR0CiLgTnied1dX2UKGgGaAloD0MII0kQrkCFcUCUhpRSlGgVTQIBaBZHQKIuCBQvYe11fZQoaAZoCWgPQwh1r5P6MkRuQJSGlFKUaBVL8GgWR0CiLhFy7wrldX2UKGgGaAloD0MIRBg/jfu/ckCUhpRSlGgVS/9oFkdAoi5LTlT3qXV9lChoBmgJaA9DCKJinL8JC3FAlIaUUpRoFUvcaBZHQKIuZLFn7Hh1fZQoaAZoCWgPQwheE9IaA7huQJSGlFKUaBVNAwFoFkdAoi6KzkZJkHV9lChoBmgJaA9DCKLw2To4P3JAlIaUUpRoFUvkaBZHQKIumnb7CSB1fZQoaAZoCWgPQwh9rrZif45tQJSGlFKUaBVL4GgWR0CiLsdkz41xdX2UKGgGaAloD0MIcT0K16PlbUCUhpRSlGgVS+BoFkdAoi7huMuOCHV9lChoBmgJaA9DCDBkdaunHHBAlIaUUpRoFU0DAWgWR0CiLynmzSkTdX2UKGgGaAloD0MI98snK0ZackCUhpRSlGgVS9doFkdAoi8qEtdzGXV9lChoBmgJaA9DCN+pgHse+HBAlIaUUpRoFUvjaBZHQKIw8H446wN1fZQoaAZoCWgPQwhnuWx0TvFyQJSGlFKUaBVL4mgWR0CiMQaBZpztdX2UKGgGaAloD0MIjQqcbIMEbUCUhpRSlGgVS/ZoFkdAojEvJcPe6HV9lChoBmgJaA9DCHrhzoWRbXFAlIaUUpRoFUvmaBZHQKIxOIC2c8V1fZQoaAZoCWgPQwhslPWbSRpzQJSGlFKUaBVL5mgWR0CiMTufdyksdX2UKGgGaAloD0MItyVywVmockCUhpRSlGgVS+9oFkdAojFXlZHNHHV9lChoBmgJaA9DCMY1PpN9MW9AlIaUUpRoFUv6aBZHQKIxecinpB51fZQoaAZoCWgPQwjx8nSuaD9xQJSGlFKUaBVL32gWR0CiMZiQ1aW5dX2UKGgGaAloD0MI7UrLSL2ZcUCUhpRSlGgVTQMBaBZHQKIxnlS0jTt1fZQoaAZoCWgPQwi6ZvLNtvhuQJSGlFKUaBVL7GgWR0CiMaGViWmhdX2UKGgGaAloD0MIP1OvWwSicUCUhpRSlGgVS/loFkdAojJK11GLDXV9lChoBmgJaA9DCB1WuOUjn25AlIaUUpRoFUv1aBZHQKIyX73wkPd1fZQoaAZoCWgPQwgoucMmMrhuQJSGlFKUaBVNGgFoFkdAojJocDKYA3V9lChoBmgJaA9DCJZ5q67DH3BAlIaUUpRoFUvaaBZHQKIya5BkZrJ1fZQoaAZoCWgPQwiQuwhTlHNtQJSGlFKUaBVL5WgWR0CiMoamwaBJdX2UKGgGaAloD0MIzaylgLT7cECUhpRSlGgVTScBaBZHQKIylvbXYlJ1fZQoaAZoCWgPQwiZnxuacpBwQJSGlFKUaBVL5GgWR0CiM2UxM36zdX2UKGgGaAloD0MIX3tmSUBacECUhpRSlGgVS+hoFkdAojOGvGIbfnV9lChoBmgJaA9DCLka2ZWWeHFAlIaUUpRoFUvyaBZHQKIzzCzkZJl1fZQoaAZoCWgPQwgcCMkCJltxQJSGlFKUaBVL8GgWR0CiM8+RYA80dX2UKGgGaAloD0MIpd3oY36NcUCUhpRSlGgVS9hoFkdAojPyaPS2IHV9lChoBmgJaA9DCEp/L4UHWnNAlIaUUpRoFUvtaBZHQKI0CWRigCh1fZQoaAZoCWgPQwhVaYtrPClwQJSGlFKUaBVL4mgWR0CiNAmVRk3CdX2UKGgGaAloD0MIVDntKbkZckCUhpRSlGgVS/poFkdAojQMxCY1HnV9lChoBmgJaA9DCF1Q3zJnD3FAlIaUUpRoFU0rAWgWR0CiNHWWhRIjdX2UKGgGaAloD0MItr3dktyDcECUhpRSlGgVTQkBaBZHQKI0e37UG3Z1fZQoaAZoCWgPQwjh8IKIlEpyQJSGlFKUaBVL3GgWR0CiNKO+h4+sdX2UKGgGaAloD0MIj4mUZjN5cUCUhpRSlGgVS9RoFkdAojTbot+TeXV9lChoBmgJaA9DCL1tpkJ8G3BAlIaUUpRoFUv2aBZHQKI0+vt+kQB1fZQoaAZoCWgPQwjQtwVLde1vQJSGlFKUaBVL/GgWR0CiNRSl3yI6dX2UKGgGaAloD0MIqYdodIeMckCUhpRSlGgVTQIBaBZHQKI1IQlruYx1fZQoaAZoCWgPQwig3Lbv0dtyQJSGlFKUaBVNAgFoFkdAojU8ajvd/XVlLg=="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 504, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVlgIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAEsBSwFLE0MEiABTAJROhZQpjAFflIWUjGYvaG9tZS9yb2JlcnQxMDAzLy5weWVudi92ZXJzaW9ucy9kZWVwLXJsL2xpYi9weXRob24zLjgvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuAQwIAAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UaA11Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoF2gOjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoGIwHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/yZmZmZmZmoWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "system_info": {"OS": "Linux-5.4.0-109-generic-x86_64-with-glibc2.29 #123-Ubuntu SMP Fri Apr 8 09:10:54 UTC 2022", "Python": "3.8.11", "Stable-Baselines3": "1.5.0", "PyTorch": "1.11.0+cu102", "GPU Enabled": "True", "Numpy": "1.22.3", "Gym": "0.21.0"}}
 
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7feb678aa310>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7feb678aa3a0>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7feb678aa430>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7feb678aa4c0>", "_build": "<function ActorCriticPolicy._build at 0x7feb678aa550>", "forward": "<function ActorCriticPolicy.forward at 0x7feb678aa5e0>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7feb678aa670>", "_predict": "<function ActorCriticPolicy._predict at 0x7feb678aa700>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7feb678aa790>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7feb678aa820>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7feb678aa8b0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc_data object at 0x7feb678b0660>"}, "verbose": 1, "policy_kwargs": {}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVpQEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/5RoC0sIhZSMAUOUdJRSlIwEaGlnaJRoEyiWIAAAAAAAAAAAAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAf5RoC0sIhZRoFnSUUpSMDWJvdW5kZWRfYmVsb3eUaBMolggAAAAAAAAAAAAAAAAAAACUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBZ0lFKUjA1ib3VuZGVkX2Fib3ZllGgTKJYIAAAAAAAAAAAAAAAAAAAAlGgiSwiFlGgWdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [8], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False]", "bounded_above": "[False False False False False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gAWViAAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu", "n": 4, "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "num_timesteps": 5013504, "_total_timesteps": 5000000.0, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1652608229.6440349, "learning_rate": 0.0003, "tensorboard_log": "./logs", "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVlgIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAEsBSwFLE0MEiABTAJROhZQpjAFflIWUjGYvaG9tZS9yb2JlcnQxMDAzLy5weWVudi92ZXJzaW9ucy9kZWVwLXJsL2xpYi9weXRob24zLjgvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuAQwIAAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UaA11Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoF2gOjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoGIwHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/M6kqMFUyYYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAADMFF7x6+rY/yUGZvvlhfz57zZw7NTvhuwAAAAAAAAAAmj1tvaoGMz7e9ws+S4HGvqDKKL1A2Io9AAAAAAAAAAC6uQ4+NtiOP5gILT4G4iu/GPd3Pq3Eyz0AAAAAAAAAAEBMsD14a6c/dee+Pp2x+L7Uxeg9nsJvPgAAAAAAAAAAAFYwvEiqqT8ahIS9MornvhQ/nLwxIMS9AAAAAAAAAABmfgC8rn2HusLfyzOQSa4vR1Qtur5lw7MAAIA/AACAP/q5Wb60gUg+gh/8Pg9ll76Hu4+9AR+pPgAAAAAAAAAAzTnyPAgI5D2VkFG+9FvDvpEND74hDzG9AAAAAAAAAABmpru8LjvhPYK3sbyEA72+8yACvvMhfbwAAAAAAAAAAOYKsL16hJ0/8wK7vt4mJb9gXy6+kvBlvgAAAAAAAAAADe7+PSn8Ezs0GRQ7mTfTNunaxjz+uGC6AAAAAAAAAACA+1c99tB3upaahTuxh0E38zolO8WhMTYAAAAAAAAAAFrkuz0C5+8+pg3NvbyVAr8iXIs9fxLGvQAAAAAAAAAAZmaZOFzisT5ilK291/wGv+dij712Vbq9AAAAAAAAAABmxHI80i6YuygsWTt6+Yc8T1XePPBsaL0AAIA/AACAPzN0vryDJwg9LU7RPiG8Vr4vDjY+McEAPgAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.0027007999999999477, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVHRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIz/dT4+WBckCUhpRSlIwBbJRLsIwBdJRHQLIeStknTiN1fZQoaAZoCWgPQwjTTs3lBnRwQJSGlFKUaBVLyWgWR0CyHmBigCfZdX2UKGgGaAloD0MIG/Sltz9RckCUhpRSlGgVS6toFkdAsh59edCmdnV9lChoBmgJaA9DCCyeeqRBpnBAlIaUUpRoFUvFaBZHQLIeinmJWNp1fZQoaAZoCWgPQwicGf1ouNRzQJSGlFKUaBVL3GgWR0CyHov16E8JdX2UKGgGaAloD0MIhQfNrvvDcUCUhpRSlGgVS7JoFkdAsh6QF1SwW3V9lChoBmgJaA9DCHHMsicB83FAlIaUUpRoFUvRaBZHQLIelf2K2rp1fZQoaAZoCWgPQwh8mShCKjNxQJSGlFKUaBVL1mgWR0CyHqwrYoRadX2UKGgGaAloD0MIlxsMdZj0cUCUhpRSlGgVS8toFkdAsh60/2TPjXV9lChoBmgJaA9DCMFUM2spxG9AlIaUUpRoFUu5aBZHQLIeuMsYl6Z1fZQoaAZoCWgPQwjLoNrgxHtwQJSGlFKUaBVLr2gWR0CyHuRx1gYxdX2UKGgGaAloD0MI/Bu0V98acECUhpRSlGgVS71oFkdAsh7m7btZ3nV9lChoBmgJaA9DCJCjObKylHBAlIaUUpRoFUvSaBZHQLIe7/n4fwJ1fZQoaAZoCWgPQwgcDHVY4QVzQJSGlFKUaBVLxGgWR0CyHwanrIHUdX2UKGgGaAloD0MIX9BCAkZncUCUhpRSlGgVS8NoFkdAsh8K5Fw1i3V9lChoBmgJaA9DCIC6gQIv+HJAlIaUUpRoFUvUaBZHQLIfIGMGX5Z1fZQoaAZoCWgPQwjxDYXPlrtzQJSGlFKUaBVL+WgWR0CyHyJokAxSdX2UKGgGaAloD0MI41KVtjjNcUCUhpRSlGgVS8xoFkdAsh8wvalDW3V9lChoBmgJaA9DCBe2ZivvcnBAlIaUUpRoFUvGaBZHQLIfSRTS9dx1fZQoaAZoCWgPQwhI+Um1j+FyQJSGlFKUaBVL02gWR0CyJ6TcqOLjdX2UKGgGaAloD0MIp1oLs5CscECUhpRSlGgVS6toFkdAsienVkMCtHV9lChoBmgJaA9DCDV6NUCprnFAlIaUUpRoFUvVaBZHQLInq/NZ/1B1fZQoaAZoCWgPQwjcKR2svy1yQJSGlFKUaBVL3mgWR0CyJ7y1JDmbdX2UKGgGaAloD0MI+RBUjd7wckCUhpRSlGgVS+xoFkdAsifAqXnhbXV9lChoBmgJaA9DCNtQMc4fwnJAlIaUUpRoFUvBaBZHQLInxMEzO5d1fZQoaAZoCWgPQwgBiSZQBB1wQJSGlFKUaBVL22gWR0CyJ9I9X9zfdX2UKGgGaAloD0MI6ndhazb2ckCUhpRSlGgVS7poFkdAsifsQxveg3V9lChoBmgJaA9DCILJjSLr53NAlIaUUpRoFUvBaBZHQLIoAd07r9l1fZQoaAZoCWgPQwg3OXzSSYNyQJSGlFKUaBVLsGgWR0CyKAm29crzdX2UKGgGaAloD0MIAmGnWLWRb0CUhpRSlGgVS7poFkdAsigZnOB193V9lChoBmgJaA9DCA1RhT8DzXNAlIaUUpRoFUviaBZHQLIoHcFQl8h1fZQoaAZoCWgPQwieKAmJtMlzQJSGlFKUaBVLxmgWR0CyKD4+0PYndX2UKGgGaAloD0MIY7ZkVYRTb0CUhpRSlGgVS7loFkdAsig/giu+y3V9lChoBmgJaA9DCF36l6Ty53JAlIaUUpRoFUvRaBZHQLIoR/QBxPx1fZQoaAZoCWgPQwgAVkeOdHNvQJSGlFKUaBVLt2gWR0CyKFYUnG83dX2UKGgGaAloD0MIEywOZ/6TcUCUhpRSlGgVS7NoFkdAsihyiEg4fnV9lChoBmgJaA9DCK7X9KBgtHBAlIaUUpRoFUu6aBZHQLIoc606YE51fZQoaAZoCWgPQwgrhUAuMXBxQJSGlFKUaBVLs2gWR0CyKIHDrJKbdX2UKGgGaAloD0MIH4Kq0atjc0CUhpRSlGgVS7VoFkdAsiiLy9VWCHV9lChoBmgJaA9DCJHUQsnk5HFAlIaUUpRoFUvYaBZHQLIolWAwwkB1fZQoaAZoCWgPQwihavRqAMRyQJSGlFKUaBVLx2gWR0CyKKzEaVD8dX2UKGgGaAloD0MItyqJ7EMJckCUhpRSlGgVS+toFkdAsijBrbg0j3V9lChoBmgJaA9DCF6ezhWl2nJAlIaUUpRoFUvBaBZHQLIo1287IT51fZQoaAZoCWgPQwjcKR2sP9lyQJSGlFKUaBVLz2gWR0CyKOG8ujASdX2UKGgGaAloD0MIYmpLHeQCckCUhpRSlGgVS+BoFkdAsijj0voNeHV9lChoBmgJaA9DCF4robskSXBAlIaUUpRoFUvFaBZHQLIo6wX668R1fZQoaAZoCWgPQwj9a3nl+jdwQJSGlFKUaBVLtWgWR0CyKP98eCCjdX2UKGgGaAloD0MIBoIAGTqdc0CUhpRSlGgVS+toFkdAsikY6BAfMnV9lChoBmgJaA9DCBXI7Cy6/3JAlIaUUpRoFUvNaBZHQLIpG0ygwoN1fZQoaAZoCWgPQwjzAYHO5JZzQJSGlFKUaBVLzGgWR0CyKSLXlKbsdX2UKGgGaAloD0MIfcucLoupcUCUhpRSlGgVS8FoFkdAsikksUZeiXV9lChoBmgJaA9DCKIo0CdylXFAlIaUUpRoFUvGaBZHQLIpSXLNfPZ1fZQoaAZoCWgPQwhXIeUnVQJxQJSGlFKUaBVLrWgWR0CyKVJf2K2sdX2UKGgGaAloD0MIWWyTikasc0CUhpRSlGgVS9ZoFkdAsilcKqn3tnV9lChoBmgJaA9DCLABEeIK3XBAlIaUUpRoFUvCaBZHQLIpX01IiC91fZQoaAZoCWgPQwgw9l580XpzQJSGlFKUaBVL02gWR0CyKWdsFdLQdX2UKGgGaAloD0MIxVimX+LacECUhpRSlGgVS7hoFkdAsilzp3X7L3V9lChoBmgJaA9DCMUB9Pt+DnRAlIaUUpRoFUvDaBZHQLIpkK0UoKF1fZQoaAZoCWgPQwg7U+i8RopyQJSGlFKUaBVLxGgWR0CyKbEZR8+idX2UKGgGaAloD0MI4LvNG6ebckCUhpRSlGgVS9FoFkdAsim2R/3Fk3V9lChoBmgJaA9DCMh4lEo4DnFAlIaUUpRoFUu3aBZHQLIpwnXumaZ1fZQoaAZoCWgPQwihavRqAKJxQJSGlFKUaBVL2mgWR0CyKcxrJr+HdX2UKGgGaAloD0MIUtUEUXcOcUCUhpRSlGgVS9ZoFkdAsinP0XgtOHV9lChoBmgJaA9DCNkkP+LXRnBAlIaUUpRoFUu4aBZHQLIp3cG1QZZ1fZQoaAZoCWgPQwg9X7NcNg1xQJSGlFKUaBVLy2gWR0CyKft4VymzdX2UKGgGaAloD0MI8Z9uoMDzb0CUhpRSlGgVS89oFkdAsin+B06o2nV9lChoBmgJaA9DCKfJjLeV/nBAlIaUUpRoFUvEaBZHQLIqFw/PgNx1fZQoaAZoCWgPQwhLWvENhXdxQJSGlFKUaBVLt2gWR0CyKhtUbT+edX2UKGgGaAloD0MIavmBqzz1cUCUhpRSlGgVS7FoFkdAsiog6Kcd53V9lChoBmgJaA9DCPGD86ljGXBAlIaUUpRoFUu6aBZHQLIqIdKNAC51fZQoaAZoCWgPQwgSTaCIRS1xQJSGlFKUaBVLzmgWR0CyKimdupCKdX2UKGgGaAloD0MIA+55/vR/cUCUhpRSlGgVS71oFkdAsio5deIEbHV9lChoBmgJaA9DCHeBkgJLenFAlIaUUpRoFUu4aBZHQLIqVA3kxRF1fZQoaAZoCWgPQwgtmPijaIhzQJSGlFKUaBVLz2gWR0CyKpnEyckMdX2UKGgGaAloD0MIzM8NTRkvcECUhpRSlGgVS75oFkdAsiqi4nWrfnV9lChoBmgJaA9DCJm8AWb+DHJAlIaUUpRoFUuvaBZHQLIqpW5H3Dh1fZQoaAZoCWgPQwgh6dMqOilzQJSGlFKUaBVL12gWR0CyKqj/+85CdX2UKGgGaAloD0MIuQA0ShdgcUCUhpRSlGgVS8loFkdAsiqyw7kn1HV9lChoBmgJaA9DCNQQVfjz43FAlIaUUpRoFUujaBZHQLIqtu/k/8l1fZQoaAZoCWgPQwgrobskjkhzQJSGlFKUaBVL4mgWR0CyKsDrRjSYdX2UKGgGaAloD0MI7Zv7q8eFcUCUhpRSlGgVS61oFkdAsitW8jAzpHV9lChoBmgJaA9DCELpCyFnv3FAlIaUUpRoFUvVaBZHQLIrapwCKaZ1fZQoaAZoCWgPQwjQm4pU2KJwQJSGlFKUaBVLtmgWR0CyK3edwvQGdX2UKGgGaAloD0MIo68gzdj9cECUhpRSlGgVS9RoFkdAsiuFsnAqNXV9lChoBmgJaA9DCKfK94zEc3BAlIaUUpRoFUvLaBZHQLIrha9K28Z1fZQoaAZoCWgPQwjMJVXbzUxyQJSGlFKUaBVL3GgWR0CyK5kliSaFdX2UKGgGaAloD0MImIdM+RBjc0CUhpRSlGgVS8toFkdAsiug5aNdaHV9lChoBmgJaA9DCF653jaTz3JAlIaUUpRoFUvOaBZHQLIrvxeLNwB1fZQoaAZoCWgPQwgs2EY82UBwQJSGlFKUaBVLwmgWR0CyK/o8yN4rdX2UKGgGaAloD0MIVACMZ5CwcUCUhpRSlGgVS8FoFkdAsiv/xSYPXnV9lChoBmgJaA9DCCFaK9pcrnBAlIaUUpRoFUvOaBZHQLIsAU7CBPN1fZQoaAZoCWgPQwgWURN9Pp1wQJSGlFKUaBVLtmgWR0CyLAJ3LV4HdX2UKGgGaAloD0MISx+6oD7EcUCUhpRSlGgVS9loFkdAsiwY3FUADXV9lChoBmgJaA9DCNuJkpBIB05AlIaUUpRoFUubaBZHQLIsIA3T/hl1fZQoaAZoCWgPQwiKWS+GsoZwQJSGlFKUaBVLxmgWR0CyLCAk1MufdX2UKGgGaAloD0MISgfr/xxBcUCUhpRSlGgVS9JoFkdAsixS+pOvdXV9lChoBmgJaA9DCD3TS4wlTXJAlIaUUpRoFUu6aBZHQLIseUiY9gZ1fZQoaAZoCWgPQwjvAbovJ+xzQJSGlFKUaBVL2WgWR0CyLHrksBhhdX2UKGgGaAloD0MIOC7jpoZWcECUhpRSlGgVS7xoFkdAsiyE+wC8vnV9lChoBmgJaA9DCEpFY+0vY3FAlIaUUpRoFUvfaBZHQLIskjhUBGR1ZS4="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 1224, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVlgIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAEsBSwFLE0MEiABTAJROhZQpjAFflIWUjGYvaG9tZS9yb2JlcnQxMDAzLy5weWVudi92ZXJzaW9ucy9kZWVwLXJsL2xpYi9weXRob24zLjgvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuAQwIAAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UaA11Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoF2gOjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoGIwHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/yZmZmZmZmoWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "system_info": {"OS": "Linux-5.4.0-109-generic-x86_64-with-glibc2.29 #123-Ubuntu SMP Fri Apr 8 09:10:54 UTC 2022", "Python": "3.8.11", "Stable-Baselines3": "1.5.0", "PyTorch": "1.11.0+cu102", "GPU Enabled": "True", "Numpy": "1.22.3", "Gym": "0.21.0"}}
ppo-LunarLander-v2.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:939d324d7a2b8f44f5a38af53011f5af7b91f0cf611a960f87ab1cb33055190e
3
- size 143931
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:07cef63b4af7a6729e19641af74150182518ccba3a36bccf163a33965a18b985
3
+ size 143909
ppo-LunarLander-v2/data CHANGED
@@ -4,19 +4,19 @@
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
- "__init__": "<function ActorCriticPolicy.__init__ at 0x7fea4bce0310>",
8
- "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7fea4bce03a0>",
9
- "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7fea4bce0430>",
10
- "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7fea4bce04c0>",
11
- "_build": "<function ActorCriticPolicy._build at 0x7fea4bce0550>",
12
- "forward": "<function ActorCriticPolicy.forward at 0x7fea4bce05e0>",
13
- "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7fea4bce0670>",
14
- "_predict": "<function ActorCriticPolicy._predict at 0x7fea4bce0700>",
15
- "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7fea4bce0790>",
16
- "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7fea4bce0820>",
17
- "predict_values": "<function ActorCriticPolicy.predict_values at 0x7fea4bce08b0>",
18
  "__abstractmethods__": "frozenset()",
19
- "_abc_impl": "<_abc_data object at 0x7fea4bcfa660>"
20
  },
21
  "verbose": 1,
22
  "policy_kwargs": {},
@@ -42,7 +42,7 @@
42
  "_np_random": null
43
  },
44
  "n_envs": 16,
45
- "num_timesteps": 2080000,
46
  "_total_timesteps": 5000000.0,
47
  "_num_timesteps_at_start": 0,
48
  "seed": null,
@@ -56,7 +56,7 @@
56
  },
57
  "_last_obs": {
58
  ":type:": "<class 'numpy.ndarray'>",
59
- ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAALP7972BPn8/tGkKviawCb/+94a+qqhyPQAAAAAAAAAAzS8XveEQubrn0Qq2DRnFsIKXDLlgohk1AACAPwAAgD/m9Qy9L7QdPoL8Lz03tIq+U+UJPMpeCT4AAAAAAAAAAED4xj1q0/s+PXUmvsyZ174gVxC9Nt4IvgAAAAAAAAAAM8kAvnrPaT9SQaw9pc7nvspMsb2dFAA+AAAAAAAAAACaHo49E1iDP/rauD1+Ls++XKA3PpbORLsAAAAAAAAAAHPxzb3M+Jw+GhECP/uUN75wRHY+OP1mPgAAAAAAAAAAZro1vTanPbzqgI69VOREvBhWJj2IQm4+AACAPwAAgD+aW2w9n7fXuwiPxrx03P88AAw3Pfvc0r0AAIA/AACAP830J724cMa7b+KSPL8buzyoSK28sURIPAAAgD8AAIA/mksdvadTXT4Ki6O8I3h6vth1A777A3I9AAAAAAAAAACaj9e8VSEUPsgyt7tB0Ie+qPSsvAiP1zwAAAAAAAAAACD4RT4riXk/8vs/Ps6e374V7tg+Wb6ZvQAAAAAAAAAA4Ew2vkifdj/i5yQ9kSTnvkmcab6hXQ0+AAAAAAAAAACzYVW9vB6uPvJnLj4Jaoq+bg++PSiLhb0AAAAAAAAAALOjRT2/jU0+Sek+vgUCn74Wn/K9R4OsPAAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
60
  },
61
  "_last_episode_starts": {
62
  ":type:": "<class 'numpy.ndarray'>",
@@ -66,16 +66,16 @@
66
  "_episode_num": 0,
67
  "use_sde": false,
68
  "sde_sample_freq": -1,
69
- "_current_progress_remaining": 0.5871232,
70
  "ep_info_buffer": {
71
  ":type:": "<class 'collections.deque'>",
72
- ":serialized:": "gAWVNxAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIkZkLXJ6FcECUhpRSlIwBbJRL3IwBdJRHQKIYWcd5prV1fZQoaAZoCWgPQwgKn62DQwRxQJSGlFKUaBVNDQFoFkdAohhxje9BbHV9lChoBmgJaA9DCPNUh9wM33JAlIaUUpRoFUvuaBZHQKIYdgKF7D51fZQoaAZoCWgPQwgRGOsbGLNvQJSGlFKUaBVL22gWR0CiGKbF0gbIdX2UKGgGaAloD0MIEcgljryIbkCUhpRSlGgVS+JoFkdAohltz+3pfXV9lChoBmgJaA9DCKVOQBNhcXFAlIaUUpRoFUvyaBZHQKIZkXVsk6d1fZQoaAZoCWgPQwhXe9gLxRBzQJSGlFKUaBVNAwFoFkdAohoIhje9BnV9lChoBmgJaA9DCPzkKEBUa3NAlIaUUpRoFUvvaBZHQKIa047Rv3t1fZQoaAZoCWgPQwhw6gPJO4ZyQJSGlFKUaBVL52gWR0CiGwNu+AVgdX2UKGgGaAloD0MIK6ORzys2cUCUhpRSlGgVS95oFkdAohsT6guh9XV9lChoBmgJaA9DCFfPSe+bN3FAlIaUUpRoFU1IAWgWR0CiGz+bmU4adX2UKGgGaAloD0MI8wLso5OwckCUhpRSlGgVS/ZoFkdAohuUQiA2AHV9lChoBmgJaA9DCEAwR4+fIXFAlIaUUpRoFUv/aBZHQKIbl/7SApd1fZQoaAZoCWgPQwhzY3rCEr9xQJSGlFKUaBVL6WgWR0CiG6o0hvBKdX2UKGgGaAloD0MIoUyjycUnckCUhpRSlGgVS9doFkdAohu+biIcinV9lChoBmgJaA9DCFde8j/5jnFAlIaUUpRoFUvfaBZHQKIbz6Skj5d1fZQoaAZoCWgPQwjQ1OsWQepwQJSGlFKUaBVL/mgWR0CiG8/jsD4hdX2UKGgGaAloD0MInwJgPIOBbkCUhpRSlGgVS/BoFkdAohvkDnvDxnV9lChoBmgJaA9DCFQ1QdT9u3BAlIaUUpRoFU0KAWgWR0CiHBX9aUzLdX2UKGgGaAloD0MIa7kzE8y/cECUhpRSlGgVS/VoFkdAohxAd2gWanV9lChoBmgJaA9DCHdpw2FpZm5AlIaUUpRoFUvsaBZHQKIcQ5avA451fZQoaAZoCWgPQwg6evzeJqBvQJSGlFKUaBVL9GgWR0CiHLla0QbudX2UKGgGaAloD0MIlrGhm72QcUCUhpRSlGgVS+BoFkdAoh2JDohY/3V9lChoBmgJaA9DCKG5TiOtb25AlIaUUpRoFU0CAWgWR0CiHdMtsenydX2UKGgGaAloD0MIX9ODglKTbkCUhpRSlGgVS/FoFkdAoh3aF/QSjHV9lChoBmgJaA9DCExxVdm3xXBAlIaUUpRoFUvraBZHQKId8OG0u151fZQoaAZoCWgPQwgmj6flB6JOQJSGlFKUaBVLmmgWR0CiHhL6UJOWdX2UKGgGaAloD0MI1Qj9TD1ccUCUhpRSlGgVS+toFkdAoh5KVD8cdnV9lChoBmgJaA9DCO9VKxP+pHBAlIaUUpRoFUvbaBZHQKIeb1MdtEZ1fZQoaAZoCWgPQwj1nPS+sZ1wQJSGlFKUaBVL7GgWR0CiHnlUQ04zdX2UKGgGaAloD0MIsACmDBx6ckCUhpRSlGgVS+1oFkdAoh6Pag261HV9lChoBmgJaA9DCCP1nsrp9nBAlIaUUpRoFU0BAWgWR0CiHo/LLZBcdX2UKGgGaAloD0MItD7lmOxJckCUhpRSlGgVTQEBaBZHQKIeovJRwZR1fZQoaAZoCWgPQwhfl+E/nSNzQJSGlFKUaBVL42gWR0CiHr4BmwqzdX2UKGgGaAloD0MID9b/OUxecUCUhpRSlGgVTSUBaBZHQKIfIIk7fYV1fZQoaAZoCWgPQwiqYir9BERyQJSGlFKUaBVL/mgWR0CiHzRBeHBUdX2UKGgGaAloD0MIs5quJ7ojckCUhpRSlGgVTRcBaBZHQKIqtSNwR5F1fZQoaAZoCWgPQwj9+bZgae1yQJSGlFKUaBVL7GgWR0CiKvyQgcLjdX2UKGgGaAloD0MIHM9nQL2bcECUhpRSlGgVS+ZoFkdAoiszRKHwgHV9lChoBmgJaA9DCA/Tvrm/s21AlIaUUpRoFUvsaBZHQKIrXqzqrzZ1fZQoaAZoCWgPQwg8o61KIk9uQJSGlFKUaBVL/mgWR0CiK309yLhrdX2UKGgGaAloD0MIshGI13VjcUCUhpRSlGgVS9JoFkdAoiuKSHM2WXV9lChoBmgJaA9DCKCH2jYMrnJAlIaUUpRoFUvRaBZHQKIrkHqu8sd1fZQoaAZoCWgPQwhffqfJDApzQJSGlFKUaBVL4mgWR0CiK5lEiMYNdX2UKGgGaAloD0MINe84RUfXbkCUhpRSlGgVTQgBaBZHQKIr07KaG6B1fZQoaAZoCWgPQwiLpUi+0iNxQJSGlFKUaBVNiwJoFkdAoivfUc4o7XV9lChoBmgJaA9DCBFSt7MvJXFAlIaUUpRoFUv6aBZHQKIsEEqUeMh1fZQoaAZoCWgPQwjfbd44qZ9wQJSGlFKUaBVNBwFoFkdAoiwx0Qsf73V9lChoBmgJaA9DCKvMlNZftXJAlIaUUpRoFU0VAWgWR0CiLGeOGTLXdX2UKGgGaAloD0MIVkW4yag/b0CUhpRSlGgVS+toFkdAoix5ul41P3V9lChoBmgJaA9DCGA6rdtgnnFAlIaUUpRoFU0VAWgWR0CiLING3F1kdX2UKGgGaAloD0MIA5ZcxWL/cECUhpRSlGgVTRABaBZHQKIs4f4h2W91fZQoaAZoCWgPQwi8ehUZXb5wQJSGlFKUaBVL+2gWR0CiLb6Xrt3OdX2UKGgGaAloD0MIzc03orvscUCUhpRSlGgVS99oFkdAoi3CdjG1hXV9lChoBmgJaA9DCACrI0f6XnJAlIaUUpRoFUvXaBZHQKIt2RgZ0jl1fZQoaAZoCWgPQwgTuHU3T+1wQJSGlFKUaBVNJAFoFkdAoi3+nyd4FHV9lChoBmgJaA9DCBsQIa6ckXNAlIaUUpRoFUvmaBZHQKIuAdnTRY11fZQoaAZoCWgPQwg74LpiRulyQJSGlFKUaBVLyWgWR0CiLgTnied1dX2UKGgGaAloD0MII0kQrkCFcUCUhpRSlGgVTQIBaBZHQKIuCBQvYe11fZQoaAZoCWgPQwh1r5P6MkRuQJSGlFKUaBVL8GgWR0CiLhFy7wrldX2UKGgGaAloD0MIRBg/jfu/ckCUhpRSlGgVS/9oFkdAoi5LTlT3qXV9lChoBmgJaA9DCKJinL8JC3FAlIaUUpRoFUvcaBZHQKIuZLFn7Hh1fZQoaAZoCWgPQwheE9IaA7huQJSGlFKUaBVNAwFoFkdAoi6KzkZJkHV9lChoBmgJaA9DCKLw2To4P3JAlIaUUpRoFUvkaBZHQKIumnb7CSB1fZQoaAZoCWgPQwh9rrZif45tQJSGlFKUaBVL4GgWR0CiLsdkz41xdX2UKGgGaAloD0MIcT0K16PlbUCUhpRSlGgVS+BoFkdAoi7huMuOCHV9lChoBmgJaA9DCDBkdaunHHBAlIaUUpRoFU0DAWgWR0CiLynmzSkTdX2UKGgGaAloD0MI98snK0ZackCUhpRSlGgVS9doFkdAoi8qEtdzGXV9lChoBmgJaA9DCN+pgHse+HBAlIaUUpRoFUvjaBZHQKIw8H446wN1fZQoaAZoCWgPQwhnuWx0TvFyQJSGlFKUaBVL4mgWR0CiMQaBZpztdX2UKGgGaAloD0MIjQqcbIMEbUCUhpRSlGgVS/ZoFkdAojEvJcPe6HV9lChoBmgJaA9DCHrhzoWRbXFAlIaUUpRoFUvmaBZHQKIxOIC2c8V1fZQoaAZoCWgPQwhslPWbSRpzQJSGlFKUaBVL5mgWR0CiMTufdyksdX2UKGgGaAloD0MItyVywVmockCUhpRSlGgVS+9oFkdAojFXlZHNHHV9lChoBmgJaA9DCMY1PpN9MW9AlIaUUpRoFUv6aBZHQKIxecinpB51fZQoaAZoCWgPQwjx8nSuaD9xQJSGlFKUaBVL32gWR0CiMZiQ1aW5dX2UKGgGaAloD0MI7UrLSL2ZcUCUhpRSlGgVTQMBaBZHQKIxnlS0jTt1fZQoaAZoCWgPQwi6ZvLNtvhuQJSGlFKUaBVL7GgWR0CiMaGViWmhdX2UKGgGaAloD0MIP1OvWwSicUCUhpRSlGgVS/loFkdAojJK11GLDXV9lChoBmgJaA9DCB1WuOUjn25AlIaUUpRoFUv1aBZHQKIyX73wkPd1fZQoaAZoCWgPQwgoucMmMrhuQJSGlFKUaBVNGgFoFkdAojJocDKYA3V9lChoBmgJaA9DCJZ5q67DH3BAlIaUUpRoFUvaaBZHQKIya5BkZrJ1fZQoaAZoCWgPQwiQuwhTlHNtQJSGlFKUaBVL5WgWR0CiMoamwaBJdX2UKGgGaAloD0MIzaylgLT7cECUhpRSlGgVTScBaBZHQKIylvbXYlJ1fZQoaAZoCWgPQwiZnxuacpBwQJSGlFKUaBVL5GgWR0CiM2UxM36zdX2UKGgGaAloD0MIX3tmSUBacECUhpRSlGgVS+hoFkdAojOGvGIbfnV9lChoBmgJaA9DCLka2ZWWeHFAlIaUUpRoFUvyaBZHQKIzzCzkZJl1fZQoaAZoCWgPQwgcCMkCJltxQJSGlFKUaBVL8GgWR0CiM8+RYA80dX2UKGgGaAloD0MIpd3oY36NcUCUhpRSlGgVS9hoFkdAojPyaPS2IHV9lChoBmgJaA9DCEp/L4UHWnNAlIaUUpRoFUvtaBZHQKI0CWRigCh1fZQoaAZoCWgPQwhVaYtrPClwQJSGlFKUaBVL4mgWR0CiNAmVRk3CdX2UKGgGaAloD0MIVDntKbkZckCUhpRSlGgVS/poFkdAojQMxCY1HnV9lChoBmgJaA9DCF1Q3zJnD3FAlIaUUpRoFU0rAWgWR0CiNHWWhRIjdX2UKGgGaAloD0MItr3dktyDcECUhpRSlGgVTQkBaBZHQKI0e37UG3Z1fZQoaAZoCWgPQwjh8IKIlEpyQJSGlFKUaBVL3GgWR0CiNKO+h4+sdX2UKGgGaAloD0MIj4mUZjN5cUCUhpRSlGgVS9RoFkdAojTbot+TeXV9lChoBmgJaA9DCL1tpkJ8G3BAlIaUUpRoFUv2aBZHQKI0+vt+kQB1fZQoaAZoCWgPQwjQtwVLde1vQJSGlFKUaBVL/GgWR0CiNRSl3yI6dX2UKGgGaAloD0MIqYdodIeMckCUhpRSlGgVTQIBaBZHQKI1IQlruYx1fZQoaAZoCWgPQwig3Lbv0dtyQJSGlFKUaBVNAgFoFkdAojU8ajvd/XVlLg=="
73
  },
74
  "ep_success_buffer": {
75
  ":type:": "<class 'collections.deque'>",
76
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
77
  },
78
- "_n_updates": 504,
79
  "n_steps": 1024,
80
  "gamma": 0.999,
81
  "gae_lambda": 0.98,
 
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
+ "__init__": "<function ActorCriticPolicy.__init__ at 0x7feb678aa310>",
8
+ "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7feb678aa3a0>",
9
+ "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7feb678aa430>",
10
+ "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7feb678aa4c0>",
11
+ "_build": "<function ActorCriticPolicy._build at 0x7feb678aa550>",
12
+ "forward": "<function ActorCriticPolicy.forward at 0x7feb678aa5e0>",
13
+ "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7feb678aa670>",
14
+ "_predict": "<function ActorCriticPolicy._predict at 0x7feb678aa700>",
15
+ "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7feb678aa790>",
16
+ "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7feb678aa820>",
17
+ "predict_values": "<function ActorCriticPolicy.predict_values at 0x7feb678aa8b0>",
18
  "__abstractmethods__": "frozenset()",
19
+ "_abc_impl": "<_abc_data object at 0x7feb678b0660>"
20
  },
21
  "verbose": 1,
22
  "policy_kwargs": {},
 
42
  "_np_random": null
43
  },
44
  "n_envs": 16,
45
+ "num_timesteps": 5013504,
46
  "_total_timesteps": 5000000.0,
47
  "_num_timesteps_at_start": 0,
48
  "seed": null,
 
56
  },
57
  "_last_obs": {
58
  ":type:": "<class 'numpy.ndarray'>",
59
+ ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAADMFF7x6+rY/yUGZvvlhfz57zZw7NTvhuwAAAAAAAAAAmj1tvaoGMz7e9ws+S4HGvqDKKL1A2Io9AAAAAAAAAAC6uQ4+NtiOP5gILT4G4iu/GPd3Pq3Eyz0AAAAAAAAAAEBMsD14a6c/dee+Pp2x+L7Uxeg9nsJvPgAAAAAAAAAAAFYwvEiqqT8ahIS9MornvhQ/nLwxIMS9AAAAAAAAAABmfgC8rn2HusLfyzOQSa4vR1Qtur5lw7MAAIA/AACAP/q5Wb60gUg+gh/8Pg9ll76Hu4+9AR+pPgAAAAAAAAAAzTnyPAgI5D2VkFG+9FvDvpEND74hDzG9AAAAAAAAAABmpru8LjvhPYK3sbyEA72+8yACvvMhfbwAAAAAAAAAAOYKsL16hJ0/8wK7vt4mJb9gXy6+kvBlvgAAAAAAAAAADe7+PSn8Ezs0GRQ7mTfTNunaxjz+uGC6AAAAAAAAAACA+1c99tB3upaahTuxh0E38zolO8WhMTYAAAAAAAAAAFrkuz0C5+8+pg3NvbyVAr8iXIs9fxLGvQAAAAAAAAAAZmaZOFzisT5ilK291/wGv+dij712Vbq9AAAAAAAAAABmxHI80i6YuygsWTt6+Yc8T1XePPBsaL0AAIA/AACAPzN0vryDJwg9LU7RPiG8Vr4vDjY+McEAPgAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
60
  },
61
  "_last_episode_starts": {
62
  ":type:": "<class 'numpy.ndarray'>",
 
66
  "_episode_num": 0,
67
  "use_sde": false,
68
  "sde_sample_freq": -1,
69
+ "_current_progress_remaining": -0.0027007999999999477,
70
  "ep_info_buffer": {
71
  ":type:": "<class 'collections.deque'>",
72
+ ":serialized:": "gAWVHRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIz/dT4+WBckCUhpRSlIwBbJRLsIwBdJRHQLIeStknTiN1fZQoaAZoCWgPQwjTTs3lBnRwQJSGlFKUaBVLyWgWR0CyHmBigCfZdX2UKGgGaAloD0MIG/Sltz9RckCUhpRSlGgVS6toFkdAsh59edCmdnV9lChoBmgJaA9DCCyeeqRBpnBAlIaUUpRoFUvFaBZHQLIeinmJWNp1fZQoaAZoCWgPQwicGf1ouNRzQJSGlFKUaBVL3GgWR0CyHov16E8JdX2UKGgGaAloD0MIhQfNrvvDcUCUhpRSlGgVS7JoFkdAsh6QF1SwW3V9lChoBmgJaA9DCHHMsicB83FAlIaUUpRoFUvRaBZHQLIelf2K2rp1fZQoaAZoCWgPQwh8mShCKjNxQJSGlFKUaBVL1mgWR0CyHqwrYoRadX2UKGgGaAloD0MIlxsMdZj0cUCUhpRSlGgVS8toFkdAsh60/2TPjXV9lChoBmgJaA9DCMFUM2spxG9AlIaUUpRoFUu5aBZHQLIeuMsYl6Z1fZQoaAZoCWgPQwjLoNrgxHtwQJSGlFKUaBVLr2gWR0CyHuRx1gYxdX2UKGgGaAloD0MI/Bu0V98acECUhpRSlGgVS71oFkdAsh7m7btZ3nV9lChoBmgJaA9DCJCjObKylHBAlIaUUpRoFUvSaBZHQLIe7/n4fwJ1fZQoaAZoCWgPQwgcDHVY4QVzQJSGlFKUaBVLxGgWR0CyHwanrIHUdX2UKGgGaAloD0MIX9BCAkZncUCUhpRSlGgVS8NoFkdAsh8K5Fw1i3V9lChoBmgJaA9DCIC6gQIv+HJAlIaUUpRoFUvUaBZHQLIfIGMGX5Z1fZQoaAZoCWgPQwjxDYXPlrtzQJSGlFKUaBVL+WgWR0CyHyJokAxSdX2UKGgGaAloD0MI41KVtjjNcUCUhpRSlGgVS8xoFkdAsh8wvalDW3V9lChoBmgJaA9DCBe2ZivvcnBAlIaUUpRoFUvGaBZHQLIfSRTS9dx1fZQoaAZoCWgPQwhI+Um1j+FyQJSGlFKUaBVL02gWR0CyJ6TcqOLjdX2UKGgGaAloD0MIp1oLs5CscECUhpRSlGgVS6toFkdAsienVkMCtHV9lChoBmgJaA9DCDV6NUCprnFAlIaUUpRoFUvVaBZHQLInq/NZ/1B1fZQoaAZoCWgPQwjcKR2svy1yQJSGlFKUaBVL3mgWR0CyJ7y1JDmbdX2UKGgGaAloD0MI+RBUjd7wckCUhpRSlGgVS+xoFkdAsifAqXnhbXV9lChoBmgJaA9DCNtQMc4fwnJAlIaUUpRoFUvBaBZHQLInxMEzO5d1fZQoaAZoCWgPQwgBiSZQBB1wQJSGlFKUaBVL22gWR0CyJ9I9X9zfdX2UKGgGaAloD0MI6ndhazb2ckCUhpRSlGgVS7poFkdAsifsQxveg3V9lChoBmgJaA9DCILJjSLr53NAlIaUUpRoFUvBaBZHQLIoAd07r9l1fZQoaAZoCWgPQwg3OXzSSYNyQJSGlFKUaBVLsGgWR0CyKAm29crzdX2UKGgGaAloD0MIAmGnWLWRb0CUhpRSlGgVS7poFkdAsigZnOB193V9lChoBmgJaA9DCA1RhT8DzXNAlIaUUpRoFUviaBZHQLIoHcFQl8h1fZQoaAZoCWgPQwieKAmJtMlzQJSGlFKUaBVLxmgWR0CyKD4+0PYndX2UKGgGaAloD0MIY7ZkVYRTb0CUhpRSlGgVS7loFkdAsig/giu+y3V9lChoBmgJaA9DCF36l6Ty53JAlIaUUpRoFUvRaBZHQLIoR/QBxPx1fZQoaAZoCWgPQwgAVkeOdHNvQJSGlFKUaBVLt2gWR0CyKFYUnG83dX2UKGgGaAloD0MIEywOZ/6TcUCUhpRSlGgVS7NoFkdAsihyiEg4fnV9lChoBmgJaA9DCK7X9KBgtHBAlIaUUpRoFUu6aBZHQLIoc606YE51fZQoaAZoCWgPQwgrhUAuMXBxQJSGlFKUaBVLs2gWR0CyKIHDrJKbdX2UKGgGaAloD0MIH4Kq0atjc0CUhpRSlGgVS7VoFkdAsiiLy9VWCHV9lChoBmgJaA9DCJHUQsnk5HFAlIaUUpRoFUvYaBZHQLIolWAwwkB1fZQoaAZoCWgPQwihavRqAMRyQJSGlFKUaBVLx2gWR0CyKKzEaVD8dX2UKGgGaAloD0MItyqJ7EMJckCUhpRSlGgVS+toFkdAsijBrbg0j3V9lChoBmgJaA9DCF6ezhWl2nJAlIaUUpRoFUvBaBZHQLIo1287IT51fZQoaAZoCWgPQwjcKR2sP9lyQJSGlFKUaBVLz2gWR0CyKOG8ujASdX2UKGgGaAloD0MIYmpLHeQCckCUhpRSlGgVS+BoFkdAsijj0voNeHV9lChoBmgJaA9DCF4robskSXBAlIaUUpRoFUvFaBZHQLIo6wX668R1fZQoaAZoCWgPQwj9a3nl+jdwQJSGlFKUaBVLtWgWR0CyKP98eCCjdX2UKGgGaAloD0MIBoIAGTqdc0CUhpRSlGgVS+toFkdAsikY6BAfMnV9lChoBmgJaA9DCBXI7Cy6/3JAlIaUUpRoFUvNaBZHQLIpG0ygwoN1fZQoaAZoCWgPQwjzAYHO5JZzQJSGlFKUaBVLzGgWR0CyKSLXlKbsdX2UKGgGaAloD0MIfcucLoupcUCUhpRSlGgVS8FoFkdAsikksUZeiXV9lChoBmgJaA9DCKIo0CdylXFAlIaUUpRoFUvGaBZHQLIpSXLNfPZ1fZQoaAZoCWgPQwhXIeUnVQJxQJSGlFKUaBVLrWgWR0CyKVJf2K2sdX2UKGgGaAloD0MIWWyTikasc0CUhpRSlGgVS9ZoFkdAsilcKqn3tnV9lChoBmgJaA9DCLABEeIK3XBAlIaUUpRoFUvCaBZHQLIpX01IiC91fZQoaAZoCWgPQwgw9l580XpzQJSGlFKUaBVL02gWR0CyKWdsFdLQdX2UKGgGaAloD0MIxVimX+LacECUhpRSlGgVS7hoFkdAsilzp3X7L3V9lChoBmgJaA9DCMUB9Pt+DnRAlIaUUpRoFUvDaBZHQLIpkK0UoKF1fZQoaAZoCWgPQwg7U+i8RopyQJSGlFKUaBVLxGgWR0CyKbEZR8+idX2UKGgGaAloD0MI4LvNG6ebckCUhpRSlGgVS9FoFkdAsim2R/3Fk3V9lChoBmgJaA9DCMh4lEo4DnFAlIaUUpRoFUu3aBZHQLIpwnXumaZ1fZQoaAZoCWgPQwihavRqAKJxQJSGlFKUaBVL2mgWR0CyKcxrJr+HdX2UKGgGaAloD0MIUtUEUXcOcUCUhpRSlGgVS9ZoFkdAsinP0XgtOHV9lChoBmgJaA9DCNkkP+LXRnBAlIaUUpRoFUu4aBZHQLIp3cG1QZZ1fZQoaAZoCWgPQwg9X7NcNg1xQJSGlFKUaBVLy2gWR0CyKft4VymzdX2UKGgGaAloD0MI8Z9uoMDzb0CUhpRSlGgVS89oFkdAsin+B06o2nV9lChoBmgJaA9DCKfJjLeV/nBAlIaUUpRoFUvEaBZHQLIqFw/PgNx1fZQoaAZoCWgPQwhLWvENhXdxQJSGlFKUaBVLt2gWR0CyKhtUbT+edX2UKGgGaAloD0MIavmBqzz1cUCUhpRSlGgVS7FoFkdAsiog6Kcd53V9lChoBmgJaA9DCPGD86ljGXBAlIaUUpRoFUu6aBZHQLIqIdKNAC51fZQoaAZoCWgPQwgSTaCIRS1xQJSGlFKUaBVLzmgWR0CyKimdupCKdX2UKGgGaAloD0MIA+55/vR/cUCUhpRSlGgVS71oFkdAsio5deIEbHV9lChoBmgJaA9DCHeBkgJLenFAlIaUUpRoFUu4aBZHQLIqVA3kxRF1fZQoaAZoCWgPQwgtmPijaIhzQJSGlFKUaBVLz2gWR0CyKpnEyckMdX2UKGgGaAloD0MIzM8NTRkvcECUhpRSlGgVS75oFkdAsiqi4nWrfnV9lChoBmgJaA9DCJm8AWb+DHJAlIaUUpRoFUuvaBZHQLIqpW5H3Dh1fZQoaAZoCWgPQwgh6dMqOilzQJSGlFKUaBVL12gWR0CyKqj/+85CdX2UKGgGaAloD0MIuQA0ShdgcUCUhpRSlGgVS8loFkdAsiqyw7kn1HV9lChoBmgJaA9DCNQQVfjz43FAlIaUUpRoFUujaBZHQLIqtu/k/8l1fZQoaAZoCWgPQwgrobskjkhzQJSGlFKUaBVL4mgWR0CyKsDrRjSYdX2UKGgGaAloD0MI7Zv7q8eFcUCUhpRSlGgVS61oFkdAsitW8jAzpHV9lChoBmgJaA9DCELpCyFnv3FAlIaUUpRoFUvVaBZHQLIrapwCKaZ1fZQoaAZoCWgPQwjQm4pU2KJwQJSGlFKUaBVLtmgWR0CyK3edwvQGdX2UKGgGaAloD0MIo68gzdj9cECUhpRSlGgVS9RoFkdAsiuFsnAqNXV9lChoBmgJaA9DCKfK94zEc3BAlIaUUpRoFUvLaBZHQLIrha9K28Z1fZQoaAZoCWgPQwjMJVXbzUxyQJSGlFKUaBVL3GgWR0CyK5kliSaFdX2UKGgGaAloD0MImIdM+RBjc0CUhpRSlGgVS8toFkdAsiug5aNdaHV9lChoBmgJaA9DCF653jaTz3JAlIaUUpRoFUvOaBZHQLIrvxeLNwB1fZQoaAZoCWgPQwgs2EY82UBwQJSGlFKUaBVLwmgWR0CyK/o8yN4rdX2UKGgGaAloD0MIVACMZ5CwcUCUhpRSlGgVS8FoFkdAsiv/xSYPXnV9lChoBmgJaA9DCCFaK9pcrnBAlIaUUpRoFUvOaBZHQLIsAU7CBPN1fZQoaAZoCWgPQwgWURN9Pp1wQJSGlFKUaBVLtmgWR0CyLAJ3LV4HdX2UKGgGaAloD0MISx+6oD7EcUCUhpRSlGgVS9loFkdAsiwY3FUADXV9lChoBmgJaA9DCNuJkpBIB05AlIaUUpRoFUubaBZHQLIsIA3T/hl1fZQoaAZoCWgPQwiKWS+GsoZwQJSGlFKUaBVLxmgWR0CyLCAk1MufdX2UKGgGaAloD0MISgfr/xxBcUCUhpRSlGgVS9JoFkdAsixS+pOvdXV9lChoBmgJaA9DCD3TS4wlTXJAlIaUUpRoFUu6aBZHQLIseUiY9gZ1fZQoaAZoCWgPQwjvAbovJ+xzQJSGlFKUaBVL2WgWR0CyLHrksBhhdX2UKGgGaAloD0MIOC7jpoZWcECUhpRSlGgVS7xoFkdAsiyE+wC8vnV9lChoBmgJaA9DCEpFY+0vY3FAlIaUUpRoFUvfaBZHQLIskjhUBGR1ZS4="
73
  },
74
  "ep_success_buffer": {
75
  ":type:": "<class 'collections.deque'>",
76
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
77
  },
78
+ "_n_updates": 1224,
79
  "n_steps": 1024,
80
  "gamma": 0.999,
81
  "gae_lambda": 0.98,
ppo-LunarLander-v2/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5950de0cbf2d4eecc872b9c5ccce981a0b18440f1b12ee4ef3c6d55470dced3e
3
  size 84893
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:742b623d7a7441b3f7e06d8d35d74d3bff9f85f6540665d3c6bfc88d95a5515c
3
  size 84893
ppo-LunarLander-v2/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e1d4d83b2555bfbc9a59deee8fd0ce18a36afcfee1f70810b0e25726b0ce58be
3
  size 43201
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:544a206e8d5bc28275a7aefa49dc07cb176fb33b33cc6867ae46bd379a240523
3
  size 43201
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4730a96c3a0bb94d4bea4ea8e673b8b4ae75e00fdf854a364e07a540e1eac324
3
- size 200661
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e6f25991b824c4ee70d60717fd0fa773bb0314016b9377d154e68d788d266b99
3
+ size 203960
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 268.87940216743846, "std_reward": 16.335514984213358, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2022-05-15T21:09:05.450622"}
 
1
+ {"mean_reward": 280.06620169324304, "std_reward": 14.867982529070549, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2022-05-15T21:15:33.948162"}