nadirbekovnadir commited on
Commit
cb26f54
1 Parent(s): 22df7e0

One more try!

Browse files
README.md CHANGED
@@ -10,7 +10,7 @@ model-index:
10
  results:
11
  - metrics:
12
  - type: mean_reward
13
- value: 276.26 +/- 18.75
14
  name: mean_reward
15
  task:
16
  type: reinforcement-learning
 
10
  results:
11
  - metrics:
12
  - type: mean_reward
13
+ value: 280.58 +/- 16.13
14
  name: mean_reward
15
  task:
16
  type: reinforcement-learning
config.json CHANGED
@@ -1 +1 @@
1
- {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f1926842f80>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f1926843010>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f19268430a0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f1926843130>", "_build": "<function ActorCriticPolicy._build at 0x7f19268431c0>", "forward": "<function ActorCriticPolicy.forward at 0x7f1926843250>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f19268432e0>", "_predict": "<function ActorCriticPolicy._predict at 0x7f1926843370>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f1926843400>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f1926843490>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f1926843520>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7f1926845a80>"}, "verbose": 1, "policy_kwargs": {}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVpQEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/5RoC0sIhZSMAUOUdJRSlIwEaGlnaJRoEyiWIAAAAAAAAAAAAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAf5RoC0sIhZRoFnSUUpSMDWJvdW5kZWRfYmVsb3eUaBMolggAAAAAAAAAAAAAAAAAAACUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBZ0lFKUjA1ib3VuZGVkX2Fib3ZllGgTKJYIAAAAAAAAAAAAAAAAAAAAlGgiSwiFlGgWdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [8], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False]", "bounded_above": "[False False False False False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gAWViAAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu", "n": 4, "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "num_timesteps": 2015232, "_total_timesteps": 2000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1652207206.5813828, "learning_rate": 0.0003, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWV+QIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAEsBSwFLE0MEiABTAJROhZQpjAFflIWUjGQvaG9tZS9uYWRpcmJla292L2FuYWNvbmRhMy9lbnZzL2hmLXJsL2xpYi9weXRob24zLjEwL3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxkL2hvbWUvbmFkaXJiZWtvdi9hbmFjb25kYTMvZW52cy9oZi1ybC9saWIvcHl0aG9uMy4xMC9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGggfZR9lChoF2gOjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoGIwHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/M6kqMFUyYYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAANooub3QPP4+YNblvSsz474OR8O9yaIfvQAAAAAAAAAAgE4dvVJMVD7pnCW+UKqrvgkPsL36HoY8AAAAAAAAAABmiCy8tjAQvDJcSD2McZ48Tk93PRlgg70AAIA/AACAP5r+nr0T74M/IGxSvgcvFr+I4Sy9wzMlvQAAAAAAAAAAGnIjvsOIEz/WKbW8xCnlvnZ46r1rSyw9AAAAAAAAAADNzDu7vRtaPFvNvT0DzlO+CP6BveeXLj0AAAAAAAAAAHPwj70qXp8/ZeRVvoJRJL9PKby9nMQqPAAAAAAAAAAA/VNaviULlT66/oc+VKRavg9ttLz9OdY8AAAAAAAAAADzAE4+w7+3P952HT8LPpe+7XywPkparD4AAAAAAAAAAJrNST0fxaS5Lh2FMcsa4ilnsbc7Y+7ysQAAgD8AAIA/jdfcPWsHbj84RJo9+qnavgOXkD4USb+9AAAAAAAAAABNq/a9jHHEPlX3/DxShqm+OouMvSYSrD0AAAAAAAAAAGa90LxCbLs/RWisvr17hD62gsq6MK3nvQAAAAAAAAAAZmw/veHEqrqlsbG2l4yusRNKPjr3lMw1AACAPwAAgD9aHng+/MySP/oUQT5B8tO+cCQIPxlZKj0AAAAAAAAAAI1eKL7fAIM+4IKtPtKMab4fOS09eqpTPQAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.007616000000000067, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVKxAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIYtwNovVtcECUhpRSlIwBbJRNAAGMAXSUR0C5PBCUHIIXdX2UKGgGaAloD0MIyXTo9LwYcUCUhpRSlGgVS89oFkdAuTwnJKaodnV9lChoBmgJaA9DCAAAAABABXJAlIaUUpRoFUv5aBZHQLk8Rz06HTJ1fZQoaAZoCWgPQwg4oRABBxByQJSGlFKUaBVLzmgWR0C5PHlkDp1SdX2UKGgGaAloD0MIjln2JDC9b0CUhpRSlGgVS/VoFkdAuTy0+PikwnV9lChoBmgJaA9DCEta8Q0FYG5AlIaUUpRoFUvPaBZHQLk8ub6xgRd1fZQoaAZoCWgPQwgNcEG27K1xQJSGlFKUaBVLy2gWR0C5PL8chkiEdX2UKGgGaAloD0MIQBU3bjFfU0CUhpRSlGgVS7BoFkdAuTzH4+KTCHV9lChoBmgJaA9DCAn/ImjMnHBAlIaUUpRoFUvTaBZHQLk8/UGmk311fZQoaAZoCWgPQwjbTlsjAqRzQJSGlFKUaBVL/WgWR0C5PRX6ZYxMdX2UKGgGaAloD0MIE7afjPHXSECUhpRSlGgVS59oFkdAuT0awTufEnV9lChoBmgJaA9DCNVbA1sl7nBAlIaUUpRoFUvDaBZHQLk9PaHbh3t1fZQoaAZoCWgPQwhYdVYL7P5wQJSGlFKUaBVL2WgWR0C5PU1HOKO1dX2UKGgGaAloD0MIDmsqi4JUcECUhpRSlGgVS+poFkdAuT1p3t8eCHV9lChoBmgJaA9DCBkAqrixBXBAlIaUUpRoFUveaBZHQLk9a9AHE/B1fZQoaAZoCWgPQwhmo3N+itZwQJSGlFKUaBVNAQFoFkdAuT2TgDRtxnV9lChoBmgJaA9DCBgFweNb5W9AlIaUUpRoFUvhaBZHQLk9y51eSjh1fZQoaAZoCWgPQwjIYMWpFohxQJSGlFKUaBVL/2gWR0C5PdqbWmP6dX2UKGgGaAloD0MIaD9SRIYHQ0CUhpRSlGgVS6doFkdAuT3ggZCOWHV9lChoBmgJaA9DCH9skh9xEnFAlIaUUpRoFUvdaBZHQLk9+BoVVPx1fZQoaAZoCWgPQwheMLjmTpRwQJSGlFKUaBVLxGgWR0C5Phlh5PdmdX2UKGgGaAloD0MIBKvq5fcHc0CUhpRSlGgVS9VoFkdAuT4kYTCcgHV9lChoBmgJaA9DCOVjd4GSvXFAlIaUUpRoFUu/aBZHQLk+ZEb5uZV1fZQoaAZoCWgPQwi+huC4jENxQJSGlFKUaBVL1mgWR0C5Pm9Eb5uZdX2UKGgGaAloD0MImUaTizEWckCUhpRSlGgVTQkBaBZHQLk+gJ66asp1fZQoaAZoCWgPQwgVHcnlv19wQJSGlFKUaBVL6WgWR0C5PqZR8+ibdX2UKGgGaAloD0MI39xfPW60cUCUhpRSlGgVS9RoFkdAuUu+JGe+VXV9lChoBmgJaA9DCOz5muWyh3BAlIaUUpRoFUvGaBZHQLlLwmuDBdl1fZQoaAZoCWgPQwguVWmLq1VyQJSGlFKUaBVLx2gWR0C5S8KLfk3kdX2UKGgGaAloD0MInx7bMmAmcUCUhpRSlGgVS8RoFkdAuUvcE7nxKHV9lChoBmgJaA9DCPGhREuelmxAlIaUUpRoFUvLaBZHQLlMHu1F6Rh1fZQoaAZoCWgPQwjmB67yBLVxQJSGlFKUaBVL0WgWR0C5TCMrEtNBdX2UKGgGaAloD0MILUFGQIXscUCUhpRSlGgVS+FoFkdAuUwu/nGKh3V9lChoBmgJaA9DCOOON/mtpXNAlIaUUpRoFUvGaBZHQLlMSFXJYDF1fZQoaAZoCWgPQwgfSUkPg0ZxQJSGlFKUaBVL1mgWR0C5TGcpsoDxdX2UKGgGaAloD0MIMQkX8ohWckCUhpRSlGgVS/BoFkdAuUxnWwu/UXV9lChoBmgJaA9DCHwPlxy323FAlIaUUpRoFU1pAWgWR0C5THyV0Lc9dX2UKGgGaAloD0MINfEO8CT9b0CUhpRSlGgVS+VoFkdAuUyv0OEuhHV9lChoBmgJaA9DCI9xxcVRmHBAlIaUUpRoFUvQaBZHQLlM3ttALRd1fZQoaAZoCWgPQwiBsilXeLxxQJSGlFKUaBVNCQFoFkdAuUzzNorWiHV9lChoBmgJaA9DCJSHhVqTcHJAlIaUUpRoFUvdaBZHQLlM96By0a91fZQoaAZoCWgPQwgHlbiO8UdyQJSGlFKUaBVL0mgWR0C5TQX4TK1YdX2UKGgGaAloD0MIOMDMd3BrcECUhpRSlGgVS/BoFkdAuU0TrHEMs3V9lChoBmgJaA9DCJoklpQ7uHJAlIaUUpRoFU0oAWgWR0C5TS+UD+zddX2UKGgGaAloD0MIshLzrGR5ckCUhpRSlGgVTRwBaBZHQLlNPVmBe5Z1fZQoaAZoCWgPQwgm/5O/O89yQJSGlFKUaBVL0GgWR0C5TUtxZMcqdX2UKGgGaAloD0MI8UdRZ+6Ec0CUhpRSlGgVS/RoFkdAuU2O6RQrMHV9lChoBmgJaA9DCMWRByKL3G1AlIaUUpRoFUvOaBZHQLlNkoq0+kh1fZQoaAZoCWgPQwi+FYkJ6npxQJSGlFKUaBVL6GgWR0C5TZmGVRk3dX2UKGgGaAloD0MI4bVLG04KcUCUhpRSlGgVTQYBaBZHQLlNoCZWq951fZQoaAZoCWgPQwhlxXB1gKFxQJSGlFKUaBVL4GgWR0C5TbDm4iHJdX2UKGgGaAloD0MIZ7Yr9MEwZ0CUhpRSlGgVTegDaBZHQLlNznUUfxN1fZQoaAZoCWgPQwjIBtLFJgJxQJSGlFKUaBVL2GgWR0C5Tfhp1zQvdX2UKGgGaAloD0MI18BWCRa0UUCUhpRSlGgVS6VoFkdAuU4MMPSUknV9lChoBmgJaA9DCH0Iqkbv3nNAlIaUUpRoFU0gAWgWR0C5Ti1VHWjHdX2UKGgGaAloD0MIgbIpVziocECUhpRSlGgVS9JoFkdAuU41EQXhwXV9lChoBmgJaA9DCNNqSNwjzHJAlIaUUpRoFUveaBZHQLlOQt/FzdV1fZQoaAZoCWgPQwhmTwKbs+pxQJSGlFKUaBVL1WgWR0C5TkkUO/cndX2UKGgGaAloD0MIELOXbaeqcECUhpRSlGgVS9ZoFkdAuU51DneSCHV9lChoBmgJaA9DCK7xmewfUnBAlIaUUpRoFUvNaBZHQLlOdp97Wup1fZQoaAZoCWgPQwjIs8u3/vpyQJSGlFKUaBVNIQFoFkdAuU6VTdcjaHV9lChoBmgJaA9DCDuOHyoNEHJAlIaUUpRoFUveaBZHQLlOoER8MNN1fZQoaAZoCWgPQwgMlBRYAFc3QJSGlFKUaBVLtmgWR0C5Trf863iJdX2UKGgGaAloD0MIUIwsmaMhc0CUhpRSlGgVS9NoFkdAuU7UfyPMjnV9lChoBmgJaA9DCAFuFi8WwW5AlIaUUpRoFUvTaBZHQLlO3efI0ZZ1fZQoaAZoCWgPQwgxJZLoJZ9yQJSGlFKUaBVLyGgWR0C5TuJKSPludX2UKGgGaAloD0MIJ79FJ8ssckCUhpRSlGgVS8loFkdAuU8BakhzNnV9lChoBmgJaA9DCHRiD+2jynBAlIaUUpRoFUv3aBZHQLlPEJx//ed1fZQoaAZoCWgPQwjHuU24F0VzQJSGlFKUaBVLz2gWR0C5TzFJDmbLdX2UKGgGaAloD0MI4Zumzw4WcUCUhpRSlGgVS8NoFkdAuU9qIbfgrHV9lChoBmgJaA9DCByZR/7g9G9AlIaUUpRoFUvWaBZHQLlPe1jy4F11fZQoaAZoCWgPQwialIJur0VvQJSGlFKUaBVL9mgWR0C5T4RDohZAdX2UKGgGaAloD0MIsDcxJKfNbkCUhpRSlGgVS9BoFkdAuU+4Bfa6BnV9lChoBmgJaA9DCDDxR1Fn3XJAlIaUUpRoFU0JAWgWR0C5T8ZKSPludX2UKGgGaAloD0MIggAZOjYnckCUhpRSlGgVS/loFkdAuU/J03fhuXV9lChoBmgJaA9DCNPddTYkjXNAlIaUUpRoFUvcaBZHQLlPy3Tuv2Z1fZQoaAZoCWgPQwhdv2A37GNvQJSGlFKUaBVL5GgWR0C5T/Rdt2s8dX2UKGgGaAloD0MI9zk+WpwucECUhpRSlGgVS81oFkdAuU/4G/vfCXV9lChoBmgJaA9DCCKNCpxshnFAlIaUUpRoFUu9aBZHQLlQCKxcE/11fZQoaAZoCWgPQwgWhV0U/cByQJSGlFKUaBVLxGgWR0C5UDJZbILgdX2UKGgGaAloD0MIOxvyz4wBcECUhpRSlGgVTQkBaBZHQLlQO4yXUpd1fZQoaAZoCWgPQwj5vyMq1GlvQJSGlFKUaBVLzGgWR0C5UFQvtdAxdX2UKGgGaAloD0MI2cwhqQVVc0CUhpRSlGgVS/toFkdAuVBtQuVX3nV9lChoBmgJaA9DCHwsfejCsnBAlIaUUpRoFUvGaBZHQLlQcVxjriV1fZQoaAZoCWgPQwhuvhHdM7FyQJSGlFKUaBVNEAFoFkdAuVCGPMjeK3V9lChoBmgJaA9DCMNmgAvylXNAlIaUUpRoFUvAaBZHQLlQoLKV6eJ1fZQoaAZoCWgPQwg0SSwp9/FxQJSGlFKUaBVLvmgWR0C5UK5PAO8TdX2UKGgGaAloD0MI3sfRHFmMckCUhpRSlGgVS81oFkdAuVDO/IsAenV9lChoBmgJaA9DCHo2qz7XMXNAlIaUUpRoFUu9aBZHQLlQ+5avA451fZQoaAZoCWgPQwhm9nmMcrdvQJSGlFKUaBVLy2gWR0C5UQ8brC3xdX2UKGgGaAloD0MIFoielIltc0CUhpRSlGgVS+FoFkdAuVEmUliSaHV9lChoBmgJaA9DCLggW5YvPHFAlIaUUpRoFUvBaBZHQLlRSBFd9lV1fZQoaAZoCWgPQwiEnWLV4IZzQJSGlFKUaBVL1GgWR0C5UVEr08NhdX2UKGgGaAloD0MInGuYoXGtcECUhpRSlGgVS/VoFkdAuVFX6LwWnHV9lChoBmgJaA9DCDi7tUwGZnBAlIaUUpRoFUvLaBZHQLlRjgGbCrN1fZQoaAZoCWgPQwi3fvrPWkpwQJSGlFKUaBVL+WgWR0C5UZLfDUExdX2UKGgGaAloD0MIb7plh/irbkCUhpRSlGgVS9hoFkdAuVGaqHXVb3V9lChoBmgJaA9DCI+Oq5Fd3m5AlIaUUpRoFUvIaBZHQLlRnYb83uN1fZQoaAZoCWgPQwghH/RsFt1xQJSGlFKUaBVLwmgWR0C5UawSeyzHdX2UKGgGaAloD0MI2QjE6/qgckCUhpRSlGgVS9ZoFkdAuVHPHvMKTnVlLg=="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 492, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.995, "ent_coef": 0.005, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 32, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWV+QIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAEsBSwFLE0MEiABTAJROhZQpjAFflIWUjGQvaG9tZS9uYWRpcmJla292L2FuYWNvbmRhMy9lbnZzL2hmLXJsL2xpYi9weXRob24zLjEwL3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgEMCAA2UjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxkL2hvbWUvbmFkaXJiZWtvdi9hbmFjb25kYTMvZW52cy9oZi1ybC9saWIvcHl0aG9uMy4xMC9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGggfZR9lChoF2gOjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoGIwHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/yZmZmZmZmoWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "system_info": {"OS": "Linux-5.10.16.3-microsoft-standard-WSL2-x86_64-with-glibc2.31 #1 SMP Fri Apr 2 22:23:49 UTC 2021", "Python": "3.10.4", "Stable-Baselines3": "1.5.0", "PyTorch": "1.11.0", "GPU Enabled": "True", "Numpy": "1.21.5", "Gym": "0.21.0"}}
 
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f07385125f0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f0738512680>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f0738512710>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f07385127a0>", "_build": "<function ActorCriticPolicy._build at 0x7f0738512830>", "forward": "<function ActorCriticPolicy.forward at 0x7f07385128c0>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f0738512950>", "_predict": "<function ActorCriticPolicy._predict at 0x7f07385129e0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f0738512a70>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f0738512b00>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f0738512b90>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7f07385157c0>"}, "verbose": 1, "policy_kwargs": {}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVpQEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/5RoC0sIhZSMAUOUdJRSlIwEaGlnaJRoEyiWIAAAAAAAAAAAAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAf5RoC0sIhZRoFnSUUpSMDWJvdW5kZWRfYmVsb3eUaBMolggAAAAAAAAAAAAAAAAAAACUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBZ0lFKUjA1ib3VuZGVkX2Fib3ZllGgTKJYIAAAAAAAAAAAAAAAAAAAAlGgiSwiFlGgWdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [8], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False]", "bounded_above": "[False False False False False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gAWViAAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu", "n": 4, "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 64, "num_timesteps": 3014656, "_total_timesteps": 3000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1652378866.9388123, "learning_rate": 0.0003, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWV+QIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAEsBSwFLE0MEiABTAJROhZQpjAFflIWUjGQvaG9tZS9uYWRpcmJla292L2FuYWNvbmRhMy9lbnZzL2hmLXJsL2xpYi9weXRob24zLjEwL3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxkL2hvbWUvbmFkaXJiZWtvdi9hbmFjb25kYTMvZW52cy9oZi1ybC9saWIvcHl0aG9uMy4xMC9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGggfZR9lChoF2gOjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoGIwHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/M6kqMFUyYYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQgAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYACAAAAAAAAOYgBj2PxlK6n4UbOVHWfba2qYI6VQkzuAAAgD8AAIA/msHEPJBWtD+2GRw+qsZFvsIJVD0+Oq89AAAAAAAAAABmWOg8gWnNPc68Tj3s2ZW+bTh7PeqrvDsAAAAAAAAAAC1jCr4X+Ws+RXOnPkFEmb50+wI8EGrzPQAAAAAAAAAAZmdJPc4vtT/y7yw/keFNvSIUkLyY/Is9AAAAAAAAAADNQhg9XNt4uuVjILZMeJGxY4bgOnvGQjUAAIA/AACAP81vRz6r8pM/AOQmPsLPFL9zLoE+r5yBPAAAAAAAAAAAswpEPY34ij6AZcy9oUOpvhVGJT091kM9AAAAAAAAAAAzAcw87a9BPvlcOr5h4sG++qVVvAOIwLwAAAAAAAAAAE0WK76FR6w/ZhAHv4PU577yxV6+Iul6vgAAAAAAAAAAJprKvTbjsz+CC8W+a3Chvj2oirxwZ/e9AAAAAAAAAACzqq69nwyXP0JTx77B3iK/Qk0FvqJpSL4AAAAAAAAAAK2lJL5PhhU/eg4ZPmrd6b553QS+BiT2PQAAAAAAAAAApmgHPs4G4z5tDO+9SWLZvlCcxj3/RwS+AAAAAAAAAABmPYw84GmYP2Uysj3wGyS/Y+IHPSmBn70AAAAAAAAAAGZS6rzhTJW6Gs2FOcZNATWMs8E6LVmYuAAAgD8AAIA/mpm8uQ+aBz2yoAI+ljObvl+w3jxLA4E9AAAAAAAAAABmQKu84QqTOUHnkLsRL4G5lCQUu1B+tToAAIA/AACAP82M0zkUsrW6/YJwvOcsgTwKkdM72rxgvQAAgD8AAIA/bekBvvP5Bj/921Q+h37Vvmpey724maE9AAAAAAAAAABmgEY9wwl6ukZENTgCixEzC6itumCFU7cAAIA/AACAP+bQKD4gS6E/ahCxPiJgGr8KHoM+++EjPQAAAAAAAAAA9viUPtYQHj8+58E8VmYSv23NGD9ypQO9AAAAAAAAAACaxMO8D2gNvEpQ0D1QIry674NlvRdBA7sAAIA/AACAP6trgr5/gUI//aW2vQKN+L6NsKu+om26PQAAAAAAAAAAZpZ7vHbtDrzaIjM8hZUoPTPhl7vQV066AACAPwAAgD/Ni2u+EDNRP94137w+ahO/ZQuWvuWu4TwAAAAAAAAAAM3aLz32oHS6lqwINcCIlTCreAe7YklqtAAAgD8AAIA/ZqpUPGhOrLxCW6Y78ttJPHi6GT73wiK9AACAPwAAgD9mBIW8+XqxPyrMCr+DNsa+OQJoPM/1nz0AAAAAAAAAADPgdT328EW67WbJPEfNu7yCuOi68kPFvAAAAAAAAAAAjROOPc5cgrz9MEy+N/R7PUKy5j2P0Lc6AAAAAAAAgD+a2u48kGSWP4cwgz3gRPK+pAOTPbikjj0AAAAAAAAAADqzLb6BHcI/yFcvv8Yrt71X7gS+olyZvgAAAAAAAAAAMzU+vZPFzT6dGB0+qXXsvleNoTwYhLg9AAAAAAAAAACaJTk9NcF7PkLBYL5GDNq+I6ojvcqXcL4AAAAAAAAAAK1kXr7G+Kc/npz7vofB+r7JJ5m+MgM2vgAAAAAAAAAAANwMPYjXt7wkq0U+AhNQPXUTBr64J4M8AACAPwAAgD8A13o+huFOP9Y+gj7VNAS/we/ePpZmGT4AAAAAAAAAADOMjj3hYI26VuF/OGZNfDNkHro64WKUtwAAgD8AAIA/M/WrPFRU7z2+DYq9p0SwvsbD+L3RRBG9AAAAAAAAAAAmzJu9r3YjPmKm+j7POaC+k5OIPqKbHj4AAAAAAAAAAOanS70Sja4/q6Ofvv3Wpr4VsC+92/T9vQAAAAAAAAAAzdIZvBfYsT/us2a+T6+OvmEbhDt5nbS8AAAAAAAAAADNHI67KXgIupuvTDNa6AGwh+/gOgZzzbMAAIA/AACAP7NrFb0XSDg+Lx3Gvhbzkb5RCbC+q9KIvQAAAAAAAAAAs0B9Po1nrz4Y6Lm+TnzXvknOVD4aYV++AAAAAAAAAAAA6CA8rY18PrqoxbzlqaO+NWkcPGAI3TwAAAAAAAAAADOjjLvsxuy7s8TMO/tggjzou0q9PTpcPQAAgD8AAIA/M2gyva45ibqCIjc3vIU3MtkdcrkuD1W2AACAPwAAgD+aWfE7KWAgum3Pzje3xzm2daNPOvvr67YAAIA/AACAP5rd6Dt8g1E+3OwJvaDiy763alS8LdLnOwAAAAAAAAAAADApPRSkkLq2MGu5VVVZtNEQMzoCaYg4AACAPwAAgD8AxdE8w7lyutZmjjj+Wha2EUZOO19AobcAAIA/AACAP5qqAL0eoYI9zXH6Pe/kcr4G/3Y9G0tkPQAAAAAAAAAAM88HPTaAoT8zEyo+vKUPv03CNj2lPpA9AAAAAAAAAACGkYA+f5cCP5vVar6R6P6+EfcuPrGiQ74AAAAAAAAAAENHf75YwrM+aGPKPus48L7WQ1W+3FyaPgAAAAAAAAAAs0MhPeFsrrrqYW63dXELsmcR1DhTrIg2AACAPwAAgD8a55O9qcx0PboEsz4WfYS+OScxPcP+Pz4AAAAAAAAAAAAT2b2Pfmq6vkvcuvNUY7VWe6a664P5OQAAgD8AAAAAZmqLPY8mR7rc1BQ+Tf/VNXtHRzo0/sc0AACAPwAAgD+zNig9ru+Eut8ApDZpmaox8hL+OmHYwrUAAIA/AACAP7OZDj38Qhs+FmQRvsskw75MHig704GovQAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYktASwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVswAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJZAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiS0CFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.004885333333333408, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVJhAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMI0NA/wQUKcECUhpRSlIwBbJRL3YwBdJRHQLfT/V8Ti851fZQoaAZoCWgPQwg+PEuQkc5zQJSGlFKUaBVLzGgWR0C31AEygwoLdX2UKGgGaAloD0MIbhYvFgbbcUCUhpRSlGgVS+doFkdAt9QwyKvV3HV9lChoBmgJaA9DCMKjjSNWdnJAlIaUUpRoFU1UAWgWR0C31DDj7yhBdX2UKGgGaAloD0MIEJaxoVs6cUCUhpRSlGgVS9FoFkdAt9Q0tbs4UHV9lChoBmgJaA9DCMXIkjkWvm9AlIaUUpRoFUvCaBZHQLfUTi5NGmV1fZQoaAZoCWgPQwiqu7ILhiZyQJSGlFKUaBVLxGgWR0C31E40qH45dX2UKGgGaAloD0MIvqPGhBgQckCUhpRSlGgVS9loFkdAt9Rug6EJ0HV9lChoBmgJaA9DCFKazeOwRHBAlIaUUpRoFUvbaBZHQLfUckxyn1p1fZQoaAZoCWgPQwhl+5C3nMJwQJSGlFKUaBVLymgWR0C31HJU1hsqdX2UKGgGaAloD0MIv7m/elw7ckCUhpRSlGgVS9poFkdAt9R5m6GxlnV9lChoBmgJaA9DCJGA0eWNTnJAlIaUUpRoFUvvaBZHQLfUi1RceKd1fZQoaAZoCWgPQwigppat9epwQJSGlFKUaBVL1GgWR0C31Itl2/zrdX2UKGgGaAloD0MI6Q/NPPmAcECUhpRSlGgVS9VoFkdAt9TEI4VARnV9lChoBmgJaA9DCEtXsI24dXNAlIaUUpRoFUvraBZHQLfUz03fhuR1fZQoaAZoCWgPQwjK+s3EtGNzQJSGlFKUaBVNBwFoFkdAt9TS/zreInV9lChoBmgJaA9DCCh9IeS8J3FAlIaUUpRoFUvSaBZHQLfU4WyTpxF1fZQoaAZoCWgPQwiWJM/1PQhwQJSGlFKUaBVLzWgWR0C31OxRAKOUdX2UKGgGaAloD0MIOZhNgCFMcUCUhpRSlGgVS9NoFkdAt9Tz9bX6InV9lChoBmgJaA9DCLlPjgJEV3JAlIaUUpRoFUuxaBZHQLfU/wAlv611fZQoaAZoCWgPQwijVpi+1yw7QJSGlFKUaBVLnmgWR0C31QpZbILgdX2UKGgGaAloD0MIP8bctUTQcECUhpRSlGgVS9JoFkdAt9UbOD8Lr3V9lChoBmgJaA9DCF8JpMQu1HBAlIaUUpRoFU0KAWgWR0C31Rt0vGp/dX2UKGgGaAloD0MIE/QXesQtcECUhpRSlGgVS8BoFkdAt9UuBVdX1nV9lChoBmgJaA9DCMdmR6rvlXBAlIaUUpRoFUvYaBZHQLfVQ9deIEd1fZQoaAZoCWgPQwhCPujZrJRwQJSGlFKUaBVL2WgWR0C31U845tFbdX2UKGgGaAloD0MI2+BE9OtTckCUhpRSlGgVS+xoFkdAt9Vd2t+1B3V9lChoBmgJaA9DCJ+QnbfxX3NAlIaUUpRoFUvdaBZHQLfVYbn5i3J1fZQoaAZoCWgPQwicU8kAUINvQJSGlFKUaBVL92gWR0C31WlG5MDfdX2UKGgGaAloD0MII8DpXbwzcUCUhpRSlGgVS9doFkdAt9VwSWZ7X3V9lChoBmgJaA9DCHtntFVJanJAlIaUUpRoFUvyaBZHQLfVd5q/M4d1fZQoaAZoCWgPQwhwd9ZuO15wQJSGlFKUaBVLzWgWR0C31Y26wt8NdX2UKGgGaAloD0MI5dTOMPVecUCUhpRSlGgVS/loFkdAt9WN98Z1m3V9lChoBmgJaA9DCJcA/FPqtnFAlIaUUpRoFUvGaBZHQLfVlRFZxJd1fZQoaAZoCWgPQwipF3yaE3NwQJSGlFKUaBVL+2gWR0C31a2mP5pKdX2UKGgGaAloD0MI2qoksg87ckCUhpRSlGgVS9toFkdAt9W4VwgkknV9lChoBmgJaA9DCJseFJQiH3FAlIaUUpRoFUu4aBZHQLfVylnAZbZ1fZQoaAZoCWgPQwghyEEJM7dLQJSGlFKUaBVLp2gWR0C31eqpDNQkdX2UKGgGaAloD0MITwKbc3Cdc0CUhpRSlGgVS9VoFkdAt9X3VhCtzXV9lChoBmgJaA9DCFXejnCaw3BAlIaUUpRoFUvmaBZHQLfV96Kcd5p1fZQoaAZoCWgPQwgIyJdQQdxwQJSGlFKUaBVL1WgWR0C31f+U+s5odX2UKGgGaAloD0MI22/tRMk8bkCUhpRSlGgVS9JoFkdAt9YHaQFLWnV9lChoBmgJaA9DCJ0PzxJkTHJAlIaUUpRoFUvZaBZHQLfWC1zhgmZ1fZQoaAZoCWgPQwgZyLPLN19xQJSGlFKUaBVL4GgWR0C31hLcXWOIdX2UKGgGaAloD0MIONvcmF5OckCUhpRSlGgVS/FoFkdAt9YS/M4cWHV9lChoBmgJaA9DCKlqgqi7V3BAlIaUUpRoFUvUaBZHQLfWGgGr0at1fZQoaAZoCWgPQwh41JgQ87FyQJSGlFKUaBVL62gWR0C31hoh6jWTdX2UKGgGaAloD0MIZw+0AkMsb0CUhpRSlGgVS+1oFkdAt9YkaLn9vXV9lChoBmgJaA9DCI4G8BZItnFAlIaUUpRoFUvJaBZHQLfWJGyX2M91fZQoaAZoCWgPQwhwXpz4qsxxQJSGlFKUaBVLyGgWR0C31ljhcZ+AdX2UKGgGaAloD0MI0VlmEQqzcECUhpRSlGgVS8hoFkdAt9Z3PzFuN3V9lChoBmgJaA9DCGu28pL/629AlIaUUpRoFUvSaBZHQLfWhQC0WuZ1fZQoaAZoCWgPQwiIS4475VxxQJSGlFKUaBVL1GgWR0C31oiudPLxdX2UKGgGaAloD0MIiEZ3EPubcUCUhpRSlGgVS+NoFkdAt9aWoHcDbXV9lChoBmgJaA9DCKBrX0DvTnNAlIaUUpRoFUv/aBZHQLfWpR4QjD91fZQoaAZoCWgPQwgI46dxb0BzQJSGlFKUaBVNDAFoFkdAt9alUtI07HV9lChoBmgJaA9DCBGQL6ECYnNAlIaUUpRoFUvSaBZHQLfWr9MsYl91fZQoaAZoCWgPQwiCrn0B/SFxQJSGlFKUaBVLsGgWR0C31sqCL/CJdX2UKGgGaAloD0MIMX4a96a1ckCUhpRSlGgVS+doFkdAt9bXnU2DQXV9lChoBmgJaA9DCMGPativW3FAlIaUUpRoFUvQaBZHQLfW281n/T91fZQoaAZoCWgPQwi3skRnWd9xQJSGlFKUaBVL5mgWR0C31v5vo/zKdX2UKGgGaAloD0MIvvkNE00vcUCUhpRSlGgVS8hoFkdAt9cGW7e2u3V9lChoBmgJaA9DCPs/h/nyKnJAlIaUUpRoFUvYaBZHQLfXCgOz6ad1fZQoaAZoCWgPQwgD7KNTV+FxQJSGlFKUaBVLvWgWR0C31xweRxLkdX2UKGgGaAloD0MILo81IwNtcUCUhpRSlGgVS+xoFkdAt9cjatcOb3V9lChoBmgJaA9DCNvdA3Tfn21AlIaUUpRoFUvXaBZHQLfXOCNCJGh1fZQoaAZoCWgPQwgt0sQ7QAxzQJSGlFKUaBVL0GgWR0C31zuIRAbAdX2UKGgGaAloD0MIBcWPMfckb0CUhpRSlGgVS81oFkdAt9dRrgwXZXV9lChoBmgJaA9DCGe4AZ8fiXFAlIaUUpRoFUvIaBZHQLfXXMb3oLZ1fZQoaAZoCWgPQwiEud3LfVRxQJSGlFKUaBVLzWgWR0C3125TyauwdX2UKGgGaAloD0MIbJbLRucVckCUhpRSlGgVS+hoFkdAt9d1hc7henV9lChoBmgJaA9DCHLBGfy9WnBAlIaUUpRoFUvYaBZHQLfXhA2hqTN1fZQoaAZoCWgPQwiazk4Ghz5wQJSGlFKUaBVNmQFoFkdAt9eHz4DcM3V9lChoBmgJaA9DCJ55Oey+eHJAlIaUUpRoFUv/aBZHQLfXmNsFdLR1fZQoaAZoCWgPQwhgBmNEYgdyQJSGlFKUaBVLvWgWR0C315wvL5h0dX2UKGgGaAloD0MIwCUA/1RdckCUhpRSlGgVS8xoFkdAt9eyGmDUVnV9lChoBmgJaA9DCAA5YcJoPHNAlIaUUpRoFUvFaBZHQLfXsit7rs11fZQoaAZoCWgPQwh+UYL+whZwQJSGlFKUaBVLyGgWR0C319fRu0kXdX2UKGgGaAloD0MILzVCP1MZb0CUhpRSlGgVS8toFkdAt9fX81n/UHV9lChoBmgJaA9DCHZSX5Z2BXFAlIaUUpRoFUvZaBZHQLfX29TP0I11fZQoaAZoCWgPQwi139qJkstVQJSGlFKUaBVN6ANoFkdAt9frWhAWznV9lChoBmgJaA9DCN481SF3jHNAlIaUUpRoFUvoaBZHQLfYBx20Re11fZQoaAZoCWgPQwgvwakP5DdyQJSGlFKUaBVLyWgWR0C32CrlvIfbdX2UKGgGaAloD0MICfmgZ3P7cUCUhpRSlGgVS+xoFkdAt9gyEqUeMnV9lChoBmgJaA9DCLd++s9aYXJAlIaUUpRoFUvPaBZHQLfYRKcNH6N1fZQoaAZoCWgPQwj7PEZ5pntwQJSGlFKUaBVL5GgWR0C32HYbn5i3dX2UKGgGaAloD0MIbTgsDXxEcUCUhpRSlGgVS/FoFkdAt9h97u2JBXV9lChoBmgJaA9DCJEm3gGeZnFAlIaUUpRoFUvWaBZHQLfYjYpDu0F1fZQoaAZoCWgPQwiUoL/QIxJyQJSGlFKUaBVL1GgWR0C32KhTsIE9dX2UKGgGaAloD0MIl65gG/Ebb0CUhpRSlGgVS99oFkdAt9iwSAYpD3V9lChoBmgJaA9DCH0/NV56mHNAlIaUUpRoFUvTaBZHQLfYw9OARTV1fZQoaAZoCWgPQwhHHLKBNBVxQJSGlFKUaBVL9mgWR0C32MfIGQjmdX2UKGgGaAloD0MIpBmLpjPQcECUhpRSlGgVS+toFkdAt9jH3XZoPHV9lChoBmgJaA9DCKio+pUORXFAlIaUUpRoFUvvaBZHQLfYz7dSEUV1fZQoaAZoCWgPQwjBqQ8kL49xQJSGlFKUaBVNCQFoFkdAt9jbBKtga3V9lChoBmgJaA9DCCDQmbTpKHFAlIaUUpRoFUvQaBZHQLfY5ld1Mdt1fZQoaAZoCWgPQwj5n/zde/lxQJSGlFKUaBVNBwFoFkdAt9jmGSIP9XV9lChoBmgJaA9DCNo7o61K/XFAlIaUUpRoFUvpaBZHQLfZArpJPIp1fZQoaAZoCWgPQwitad5xCrFoQJSGlFKUaBVNOwJoFkdAt9kOMZP2wnV9lChoBmgJaA9DCPQxHxDo6XJAlIaUUpRoFUvfaBZHQLfZEgZjx1B1ZS4="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 368, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.995, "ent_coef": 0.005, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 32, "n_epochs": 8, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWV+wIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAEsBSwFLE0MEiABTAJROhZQpjAFflIWUjGQvaG9tZS9uYWRpcmJla292L2FuYWNvbmRhMy9lbnZzL2hmLXJsL2xpYi9weXRob24zLjEwL3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgEMEAIAA35SMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjGQvaG9tZS9uYWRpcmJla292L2FuYWNvbmRhMy9lbnZzL2hmLXJsL2xpYi9weXRob24zLjEwL3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCB9lH2UKGgXaA6MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgYjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "system_info": {"OS": "Linux-5.10.16.3-microsoft-standard-WSL2-x86_64-with-glibc2.31 #1 SMP Fri Apr 2 22:23:49 UTC 2021", "Python": "3.10.4", "Stable-Baselines3": "1.5.0", "PyTorch": "1.11.0", "GPU Enabled": "True", "Numpy": "1.21.5", "Gym": "0.21.0"}}
ppo-LunarLander-v2.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:59c80de87083103c96119a1d216aabbb417f9dd26b65252183ee94cbcc2b9396
3
- size 144193
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab1fce010a6e4fb7f4f6164d262b6bfb83815ec888ab742a97a99e005971cd62
3
+ size 146297
ppo-LunarLander-v2/data CHANGED
@@ -4,19 +4,19 @@
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
- "__init__": "<function ActorCriticPolicy.__init__ at 0x7f1926842f80>",
8
- "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f1926843010>",
9
- "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f19268430a0>",
10
- "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f1926843130>",
11
- "_build": "<function ActorCriticPolicy._build at 0x7f19268431c0>",
12
- "forward": "<function ActorCriticPolicy.forward at 0x7f1926843250>",
13
- "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f19268432e0>",
14
- "_predict": "<function ActorCriticPolicy._predict at 0x7f1926843370>",
15
- "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f1926843400>",
16
- "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f1926843490>",
17
- "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f1926843520>",
18
  "__abstractmethods__": "frozenset()",
19
- "_abc_impl": "<_abc._abc_data object at 0x7f1926845a80>"
20
  },
21
  "verbose": 1,
22
  "policy_kwargs": {},
@@ -41,13 +41,13 @@
41
  "dtype": "int64",
42
  "_np_random": null
43
  },
44
- "n_envs": 16,
45
- "num_timesteps": 2015232,
46
- "_total_timesteps": 2000000,
47
  "_num_timesteps_at_start": 0,
48
  "seed": null,
49
  "action_noise": null,
50
- "start_time": 1652207206.5813828,
51
  "learning_rate": 0.0003,
52
  "tensorboard_log": null,
53
  "lr_schedule": {
@@ -56,26 +56,26 @@
56
  },
57
  "_last_obs": {
58
  ":type:": "<class 'numpy.ndarray'>",
59
- ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAANooub3QPP4+YNblvSsz474OR8O9yaIfvQAAAAAAAAAAgE4dvVJMVD7pnCW+UKqrvgkPsL36HoY8AAAAAAAAAABmiCy8tjAQvDJcSD2McZ48Tk93PRlgg70AAIA/AACAP5r+nr0T74M/IGxSvgcvFr+I4Sy9wzMlvQAAAAAAAAAAGnIjvsOIEz/WKbW8xCnlvnZ46r1rSyw9AAAAAAAAAADNzDu7vRtaPFvNvT0DzlO+CP6BveeXLj0AAAAAAAAAAHPwj70qXp8/ZeRVvoJRJL9PKby9nMQqPAAAAAAAAAAA/VNaviULlT66/oc+VKRavg9ttLz9OdY8AAAAAAAAAADzAE4+w7+3P952HT8LPpe+7XywPkparD4AAAAAAAAAAJrNST0fxaS5Lh2FMcsa4ilnsbc7Y+7ysQAAgD8AAIA/jdfcPWsHbj84RJo9+qnavgOXkD4USb+9AAAAAAAAAABNq/a9jHHEPlX3/DxShqm+OouMvSYSrD0AAAAAAAAAAGa90LxCbLs/RWisvr17hD62gsq6MK3nvQAAAAAAAAAAZmw/veHEqrqlsbG2l4yusRNKPjr3lMw1AACAPwAAgD9aHng+/MySP/oUQT5B8tO+cCQIPxlZKj0AAAAAAAAAAI1eKL7fAIM+4IKtPtKMab4fOS09eqpTPQAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
60
  },
61
  "_last_episode_starts": {
62
  ":type:": "<class 'numpy.ndarray'>",
63
- ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="
64
  },
65
  "_last_original_obs": null,
66
  "_episode_num": 0,
67
  "use_sde": false,
68
  "sde_sample_freq": -1,
69
- "_current_progress_remaining": -0.007616000000000067,
70
  "ep_info_buffer": {
71
  ":type:": "<class 'collections.deque'>",
72
- ":serialized:": "gAWVKxAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIYtwNovVtcECUhpRSlIwBbJRNAAGMAXSUR0C5PBCUHIIXdX2UKGgGaAloD0MIyXTo9LwYcUCUhpRSlGgVS89oFkdAuTwnJKaodnV9lChoBmgJaA9DCAAAAABABXJAlIaUUpRoFUv5aBZHQLk8Rz06HTJ1fZQoaAZoCWgPQwg4oRABBxByQJSGlFKUaBVLzmgWR0C5PHlkDp1SdX2UKGgGaAloD0MIjln2JDC9b0CUhpRSlGgVS/VoFkdAuTy0+PikwnV9lChoBmgJaA9DCEta8Q0FYG5AlIaUUpRoFUvPaBZHQLk8ub6xgRd1fZQoaAZoCWgPQwgNcEG27K1xQJSGlFKUaBVLy2gWR0C5PL8chkiEdX2UKGgGaAloD0MIQBU3bjFfU0CUhpRSlGgVS7BoFkdAuTzH4+KTCHV9lChoBmgJaA9DCAn/ImjMnHBAlIaUUpRoFUvTaBZHQLk8/UGmk311fZQoaAZoCWgPQwjbTlsjAqRzQJSGlFKUaBVL/WgWR0C5PRX6ZYxMdX2UKGgGaAloD0MIE7afjPHXSECUhpRSlGgVS59oFkdAuT0awTufEnV9lChoBmgJaA9DCNVbA1sl7nBAlIaUUpRoFUvDaBZHQLk9PaHbh3t1fZQoaAZoCWgPQwhYdVYL7P5wQJSGlFKUaBVL2WgWR0C5PU1HOKO1dX2UKGgGaAloD0MIDmsqi4JUcECUhpRSlGgVS+poFkdAuT1p3t8eCHV9lChoBmgJaA9DCBkAqrixBXBAlIaUUpRoFUveaBZHQLk9a9AHE/B1fZQoaAZoCWgPQwhmo3N+itZwQJSGlFKUaBVNAQFoFkdAuT2TgDRtxnV9lChoBmgJaA9DCBgFweNb5W9AlIaUUpRoFUvhaBZHQLk9y51eSjh1fZQoaAZoCWgPQwjIYMWpFohxQJSGlFKUaBVL/2gWR0C5PdqbWmP6dX2UKGgGaAloD0MIaD9SRIYHQ0CUhpRSlGgVS6doFkdAuT3ggZCOWHV9lChoBmgJaA9DCH9skh9xEnFAlIaUUpRoFUvdaBZHQLk9+BoVVPx1fZQoaAZoCWgPQwheMLjmTpRwQJSGlFKUaBVLxGgWR0C5Phlh5PdmdX2UKGgGaAloD0MIBKvq5fcHc0CUhpRSlGgVS9VoFkdAuT4kYTCcgHV9lChoBmgJaA9DCOVjd4GSvXFAlIaUUpRoFUu/aBZHQLk+ZEb5uZV1fZQoaAZoCWgPQwi+huC4jENxQJSGlFKUaBVL1mgWR0C5Pm9Eb5uZdX2UKGgGaAloD0MImUaTizEWckCUhpRSlGgVTQkBaBZHQLk+gJ66asp1fZQoaAZoCWgPQwgVHcnlv19wQJSGlFKUaBVL6WgWR0C5PqZR8+ibdX2UKGgGaAloD0MI39xfPW60cUCUhpRSlGgVS9RoFkdAuUu+JGe+VXV9lChoBmgJaA9DCOz5muWyh3BAlIaUUpRoFUvGaBZHQLlLwmuDBdl1fZQoaAZoCWgPQwguVWmLq1VyQJSGlFKUaBVLx2gWR0C5S8KLfk3kdX2UKGgGaAloD0MInx7bMmAmcUCUhpRSlGgVS8RoFkdAuUvcE7nxKHV9lChoBmgJaA9DCPGhREuelmxAlIaUUpRoFUvLaBZHQLlMHu1F6Rh1fZQoaAZoCWgPQwjmB67yBLVxQJSGlFKUaBVL0WgWR0C5TCMrEtNBdX2UKGgGaAloD0MILUFGQIXscUCUhpRSlGgVS+FoFkdAuUwu/nGKh3V9lChoBmgJaA9DCOOON/mtpXNAlIaUUpRoFUvGaBZHQLlMSFXJYDF1fZQoaAZoCWgPQwgfSUkPg0ZxQJSGlFKUaBVL1mgWR0C5TGcpsoDxdX2UKGgGaAloD0MIMQkX8ohWckCUhpRSlGgVS/BoFkdAuUxnWwu/UXV9lChoBmgJaA9DCHwPlxy323FAlIaUUpRoFU1pAWgWR0C5THyV0Lc9dX2UKGgGaAloD0MINfEO8CT9b0CUhpRSlGgVS+VoFkdAuUyv0OEuhHV9lChoBmgJaA9DCI9xxcVRmHBAlIaUUpRoFUvQaBZHQLlM3ttALRd1fZQoaAZoCWgPQwiBsilXeLxxQJSGlFKUaBVNCQFoFkdAuUzzNorWiHV9lChoBmgJaA9DCJSHhVqTcHJAlIaUUpRoFUvdaBZHQLlM96By0a91fZQoaAZoCWgPQwgHlbiO8UdyQJSGlFKUaBVL0mgWR0C5TQX4TK1YdX2UKGgGaAloD0MIOMDMd3BrcECUhpRSlGgVS/BoFkdAuU0TrHEMs3V9lChoBmgJaA9DCJoklpQ7uHJAlIaUUpRoFU0oAWgWR0C5TS+UD+zddX2UKGgGaAloD0MIshLzrGR5ckCUhpRSlGgVTRwBaBZHQLlNPVmBe5Z1fZQoaAZoCWgPQwgm/5O/O89yQJSGlFKUaBVL0GgWR0C5TUtxZMcqdX2UKGgGaAloD0MI8UdRZ+6Ec0CUhpRSlGgVS/RoFkdAuU2O6RQrMHV9lChoBmgJaA9DCMWRByKL3G1AlIaUUpRoFUvOaBZHQLlNkoq0+kh1fZQoaAZoCWgPQwi+FYkJ6npxQJSGlFKUaBVL6GgWR0C5TZmGVRk3dX2UKGgGaAloD0MI4bVLG04KcUCUhpRSlGgVTQYBaBZHQLlNoCZWq951fZQoaAZoCWgPQwhlxXB1gKFxQJSGlFKUaBVL4GgWR0C5TbDm4iHJdX2UKGgGaAloD0MIZ7Yr9MEwZ0CUhpRSlGgVTegDaBZHQLlNznUUfxN1fZQoaAZoCWgPQwjIBtLFJgJxQJSGlFKUaBVL2GgWR0C5Tfhp1zQvdX2UKGgGaAloD0MI18BWCRa0UUCUhpRSlGgVS6VoFkdAuU4MMPSUknV9lChoBmgJaA9DCH0Iqkbv3nNAlIaUUpRoFU0gAWgWR0C5Ti1VHWjHdX2UKGgGaAloD0MIgbIpVziocECUhpRSlGgVS9JoFkdAuU41EQXhwXV9lChoBmgJaA9DCNNqSNwjzHJAlIaUUpRoFUveaBZHQLlOQt/FzdV1fZQoaAZoCWgPQwhmTwKbs+pxQJSGlFKUaBVL1WgWR0C5TkkUO/cndX2UKGgGaAloD0MIELOXbaeqcECUhpRSlGgVS9ZoFkdAuU51DneSCHV9lChoBmgJaA9DCK7xmewfUnBAlIaUUpRoFUvNaBZHQLlOdp97Wup1fZQoaAZoCWgPQwjIs8u3/vpyQJSGlFKUaBVNIQFoFkdAuU6VTdcjaHV9lChoBmgJaA9DCDuOHyoNEHJAlIaUUpRoFUveaBZHQLlOoER8MNN1fZQoaAZoCWgPQwgMlBRYAFc3QJSGlFKUaBVLtmgWR0C5Trf863iJdX2UKGgGaAloD0MIUIwsmaMhc0CUhpRSlGgVS9NoFkdAuU7UfyPMjnV9lChoBmgJaA9DCAFuFi8WwW5AlIaUUpRoFUvTaBZHQLlO3efI0ZZ1fZQoaAZoCWgPQwgxJZLoJZ9yQJSGlFKUaBVLyGgWR0C5TuJKSPludX2UKGgGaAloD0MIJ79FJ8ssckCUhpRSlGgVS8loFkdAuU8BakhzNnV9lChoBmgJaA9DCHRiD+2jynBAlIaUUpRoFUv3aBZHQLlPEJx//ed1fZQoaAZoCWgPQwjHuU24F0VzQJSGlFKUaBVLz2gWR0C5TzFJDmbLdX2UKGgGaAloD0MI4Zumzw4WcUCUhpRSlGgVS8NoFkdAuU9qIbfgrHV9lChoBmgJaA9DCByZR/7g9G9AlIaUUpRoFUvWaBZHQLlPe1jy4F11fZQoaAZoCWgPQwialIJur0VvQJSGlFKUaBVL9mgWR0C5T4RDohZAdX2UKGgGaAloD0MIsDcxJKfNbkCUhpRSlGgVS9BoFkdAuU+4Bfa6BnV9lChoBmgJaA9DCDDxR1Fn3XJAlIaUUpRoFU0JAWgWR0C5T8ZKSPludX2UKGgGaAloD0MIggAZOjYnckCUhpRSlGgVS/loFkdAuU/J03fhuXV9lChoBmgJaA9DCNPddTYkjXNAlIaUUpRoFUvcaBZHQLlPy3Tuv2Z1fZQoaAZoCWgPQwhdv2A37GNvQJSGlFKUaBVL5GgWR0C5T/Rdt2s8dX2UKGgGaAloD0MI9zk+WpwucECUhpRSlGgVS81oFkdAuU/4G/vfCXV9lChoBmgJaA9DCCKNCpxshnFAlIaUUpRoFUu9aBZHQLlQCKxcE/11fZQoaAZoCWgPQwgWhV0U/cByQJSGlFKUaBVLxGgWR0C5UDJZbILgdX2UKGgGaAloD0MIOxvyz4wBcECUhpRSlGgVTQkBaBZHQLlQO4yXUpd1fZQoaAZoCWgPQwj5vyMq1GlvQJSGlFKUaBVLzGgWR0C5UFQvtdAxdX2UKGgGaAloD0MI2cwhqQVVc0CUhpRSlGgVS/toFkdAuVBtQuVX3nV9lChoBmgJaA9DCHwsfejCsnBAlIaUUpRoFUvGaBZHQLlQcVxjriV1fZQoaAZoCWgPQwhuvhHdM7FyQJSGlFKUaBVNEAFoFkdAuVCGPMjeK3V9lChoBmgJaA9DCMNmgAvylXNAlIaUUpRoFUvAaBZHQLlQoLKV6eJ1fZQoaAZoCWgPQwg0SSwp9/FxQJSGlFKUaBVLvmgWR0C5UK5PAO8TdX2UKGgGaAloD0MI3sfRHFmMckCUhpRSlGgVS81oFkdAuVDO/IsAenV9lChoBmgJaA9DCHo2qz7XMXNAlIaUUpRoFUu9aBZHQLlQ+5avA451fZQoaAZoCWgPQwhm9nmMcrdvQJSGlFKUaBVLy2gWR0C5UQ8brC3xdX2UKGgGaAloD0MIFoielIltc0CUhpRSlGgVS+FoFkdAuVEmUliSaHV9lChoBmgJaA9DCLggW5YvPHFAlIaUUpRoFUvBaBZHQLlRSBFd9lV1fZQoaAZoCWgPQwiEnWLV4IZzQJSGlFKUaBVL1GgWR0C5UVEr08NhdX2UKGgGaAloD0MInGuYoXGtcECUhpRSlGgVS/VoFkdAuVFX6LwWnHV9lChoBmgJaA9DCDi7tUwGZnBAlIaUUpRoFUvLaBZHQLlRjgGbCrN1fZQoaAZoCWgPQwi3fvrPWkpwQJSGlFKUaBVL+WgWR0C5UZLfDUExdX2UKGgGaAloD0MIb7plh/irbkCUhpRSlGgVS9hoFkdAuVGaqHXVb3V9lChoBmgJaA9DCI+Oq5Fd3m5AlIaUUpRoFUvIaBZHQLlRnYb83uN1fZQoaAZoCWgPQwghH/RsFt1xQJSGlFKUaBVLwmgWR0C5UawSeyzHdX2UKGgGaAloD0MI2QjE6/qgckCUhpRSlGgVS9ZoFkdAuVHPHvMKTnVlLg=="
73
  },
74
  "ep_success_buffer": {
75
  ":type:": "<class 'collections.deque'>",
76
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
77
  },
78
- "_n_updates": 492,
79
  "n_steps": 1024,
80
  "gamma": 0.999,
81
  "gae_lambda": 0.995,
@@ -83,10 +83,10 @@
83
  "vf_coef": 0.5,
84
  "max_grad_norm": 0.5,
85
  "batch_size": 32,
86
- "n_epochs": 4,
87
  "clip_range": {
88
  ":type:": "<class 'function'>",
89
- ":serialized:": "gAWV+QIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAEsBSwFLE0MEiABTAJROhZQpjAFflIWUjGQvaG9tZS9uYWRpcmJla292L2FuYWNvbmRhMy9lbnZzL2hmLXJsL2xpYi9weXRob24zLjEwL3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgEMCAA2UjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxkL2hvbWUvbmFkaXJiZWtvdi9hbmFjb25kYTMvZW52cy9oZi1ybC9saWIvcHl0aG9uMy4xMC9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGggfZR9lChoF2gOjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoGIwHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/yZmZmZmZmoWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="
90
  },
91
  "clip_range_vf": null,
92
  "normalize_advantage": true,
 
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
+ "__init__": "<function ActorCriticPolicy.__init__ at 0x7f07385125f0>",
8
+ "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f0738512680>",
9
+ "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f0738512710>",
10
+ "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f07385127a0>",
11
+ "_build": "<function ActorCriticPolicy._build at 0x7f0738512830>",
12
+ "forward": "<function ActorCriticPolicy.forward at 0x7f07385128c0>",
13
+ "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f0738512950>",
14
+ "_predict": "<function ActorCriticPolicy._predict at 0x7f07385129e0>",
15
+ "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f0738512a70>",
16
+ "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f0738512b00>",
17
+ "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f0738512b90>",
18
  "__abstractmethods__": "frozenset()",
19
+ "_abc_impl": "<_abc._abc_data object at 0x7f07385157c0>"
20
  },
21
  "verbose": 1,
22
  "policy_kwargs": {},
 
41
  "dtype": "int64",
42
  "_np_random": null
43
  },
44
+ "n_envs": 64,
45
+ "num_timesteps": 3014656,
46
+ "_total_timesteps": 3000000,
47
  "_num_timesteps_at_start": 0,
48
  "seed": null,
49
  "action_noise": null,
50
+ "start_time": 1652378866.9388123,
51
  "learning_rate": 0.0003,
52
  "tensorboard_log": null,
53
  "lr_schedule": {
 
56
  },
57
  "_last_obs": {
58
  ":type:": "<class 'numpy.ndarray'>",
59
+ ":serialized:": "gAWVdQgAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYACAAAAAAAAOYgBj2PxlK6n4UbOVHWfba2qYI6VQkzuAAAgD8AAIA/msHEPJBWtD+2GRw+qsZFvsIJVD0+Oq89AAAAAAAAAABmWOg8gWnNPc68Tj3s2ZW+bTh7PeqrvDsAAAAAAAAAAC1jCr4X+Ws+RXOnPkFEmb50+wI8EGrzPQAAAAAAAAAAZmdJPc4vtT/y7yw/keFNvSIUkLyY/Is9AAAAAAAAAADNQhg9XNt4uuVjILZMeJGxY4bgOnvGQjUAAIA/AACAP81vRz6r8pM/AOQmPsLPFL9zLoE+r5yBPAAAAAAAAAAAswpEPY34ij6AZcy9oUOpvhVGJT091kM9AAAAAAAAAAAzAcw87a9BPvlcOr5h4sG++qVVvAOIwLwAAAAAAAAAAE0WK76FR6w/ZhAHv4PU577yxV6+Iul6vgAAAAAAAAAAJprKvTbjsz+CC8W+a3Chvj2oirxwZ/e9AAAAAAAAAACzqq69nwyXP0JTx77B3iK/Qk0FvqJpSL4AAAAAAAAAAK2lJL5PhhU/eg4ZPmrd6b553QS+BiT2PQAAAAAAAAAApmgHPs4G4z5tDO+9SWLZvlCcxj3/RwS+AAAAAAAAAABmPYw84GmYP2Uysj3wGyS/Y+IHPSmBn70AAAAAAAAAAGZS6rzhTJW6Gs2FOcZNATWMs8E6LVmYuAAAgD8AAIA/mpm8uQ+aBz2yoAI+ljObvl+w3jxLA4E9AAAAAAAAAABmQKu84QqTOUHnkLsRL4G5lCQUu1B+tToAAIA/AACAP82M0zkUsrW6/YJwvOcsgTwKkdM72rxgvQAAgD8AAIA/bekBvvP5Bj/921Q+h37Vvmpey724maE9AAAAAAAAAABmgEY9wwl6ukZENTgCixEzC6itumCFU7cAAIA/AACAP+bQKD4gS6E/ahCxPiJgGr8KHoM+++EjPQAAAAAAAAAA9viUPtYQHj8+58E8VmYSv23NGD9ypQO9AAAAAAAAAACaxMO8D2gNvEpQ0D1QIry674NlvRdBA7sAAIA/AACAP6trgr5/gUI//aW2vQKN+L6NsKu+om26PQAAAAAAAAAAZpZ7vHbtDrzaIjM8hZUoPTPhl7vQV066AACAPwAAgD/Ni2u+EDNRP94137w+ahO/ZQuWvuWu4TwAAAAAAAAAAM3aLz32oHS6lqwINcCIlTCreAe7YklqtAAAgD8AAIA/ZqpUPGhOrLxCW6Y78ttJPHi6GT73wiK9AACAPwAAgD9mBIW8+XqxPyrMCr+DNsa+OQJoPM/1nz0AAAAAAAAAADPgdT328EW67WbJPEfNu7yCuOi68kPFvAAAAAAAAAAAjROOPc5cgrz9MEy+N/R7PUKy5j2P0Lc6AAAAAAAAgD+a2u48kGSWP4cwgz3gRPK+pAOTPbikjj0AAAAAAAAAADqzLb6BHcI/yFcvv8Yrt71X7gS+olyZvgAAAAAAAAAAMzU+vZPFzT6dGB0+qXXsvleNoTwYhLg9AAAAAAAAAACaJTk9NcF7PkLBYL5GDNq+I6ojvcqXcL4AAAAAAAAAAK1kXr7G+Kc/npz7vofB+r7JJ5m+MgM2vgAAAAAAAAAAANwMPYjXt7wkq0U+AhNQPXUTBr64J4M8AACAPwAAgD8A13o+huFOP9Y+gj7VNAS/we/ePpZmGT4AAAAAAAAAADOMjj3hYI26VuF/OGZNfDNkHro64WKUtwAAgD8AAIA/M/WrPFRU7z2+DYq9p0SwvsbD+L3RRBG9AAAAAAAAAAAmzJu9r3YjPmKm+j7POaC+k5OIPqKbHj4AAAAAAAAAAOanS70Sja4/q6Ofvv3Wpr4VsC+92/T9vQAAAAAAAAAAzdIZvBfYsT/us2a+T6+OvmEbhDt5nbS8AAAAAAAAAADNHI67KXgIupuvTDNa6AGwh+/gOgZzzbMAAIA/AACAP7NrFb0XSDg+Lx3Gvhbzkb5RCbC+q9KIvQAAAAAAAAAAs0B9Po1nrz4Y6Lm+TnzXvknOVD4aYV++AAAAAAAAAAAA6CA8rY18PrqoxbzlqaO+NWkcPGAI3TwAAAAAAAAAADOjjLvsxuy7s8TMO/tggjzou0q9PTpcPQAAgD8AAIA/M2gyva45ibqCIjc3vIU3MtkdcrkuD1W2AACAPwAAgD+aWfE7KWAgum3Pzje3xzm2daNPOvvr67YAAIA/AACAP5rd6Dt8g1E+3OwJvaDiy763alS8LdLnOwAAAAAAAAAAADApPRSkkLq2MGu5VVVZtNEQMzoCaYg4AACAPwAAgD8AxdE8w7lyutZmjjj+Wha2EUZOO19AobcAAIA/AACAP5qqAL0eoYI9zXH6Pe/kcr4G/3Y9G0tkPQAAAAAAAAAAM88HPTaAoT8zEyo+vKUPv03CNj2lPpA9AAAAAAAAAACGkYA+f5cCP5vVar6R6P6+EfcuPrGiQ74AAAAAAAAAAENHf75YwrM+aGPKPus48L7WQ1W+3FyaPgAAAAAAAAAAs0MhPeFsrrrqYW63dXELsmcR1DhTrIg2AACAPwAAgD8a55O9qcx0PboEsz4WfYS+OScxPcP+Pz4AAAAAAAAAAAAT2b2Pfmq6vkvcuvNUY7VWe6a664P5OQAAgD8AAAAAZmqLPY8mR7rc1BQ+Tf/VNXtHRzo0/sc0AACAPwAAgD+zNig9ru+Eut8ApDZpmaox8hL+OmHYwrUAAIA/AACAP7OZDj38Qhs+FmQRvsskw75MHig704GovQAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYktASwiGlIwBQ5R0lFKULg=="
60
  },
61
  "_last_episode_starts": {
62
  ":type:": "<class 'numpy.ndarray'>",
63
+ ":serialized:": "gAWVswAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJZAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiS0CFlIwBQ5R0lFKULg=="
64
  },
65
  "_last_original_obs": null,
66
  "_episode_num": 0,
67
  "use_sde": false,
68
  "sde_sample_freq": -1,
69
+ "_current_progress_remaining": -0.004885333333333408,
70
  "ep_info_buffer": {
71
  ":type:": "<class 'collections.deque'>",
72
+ ":serialized:": "gAWVJhAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMI0NA/wQUKcECUhpRSlIwBbJRL3YwBdJRHQLfT/V8Ti851fZQoaAZoCWgPQwg+PEuQkc5zQJSGlFKUaBVLzGgWR0C31AEygwoLdX2UKGgGaAloD0MIbhYvFgbbcUCUhpRSlGgVS+doFkdAt9QwyKvV3HV9lChoBmgJaA9DCMKjjSNWdnJAlIaUUpRoFU1UAWgWR0C31DDj7yhBdX2UKGgGaAloD0MIEJaxoVs6cUCUhpRSlGgVS9FoFkdAt9Q0tbs4UHV9lChoBmgJaA9DCMXIkjkWvm9AlIaUUpRoFUvCaBZHQLfUTi5NGmV1fZQoaAZoCWgPQwiqu7ILhiZyQJSGlFKUaBVLxGgWR0C31E40qH45dX2UKGgGaAloD0MIvqPGhBgQckCUhpRSlGgVS9loFkdAt9Rug6EJ0HV9lChoBmgJaA9DCFKazeOwRHBAlIaUUpRoFUvbaBZHQLfUckxyn1p1fZQoaAZoCWgPQwhl+5C3nMJwQJSGlFKUaBVLymgWR0C31HJU1hsqdX2UKGgGaAloD0MIv7m/elw7ckCUhpRSlGgVS9poFkdAt9R5m6GxlnV9lChoBmgJaA9DCJGA0eWNTnJAlIaUUpRoFUvvaBZHQLfUi1RceKd1fZQoaAZoCWgPQwigppat9epwQJSGlFKUaBVL1GgWR0C31Itl2/zrdX2UKGgGaAloD0MI6Q/NPPmAcECUhpRSlGgVS9VoFkdAt9TEI4VARnV9lChoBmgJaA9DCEtXsI24dXNAlIaUUpRoFUvraBZHQLfUz03fhuR1fZQoaAZoCWgPQwjK+s3EtGNzQJSGlFKUaBVNBwFoFkdAt9TS/zreInV9lChoBmgJaA9DCCh9IeS8J3FAlIaUUpRoFUvSaBZHQLfU4WyTpxF1fZQoaAZoCWgPQwiWJM/1PQhwQJSGlFKUaBVLzWgWR0C31OxRAKOUdX2UKGgGaAloD0MIOZhNgCFMcUCUhpRSlGgVS9NoFkdAt9Tz9bX6InV9lChoBmgJaA9DCLlPjgJEV3JAlIaUUpRoFUuxaBZHQLfU/wAlv611fZQoaAZoCWgPQwijVpi+1yw7QJSGlFKUaBVLnmgWR0C31QpZbILgdX2UKGgGaAloD0MIP8bctUTQcECUhpRSlGgVS9JoFkdAt9UbOD8Lr3V9lChoBmgJaA9DCF8JpMQu1HBAlIaUUpRoFU0KAWgWR0C31Rt0vGp/dX2UKGgGaAloD0MIE/QXesQtcECUhpRSlGgVS8BoFkdAt9UuBVdX1nV9lChoBmgJaA9DCMdmR6rvlXBAlIaUUpRoFUvYaBZHQLfVQ9deIEd1fZQoaAZoCWgPQwhCPujZrJRwQJSGlFKUaBVL2WgWR0C31U845tFbdX2UKGgGaAloD0MI2+BE9OtTckCUhpRSlGgVS+xoFkdAt9Vd2t+1B3V9lChoBmgJaA9DCJ+QnbfxX3NAlIaUUpRoFUvdaBZHQLfVYbn5i3J1fZQoaAZoCWgPQwicU8kAUINvQJSGlFKUaBVL92gWR0C31WlG5MDfdX2UKGgGaAloD0MII8DpXbwzcUCUhpRSlGgVS9doFkdAt9VwSWZ7X3V9lChoBmgJaA9DCHtntFVJanJAlIaUUpRoFUvyaBZHQLfVd5q/M4d1fZQoaAZoCWgPQwhwd9ZuO15wQJSGlFKUaBVLzWgWR0C31Y26wt8NdX2UKGgGaAloD0MI5dTOMPVecUCUhpRSlGgVS/loFkdAt9WN98Z1m3V9lChoBmgJaA9DCJcA/FPqtnFAlIaUUpRoFUvGaBZHQLfVlRFZxJd1fZQoaAZoCWgPQwipF3yaE3NwQJSGlFKUaBVL+2gWR0C31a2mP5pKdX2UKGgGaAloD0MI2qoksg87ckCUhpRSlGgVS9toFkdAt9W4VwgkknV9lChoBmgJaA9DCJseFJQiH3FAlIaUUpRoFUu4aBZHQLfVylnAZbZ1fZQoaAZoCWgPQwghyEEJM7dLQJSGlFKUaBVLp2gWR0C31eqpDNQkdX2UKGgGaAloD0MITwKbc3Cdc0CUhpRSlGgVS9VoFkdAt9X3VhCtzXV9lChoBmgJaA9DCFXejnCaw3BAlIaUUpRoFUvmaBZHQLfV96Kcd5p1fZQoaAZoCWgPQwgIyJdQQdxwQJSGlFKUaBVL1WgWR0C31f+U+s5odX2UKGgGaAloD0MI22/tRMk8bkCUhpRSlGgVS9JoFkdAt9YHaQFLWnV9lChoBmgJaA9DCJ0PzxJkTHJAlIaUUpRoFUvZaBZHQLfWC1zhgmZ1fZQoaAZoCWgPQwgZyLPLN19xQJSGlFKUaBVL4GgWR0C31hLcXWOIdX2UKGgGaAloD0MIONvcmF5OckCUhpRSlGgVS/FoFkdAt9YS/M4cWHV9lChoBmgJaA9DCKlqgqi7V3BAlIaUUpRoFUvUaBZHQLfWGgGr0at1fZQoaAZoCWgPQwh41JgQ87FyQJSGlFKUaBVL62gWR0C31hoh6jWTdX2UKGgGaAloD0MIZw+0AkMsb0CUhpRSlGgVS+1oFkdAt9YkaLn9vXV9lChoBmgJaA9DCI4G8BZItnFAlIaUUpRoFUvJaBZHQLfWJGyX2M91fZQoaAZoCWgPQwhwXpz4qsxxQJSGlFKUaBVLyGgWR0C31ljhcZ+AdX2UKGgGaAloD0MI0VlmEQqzcECUhpRSlGgVS8hoFkdAt9Z3PzFuN3V9lChoBmgJaA9DCGu28pL/629AlIaUUpRoFUvSaBZHQLfWhQC0WuZ1fZQoaAZoCWgPQwiIS4475VxxQJSGlFKUaBVL1GgWR0C31oiudPLxdX2UKGgGaAloD0MIiEZ3EPubcUCUhpRSlGgVS+NoFkdAt9aWoHcDbXV9lChoBmgJaA9DCKBrX0DvTnNAlIaUUpRoFUv/aBZHQLfWpR4QjD91fZQoaAZoCWgPQwgI46dxb0BzQJSGlFKUaBVNDAFoFkdAt9alUtI07HV9lChoBmgJaA9DCBGQL6ECYnNAlIaUUpRoFUvSaBZHQLfWr9MsYl91fZQoaAZoCWgPQwiCrn0B/SFxQJSGlFKUaBVLsGgWR0C31sqCL/CJdX2UKGgGaAloD0MIMX4a96a1ckCUhpRSlGgVS+doFkdAt9bXnU2DQXV9lChoBmgJaA9DCMGPativW3FAlIaUUpRoFUvQaBZHQLfW281n/T91fZQoaAZoCWgPQwi3skRnWd9xQJSGlFKUaBVL5mgWR0C31v5vo/zKdX2UKGgGaAloD0MIvvkNE00vcUCUhpRSlGgVS8hoFkdAt9cGW7e2u3V9lChoBmgJaA9DCPs/h/nyKnJAlIaUUpRoFUvYaBZHQLfXCgOz6ad1fZQoaAZoCWgPQwgD7KNTV+FxQJSGlFKUaBVLvWgWR0C31xweRxLkdX2UKGgGaAloD0MILo81IwNtcUCUhpRSlGgVS+xoFkdAt9cjatcOb3V9lChoBmgJaA9DCNvdA3Tfn21AlIaUUpRoFUvXaBZHQLfXOCNCJGh1fZQoaAZoCWgPQwgt0sQ7QAxzQJSGlFKUaBVL0GgWR0C31zuIRAbAdX2UKGgGaAloD0MIBcWPMfckb0CUhpRSlGgVS81oFkdAt9dRrgwXZXV9lChoBmgJaA9DCGe4AZ8fiXFAlIaUUpRoFUvIaBZHQLfXXMb3oLZ1fZQoaAZoCWgPQwiEud3LfVRxQJSGlFKUaBVLzWgWR0C3125TyauwdX2UKGgGaAloD0MIbJbLRucVckCUhpRSlGgVS+hoFkdAt9d1hc7henV9lChoBmgJaA9DCHLBGfy9WnBAlIaUUpRoFUvYaBZHQLfXhA2hqTN1fZQoaAZoCWgPQwiazk4Ghz5wQJSGlFKUaBVNmQFoFkdAt9eHz4DcM3V9lChoBmgJaA9DCJ55Oey+eHJAlIaUUpRoFUv/aBZHQLfXmNsFdLR1fZQoaAZoCWgPQwhgBmNEYgdyQJSGlFKUaBVLvWgWR0C315wvL5h0dX2UKGgGaAloD0MIwCUA/1RdckCUhpRSlGgVS8xoFkdAt9eyGmDUVnV9lChoBmgJaA9DCAA5YcJoPHNAlIaUUpRoFUvFaBZHQLfXsit7rs11fZQoaAZoCWgPQwh+UYL+whZwQJSGlFKUaBVLyGgWR0C319fRu0kXdX2UKGgGaAloD0MILzVCP1MZb0CUhpRSlGgVS8toFkdAt9fX81n/UHV9lChoBmgJaA9DCHZSX5Z2BXFAlIaUUpRoFUvZaBZHQLfX29TP0I11fZQoaAZoCWgPQwi139qJkstVQJSGlFKUaBVN6ANoFkdAt9frWhAWznV9lChoBmgJaA9DCN481SF3jHNAlIaUUpRoFUvoaBZHQLfYBx20Re11fZQoaAZoCWgPQwgvwakP5DdyQJSGlFKUaBVLyWgWR0C32CrlvIfbdX2UKGgGaAloD0MICfmgZ3P7cUCUhpRSlGgVS+xoFkdAt9gyEqUeMnV9lChoBmgJaA9DCLd++s9aYXJAlIaUUpRoFUvPaBZHQLfYRKcNH6N1fZQoaAZoCWgPQwj7PEZ5pntwQJSGlFKUaBVL5GgWR0C32HYbn5i3dX2UKGgGaAloD0MIbTgsDXxEcUCUhpRSlGgVS/FoFkdAt9h97u2JBXV9lChoBmgJaA9DCJEm3gGeZnFAlIaUUpRoFUvWaBZHQLfYjYpDu0F1fZQoaAZoCWgPQwiUoL/QIxJyQJSGlFKUaBVL1GgWR0C32KhTsIE9dX2UKGgGaAloD0MIl65gG/Ebb0CUhpRSlGgVS99oFkdAt9iwSAYpD3V9lChoBmgJaA9DCH0/NV56mHNAlIaUUpRoFUvTaBZHQLfYw9OARTV1fZQoaAZoCWgPQwhHHLKBNBVxQJSGlFKUaBVL9mgWR0C32MfIGQjmdX2UKGgGaAloD0MIpBmLpjPQcECUhpRSlGgVS+toFkdAt9jH3XZoPHV9lChoBmgJaA9DCKio+pUORXFAlIaUUpRoFUvvaBZHQLfYz7dSEUV1fZQoaAZoCWgPQwjBqQ8kL49xQJSGlFKUaBVNCQFoFkdAt9jbBKtga3V9lChoBmgJaA9DCCDQmbTpKHFAlIaUUpRoFUvQaBZHQLfY5ld1Mdt1fZQoaAZoCWgPQwj5n/zde/lxQJSGlFKUaBVNBwFoFkdAt9jmGSIP9XV9lChoBmgJaA9DCNo7o61K/XFAlIaUUpRoFUvpaBZHQLfZArpJPIp1fZQoaAZoCWgPQwitad5xCrFoQJSGlFKUaBVNOwJoFkdAt9kOMZP2wnV9lChoBmgJaA9DCPQxHxDo6XJAlIaUUpRoFUvfaBZHQLfZEgZjx1B1ZS4="
73
  },
74
  "ep_success_buffer": {
75
  ":type:": "<class 'collections.deque'>",
76
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
77
  },
78
+ "_n_updates": 368,
79
  "n_steps": 1024,
80
  "gamma": 0.999,
81
  "gae_lambda": 0.995,
 
83
  "vf_coef": 0.5,
84
  "max_grad_norm": 0.5,
85
  "batch_size": 32,
86
+ "n_epochs": 8,
87
  "clip_range": {
88
  ":type:": "<class 'function'>",
89
+ ":serialized:": "gAWV+wIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAEsBSwFLE0MEiABTAJROhZQpjAFflIWUjGQvaG9tZS9uYWRpcmJla292L2FuYWNvbmRhMy9lbnZzL2hmLXJsL2xpYi9weXRob24zLjEwL3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgEMEAIAA35SMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjGQvaG9tZS9uYWRpcmJla292L2FuYWNvbmRhMy9lbnZzL2hmLXJsL2xpYi9weXRob24zLjEwL3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCB9lH2UKGgXaA6MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgYjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"
90
  },
91
  "clip_range_vf": null,
92
  "normalize_advantage": true,
ppo-LunarLander-v2/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6b6485e9e668109c31c5e862861da25a42d98f52ec13a9b7e977a7bb84a3fb78
3
  size 84893
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ef1c8ad112a50edf305b6edd592d1425c3696e1367b4a27b84f2d671c777d87
3
  size 84893
ppo-LunarLander-v2/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:adea2eb9ff81020c63448420fd3208337c44b83ff8f8f3005459a675dcd8f401
3
  size 43201
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e0aaeaf1cc6272fd56d2a4a4e2e0ba1b552046dd864c7b5c0b31a3841dafdfb7
3
  size 43201
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ad9574a65ca52c4f404658f078a21358f229bb50eceda6d6ee5333a1750004a5
3
- size 187339
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:283f01d9712ed7b8fdd1b2213f5a373f503a2608c7f13dc8b32011514be46be9
3
+ size 187838
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 276.25667652452285, "std_reward": 18.754370054400933, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2022-05-11T00:00:02.351431"}
 
1
+ {"mean_reward": 280.5823631041261, "std_reward": 16.128313581977128, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2022-05-12T23:00:04.406103"}