dk-crazydiv commited on
Commit
499d7e7
1 Parent(s): 8f8c6a0

longtraining1

Browse files
README.md CHANGED
@@ -10,7 +10,7 @@ model-index:
10
  results:
11
  - metrics:
12
  - type: mean_reward
13
- value: 293.21 +/- 12.62
14
  name: mean_reward
15
  task:
16
  type: reinforcement-learning
 
10
  results:
11
  - metrics:
12
  - type: mean_reward
13
+ value: 282.02 +/- 22.46
14
  name: mean_reward
15
  task:
16
  type: reinforcement-learning
config.json CHANGED
@@ -1 +1 @@
1
- {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f6a47db93b0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f6a47db9440>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f6a47db94d0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f6a47db9560>", "_build": "<function ActorCriticPolicy._build at 0x7f6a47db95f0>", "forward": "<function ActorCriticPolicy.forward at 0x7f6a47db9680>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f6a47db9710>", "_predict": "<function ActorCriticPolicy._predict at 0x7f6a47db97a0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f6a47db9830>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f6a47db98c0>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f6a47db9950>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc_data object at 0x7f6a47e0b480>"}, "verbose": 1, "policy_kwargs": {}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVnwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/5RoCksIhZSMAUOUdJRSlIwEaGlnaJRoEiiWIAAAAAAAAAAAAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAf5RoCksIhZRoFXSUUpSMDWJvdW5kZWRfYmVsb3eUaBIolggAAAAAAAAAAAAAAAAAAACUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYIAAAAAAAAAAAAAAAAAAAAlGghSwiFlGgVdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [8], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False]", "bounded_above": "[False False False False False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gAWVggAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUaAeTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu", "n": 4, "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "num_timesteps": 49152, "_total_timesteps": 40000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1651747358.8787131, "learning_rate": 0.0003, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVvwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAUsBSxNDBIgAUwCUToWUKYwBX5SFlIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCB9lH2UKGgXaA6MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgYjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAFP7A74TbYM/tF6DvlNoIr9Fv4e+IekrvgAAAAAAAAAAsy4kvhCNjj6BtI0+EgTtvo6qe730VRI+AAAAAAAAAACAZxq+H3gDP25IjT7luu2++q2hvWJ56T0AAAAAAAAAAFPGqb65Xz4/tbssPswFBr81lsy+pq9PPgAAAAAAAAAAmnnvuky0tD/XhT2+7H0XPckxCzsUuCs9AAAAAAAAAAAA/G69KRM6vIaRXz0caXs89umbvdo4UD0AAIA/AACAPwCAeDyPqim6HHQcs13L8a7CYnG77tvBMwAAgD8AAIA/MzgDPoR6gj7uA+W+t0gHv0ZiYrwuTKW+AAAAAAAAAADAUYO9lwpyP/Ou8L1Jayu/SEGrvWBKlb0AAAAAAAAAADOTj72yn5w/AAqqvllgK7+twPW9pVYsvgAAAAAAAAAAM438vOHVnTt+zJc+v2eOviu1/D0rMBq/AAAAAAAAgD/NLV4+skSEPx2kID6/dRO/857bPjFnrTwAAAAAAAAAAKarAb62LwA/EFA+Ppzu6b4F/7S9E8/5PQAAAAAAAAAAzUxHORbqtD/8rp080yfhPfzvX7nH3o67AAAAAAAAAADNrQS+w9kKun5Avjvybx02wRXJuxVsvjgAAAAAAAAAAGYS67sk0Xw8Ypq/PP4r274SGs+7eR6bPAAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAABAAAAAAAAAAABAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.2287999999999999, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVHRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIP1OvW4TtcECUhpRSlIwBbJRLxIwBdJRHQFqyiJfpljF1fZQoaAZoCWgPQwhPWU3X02dyQJSGlFKUaBVL5WgWR0BauHTI/7iydX2UKGgGaAloD0MIKqkT0IQDckCUhpRSlGgVS8BoFkdAWri4EwFkhHV9lChoBmgJaA9DCBegbTWrLHFAlIaUUpRoFUvaaBZHQFq5pTMqz7d1fZQoaAZoCWgPQwheRxyygZhyQJSGlFKUaBVLumgWR0BaveGXXyy2dX2UKGgGaAloD0MIK/uuCH6NcUCUhpRSlGgVS8xoFkdAWsa4Wk8A73V9lChoBmgJaA9DCB/Xhopx/HBAlIaUUpRoFUu9aBZHQFrKeumrKeV1fZQoaAZoCWgPQwgSSl8IueBxQJSGlFKUaBVLxGgWR0BayxyKekHldX2UKGgGaAloD0MIIT1FDtEJdECUhpRSlGgVS8JoFkdAWvI6xPfsNXV9lChoBmgJaA9DCHO4VntYrXBAlIaUUpRoFUu9aBZHQFr0ev6j3251fZQoaAZoCWgPQwj5SiAlNrRyQJSGlFKUaBVLz2gWR0BbANelbeMydX2UKGgGaAloD0MIoYMu4ZBicECUhpRSlGgVS8VoFkdAWwKfywwCbXV9lChoBmgJaA9DCCEdHsL44nJAlIaUUpRoFUu8aBZHQFsEV4X40uV1fZQoaAZoCWgPQwgKgse3t2pyQJSGlFKUaBVL7mgWR0BbB0nw5NoKdX2UKGgGaAloD0MIIPEr1jASdECUhpRSlGgVS9JoFkdAWw3Eehf0E3V9lChoBmgJaA9DCDVCP1PvmHNAlIaUUpRoFUvuaBZHQFsO9Ujs2Nx1fZQoaAZoCWgPQwilFd9QOAtyQJSGlFKUaBVL12gWR0BbECGvfTCtdX2UKGgGaAloD0MIEeSghJmBc0CUhpRSlGgVS7poFkdAWw/101ZTynV9lChoBmgJaA9DCEuxo3Gow3JAlIaUUpRoFUvOaBZHQFsSU9ZA6dV1fZQoaAZoCWgPQwgXnMHf73NyQJSGlFKUaBVL0GgWR0BbE3gtOEdvdX2UKGgGaAloD0MI0a5Cys/nckCUhpRSlGgVS+RoFkdAWxyRbKRuCXV9lChoBmgJaA9DCOxnsRTJ2HFAlIaUUpRoFUvKaBZHQF00mjj7yhB1fZQoaAZoCWgPQwgQlNv2vXNyQJSGlFKUaBVLwmgWR0BdNakAPuohdX2UKGgGaAloD0MIGw5LA380c0CUhpRSlGgVS89oFkdAXToQL/jsEHV9lChoBmgJaA9DCGVQbXDiVnNAlIaUUpRoFUvMaBZHQF1jDCxeLNx1fZQoaAZoCWgPQwinPLoRFoRxQJSGlFKUaBVLtmgWR0BdZVafSQYDdX2UKGgGaAloD0MIj1Tf+UV5TkCUhpRSlGgVS5toFkdAXWep84Pwu3V9lChoBmgJaA9DCGqiz0cZtXFAlIaUUpRoFUu2aBZHQF1pOe8PFvR1fZQoaAZoCWgPQwis5c5M8M1yQJSGlFKUaBVLv2gWR0BdbBDohY/3dX2UKGgGaAloD0MI28NeKGBDckCUhpRSlGgVS7doFkdAXW1Gqgh8pnV9lChoBmgJaA9DCILhXMPM7XFAlIaUUpRoFUvlaBZHQF1t2itaIN51fZQoaAZoCWgPQwgr+kMzj+pwQJSGlFKUaBVLxGgWR0BdeoBeXzDodX2UKGgGaAloD0MI7rCJzFyAckCUhpRSlGgVS8ZoFkdAXXsyuZCv5nV9lChoBmgJaA9DCI1HqYSnU3JAlIaUUpRoFUvFaBZHQF19QnhKlHl1fZQoaAZoCWgPQwhwzR39L8xxQJSGlFKUaBVL12gWR0BdgTTSb6P9dX2UKGgGaAloD0MIBWoxeBjicUCUhpRSlGgVS8BoFkdAXYaunuRcNnV9lChoBmgJaA9DCGVwlLx6GXJAlIaUUpRoFUvGaBZHQF2N7JGOMl11fZQoaAZoCWgPQwiSsG8n0ZhxQJSGlFKUaBVL0mgWR0BdkeAy2x6fdX2UKGgGaAloD0MIjKAxk2izc0CUhpRSlGgVS/VoFkdAXZRLdvbXYnV9lChoBmgJaA9DCEJ4tHFEBHNAlIaUUpRoFUvIaBZHQF2UBZIQOFx1fZQoaAZoCWgPQwg9t9CVCFFzQJSGlFKUaBVLyGgWR0Bdv/Cl7+kydX2UKGgGaAloD0MIu7ciMcFFckCUhpRSlGgVS8FoFkdAXcLgflp48nV9lChoBmgJaA9DCMWPMXctO3RAlIaUUpRoFUvRaBZHQF3C6P8yeqd1fZQoaAZoCWgPQwhtrS8SWgF0QJSGlFKUaBVLxGgWR0Bdw98Rcu8LdX2UKGgGaAloD0MIvf25aEgNcUCUhpRSlGgVS8doFkdAXcQ91U2kz3V9lChoBmgJaA9DCH+FzJXBQXJAlIaUUpRoFUvNaBZHQF3EpzcRDkV1fZQoaAZoCWgPQwgk7UYfMz5zQJSGlFKUaBVL52gWR0BdyjgqEvkBdX2UKGgGaAloD0MIceSByKKCc0CUhpRSlGgVS7poFkdAXc/2TPjXF3V9lChoBmgJaA9DCLx2acOhz3JAlIaUUpRoFUvEaBZHQF3SBRyfcvd1fZQoaAZoCWgPQwjjwRa7/Q10QJSGlFKUaBVLz2gWR0Bd1fms/6frdX2UKGgGaAloD0MIroBCPf3dcUCUhpRSlGgVS8FoFkdAXdX15B1LanV9lChoBmgJaA9DCKiMf59xG3BAlIaUUpRoFUvHaBZHQF3j/jsD4g11fZQoaAZoCWgPQwjQ8GYNHuVwQJSGlFKUaBVL0GgWR0Bd7ADeTFERdX2UKGgGaAloD0MIAyMva2Iwc0CUhpRSlGgVS+toFkdAXezWSU1Q7HV9lChoBmgJaA9DCA2K5gHsv3FAlIaUUpRoFUvZaBZHQF3yKR+z+m51fZQoaAZoCWgPQwihuyTOyltzQJSGlFKUaBVL7WgWR0Bd+hXGOuJUdX2UKGgGaAloD0MIVYSbjCozOUCUhpRSlGgVS41oFkdAXf9fTkQwsXV9lChoBmgJaA9DCJ87wf7rUnBAlIaUUpRoFUu9aBZHQF4VCbtqpLp1fZQoaAZoCWgPQwhruwm+aaBxQJSGlFKUaBVLz2gWR0BeHKcEvCdjdX2UKGgGaAloD0MIIk+Srtk5cECUhpRSlGgVS81oFkdAXhyuA7Ppp3V9lChoBmgJaA9DCBQEj28v3HBAlIaUUpRoFUvaaBZHQF4hq4pc5bR1fZQoaAZoCWgPQwhEMuTY+g5yQJSGlFKUaBVL4GgWR0BeIjUVi4KAdX2UKGgGaAloD0MI9kVCW46OcUCUhpRSlGgVS7hoFkdAXia4Cp3otHV9lChoBmgJaA9DCIZVvJE5t3BAlIaUUpRoFUvLaBZHQF4oogFHJ911fZQoaAZoCWgPQwitGK4OAE1zQJSGlFKUaBVL2mgWR0BeKSAtnPE9dX2UKGgGaAloD0MImBb1SW6ockCUhpRSlGgVS8xoFkdAXi8Svkili3V9lChoBmgJaA9DCPZBlgVTm3NAlIaUUpRoFUvfaBZHQF4y4TK1XvJ1fZQoaAZoCWgPQwjlZOJWQfJxQJSGlFKUaBVLu2gWR0BeNhKlHjIadX2UKGgGaAloD0MI1Em2utxicECUhpRSlGgVS7RoFkdAXkBvm5lOGnV9lChoBmgJaA9DCNlcNc8R2HBAlIaUUpRoFUvHaBZHQF5Csyi22G91fZQoaAZoCWgPQwgsZ++MdstwQJSGlFKUaBVLymgWR0BeRUpNKyv+dX2UKGgGaAloD0MIbTmX4upyc0CUhpRSlGgVS9NoFkdAXlbbblA/s3V9lChoBmgJaA9DCA5o6Qp2DHNAlIaUUpRoFUvmaBZHQF5kXhOxjax1fZQoaAZoCWgPQwgwKqkTUN5xQJSGlFKUaBVLtWgWR0BeaqzqrzXjdX2UKGgGaAloD0MIIHu9++OCckCUhpRSlGgVS8loFkdAXm1Htnf2snV9lChoBmgJaA9DCHIUIApm63JAlIaUUpRoFUuyaBZHQF5uvlEJBxB1fZQoaAZoCWgPQwgN/+kGCn9xQJSGlFKUaBVLymgWR0BedCUs4DLbdX2UKGgGaAloD0MISgosgKmEcUCUhpRSlGgVS8VoFkdAXn67SRbKR3V9lChoBmgJaA9DCM2RlV8GWHNAlIaUUpRoFUvaaBZHQF6BD/VAiV11fZQoaAZoCWgPQwjhYkUNZt9xQJSGlFKUaBVLv2gWR0Beh8ENe+mFdX2UKGgGaAloD0MIKQXdXpJIc0CUhpRSlGgVS8poFkdAXohd5Y5ksnV9lChoBmgJaA9DCJtUNNZ+nHFAlIaUUpRoFUvcaBZHQF6JenQ6ZIB1fZQoaAZoCWgPQwgqyM9G7tFxQJSGlFKUaBVL5GgWR0BeiwxrSE13dX2UKGgGaAloD0MIgsgiTfwLckCUhpRSlGgVS91oFkdAXpiB9Tgl4XV9lChoBmgJaA9DCPDbEOM16XJAlIaUUpRoFUu/aBZHQF6apzcRDkV1fZQoaAZoCWgPQwj5wI7/QgRzQJSGlFKUaBVLy2gWR0BeniHM2WIHdX2UKGgGaAloD0MIpTDvcWYbcUCUhpRSlGgVS95oFkdAXqRu63AmA3V9lChoBmgJaA9DCLRXHw+913BAlIaUUpRoFUvJaBZHQF6w0gr6LwZ1fZQoaAZoCWgPQwie0OtPogxzQJSGlFKUaBVLy2gWR0Bevw2dd3SsdX2UKGgGaAloD0MIc4V3uYgKc0CUhpRSlGgVS8toFkdAXsV9G7SRbXV9lChoBmgJaA9DCA+byMyFgnFAlIaUUpRoFUvHaBZHQF7H6FM7EHd1fZQoaAZoCWgPQwhLzLOS1hVwQJSGlFKUaBVLzmgWR0BeyZ4W1twadX2UKGgGaAloD0MI4C77deebckCUhpRSlGgVS7FoFkdAXs4uvllsg3V9lChoBmgJaA9DCI2XbhKDvm5AlIaUUpRoFUvTaBZHQF7Swob4rSV1fZQoaAZoCWgPQwhyi/m5oaRzQJSGlFKUaBVLwGgWR0Be3M495hScdX2UKGgGaAloD0MI8NqlDccYc0CUhpRSlGgVS8poFkdAXuJsdkrf+HV9lChoBmgJaA9DCGvxKQAGxnBAlIaUUpRoFUvRaBZHQF7mldTo+wF1fZQoaAZoCWgPQwgAOzdtRmZwQJSGlFKUaBVLvmgWR0Be7aya/h2odX2UKGgGaAloD0MI6J/gYoUUckCUhpRSlGgVS/BoFkdAXvbyNGViWnV9lChoBmgJaA9DCAjIl1BBcnNAlIaUUpRoFUvMaBZHQF72vxH5Jsh1ZS4="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 1284, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVvwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAUsBSxNDBIgAUwCUToWUKYwBX5SFlIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCB9lH2UKGgXaA6MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgYjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "system_info": {"OS": "Linux-5.4.188+-x86_64-with-Ubuntu-18.04-bionic #1 SMP Sun Apr 24 10:03:06 PDT 2022", "Python": "3.7.13", "Stable-Baselines3": "1.5.0", "PyTorch": "1.11.0+cu113", "GPU Enabled": "True", "Numpy": "1.21.6", "Gym": "0.21.0"}}
 
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7fce41ef1b00>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7fce41ef1b90>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7fce41ef1c20>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7fce41ef1cb0>", "_build": "<function ActorCriticPolicy._build at 0x7fce41ef1d40>", "forward": "<function ActorCriticPolicy.forward at 0x7fce41ef1dd0>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7fce41ef1e60>", "_predict": "<function ActorCriticPolicy._predict at 0x7fce41ef1ef0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7fce41ef1f80>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7fce41ef7050>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7fce41ef70e0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc_data object at 0x7fce41f463f0>"}, "verbose": 1, "policy_kwargs": {}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVnwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/5RoCksIhZSMAUOUdJRSlIwEaGlnaJRoEiiWIAAAAAAAAAAAAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAf5RoCksIhZRoFXSUUpSMDWJvdW5kZWRfYmVsb3eUaBIolggAAAAAAAAAAAAAAAAAAACUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYIAAAAAAAAAAAAAAAAAAAAlGghSwiFlGgVdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [8], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False]", "bounded_above": "[False False False False False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gAWVggAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUaAeTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu", "n": 4, "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "num_timesteps": 65536, "_total_timesteps": 50000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1651750166.1774747, "learning_rate": 0.0003, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVvwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAUsBSxNDBIgAUwCUToWUKYwBX5SFlIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCB9lH2UKGgXaA6MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgYjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAACbLSr6MS00/ShTdPAIGGL9YVYS+ohe1PQAAAAAAAAAAmuVivZxAAbzjvS08gfqQPA3qTL1IonI9AACAPwAAgD9NSIQ9we1TP5zSqLyS1Q6/Y08sPkjj3LwAAAAAAAAAADPy1Ly4WIe75k94PPIbAT3IdEe8zcHftAAAgD8AAIA/5tudvXCavT93DK++wicNvmTV/bw98mW9AAAAAAAAAACmdq29JA+8PWgljD6ppKS+p9ShPXxvEj4AAAAAAAAAAADoc7wc6Qi8bUCivDlhxzxupUU91RXuuwAAgD8AAIA/zZkYPqVulT/PzsA+AW4Ov8vbpz5qiX4+AAAAAAAAAACNDVI+f7iWP8IDzT7G5gO/yCTVPg0eMT4AAAAAAAAAAJqpQbwbZZK8GVofve9Skrt1M549YjO6vQAAgD8AAIA/ZnWOvBSHkD3MFQu93nTgvhx6CL6iSJ67AAAAAAAAAACAlC09O6+IvCggJL65Mkg9YacvPcpDp7sAAIA/AACAPzOj5j3zdnk/5S4XPTrwD79cTYE+DZN2vQAAAAAAAAAAgNgPvSiR4z0TK1I+FPPQvkNL9zwVpdM9AAAAAAAAAAAzDIQ8lDCiPzvY0j0jbBW/BSk/PZsNuz0AAAAAAAAAADNLyju79JY/6nGYPO29L7/2pSQ9ZJqYPQAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.3107200000000001, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVHRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMI/I123DDfc0CUhpRSlIwBbJRL04wBdJRHQGMWsmOU+s51fZQoaAZoCWgPQwjuIeF7/7FwQJSGlFKUaBVLxmgWR0BjG3/DLr5ZdX2UKGgGaAloD0MImkNSC6X5ckCUhpRSlGgVS8ZoFkdAYyHM/yGzr3V9lChoBmgJaA9DCNlAuth0HXRAlIaUUpRoFUvcaBZHQGMnI0hvBJt1fZQoaAZoCWgPQwh48umx7bVxQJSGlFKUaBVL4GgWR0BjKSF9KEnLdX2UKGgGaAloD0MIMLsnD8v1ckCUhpRSlGgVS9BoFkdAYynxLCemN3V9lChoBmgJaA9DCPrxlxY1qnNAlIaUUpRoFUvnaBZHQGMqZUT+NtJ1fZQoaAZoCWgPQwjt1jIZzgZyQJSGlFKUaBVL3WgWR0BjLN1wHZ9NdX2UKGgGaAloD0MIXW+bqRC9cUCUhpRSlGgVS8xoFkdAYy5h4t6HCXV9lChoBmgJaA9DCKBuoMC7Y3NAlIaUUpRoFUu/aBZHQGMupSBK+SN1fZQoaAZoCWgPQwilLa7xWZtzQJSGlFKUaBVLwWgWR0BjM2P91loUdX2UKGgGaAloD0MI0XR2MrjlcECUhpRSlGgVS8BoFkdAYzefs/pt8HV9lChoBmgJaA9DCAAAAADAtXFAlIaUUpRoFUvCaBZHQGM3zC1qnFZ1fZQoaAZoCWgPQwjZ7h6ge+ZyQJSGlFKUaBVLuWgWR0BjN7lcQiA2dX2UKGgGaAloD0MIXYjVH2HfcECUhpRSlGgVS9NoFkdAYzoIUJv5xnV9lChoBmgJaA9DCL7Z5sa05XFAlIaUUpRoFUvUaBZHQGM7a1kUbkx1fZQoaAZoCWgPQwiuZMdGoG1xQJSGlFKUaBVLwWgWR0BjRWkk8ifQdX2UKGgGaAloD0MI2xZlNsi6cUCUhpRSlGgVS9ZoFkdAY0VScbzbvnV9lChoBmgJaA9DCAvRIXBkS3JAlIaUUpRoFUvKaBZHQGRX2sA/9pB1fZQoaAZoCWgPQwgujspNFJRxQJSGlFKUaBVLsWgWR0BkWP8O09hadX2UKGgGaAloD0MINNWT+YebcUCUhpRSlGgVS85oFkdAZGBr7fpD/nV9lChoBmgJaA9DCHNJ1XYT125AlIaUUpRoFUvDaBZHQGRg29cry2B1fZQoaAZoCWgPQwjdJXFWxNJvQJSGlFKUaBVLvWgWR0BkYY0hvBJqdX2UKGgGaAloD0MIlj50QX1kcECUhpRSlGgVS8loFkdAZGQsRQJokHV9lChoBmgJaA9DCAGG5c83ZXFAlIaUUpRoFUvraBZHQGRkp9ZzPrx1fZQoaAZoCWgPQwiJC0CjNONzQJSGlFKUaBVL3WgWR0BkZINVinYQdX2UKGgGaAloD0MI9HAC02nRc0CUhpRSlGgVS8toFkdAZG5lHSWqtHV9lChoBmgJaA9DCJZBtcEJiXFAlIaUUpRoFUvdaBZHQGRyuIhyKel1fZQoaAZoCWgPQwhoB1xXDD9zQJSGlFKUaBVL4WgWR0Bkc8X3xnWbdX2UKGgGaAloD0MI93ZLcsDQcUCUhpRSlGgVS9RoFkdAZHOf0VafSXV9lChoBmgJaA9DCH9Ma9OYH3NAlIaUUpRoFUv4aBZHQGR0F8PWhAZ1fZQoaAZoCWgPQwjE6LmFrjRzQJSGlFKUaBVL0GgWR0BkdFZNfw7UdX2UKGgGaAloD0MID9Qpjy7DcUCUhpRSlGgVS71oFkdAZHlBFd9lVnV9lChoBmgJaA9DCKhxb37D8m9AlIaUUpRoFUvOaBZHQGR83cHnln11fZQoaAZoCWgPQwi/KaxUEGpzQJSGlFKUaBVLvWgWR0Bkga925hBrdX2UKGgGaAloD0MIeLeyRCcYcUCUhpRSlGgVS8poFkdAZIM56t1ZDHV9lChoBmgJaA9DCFZl3xXB9XFAlIaUUpRoFUuqaBZHQGSE974SHuZ1fZQoaAZoCWgPQwj6QzNPLjBxQJSGlFKUaBVLsmgWR0Bkhiohpxm1dX2UKGgGaAloD0MIsW8nESHtckCUhpRSlGgVS8poFkdAZIvpN9H+ZXV9lChoBmgJaA9DCDPFHARdj3NAlIaUUpRoFUvDaBZHQGSNHoouwot1fZQoaAZoCWgPQwj0bFZ9rk9uQJSGlFKUaBVLxmgWR0BkjVBa9sabdX2UKGgGaAloD0MITYHMzqKLUECUhpRSlGgVS35oFkdAZI2u14Pf9HV9lChoBmgJaA9DCByastMPBm9AlIaUUpRoFUvNaBZHQGSPEQwsXi11fZQoaAZoCWgPQwjG/NzQFJ9xQJSGlFKUaBVL0WgWR0BkmVdmg8KYdX2UKGgGaAloD0MI4gD6fX/xcECUhpRSlGgVS79oFkdAZJpqC6H0snV9lChoBmgJaA9DCNDtJY0RDHBAlIaUUpRoFUu+aBZHQGSaiqp97Wx1fZQoaAZoCWgPQwg8SiU8IVJwQJSGlFKUaBVL2mgWR0BknxnezlcRdX2UKGgGaAloD0MI5IV0eMjYcECUhpRSlGgVS79oFkdAZKB6Q/5cknV9lChoBmgJaA9DCHKo34Vts3BAlIaUUpRoFUveaBZHQGSgt5le4Td1fZQoaAZoCWgPQwi5NlSMM0txQJSGlFKUaBVL1GgWR0BkqIG6f8MvdX2UKGgGaAloD0MIHogs0sRHSUCUhpRSlGgVS4VoFkdAZKp7sOXmeXV9lChoBmgJaA9DCGhAvRm1fXFAlIaUUpRoFUvWaBZHQGStxTjvNNd1fZQoaAZoCWgPQwiUS+MXHhJyQJSGlFKUaBVL0mgWR0BkroK6WgOCdX2UKGgGaAloD0MIcHztmaU1ckCUhpRSlGgVS8toFkdAZK6TIvJzUHV9lChoBmgJaA9DCPUUOUQcT3FAlIaUUpRoFUu2aBZHQGSykU9IPLB1fZQoaAZoCWgPQwgWbY5zW9hxQJSGlFKUaBVL3mgWR0Bks6jJuEVWdX2UKGgGaAloD0MIZFjFGxl7ckCUhpRSlGgVS8xoFkdAZLXhrFfiP3V9lChoBmgJaA9DCJNUppiDsG5AlIaUUpRoFUvJaBZHQGS281n/T9d1fZQoaAZoCWgPQwjHgOz1rmxxQJSGlFKUaBVL0WgWR0BkuDxEv0yydX2UKGgGaAloD0MIj4r/O2IWcUCUhpRSlGgVS61oFkdAZMKWmgrYoXV9lChoBmgJaA9DCMJQhxVurXBAlIaUUpRoFUvFaBZHQGTDCbDuSfV1fZQoaAZoCWgPQwhK7UW03SRzQJSGlFKUaBVL1WgWR0BkxUP8Q7LddX2UKGgGaAloD0MImpguxOr0cUCUhpRSlGgVS+FoFkdAZMkf29L6DXV9lChoBmgJaA9DCHEfuTUpJHFAlIaUUpRoFUveaBZHQGTO4Glhw2l1fZQoaAZoCWgPQwiTpkHRfKBxQJSGlFKUaBVLvmgWR0Bk0BbGFSKndX2UKGgGaAloD0MIchQgCuYcc0CUhpRSlGgVS+VoFkdAZNA1sLv1DnV9lChoBmgJaA9DCMAjKlR3zHJAlIaUUpRoFUu8aBZHQGTV+2/i5ut1fZQoaAZoCWgPQwhdFajFoKRxQJSGlFKUaBVL0mgWR0Bk1nP7el9CdX2UKGgGaAloD0MIC9P3GkI0cECUhpRSlGgVS8xoFkdAZNh3TNMXanV9lChoBmgJaA9DCHbicrwC53NAlIaUUpRoFUvNaBZHQGTZaE8JUo91fZQoaAZoCWgPQwiCixU1mO5wQJSGlFKUaBVL0mgWR0Bk3pK15Sm7dX2UKGgGaAloD0MICRUcXlDWckCUhpRSlGgVS7xoFkdAZN+8+RoysXV9lChoBmgJaA9DCNP1RNfFF3FAlIaUUpRoFUvJaBZHQGThF23azu51fZQoaAZoCWgPQwhJ2SJpN29xQJSGlFKUaBVL2WgWR0Bk4RwEQoTgdX2UKGgGaAloD0MIHLeYn9v1cUCUhpRSlGgVS95oFkdAZOQ5o4+8oXV9lChoBmgJaA9DCM5Q3PEmXU1AlIaUUpRoFUujaBZHQGTk5n13+uN1fZQoaAZoCWgPQwgSL0/nysJwQJSGlFKUaBVLxmgWR0Bk7rfWMCLddX2UKGgGaAloD0MIjWDj+ndHckCUhpRSlGgVS9RoFkdAZO9xRVIZqHV9lChoBmgJaA9DCD6w478AEXNAlIaUUpRoFUvNaBZHQGTz8BMi8nN1fZQoaAZoCWgPQwiES8ecJyJxQJSGlFKUaBVLxGgWR0Bk+SlxffGddX2UKGgGaAloD0MIflLt03EnckCUhpRSlGgVS8loFkdAZPkgSOBDonV9lChoBmgJaA9DCDsBTYRN/3BAlIaUUpRoFUvKaBZHQGT6kv9LpRp1fZQoaAZoCWgPQwgfEr73t1lxQJSGlFKUaBVLuGgWR0Bk/OgxrSE2dX2UKGgGaAloD0MIgIEgQIZAckCUhpRSlGgVS8JoFkdAZP5xwQ176nV9lChoBmgJaA9DCOj0vBtLWHFAlIaUUpRoFUu+aBZHQGUBDASFoL51fZQoaAZoCWgPQwgtW+uLROpwQJSGlFKUaBVLumgWR0BlBYnH/95ydX2UKGgGaAloD0MIrd9MTFcfc0CUhpRSlGgVS9poFkdAZQYB3A2ycHV9lChoBmgJaA9DCKuVCb/UHXNAlIaUUpRoFUvAaBZHQGUJmmk30f51fZQoaAZoCWgPQwiHNCpwcvJyQJSGlFKUaBVL3WgWR0BlDlQj2SMcdX2UKGgGaAloD0MIkXu6uiMccUCUhpRSlGgVS9hoFkdAZQ61YyO7x3V9lChoBmgJaA9DCIguqG/ZV3JAlIaUUpRoFUvTaBZHQGURpyhi9Zl1fZQoaAZoCWgPQwh5AmGnGKdzQJSGlFKUaBVL2mgWR0BlEm4Cp3otdX2UKGgGaAloD0MI/0C5bV/3ckCUhpRSlGgVS8hoFkdAZRlFRYRuj3V9lChoBmgJaA9DCJ6ayw2GCHNAlIaUUpRoFUvgaBZHQGUfF8G9pRJ1fZQoaAZoCWgPQwjBjv8CwWpxQJSGlFKUaBVLzmgWR0BlH6gh8pkPdX2UKGgGaAloD0MIVK2FWSjDckCUhpRSlGgVS7loFkdAZSHVp9JBgXV9lChoBmgJaA9DCLU1IhgH0XJAlIaUUpRoFUvHaBZHQGUjWbobGWF1fZQoaAZoCWgPQwhi2jf3V5B0QJSGlFKUaBVLz2gWR0BlJcX7+DODdX2UKGgGaAloD0MII4eIm9P6ckCUhpRSlGgVS7hoFkdAZSZcVQAMlXV9lChoBmgJaA9DCPorZK7MhXFAlIaUUpRoFUvGaBZHQGUn4tHxz7x1ZS4="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 1300, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.999, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVvwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAUsBSxNDBIgAUwCUToWUKYwBX5SFlIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCB9lH2UKGgXaA6MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgYjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz+5mZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": false, "target_kl": null, "system_info": {"OS": "Linux-5.4.188+-x86_64-with-Ubuntu-18.04-bionic #1 SMP Sun Apr 24 10:03:06 PDT 2022", "Python": "3.7.13", "Stable-Baselines3": "1.5.0", "PyTorch": "1.11.0+cu113", "GPU Enabled": "True", "Numpy": "1.21.6", "Gym": "0.21.0"}}
ppo-LunarLander-v2.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:45fc575a92654c583182e04308ee7e99023d6006f67a129e76ed289496afdebc
3
- size 143977
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1fab80b2ce79dbf9e10329dec20baaae8c26cd93585e51bb6e3cf662907769f2
3
+ size 143979
ppo-LunarLander-v2/data CHANGED
@@ -4,19 +4,19 @@
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
- "__init__": "<function ActorCriticPolicy.__init__ at 0x7f6a47db93b0>",
8
- "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f6a47db9440>",
9
- "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f6a47db94d0>",
10
- "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f6a47db9560>",
11
- "_build": "<function ActorCriticPolicy._build at 0x7f6a47db95f0>",
12
- "forward": "<function ActorCriticPolicy.forward at 0x7f6a47db9680>",
13
- "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f6a47db9710>",
14
- "_predict": "<function ActorCriticPolicy._predict at 0x7f6a47db97a0>",
15
- "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f6a47db9830>",
16
- "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f6a47db98c0>",
17
- "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f6a47db9950>",
18
  "__abstractmethods__": "frozenset()",
19
- "_abc_impl": "<_abc_data object at 0x7f6a47e0b480>"
20
  },
21
  "verbose": 1,
22
  "policy_kwargs": {},
@@ -42,12 +42,12 @@
42
  "_np_random": null
43
  },
44
  "n_envs": 16,
45
- "num_timesteps": 49152,
46
- "_total_timesteps": 40000,
47
  "_num_timesteps_at_start": 0,
48
  "seed": null,
49
  "action_noise": null,
50
- "start_time": 1651747358.8787131,
51
  "learning_rate": 0.0003,
52
  "tensorboard_log": null,
53
  "lr_schedule": {
@@ -56,29 +56,29 @@
56
  },
57
  "_last_obs": {
58
  ":type:": "<class 'numpy.ndarray'>",
59
- ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAFP7A74TbYM/tF6DvlNoIr9Fv4e+IekrvgAAAAAAAAAAsy4kvhCNjj6BtI0+EgTtvo6qe730VRI+AAAAAAAAAACAZxq+H3gDP25IjT7luu2++q2hvWJ56T0AAAAAAAAAAFPGqb65Xz4/tbssPswFBr81lsy+pq9PPgAAAAAAAAAAmnnvuky0tD/XhT2+7H0XPckxCzsUuCs9AAAAAAAAAAAA/G69KRM6vIaRXz0caXs89umbvdo4UD0AAIA/AACAPwCAeDyPqim6HHQcs13L8a7CYnG77tvBMwAAgD8AAIA/MzgDPoR6gj7uA+W+t0gHv0ZiYrwuTKW+AAAAAAAAAADAUYO9lwpyP/Ou8L1Jayu/SEGrvWBKlb0AAAAAAAAAADOTj72yn5w/AAqqvllgK7+twPW9pVYsvgAAAAAAAAAAM438vOHVnTt+zJc+v2eOviu1/D0rMBq/AAAAAAAAgD/NLV4+skSEPx2kID6/dRO/857bPjFnrTwAAAAAAAAAAKarAb62LwA/EFA+Ppzu6b4F/7S9E8/5PQAAAAAAAAAAzUxHORbqtD/8rp080yfhPfzvX7nH3o67AAAAAAAAAADNrQS+w9kKun5Avjvybx02wRXJuxVsvjgAAAAAAAAAAGYS67sk0Xw8Ypq/PP4r274SGs+7eR6bPAAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
60
  },
61
  "_last_episode_starts": {
62
  ":type:": "<class 'numpy.ndarray'>",
63
- ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAABAAAAAAAAAAABAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="
64
  },
65
  "_last_original_obs": null,
66
  "_episode_num": 0,
67
  "use_sde": false,
68
  "sde_sample_freq": -1,
69
- "_current_progress_remaining": -0.2287999999999999,
70
  "ep_info_buffer": {
71
  ":type:": "<class 'collections.deque'>",
72
- ":serialized:": "gAWVHRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIP1OvW4TtcECUhpRSlIwBbJRLxIwBdJRHQFqyiJfpljF1fZQoaAZoCWgPQwhPWU3X02dyQJSGlFKUaBVL5WgWR0BauHTI/7iydX2UKGgGaAloD0MIKqkT0IQDckCUhpRSlGgVS8BoFkdAWri4EwFkhHV9lChoBmgJaA9DCBegbTWrLHFAlIaUUpRoFUvaaBZHQFq5pTMqz7d1fZQoaAZoCWgPQwheRxyygZhyQJSGlFKUaBVLumgWR0BaveGXXyy2dX2UKGgGaAloD0MIK/uuCH6NcUCUhpRSlGgVS8xoFkdAWsa4Wk8A73V9lChoBmgJaA9DCB/Xhopx/HBAlIaUUpRoFUu9aBZHQFrKeumrKeV1fZQoaAZoCWgPQwgSSl8IueBxQJSGlFKUaBVLxGgWR0BayxyKekHldX2UKGgGaAloD0MIIT1FDtEJdECUhpRSlGgVS8JoFkdAWvI6xPfsNXV9lChoBmgJaA9DCHO4VntYrXBAlIaUUpRoFUu9aBZHQFr0ev6j3251fZQoaAZoCWgPQwj5SiAlNrRyQJSGlFKUaBVLz2gWR0BbANelbeMydX2UKGgGaAloD0MIoYMu4ZBicECUhpRSlGgVS8VoFkdAWwKfywwCbXV9lChoBmgJaA9DCCEdHsL44nJAlIaUUpRoFUu8aBZHQFsEV4X40uV1fZQoaAZoCWgPQwgKgse3t2pyQJSGlFKUaBVL7mgWR0BbB0nw5NoKdX2UKGgGaAloD0MIIPEr1jASdECUhpRSlGgVS9JoFkdAWw3Eehf0E3V9lChoBmgJaA9DCDVCP1PvmHNAlIaUUpRoFUvuaBZHQFsO9Ujs2Nx1fZQoaAZoCWgPQwilFd9QOAtyQJSGlFKUaBVL12gWR0BbECGvfTCtdX2UKGgGaAloD0MIEeSghJmBc0CUhpRSlGgVS7poFkdAWw/101ZTynV9lChoBmgJaA9DCEuxo3Gow3JAlIaUUpRoFUvOaBZHQFsSU9ZA6dV1fZQoaAZoCWgPQwgXnMHf73NyQJSGlFKUaBVL0GgWR0BbE3gtOEdvdX2UKGgGaAloD0MI0a5Cys/nckCUhpRSlGgVS+RoFkdAWxyRbKRuCXV9lChoBmgJaA9DCOxnsRTJ2HFAlIaUUpRoFUvKaBZHQF00mjj7yhB1fZQoaAZoCWgPQwgQlNv2vXNyQJSGlFKUaBVLwmgWR0BdNakAPuohdX2UKGgGaAloD0MIGw5LA380c0CUhpRSlGgVS89oFkdAXToQL/jsEHV9lChoBmgJaA9DCGVQbXDiVnNAlIaUUpRoFUvMaBZHQF1jDCxeLNx1fZQoaAZoCWgPQwinPLoRFoRxQJSGlFKUaBVLtmgWR0BdZVafSQYDdX2UKGgGaAloD0MIj1Tf+UV5TkCUhpRSlGgVS5toFkdAXWep84Pwu3V9lChoBmgJaA9DCGqiz0cZtXFAlIaUUpRoFUu2aBZHQF1pOe8PFvR1fZQoaAZoCWgPQwis5c5M8M1yQJSGlFKUaBVLv2gWR0BdbBDohY/3dX2UKGgGaAloD0MI28NeKGBDckCUhpRSlGgVS7doFkdAXW1Gqgh8pnV9lChoBmgJaA9DCILhXMPM7XFAlIaUUpRoFUvlaBZHQF1t2itaIN51fZQoaAZoCWgPQwgr+kMzj+pwQJSGlFKUaBVLxGgWR0BdeoBeXzDodX2UKGgGaAloD0MI7rCJzFyAckCUhpRSlGgVS8ZoFkdAXXsyuZCv5nV9lChoBmgJaA9DCI1HqYSnU3JAlIaUUpRoFUvFaBZHQF19QnhKlHl1fZQoaAZoCWgPQwhwzR39L8xxQJSGlFKUaBVL12gWR0BdgTTSb6P9dX2UKGgGaAloD0MIBWoxeBjicUCUhpRSlGgVS8BoFkdAXYaunuRcNnV9lChoBmgJaA9DCGVwlLx6GXJAlIaUUpRoFUvGaBZHQF2N7JGOMl11fZQoaAZoCWgPQwiSsG8n0ZhxQJSGlFKUaBVL0mgWR0BdkeAy2x6fdX2UKGgGaAloD0MIjKAxk2izc0CUhpRSlGgVS/VoFkdAXZRLdvbXYnV9lChoBmgJaA9DCEJ4tHFEBHNAlIaUUpRoFUvIaBZHQF2UBZIQOFx1fZQoaAZoCWgPQwg9t9CVCFFzQJSGlFKUaBVLyGgWR0Bdv/Cl7+kydX2UKGgGaAloD0MIu7ciMcFFckCUhpRSlGgVS8FoFkdAXcLgflp48nV9lChoBmgJaA9DCMWPMXctO3RAlIaUUpRoFUvRaBZHQF3C6P8yeqd1fZQoaAZoCWgPQwhtrS8SWgF0QJSGlFKUaBVLxGgWR0Bdw98Rcu8LdX2UKGgGaAloD0MIvf25aEgNcUCUhpRSlGgVS8doFkdAXcQ91U2kz3V9lChoBmgJaA9DCH+FzJXBQXJAlIaUUpRoFUvNaBZHQF3EpzcRDkV1fZQoaAZoCWgPQwgk7UYfMz5zQJSGlFKUaBVL52gWR0BdyjgqEvkBdX2UKGgGaAloD0MIceSByKKCc0CUhpRSlGgVS7poFkdAXc/2TPjXF3V9lChoBmgJaA9DCLx2acOhz3JAlIaUUpRoFUvEaBZHQF3SBRyfcvd1fZQoaAZoCWgPQwjjwRa7/Q10QJSGlFKUaBVLz2gWR0Bd1fms/6frdX2UKGgGaAloD0MIroBCPf3dcUCUhpRSlGgVS8FoFkdAXdX15B1LanV9lChoBmgJaA9DCKiMf59xG3BAlIaUUpRoFUvHaBZHQF3j/jsD4g11fZQoaAZoCWgPQwjQ8GYNHuVwQJSGlFKUaBVL0GgWR0Bd7ADeTFERdX2UKGgGaAloD0MIAyMva2Iwc0CUhpRSlGgVS+toFkdAXezWSU1Q7HV9lChoBmgJaA9DCA2K5gHsv3FAlIaUUpRoFUvZaBZHQF3yKR+z+m51fZQoaAZoCWgPQwihuyTOyltzQJSGlFKUaBVL7WgWR0Bd+hXGOuJUdX2UKGgGaAloD0MIVYSbjCozOUCUhpRSlGgVS41oFkdAXf9fTkQwsXV9lChoBmgJaA9DCJ87wf7rUnBAlIaUUpRoFUu9aBZHQF4VCbtqpLp1fZQoaAZoCWgPQwhruwm+aaBxQJSGlFKUaBVLz2gWR0BeHKcEvCdjdX2UKGgGaAloD0MIIk+Srtk5cECUhpRSlGgVS81oFkdAXhyuA7Ppp3V9lChoBmgJaA9DCBQEj28v3HBAlIaUUpRoFUvaaBZHQF4hq4pc5bR1fZQoaAZoCWgPQwhEMuTY+g5yQJSGlFKUaBVL4GgWR0BeIjUVi4KAdX2UKGgGaAloD0MI9kVCW46OcUCUhpRSlGgVS7hoFkdAXia4Cp3otHV9lChoBmgJaA9DCIZVvJE5t3BAlIaUUpRoFUvLaBZHQF4oogFHJ911fZQoaAZoCWgPQwitGK4OAE1zQJSGlFKUaBVL2mgWR0BeKSAtnPE9dX2UKGgGaAloD0MImBb1SW6ockCUhpRSlGgVS8xoFkdAXi8Svkili3V9lChoBmgJaA9DCPZBlgVTm3NAlIaUUpRoFUvfaBZHQF4y4TK1XvJ1fZQoaAZoCWgPQwjlZOJWQfJxQJSGlFKUaBVLu2gWR0BeNhKlHjIadX2UKGgGaAloD0MI1Em2utxicECUhpRSlGgVS7RoFkdAXkBvm5lOGnV9lChoBmgJaA9DCNlcNc8R2HBAlIaUUpRoFUvHaBZHQF5Csyi22G91fZQoaAZoCWgPQwgsZ++MdstwQJSGlFKUaBVLymgWR0BeRUpNKyv+dX2UKGgGaAloD0MIbTmX4upyc0CUhpRSlGgVS9NoFkdAXlbbblA/s3V9lChoBmgJaA9DCA5o6Qp2DHNAlIaUUpRoFUvmaBZHQF5kXhOxjax1fZQoaAZoCWgPQwgwKqkTUN5xQJSGlFKUaBVLtWgWR0BeaqzqrzXjdX2UKGgGaAloD0MIIHu9++OCckCUhpRSlGgVS8loFkdAXm1Htnf2snV9lChoBmgJaA9DCHIUIApm63JAlIaUUpRoFUuyaBZHQF5uvlEJBxB1fZQoaAZoCWgPQwgN/+kGCn9xQJSGlFKUaBVLymgWR0BedCUs4DLbdX2UKGgGaAloD0MISgosgKmEcUCUhpRSlGgVS8VoFkdAXn67SRbKR3V9lChoBmgJaA9DCM2RlV8GWHNAlIaUUpRoFUvaaBZHQF6BD/VAiV11fZQoaAZoCWgPQwjhYkUNZt9xQJSGlFKUaBVLv2gWR0Beh8ENe+mFdX2UKGgGaAloD0MIKQXdXpJIc0CUhpRSlGgVS8poFkdAXohd5Y5ksnV9lChoBmgJaA9DCJtUNNZ+nHFAlIaUUpRoFUvcaBZHQF6JenQ6ZIB1fZQoaAZoCWgPQwgqyM9G7tFxQJSGlFKUaBVL5GgWR0BeiwxrSE13dX2UKGgGaAloD0MIgsgiTfwLckCUhpRSlGgVS91oFkdAXpiB9Tgl4XV9lChoBmgJaA9DCPDbEOM16XJAlIaUUpRoFUu/aBZHQF6apzcRDkV1fZQoaAZoCWgPQwj5wI7/QgRzQJSGlFKUaBVLy2gWR0BeniHM2WIHdX2UKGgGaAloD0MIpTDvcWYbcUCUhpRSlGgVS95oFkdAXqRu63AmA3V9lChoBmgJaA9DCLRXHw+913BAlIaUUpRoFUvJaBZHQF6w0gr6LwZ1fZQoaAZoCWgPQwie0OtPogxzQJSGlFKUaBVLy2gWR0Bevw2dd3SsdX2UKGgGaAloD0MIc4V3uYgKc0CUhpRSlGgVS8toFkdAXsV9G7SRbXV9lChoBmgJaA9DCA+byMyFgnFAlIaUUpRoFUvHaBZHQF7H6FM7EHd1fZQoaAZoCWgPQwhLzLOS1hVwQJSGlFKUaBVLzmgWR0BeyZ4W1twadX2UKGgGaAloD0MI4C77deebckCUhpRSlGgVS7FoFkdAXs4uvllsg3V9lChoBmgJaA9DCI2XbhKDvm5AlIaUUpRoFUvTaBZHQF7Swob4rSV1fZQoaAZoCWgPQwhyi/m5oaRzQJSGlFKUaBVLwGgWR0Be3M495hScdX2UKGgGaAloD0MI8NqlDccYc0CUhpRSlGgVS8poFkdAXuJsdkrf+HV9lChoBmgJaA9DCGvxKQAGxnBAlIaUUpRoFUvRaBZHQF7mldTo+wF1fZQoaAZoCWgPQwgAOzdtRmZwQJSGlFKUaBVLvmgWR0Be7aya/h2odX2UKGgGaAloD0MI6J/gYoUUckCUhpRSlGgVS/BoFkdAXvbyNGViWnV9lChoBmgJaA9DCAjIl1BBcnNAlIaUUpRoFUvMaBZHQF72vxH5Jsh1ZS4="
73
  },
74
  "ep_success_buffer": {
75
  ":type:": "<class 'collections.deque'>",
76
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
77
  },
78
- "_n_updates": 1284,
79
  "n_steps": 1024,
80
  "gamma": 0.999,
81
- "gae_lambda": 0.98,
82
  "ent_coef": 0.01,
83
  "vf_coef": 0.5,
84
  "max_grad_norm": 0.5,
@@ -86,9 +86,9 @@
86
  "n_epochs": 4,
87
  "clip_range": {
88
  ":type:": "<class 'function'>",
89
- ":serialized:": "gAWVvwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAUsBSxNDBIgAUwCUToWUKYwBX5SFlIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCB9lH2UKGgXaA6MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgYjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"
90
  },
91
  "clip_range_vf": null,
92
- "normalize_advantage": true,
93
  "target_kl": null
94
  }
 
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
+ "__init__": "<function ActorCriticPolicy.__init__ at 0x7fce41ef1b00>",
8
+ "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7fce41ef1b90>",
9
+ "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7fce41ef1c20>",
10
+ "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7fce41ef1cb0>",
11
+ "_build": "<function ActorCriticPolicy._build at 0x7fce41ef1d40>",
12
+ "forward": "<function ActorCriticPolicy.forward at 0x7fce41ef1dd0>",
13
+ "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7fce41ef1e60>",
14
+ "_predict": "<function ActorCriticPolicy._predict at 0x7fce41ef1ef0>",
15
+ "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7fce41ef1f80>",
16
+ "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7fce41ef7050>",
17
+ "predict_values": "<function ActorCriticPolicy.predict_values at 0x7fce41ef70e0>",
18
  "__abstractmethods__": "frozenset()",
19
+ "_abc_impl": "<_abc_data object at 0x7fce41f463f0>"
20
  },
21
  "verbose": 1,
22
  "policy_kwargs": {},
 
42
  "_np_random": null
43
  },
44
  "n_envs": 16,
45
+ "num_timesteps": 65536,
46
+ "_total_timesteps": 50000,
47
  "_num_timesteps_at_start": 0,
48
  "seed": null,
49
  "action_noise": null,
50
+ "start_time": 1651750166.1774747,
51
  "learning_rate": 0.0003,
52
  "tensorboard_log": null,
53
  "lr_schedule": {
 
56
  },
57
  "_last_obs": {
58
  ":type:": "<class 'numpy.ndarray'>",
59
+ ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAACbLSr6MS00/ShTdPAIGGL9YVYS+ohe1PQAAAAAAAAAAmuVivZxAAbzjvS08gfqQPA3qTL1IonI9AACAPwAAgD9NSIQ9we1TP5zSqLyS1Q6/Y08sPkjj3LwAAAAAAAAAADPy1Ly4WIe75k94PPIbAT3IdEe8zcHftAAAgD8AAIA/5tudvXCavT93DK++wicNvmTV/bw98mW9AAAAAAAAAACmdq29JA+8PWgljD6ppKS+p9ShPXxvEj4AAAAAAAAAAADoc7wc6Qi8bUCivDlhxzxupUU91RXuuwAAgD8AAIA/zZkYPqVulT/PzsA+AW4Ov8vbpz5qiX4+AAAAAAAAAACNDVI+f7iWP8IDzT7G5gO/yCTVPg0eMT4AAAAAAAAAAJqpQbwbZZK8GVofve9Skrt1M549YjO6vQAAgD8AAIA/ZnWOvBSHkD3MFQu93nTgvhx6CL6iSJ67AAAAAAAAAACAlC09O6+IvCggJL65Mkg9YacvPcpDp7sAAIA/AACAPzOj5j3zdnk/5S4XPTrwD79cTYE+DZN2vQAAAAAAAAAAgNgPvSiR4z0TK1I+FPPQvkNL9zwVpdM9AAAAAAAAAAAzDIQ8lDCiPzvY0j0jbBW/BSk/PZsNuz0AAAAAAAAAADNLyju79JY/6nGYPO29L7/2pSQ9ZJqYPQAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
60
  },
61
  "_last_episode_starts": {
62
  ":type:": "<class 'numpy.ndarray'>",
63
+ ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="
64
  },
65
  "_last_original_obs": null,
66
  "_episode_num": 0,
67
  "use_sde": false,
68
  "sde_sample_freq": -1,
69
+ "_current_progress_remaining": -0.3107200000000001,
70
  "ep_info_buffer": {
71
  ":type:": "<class 'collections.deque'>",
72
+ ":serialized:": "gAWVHRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMI/I123DDfc0CUhpRSlIwBbJRL04wBdJRHQGMWsmOU+s51fZQoaAZoCWgPQwjuIeF7/7FwQJSGlFKUaBVLxmgWR0BjG3/DLr5ZdX2UKGgGaAloD0MImkNSC6X5ckCUhpRSlGgVS8ZoFkdAYyHM/yGzr3V9lChoBmgJaA9DCNlAuth0HXRAlIaUUpRoFUvcaBZHQGMnI0hvBJt1fZQoaAZoCWgPQwh48umx7bVxQJSGlFKUaBVL4GgWR0BjKSF9KEnLdX2UKGgGaAloD0MIMLsnD8v1ckCUhpRSlGgVS9BoFkdAYynxLCemN3V9lChoBmgJaA9DCPrxlxY1qnNAlIaUUpRoFUvnaBZHQGMqZUT+NtJ1fZQoaAZoCWgPQwjt1jIZzgZyQJSGlFKUaBVL3WgWR0BjLN1wHZ9NdX2UKGgGaAloD0MIXW+bqRC9cUCUhpRSlGgVS8xoFkdAYy5h4t6HCXV9lChoBmgJaA9DCKBuoMC7Y3NAlIaUUpRoFUu/aBZHQGMupSBK+SN1fZQoaAZoCWgPQwilLa7xWZtzQJSGlFKUaBVLwWgWR0BjM2P91loUdX2UKGgGaAloD0MI0XR2MrjlcECUhpRSlGgVS8BoFkdAYzefs/pt8HV9lChoBmgJaA9DCAAAAADAtXFAlIaUUpRoFUvCaBZHQGM3zC1qnFZ1fZQoaAZoCWgPQwjZ7h6ge+ZyQJSGlFKUaBVLuWgWR0BjN7lcQiA2dX2UKGgGaAloD0MIXYjVH2HfcECUhpRSlGgVS9NoFkdAYzoIUJv5xnV9lChoBmgJaA9DCL7Z5sa05XFAlIaUUpRoFUvUaBZHQGM7a1kUbkx1fZQoaAZoCWgPQwiuZMdGoG1xQJSGlFKUaBVLwWgWR0BjRWkk8ifQdX2UKGgGaAloD0MI2xZlNsi6cUCUhpRSlGgVS9ZoFkdAY0VScbzbvnV9lChoBmgJaA9DCAvRIXBkS3JAlIaUUpRoFUvKaBZHQGRX2sA/9pB1fZQoaAZoCWgPQwgujspNFJRxQJSGlFKUaBVLsWgWR0BkWP8O09hadX2UKGgGaAloD0MINNWT+YebcUCUhpRSlGgVS85oFkdAZGBr7fpD/nV9lChoBmgJaA9DCHNJ1XYT125AlIaUUpRoFUvDaBZHQGRg29cry2B1fZQoaAZoCWgPQwjdJXFWxNJvQJSGlFKUaBVLvWgWR0BkYY0hvBJqdX2UKGgGaAloD0MIlj50QX1kcECUhpRSlGgVS8loFkdAZGQsRQJokHV9lChoBmgJaA9DCAGG5c83ZXFAlIaUUpRoFUvraBZHQGRkp9ZzPrx1fZQoaAZoCWgPQwiJC0CjNONzQJSGlFKUaBVL3WgWR0BkZINVinYQdX2UKGgGaAloD0MI9HAC02nRc0CUhpRSlGgVS8toFkdAZG5lHSWqtHV9lChoBmgJaA9DCJZBtcEJiXFAlIaUUpRoFUvdaBZHQGRyuIhyKel1fZQoaAZoCWgPQwhoB1xXDD9zQJSGlFKUaBVL4WgWR0Bkc8X3xnWbdX2UKGgGaAloD0MI93ZLcsDQcUCUhpRSlGgVS9RoFkdAZHOf0VafSXV9lChoBmgJaA9DCH9Ma9OYH3NAlIaUUpRoFUv4aBZHQGR0F8PWhAZ1fZQoaAZoCWgPQwjE6LmFrjRzQJSGlFKUaBVL0GgWR0BkdFZNfw7UdX2UKGgGaAloD0MID9Qpjy7DcUCUhpRSlGgVS71oFkdAZHlBFd9lVnV9lChoBmgJaA9DCKhxb37D8m9AlIaUUpRoFUvOaBZHQGR83cHnln11fZQoaAZoCWgPQwi/KaxUEGpzQJSGlFKUaBVLvWgWR0Bkga925hBrdX2UKGgGaAloD0MIeLeyRCcYcUCUhpRSlGgVS8poFkdAZIM56t1ZDHV9lChoBmgJaA9DCFZl3xXB9XFAlIaUUpRoFUuqaBZHQGSE974SHuZ1fZQoaAZoCWgPQwj6QzNPLjBxQJSGlFKUaBVLsmgWR0Bkhiohpxm1dX2UKGgGaAloD0MIsW8nESHtckCUhpRSlGgVS8poFkdAZIvpN9H+ZXV9lChoBmgJaA9DCDPFHARdj3NAlIaUUpRoFUvDaBZHQGSNHoouwot1fZQoaAZoCWgPQwj0bFZ9rk9uQJSGlFKUaBVLxmgWR0BkjVBa9sabdX2UKGgGaAloD0MITYHMzqKLUECUhpRSlGgVS35oFkdAZI2u14Pf9HV9lChoBmgJaA9DCByastMPBm9AlIaUUpRoFUvNaBZHQGSPEQwsXi11fZQoaAZoCWgPQwjG/NzQFJ9xQJSGlFKUaBVL0WgWR0BkmVdmg8KYdX2UKGgGaAloD0MI4gD6fX/xcECUhpRSlGgVS79oFkdAZJpqC6H0snV9lChoBmgJaA9DCNDtJY0RDHBAlIaUUpRoFUu+aBZHQGSaiqp97Wx1fZQoaAZoCWgPQwg8SiU8IVJwQJSGlFKUaBVL2mgWR0BknxnezlcRdX2UKGgGaAloD0MI5IV0eMjYcECUhpRSlGgVS79oFkdAZKB6Q/5cknV9lChoBmgJaA9DCHKo34Vts3BAlIaUUpRoFUveaBZHQGSgt5le4Td1fZQoaAZoCWgPQwi5NlSMM0txQJSGlFKUaBVL1GgWR0BkqIG6f8MvdX2UKGgGaAloD0MIHogs0sRHSUCUhpRSlGgVS4VoFkdAZKp7sOXmeXV9lChoBmgJaA9DCGhAvRm1fXFAlIaUUpRoFUvWaBZHQGStxTjvNNd1fZQoaAZoCWgPQwiUS+MXHhJyQJSGlFKUaBVL0mgWR0BkroK6WgOCdX2UKGgGaAloD0MIcHztmaU1ckCUhpRSlGgVS8toFkdAZK6TIvJzUHV9lChoBmgJaA9DCPUUOUQcT3FAlIaUUpRoFUu2aBZHQGSykU9IPLB1fZQoaAZoCWgPQwgWbY5zW9hxQJSGlFKUaBVL3mgWR0Bks6jJuEVWdX2UKGgGaAloD0MIZFjFGxl7ckCUhpRSlGgVS8xoFkdAZLXhrFfiP3V9lChoBmgJaA9DCJNUppiDsG5AlIaUUpRoFUvJaBZHQGS281n/T9d1fZQoaAZoCWgPQwjHgOz1rmxxQJSGlFKUaBVL0WgWR0BkuDxEv0yydX2UKGgGaAloD0MIj4r/O2IWcUCUhpRSlGgVS61oFkdAZMKWmgrYoXV9lChoBmgJaA9DCMJQhxVurXBAlIaUUpRoFUvFaBZHQGTDCbDuSfV1fZQoaAZoCWgPQwhK7UW03SRzQJSGlFKUaBVL1WgWR0BkxUP8Q7LddX2UKGgGaAloD0MImpguxOr0cUCUhpRSlGgVS+FoFkdAZMkf29L6DXV9lChoBmgJaA9DCHEfuTUpJHFAlIaUUpRoFUveaBZHQGTO4Glhw2l1fZQoaAZoCWgPQwiTpkHRfKBxQJSGlFKUaBVLvmgWR0Bk0BbGFSKndX2UKGgGaAloD0MIchQgCuYcc0CUhpRSlGgVS+VoFkdAZNA1sLv1DnV9lChoBmgJaA9DCMAjKlR3zHJAlIaUUpRoFUu8aBZHQGTV+2/i5ut1fZQoaAZoCWgPQwhdFajFoKRxQJSGlFKUaBVL0mgWR0Bk1nP7el9CdX2UKGgGaAloD0MIC9P3GkI0cECUhpRSlGgVS8xoFkdAZNh3TNMXanV9lChoBmgJaA9DCHbicrwC53NAlIaUUpRoFUvNaBZHQGTZaE8JUo91fZQoaAZoCWgPQwiCixU1mO5wQJSGlFKUaBVL0mgWR0Bk3pK15Sm7dX2UKGgGaAloD0MICRUcXlDWckCUhpRSlGgVS7xoFkdAZN+8+RoysXV9lChoBmgJaA9DCNP1RNfFF3FAlIaUUpRoFUvJaBZHQGThF23azu51fZQoaAZoCWgPQwhJ2SJpN29xQJSGlFKUaBVL2WgWR0Bk4RwEQoTgdX2UKGgGaAloD0MIHLeYn9v1cUCUhpRSlGgVS95oFkdAZOQ5o4+8oXV9lChoBmgJaA9DCM5Q3PEmXU1AlIaUUpRoFUujaBZHQGTk5n13+uN1fZQoaAZoCWgPQwgSL0/nysJwQJSGlFKUaBVLxmgWR0Bk7rfWMCLddX2UKGgGaAloD0MIjWDj+ndHckCUhpRSlGgVS9RoFkdAZO9xRVIZqHV9lChoBmgJaA9DCD6w478AEXNAlIaUUpRoFUvNaBZHQGTz8BMi8nN1fZQoaAZoCWgPQwiES8ecJyJxQJSGlFKUaBVLxGgWR0Bk+SlxffGddX2UKGgGaAloD0MIflLt03EnckCUhpRSlGgVS8loFkdAZPkgSOBDonV9lChoBmgJaA9DCDsBTYRN/3BAlIaUUpRoFUvKaBZHQGT6kv9LpRp1fZQoaAZoCWgPQwgfEr73t1lxQJSGlFKUaBVLuGgWR0Bk/OgxrSE2dX2UKGgGaAloD0MIgIEgQIZAckCUhpRSlGgVS8JoFkdAZP5xwQ176nV9lChoBmgJaA9DCOj0vBtLWHFAlIaUUpRoFUu+aBZHQGUBDASFoL51fZQoaAZoCWgPQwgtW+uLROpwQJSGlFKUaBVLumgWR0BlBYnH/95ydX2UKGgGaAloD0MIrd9MTFcfc0CUhpRSlGgVS9poFkdAZQYB3A2ycHV9lChoBmgJaA9DCKuVCb/UHXNAlIaUUpRoFUvAaBZHQGUJmmk30f51fZQoaAZoCWgPQwiHNCpwcvJyQJSGlFKUaBVL3WgWR0BlDlQj2SMcdX2UKGgGaAloD0MIkXu6uiMccUCUhpRSlGgVS9hoFkdAZQ61YyO7x3V9lChoBmgJaA9DCIguqG/ZV3JAlIaUUpRoFUvTaBZHQGURpyhi9Zl1fZQoaAZoCWgPQwh5AmGnGKdzQJSGlFKUaBVL2mgWR0BlEm4Cp3otdX2UKGgGaAloD0MI/0C5bV/3ckCUhpRSlGgVS8hoFkdAZRlFRYRuj3V9lChoBmgJaA9DCJ6ayw2GCHNAlIaUUpRoFUvgaBZHQGUfF8G9pRJ1fZQoaAZoCWgPQwjBjv8CwWpxQJSGlFKUaBVLzmgWR0BlH6gh8pkPdX2UKGgGaAloD0MIVK2FWSjDckCUhpRSlGgVS7loFkdAZSHVp9JBgXV9lChoBmgJaA9DCLU1IhgH0XJAlIaUUpRoFUvHaBZHQGUjWbobGWF1fZQoaAZoCWgPQwhi2jf3V5B0QJSGlFKUaBVLz2gWR0BlJcX7+DODdX2UKGgGaAloD0MII4eIm9P6ckCUhpRSlGgVS7hoFkdAZSZcVQAMlXV9lChoBmgJaA9DCPorZK7MhXFAlIaUUpRoFUvGaBZHQGUn4tHxz7x1ZS4="
73
  },
74
  "ep_success_buffer": {
75
  ":type:": "<class 'collections.deque'>",
76
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
77
  },
78
+ "_n_updates": 1300,
79
  "n_steps": 1024,
80
  "gamma": 0.999,
81
+ "gae_lambda": 0.999,
82
  "ent_coef": 0.01,
83
  "vf_coef": 0.5,
84
  "max_grad_norm": 0.5,
 
86
  "n_epochs": 4,
87
  "clip_range": {
88
  ":type:": "<class 'function'>",
89
+ ":serialized:": "gAWVvwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAUsBSxNDBIgAUwCUToWUKYwBX5SFlIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCB9lH2UKGgXaA6MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgYjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz+5mZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"
90
  },
91
  "clip_range_vf": null,
92
+ "normalize_advantage": false,
93
  "target_kl": null
94
  }
ppo-LunarLander-v2/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e5fc6044145949a07211b1b357eeb7976be72f5a95856f9ae2fc031e9982ec1e
3
  size 84893
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab56f4caf59c97ad8139fb9dacaba44adc4d1c74ae53323f927855bb4f770a7d
3
  size 84893
ppo-LunarLander-v2/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b725eeb70265f746106b740a1b7e08681c6bf5e8d9adc23aaf2bb8d2c9306cc1
3
  size 43201
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc0d5ea822f8f3d70e76c7929e990831093fef67cad6ff19bc62f3e433e1d1ba
3
  size 43201
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:32f9b84b2c5cb8d406dd40abe7d0bfa823ebf869046aa1481c12460883708620
3
- size 175078
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:118122b74db75a232a9759bf566e63c5466a636a640822b8fba88ebcf348fbfd
3
+ size 180076
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 293.20748935316885, "std_reward": 12.61962443813718, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2022-05-05T10:44:15.034479"}
 
1
+ {"mean_reward": 282.02283071796126, "std_reward": 22.455474163386626, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2022-05-05T11:31:08.792742"}