nkt32 commited on
Commit
a5d5033
1 Parent(s): ca50aa8

Upload PPO LunarLander-v2 trained agent

Browse files
README.md CHANGED
@@ -10,7 +10,7 @@ model-index:
10
  results:
11
  - metrics:
12
  - type: mean_reward
13
- value: 265.08 +/- 15.39
14
  name: mean_reward
15
  task:
16
  type: reinforcement-learning
10
  results:
11
  - metrics:
12
  - type: mean_reward
13
+ value: 265.99 +/- 20.58
14
  name: mean_reward
15
  task:
16
  type: reinforcement-learning
config.json CHANGED
@@ -1 +1 @@
1
- {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f4977a5ce50>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f4977a5cee0>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f4977a5cf70>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f4977a5b040>", "_build": "<function ActorCriticPolicy._build at 0x7f4977a5b0d0>", "forward": "<function ActorCriticPolicy.forward at 0x7f4977a5b160>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f4977a5b1f0>", "_predict": "<function ActorCriticPolicy._predict at 0x7f4977a5b280>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f4977a5b310>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f4977a5b3a0>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f4977a5b430>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc_data object at 0x7f49779df0f0>"}, "verbose": 1, "policy_kwargs": {}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVnwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/5RoCksIhZSMAUOUdJRSlIwEaGlnaJRoEiiWIAAAAAAAAAAAAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAf5RoCksIhZRoFXSUUpSMDWJvdW5kZWRfYmVsb3eUaBIolggAAAAAAAAAAAAAAAAAAACUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYIAAAAAAAAAAAAAAAAAAAAlGghSwiFlGgVdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [8], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False]", "bounded_above": "[False False False False False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gAWVggAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUaAeTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu", "n": 4, "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 32, "num_timesteps": 2031616, "_total_timesteps": 2000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1652215080.7988598, "learning_rate": 0.0003, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVfgIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAEsBSwFLE0MEiABTAJROhZQpjAFflIWUjE4vaG9tZS9ua3QvLmxvY2FsL2xpYi9weXRob24zLjgvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuAQwIAAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UaA11Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoF2gOjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoGIwHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/M6kqMFUyYYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQQAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYABAAAAAAAALNueb5AvEw/8kAKvm+xyb4cYIO+veWnPQAAAAAAAAAAzf4fvODZtD/TcEK+o3QRvTc8N7pCAca8AAAAAAAAAABm/5e9XMNmuua+RzxzPSY8dHq7uhEZPDwAAAAAAACAP4Atfz6GtxI/HWKVvlINqr5TKrg9+oLjvQAAAAAAAAAA87oZvi6uhz51THA8Ib54vp28mL1gWhk7AAAAAAAAAABmlU093ZSVPy+zvj3B9Oa+o4abPaM20jwAAAAAAAAAAJocNT3Gzqo/+pPoPjWt976j6kg8BnYuPgAAAAAAAAAAZijTPFxfCrwx88S8fNLqPEfIYj3Wc7+9AACAPwAAgD9NUEA+noPAPssRRr4aDZm+nfgnPfHbE70AAAAAAAAAACO6er535iK9ynNPNluyK7TR9ow+nouHtQAAgD8AAIA/zQoSvOwQoj9P7iS9Cn/uvsM6Gr31QU68AAAAAAAAAAAAp0i9v5PlPlFfJ74oTYa+ieiZvd63jr0AAAAAAAAAAACO0LwP/D49gFhyPVo/Rb7gzHU4mLLpuwAAAAAAAAAA0zSUPrHlTT+usaU+a+LQvv121z4csL49AAAAAAAAAADAw4+9dtpcP7ZIO70rTue+6lG9vaKqSDsAAAAAAAAAAJrO4L2rrRI/2jacPKoulb5NGBq9EKV7vQAAAAAAAAAABkeCvg/WKj+6Lh89pe3UvuHfPr6amec9AAAAAAAAAAAzc94511MxuzYT3zv/CoM8aSszvHILYz0AAIA/AACAP1r/ij5aaxc/kqJCvu6xor7M5N09Qyr6vQAAAAAAAAAAzQCaPK7Jnrodjd006YCZL/rIITpR/SS0AACAPwAAgD9mYrq8KQh1ul38KLSsip6v5eLvOObiqjMAAIA/AACAP9oyy73ETJc/Hm0wvsHU7b4BNQ++VTYEvQAAAAAAAAAA5hthvejgcD91rsO9z0LJvn0olL1DSgA9AAAAAAAAAAAA7kW+FEOIvIXk5LsctCS6ff7pPYUQBDsAAIA/AACAP5phMjvv5O4+9w8pvOo8ob5RmJc8/gW7uwAAAAAAAAAAzVJUPJtQKj8y0iC+grXRvqCs/byVviW9AAAAAAAAAACalb87PFARPXMq/jywQ3C+FeqMvP7hHL0AAAAAAAAAAJp5KjopxAG6y91Mtrw9XDB6PyK7RRZ4NQAAgD8AAIA/AEeJvVxLTrrDQNQ6cXOINXr8QToWZ/q5AACAPwAAgD/N+5u8rqOUuvpOqL01jD2+09ltvEJ3wT4AAIA/AAAAABr9XD0lwXk+iQ25vb3wlr6kpAq9wvaCvQAAAAAAAAAAxjoKPoElcT+We96902rdvj4Z9j314ae9AAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSyBLCIaUjAFDlHSUUpQu"}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVkwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYgAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksghZSMAUOUdJRSlC4="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.015808000000000044, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVZhAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBcHj2zujcECUhpRSlIwBbJRNBQGMAXSUR0CWstFxGUfQdX2UKGgGaAloD0MIsd8T61TKckCUhpRSlGgVTRIBaBZHQJayzOcDr7h1fZQoaAZoCWgPQwi0BBkB1adxQJSGlFKUaBVL9WgWR0CWsswtrbg1dX2UKGgGaAloD0MI5GVNLPAIcUCUhpRSlGgVS/FoFkdAlrLTm8ujAXV9lChoBmgJaA9DCInsgyzLknFAlIaUUpRoFUv4aBZHQJay+FfzBhx1fZQoaAZoCWgPQwiKx0W1iLJtQJSGlFKUaBVNBAFoFkdAlrNTSG8Em3V9lChoBmgJaA9DCECmtWksV3FAlIaUUpRoFU0zAWgWR0CWs26STyJ9dX2UKGgGaAloD0MIOV6B6Mk+c0CUhpRSlGgVS/FoFkdAlrP4O6NEPXV9lChoBmgJaA9DCE7RkVx+vm5AlIaUUpRoFUvwaBZHQJa1EPWhAW11fZQoaAZoCWgPQwhbCd0lsXxwQJSGlFKUaBVNDwFoFkdAlrUy5I6KcnV9lChoBmgJaA9DCM8SZASUsXFAlIaUUpRoFU0lAWgWR0CWtVJ7b+LndX2UKGgGaAloD0MI2T7kLdcwcUCUhpRSlGgVTTQBaBZHQJa1V9v0h/11fZQoaAZoCWgPQwgudZDXg2xyQJSGlFKUaBVNBwFoFkdAlrY2CiAUcnV9lChoBmgJaA9DCOfib3vC6HFAlIaUUpRoFUv3aBZHQJa2NDNQj2V1fZQoaAZoCWgPQwjaU3JOrG9xQJSGlFKUaBVNIQFoFkdAlraR6By0bHV9lChoBmgJaA9DCJVE9kEWX25AlIaUUpRoFUvyaBZHQJa2oyBTXJ51fZQoaAZoCWgPQwhVoBaDh8htQJSGlFKUaBVNFQFoFkdAlrbETHsC1nV9lChoBmgJaA9DCL5qZcIvsHBAlIaUUpRoFU0tAWgWR0CWtvNmDlHSdX2UKGgGaAloD0MIQ3QIHMmscUCUhpRSlGgVTQEBaBZHQJa2/K1XvH91fZQoaAZoCWgPQwgRcAhVqq1yQJSGlFKUaBVNHAFoFkdAlrcn3cpLEnV9lChoBmgJaA9DCB0B3Cze8nJAlIaUUpRoFU0KAWgWR0CWt+3SKFZgdX2UKGgGaAloD0MIKV36l6QMcUCUhpRSlGgVTQABaBZHQJa3+qS5iEx1fZQoaAZoCWgPQwicTrLVJTNyQJSGlFKUaBVNGwFoFkdAlrjTkZJkG3V9lChoBmgJaA9DCCDsFKsGgXJAlIaUUpRoFU0HAWgWR0CWuPBYFJQMdX2UKGgGaAloD0MIy9k7oy1OcECUhpRSlGgVTRQBaBZHQJa5MBcRlH11fZQoaAZoCWgPQwgUBmUazfBxQJSGlFKUaBVNMgFoFkdAlrlPhddE9nV9lChoBmgJaA9DCMOC+wFPfnNAlIaUUpRoFU0MAWgWR0CWuV4u9OARdX2UKGgGaAloD0MINq/qrNbZcUCUhpRSlGgVTRwBaBZHQJa5dMbm2b51fZQoaAZoCWgPQwjs2t5uSWtxQJSGlFKUaBVL62gWR0CWucd/axoqdX2UKGgGaAloD0MIbAVNS2wqc0CUhpRSlGgVTRQBaBZHQJa52tga3ql1fZQoaAZoCWgPQwgfaAWGbENyQJSGlFKUaBVL+WgWR0CWulbKRuCPdX2UKGgGaAloD0MIUn5S7VOycECUhpRSlGgVTQUBaBZHQJa6rJcPe551fZQoaAZoCWgPQwh47dKGw1NyQJSGlFKUaBVNHAFoFkdAlrtujIq9XnV9lChoBmgJaA9DCO9YbJMKHW5AlIaUUpRoFU0nAWgWR0CWu48rI5o5dX2UKGgGaAloD0MIJXUCmoj8b0CUhpRSlGgVTScBaBZHQJa7yGfwqiJ1fZQoaAZoCWgPQwjRArSt5rtuQJSGlFKUaBVNEAFoFkdAlrvQEpy6tnV9lChoBmgJaA9DCNXrFoFxU3BAlIaUUpRoFU0FAWgWR0CWvBm03Ov/dX2UKGgGaAloD0MInbryWd6fcECUhpRSlGgVTS0BaBZHQJa8LJDE3sJ1fZQoaAZoCWgPQwg74SU4NQdyQJSGlFKUaBVL62gWR0CWvKU+LWI5dX2UKGgGaAloD0MIXvOqzqo7cUCUhpRSlGgVS/ZoFkdAlrzfI8yN43V9lChoBmgJaA9DCGtj7IQXb3JAlIaUUpRoFU0/AWgWR0CWvSjiGWUsdX2UKGgGaAloD0MIn1p9ddUkbUCUhpRSlGgVTQ4BaBZHQJa9fEpAlfJ1fZQoaAZoCWgPQwjY8sr1dkhxQJSGlFKUaBVL7mgWR0CWve0zCUHIdX2UKGgGaAloD0MIMT83NGU3cECUhpRSlGgVTRcBaBZHQJa+Bn003wV1fZQoaAZoCWgPQwgtQxzr4s1wQJSGlFKUaBVL7WgWR0CWvhWHDaXbdX2UKGgGaAloD0MIxqUqbTERcECUhpRSlGgVS/hoFkdAlr5KbSZ0CHV9lChoBmgJaA9DCMVwdQDEWXFAlIaUUpRoFU0MAWgWR0CWvn5vtMPCdX2UKGgGaAloD0MIOJ86VqmmcUCUhpRSlGgVTR0BaBZHQJa/AZOzpot1fZQoaAZoCWgPQwhJ88e09slyQJSGlFKUaBVNDAFoFkdAlr9kYsNDt3V9lChoBmgJaA9DCPUu3o+bI3FAlIaUUpRoFU0XAWgWR0CWv469TP0JdX2UKGgGaAloD0MIqFFIMqsTQ0CUhpRSlGgVS8BoFkdAlsCxUedTYXV9lChoBmgJaA9DCET5ghaSA3NAlIaUUpRoFU08AWgWR0CWwLrPdEb6dX2UKGgGaAloD0MI16GakqzEbUCUhpRSlGgVTQABaBZHQJbA4E9t/F11fZQoaAZoCWgPQwiVtU3xuM5wQJSGlFKUaBVL9mgWR0CWwPzmfXf7dX2UKGgGaAloD0MIPN154nmocUCUhpRSlGgVTSUBaBZHQJbBDfbblBB1fZQoaAZoCWgPQwjT+lsCcBVyQJSGlFKUaBVNKAFoFkdAlsExmTTvzHV9lChoBmgJaA9DCAnf+xs0OXFAlIaUUpRoFUv5aBZHQJbBmYRdyDJ1fZQoaAZoCWgPQwjsvmN4bAdyQJSGlFKUaBVNBAFoFkdAlsHbg0j1PHV9lChoBmgJaA9DCI51cRvNV3BAlIaUUpRoFU0iAWgWR0CWwitIClrNdX2UKGgGaAloD0MIr0LKT2qmcUCUhpRSlGgVTT0BaBZHQJbCrLyMDOl1fZQoaAZoCWgPQwiCjla1ZLdwQJSGlFKUaBVNGAFoFkdAlsMkRaouPHV9lChoBmgJaA9DCK4NFeN8yHFAlIaUUpRoFUv3aBZHQJbDMnYxtYV1fZQoaAZoCWgPQwjaklURLvpwQJSGlFKUaBVL7GgWR0CWwzY5T6zmdX2UKGgGaAloD0MIXHFxVK4xcECUhpRSlGgVTUUBaBZHQJbDb6wdKdx1fZQoaAZoCWgPQwhaKQRySXJxQJSGlFKUaBVNCAFoFkdAlsPZNTLntHV9lChoBmgJaA9DCGA7GLFPgC9AlIaUUpRoFUuRaBZHQJbEBVQyhzx1fZQoaAZoCWgPQwjI0LGDildwQJSGlFKUaBVNDAFoFkdAlsQu6unuRnV9lChoBmgJaA9DCMfZdAQwfHFAlIaUUpRoFU0SAWgWR0CWxMDRtxdZdX2UKGgGaAloD0MIY7fPKvMOcUCUhpRSlGgVTRYBaBZHQJbEz2/SH/N1fZQoaAZoCWgPQwjTM73EWKBsQJSGlFKUaBVNCQFoFkdAlsTzHwPRRnV9lChoBmgJaA9DCIIDWrrCxHJAlIaUUpRoFUvvaBZHQJbE/RzBAOd1fZQoaAZoCWgPQwj8Gd6sQU1wQJSGlFKUaBVNCgFoFkdAlsV3BxgiNnV9lChoBmgJaA9DCCRkIM/uJ3FAlIaUUpRoFU0YAWgWR0CWxZrq+rU9dX2UKGgGaAloD0MIbt3NU52Fb0CUhpRSlGgVS/VoFkdAlsXwmiQDFXV9lChoBmgJaA9DCLlTOlg/KnFAlIaUUpRoFU0IAWgWR0CWxia1kUbldX2UKGgGaAloD0MI3LdaJy5LRUCUhpRSlGgVS69oFkdAlsYnlOoHcHV9lChoBmgJaA9DCK+XpgiwznFAlIaUUpRoFUvvaBZHQJbHCa1Cw8p1fZQoaAZoCWgPQwgewCK//nxxQJSGlFKUaBVNAwFoFkdAlsccDOkcj3V9lChoBmgJaA9DCKSJd4DnTnJAlIaUUpRoFU0uAWgWR0CWx3jNIK+jdX2UKGgGaAloD0MIdCmuKjtxckCUhpRSlGgVTScBaBZHQJbHse7tiQV1fZQoaAZoCWgPQwgEdjV5CmRyQJSGlFKUaBVL62gWR0CWyEr/bTMJdX2UKGgGaAloD0MIIlD9gwiFcUCUhpRSlGgVTQkBaBZHQJbJKXa8HwB1fZQoaAZoCWgPQwgh5SfVfn5yQJSGlFKUaBVNJwFoFkdAlsoShJyyU3V9lChoBmgJaA9DCHfWbrtQ/HFAlIaUUpRoFUv7aBZHQJbKJl6JIlN1fZQoaAZoCWgPQwhl3qrrEGNyQJSGlFKUaBVNgAFoFkdAlsol0knkUHV9lChoBmgJaA9DCGIRww4jUnFAlIaUUpRoFU0IAWgWR0CWykGPPszEdX2UKGgGaAloD0MIotXJGcoxc0CUhpRSlGgVTSQBaBZHQJbKT8ZUDMh1fZQoaAZoCWgPQwjoE3mS9PFwQJSGlFKUaBVNFgFoFkdAlspwSnLq2XV9lChoBmgJaA9DCGe3lsmwd3JAlIaUUpRoFU0mAWgWR0CWyoS0BwMqdX2UKGgGaAloD0MIecpqup6lc0CUhpRSlGgVTQsBaBZHQJbLJM6BAfN1fZQoaAZoCWgPQwg51VqYBS5vQJSGlFKUaBVNBwFoFkdAlst40dilSHV9lChoBmgJaA9DCBr8/WL2p3JAlIaUUpRoFU0LAWgWR0CWy6gsK9f1dX2UKGgGaAloD0MIwXRatwGOckCUhpRSlGgVTQgBaBZHQJbLzpQk5ZN1fZQoaAZoCWgPQwhZiA6BY4dwQJSGlFKUaBVNEQFoFkdAlsvefdyksXV9lChoBmgJaA9DCGiXb31YAnBAlIaUUpRoFUv4aBZHQJbMD3SKFZh1fZQoaAZoCWgPQwi6S+KsCNRuQJSGlFKUaBVNAgFoFkdAlsw03S8aoHV9lChoBmgJaA9DCMSZX82B43BAlIaUUpRoFU0WAWgWR0CWzKT72tdSdX2UKGgGaAloD0MIkuo7v+iZcECUhpRSlGgVTQoBaBZHQJbNLUYsNDt1fZQoaAZoCWgPQwgGZ/D3S5pyQJSGlFKUaBVNDAFoFkdAls1yQkona3V9lChoBmgJaA9DCBhEpKZd/nBAlIaUUpRoFU0PAWgWR0CWzZUz9CNTdWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 248, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVfgIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAEsBSwFLE0MEiABTAJROhZQpjAFflIWUjE4vaG9tZS9ua3QvLmxvY2FsL2xpYi9weXRob24zLjgvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuAQwIAAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UaA11Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoF2gOjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoGIwHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/yZmZmZmZmoWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "system_info": {"OS": "Linux-5.4.0-109-generic-x86_64-with-glibc2.29 #123-Ubuntu SMP Fri Apr 8 09:10:54 UTC 2022", "Python": "3.8.10", "Stable-Baselines3": "1.5.0", "PyTorch": "1.11.0+cu113", "GPU Enabled": "True", "Numpy": "1.21.2", "Gym": "0.21.0"}}
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f4996344c10>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f4996344ca0>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f4996344d30>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f4996344dc0>", "_build": "<function ActorCriticPolicy._build at 0x7f4996344e50>", "forward": "<function ActorCriticPolicy.forward at 0x7f4996344ee0>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f4996344f70>", "_predict": "<function ActorCriticPolicy._predict at 0x7f49962c7040>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f49962c70d0>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f49962c7160>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f49962c71f0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc_data object at 0x7f4996336f90>"}, "verbose": 1, "policy_kwargs": {}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVnwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/5RoCksIhZSMAUOUdJRSlIwEaGlnaJRoEiiWIAAAAAAAAAAAAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAf5RoCksIhZRoFXSUUpSMDWJvdW5kZWRfYmVsb3eUaBIolggAAAAAAAAAAAAAAAAAAACUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYIAAAAAAAAAAAAAAAAAAAAlGghSwiFlGgVdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [8], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False]", "bounded_above": "[False False False False False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gAWVggAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUaAeTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu", "n": 4, "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 32, "num_timesteps": 2031616, "_total_timesteps": 2000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1652216888.4359014, "learning_rate": 0.0003, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVfgIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAEsBSwFLE0MEiABTAJROhZQpjAFflIWUjE4vaG9tZS9ua3QvLmxvY2FsL2xpYi9weXRob24zLjgvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuAQwIAAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UaA11Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoF2gOjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoGIwHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/M6kqMFUyYYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQQAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYABAAAAAAAALO5rz2PZlW6wHd0uje8b7WScMY6cBuOOQAAgD8AAIA/mtQxPR+dmbmKAV26tvscvXohR7smGT29AAAAAAAAAABm9tW6XPNjuh1hGLokqAm1NSdeOjD0MjkAAIA/AACAP5ot8rx5TG8+zsQyu8CDl77VMM68NfRVPQAAAAAAAAAAZt4xPK7dkLrO2CK6ZJhHNd/9zLobNTk5AACAPwAAgD+zQS499uwZuptFcrkJf/Gz6aOYuWb5jDgAAIA/AACAPzMJ5rwppB66eqFzOrf6MDXBJPu6xdaQuQAAgD8AAIA/Gjk2vfboPrp7r+Y54tpZNdwW6DoPjwe5AACAPwAAgD8zk3E7hcOrueTfpDtDSf03vZ6kumAPg7UAAIA/AACAPzNgLD1y35o/FmP2PaCo6L66/lU8H2oFPAAAAAAAAAAAM0j6vI++crq+3NW3Nhwhs5S2YjpWpPc2AACAPwAAgD8AIQQ9cdQgu3v2RD4lIJ88SrlOvApbiD0AAIA/AACAPzMD5ropYEq64wlgumY7Krar8GU6/JCDOQAAgD8AAIA/zajrvMOpHLptYY27EAqPOBPhvLrYJwY6AACAPwAAgD9myt48KXgyuqXx6bnmePC04jDEOQDaBTkAAIA/AACAPwAHgb2Fi5W54ibfunPuCjV5RHy78aIEOgAAgD8AAIA/zSQhO0iVoLqKRhK6IJIgurlag7sW1p86AACAPwAAgD/NVJc9PRooud61hLqNA0CzdacmOpC4ADMAAIA/AACAP2aylztcAy26MrMbOrwcADVfQFM7f002uQAAgD8AAIA/AFlkPY+eZboIuw84rv1qtvnmLrpS5By3AAAAAAAAgD/mSDE9XCNJuhKlmrXzl8iwEjoLOR/urDQAAIA/AACAPw0EB7640yw/WpfPPYGsrL4G/J68spQGvQAAAAAAAAAAbRRMvgEJtrzmR8W7cqA1unCcHT6EZQ47AACAPwAAgD/myEu9HqeDPtghXT3E8XW+oCxKPD5kHb0AAAAAAAAAADNJUj1xXUC5GPfcOoaGnDVC1xw7YD8BugAAgD8AAIA/AHyiPKIbsT/yuog+U4GBvptzhrtgGWY9AAAAAAAAAACzS5M9SJuRumVwNDgcWxwzrYBNupAPUbcAAIA/AAAAAObwoT3DKQO6H2WGOyRepjYny6U6mCahugAAgD8AAAAAM+mYvMN5fLpkFaE7NaFOOHpsarntIhe4AACAPwAAgD8zZPe8XI9zutIzhDkyxA81myttO3NKl7gAAIA/AACAPzPkmbwUXK66MJvpuND9JTarlgw4ro8EOAAAgD8AAIA/ZpqTOx41mT8yEbw8dBShvsB/hLxOfmK9AAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSyBLCIaUjAFDlHSUUpQu"}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVkwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYgAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksghZSMAUOUdJRSlC4="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.015808000000000044, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVgRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIlWOyuH+7bkCUhpRSlIwBbJRNnwGMAXSUR0CUU4bfP5YYdX2UKGgGaAloD0MIIm5OJYMiaECUhpRSlGgVTegDaBZHQJRT0ry1/lR1fZQoaAZoCWgPQwgGSgosAMBlQJSGlFKUaBVN6ANoFkdAlFiDlHSWq3V9lChoBmgJaA9DCO2fpwED7GZAlIaUUpRoFU3oA2gWR0CUWWO2RaHLdX2UKGgGaAloD0MI7X4V4Pt/cUCUhpRSlGgVTccBaBZHQJRdzthNM491fZQoaAZoCWgPQwinsFJBRWVjQJSGlFKUaBVN6ANoFkdAlF3f3ztkWnV9lChoBmgJaA9DCEMCRpc3RmJAlIaUUpRoFU3oA2gWR0CUXfEidJ8OdX2UKGgGaAloD0MIF9nO99OsZECUhpRSlGgVTegDaBZHQJReEEIPbwl1fZQoaAZoCWgPQwgK3LqbJ0NgQJSGlFKUaBVN6ANoFkdAlGEC/wiJO3V9lChoBmgJaA9DCATnjCjtHmdAlIaUUpRoFU3oA2gWR0CUYoD/lyR0dX2UKGgGaAloD0MIFJhO67YDaUCUhpRSlGgVTegDaBZHQJRi4jRlYlp1fZQoaAZoCWgPQwiDUrRyL9pnQJSGlFKUaBVN6ANoFkdAlGS9gfEGaHV9lChoBmgJaA9DCPje36A9R2RAlIaUUpRoFU3oA2gWR0CUafO3lS0jdX2UKGgGaAloD0MIQZ5dvnWabUCUhpRSlGgVTeABaBZHQJRrOU/wAlx1fZQoaAZoCWgPQwgHRIgrZ3hxQJSGlFKUaBVN6AJoFkdAlGzRq0tyxXV9lChoBmgJaA9DCEYL0LYaamNAlIaUUpRoFU3oA2gWR0CUbfgnMMZxdX2UKGgGaAloD0MIHGDmO3jlbkCUhpRSlGgVTVwBaBZHQJRuOYnfEXN1fZQoaAZoCWgPQwhwI2WLJCplQJSGlFKUaBVN6ANoFkdAlHFOOKfnOnV9lChoBmgJaA9DCF8oYDsYLWNAlIaUUpRoFU3oA2gWR0CUcV8WbgCPdX2UKGgGaAloD0MIGLDkKhYlZECUhpRSlGgVTegDaBZHQJRxb8m8dxR1fZQoaAZoCWgPQwgNi1HX2hBoQJSGlFKUaBVN6ANoFkdAlHLCm/FirnV9lChoBmgJaA9DCFEU6BN5g2dAlIaUUpRoFU3oA2gWR0CUd17EHdGidX2UKGgGaAloD0MI0NIVbKNdcUCUhpRSlGgVTWkBaBZHQJSoaJcgQpZ1fZQoaAZoCWgPQwg1ejVA6bdkQJSGlFKUaBVN6ANoFkdAlKhqJQ+EAnV9lChoBmgJaA9DCDVAaagRlXJAlIaUUpRoFU3OAmgWR0CUqTd4FA3UdX2UKGgGaAloD0MIzNQkeAMKcUCUhpRSlGgVTaoDaBZHQJSresQumJp1fZQoaAZoCWgPQwgDQBU37lRhQJSGlFKUaBVN6ANoFkdAlKt71/Ue+3V9lChoBmgJaA9DCHWRQll4bmFAlIaUUpRoFU3oA2gWR0CUq3zS1E3LdX2UKGgGaAloD0MIqmOV0rNhY0CUhpRSlGgVTegDaBZHQJSrjKJVKf51fZQoaAZoCWgPQwilZ3qJsRxhQJSGlFKUaBVN6ANoFkdAlLB5PVNHpnV9lChoBmgJaA9DCN1ELc3tGHBAlIaUUpRoFU22AWgWR0CUs+N+so2GdX2UKGgGaAloD0MIyVaXU4JhcECUhpRSlGgVTasBaBZHQJS0bopx3mp1fZQoaAZoCWgPQwiYMQVr3LhyQJSGlFKUaBVNhAJoFkdAlLRwZGax5nV9lChoBmgJaA9DCB6lEp7QfmBAlIaUUpRoFU3oA2gWR0CUtkEy+HrRdX2UKGgGaAloD0MIiUFg5dAbaECUhpRSlGgVTegDaBZHQJS2yxkd3jd1fZQoaAZoCWgPQwg0uoPYmUtzQJSGlFKUaBVNCAFoFkdAlLfNg0CRwXV9lChoBmgJaA9DCAG9cOcCgnBAlIaUUpRoFU2JAWgWR0CUuEYcebNKdX2UKGgGaAloD0MIsoLfhhhoYUCUhpRSlGgVTegDaBZHQJS4zJGOMl11fZQoaAZoCWgPQwibyMwFLtRsQJSGlFKUaBVNdgNoFkdAlLjbiADq4nV9lChoBmgJaA9DCJpd91ZkU3BAlIaUUpRoFU3vAmgWR0CUusCrcTJydX2UKGgGaAloD0MINWH7yRgxYkCUhpRSlGgVTegDaBZHQJS85foicG11fZQoaAZoCWgPQwjUu3g/bpVvQJSGlFKUaBVNAgNoFkdAlL72OEM9bHV9lChoBmgJaA9DCPaaHhSUZWdAlIaUUpRoFU3oA2gWR0CUv/HVf/m1dX2UKGgGaAloD0MIuyh64GMxY0CUhpRSlGgVTegDaBZHQJTF5vddmg91fZQoaAZoCWgPQwgrFr8p7ARxQJSGlFKUaBVN1AFoFkdAlMfXAZbY9XV9lChoBmgJaA9DCNp1b0Viq1hAlIaUUpRoFU3oA2gWR0CUyrLs8gZCdX2UKGgGaAloD0MIMV2I1R9AZ0CUhpRSlGgVTegDaBZHQJTK08W9DhN1fZQoaAZoCWgPQwivzjEg+2pxQJSGlFKUaBVNSgFoFkdAlMyc5CF9KHV9lChoBmgJaA9DCG+70FwnFHFAlIaUUpRoFU27A2gWR0CUzP+cH4XXdX2UKGgGaAloD0MIol2FlF/ucECUhpRSlGgVTcgCaBZHQJTN4vg3tKJ1fZQoaAZoCWgPQwjnGJC93rlxQJSGlFKUaBVNUQFoFkdAlM4iWu5jIHV9lChoBmgJaA9DCAD+KVWiyWZAlIaUUpRoFU3oA2gWR0CU0ZuJ1q33dX2UKGgGaAloD0MI+3WnO8/1cUCUhpRSlGgVTdkBaBZHQJTR2fChvit1fZQoaAZoCWgPQwhfXKrSFtJxQJSGlFKUaBVN1gJoFkdAlNSIvrWy1XV9lChoBmgJaA9DCOavkLkyhHBAlIaUUpRoFU21AmgWR0CU1b4qwyIpdX2UKGgGaAloD0MIlwM91DZQY0CUhpRSlGgVTegDaBZHQJTZA90Rvm51fZQoaAZoCWgPQwh5Iojz8PVoQJSGlFKUaBVN6ANoFkdAlNoJyMkyDnV9lChoBmgJaA9DCJT3cTTHF2FAlIaUUpRoFU3oA2gWR0CU2kOtW+49dX2UKGgGaAloD0MINE3YfrIyY0CUhpRSlGgVTegDaBZHQJTdHCTEBKd1fZQoaAZoCWgPQwgEHhhA+NpgQJSGlFKUaBVN6ANoFkdAlN0sURFqjHV9lChoBmgJaA9DCNDv+zdvDnBAlIaUUpRoFU2aA2gWR0CU4Gz7/GVBdX2UKGgGaAloD0MIWrxYGKLwZUCUhpRSlGgVTegDaBZHQJTi9RFZxJd1fZQoaAZoCWgPQwhIN8KiIklhQJSGlFKUaBVN6ANoFkdAlOd+KoAGS3V9lChoBmgJaA9DCJZdMLjml2VAlIaUUpRoFU3oA2gWR0CU548274BWdX2UKGgGaAloD0MIMV7zqs7Vb0CUhpRSlGgVTcYDaBZHQJTqu/KyOaR1fZQoaAZoCWgPQwipvYi2YxBwQJSGlFKUaBVNYwNoFkdAlOso150KZ3V9lChoBmgJaA9DCNxkVBlGy25AlIaUUpRoFU3RAmgWR0CU66DtPYWddX2UKGgGaAloD0MI8DZvnBTrYkCUhpRSlGgVTegDaBZHQJTwG8kD6nB1fZQoaAZoCWgPQwieQUP/hBlmQJSGlFKUaBVN6ANoFkdAlPCjqW1MNHV9lChoBmgJaA9DCKBTkJ+NjW9AlIaUUpRoFU2+AmgWR0CU8aJvo/zKdX2UKGgGaAloD0MIh/2eWKfJZECUhpRSlGgVTegDaBZHQJTyb5O8Cgd1fZQoaAZoCWgPQwgpWrkXGIFtQJSGlFKUaBVNtAFoFkdAlPKcyFfzBnV9lChoBmgJaA9DCIyDS8cctWRAlIaUUpRoFU3oA2gWR0CU9Fhb4agmdX2UKGgGaAloD0MIODEkJxNzY0CUhpRSlGgVTegDaBZHQJT06LNwBHV1fZQoaAZoCWgPQwhsy4CzlBNvQJSGlFKUaBVNqwFoFkdAlPYzAeq7y3V9lChoBmgJaA9DCBWL3xTW8WdAlIaUUpRoFU3oA2gWR0CU9sI5YHPedX2UKGgGaAloD0MIflLt03EfaECUhpRSlGgVTegDaBZHQJT4xPfsNUh1fZQoaAZoCWgPQwjZBu5A3bZwQJSGlFKUaBVN6gJoFkdAlPl/XPJJXnV9lChoBmgJaA9DCKEQAYdQcGVAlIaUUpRoFU3oA2gWR0CU+qPbO/tZdX2UKGgGaAloD0MI9HAC02kKaECUhpRSlGgVTegDaBZHQJUA6hxo7FN1fZQoaAZoCWgPQwg9YvTcQmBuQJSGlFKUaBVNxQFoFkdAlQHGWIGhVXV9lChoBmgJaA9DCCBGCI92hHFAlIaUUpRoFU23A2gWR0CVAm7/n4fwdX2UKGgGaAloD0MIyeU/pJ9ycECUhpRSlGgVTUYBaBZHQJUDTsD4gzR1fZQoaAZoCWgPQwgtX5fhPwdoQJSGlFKUaBVN6ANoFkdAlQUtgWrOq3V9lChoBmgJaA9DCNY6cTleiGFAlIaUUpRoFU3oA2gWR0CVBulfJFLGdX2UKGgGaAloD0MIuHNhpBdNZ0CUhpRSlGgVTegDaBZHQJUHRON5t3x1fZQoaAZoCWgPQwipoKLqV3NoQJSGlFKUaBVN6ANoFkdAlQgZA+pwTHV9lChoBmgJaA9DCK6gaYnVD3BAlIaUUpRoFU0HAmgWR0CVCa2fkFOgdX2UKGgGaAloD0MIFkuRfCUKWkCUhpRSlGgVTegDaBZHQJULum3vx6R1fZQoaAZoCWgPQwhM4UGz64hkQJSGlFKUaBVN6ANoFkdAlQv44hllLHV9lChoBmgJaA9DCNfbZipEA3FAlIaUUpRoFU1tA2gWR0CVDVplSS/1dX2UKGgGaAloD0MIo3iVtc2dYUCUhpRSlGgVTegDaBZHQJUOoNI9TxZ1fZQoaAZoCWgPQwi0W8tkOKxoQJSGlFKUaBVN6ANoFkdAlQ/aEWZZ0XV9lChoBmgJaA9DCHV1x2Ib7GRAlIaUUpRoFU3oA2gWR0CVFHCPp6hQdX2UKGgGaAloD0MIpS4Zx8iaZECUhpRSlGgVTegDaBZHQJUXzFQ2uPp1fZQoaAZoCWgPQwgzp8ti4vRwQJSGlFKUaBVN/QJoFkdAlRfsOskpqnV9lChoBmgJaA9DCPevrDQpd2dAlIaUUpRoFU3oA2gWR0CVG4KpkwvhdX2UKGgGaAloD0MIGAXB41srYkCUhpRSlGgVTegDaBZHQJUeRiKBNEh1fZQoaAZoCWgPQwiHhzB+Gl5zQJSGlFKUaBVNFANoFkdAlSBtw71ZknV9lChoBmgJaA9DCN46/3bZ4W9AlIaUUpRoFU3SAWgWR0CVIabWVeKLdWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 186, "n_steps": 2048, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 128, "n_epochs": 6, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVfgIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAEsBSwFLE0MEiABTAJROhZQpjAFflIWUjE4vaG9tZS9ua3QvLmxvY2FsL2xpYi9weXRob24zLjgvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuAQwIAAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UaA11Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoF2gOjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoGIwHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/yZmZmZmZmoWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "system_info": {"OS": "Linux-5.4.0-109-generic-x86_64-with-glibc2.29 #123-Ubuntu SMP Fri Apr 8 09:10:54 UTC 2022", "Python": "3.8.10", "Stable-Baselines3": "1.5.0", "PyTorch": "1.11.0+cu113", "GPU Enabled": "True", "Numpy": "1.21.2", "Gym": "0.21.0"}}
nkt32/PPO-LunarLander-v2-T2.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bc68009f3ebb60f11aefe2c91fb380fb1499db28948b1c70a0a2c646d2d5dc02
3
- size 144617
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ecb9dd220062c045cbc8c764bea7a7ef74bd2adda5179c880551a9abf7be533
3
+ size 144654
nkt32/PPO-LunarLander-v2-T2/data CHANGED
@@ -4,19 +4,19 @@
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
- "__init__": "<function ActorCriticPolicy.__init__ at 0x7f4977a5ce50>",
8
- "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f4977a5cee0>",
9
- "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f4977a5cf70>",
10
- "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f4977a5b040>",
11
- "_build": "<function ActorCriticPolicy._build at 0x7f4977a5b0d0>",
12
- "forward": "<function ActorCriticPolicy.forward at 0x7f4977a5b160>",
13
- "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f4977a5b1f0>",
14
- "_predict": "<function ActorCriticPolicy._predict at 0x7f4977a5b280>",
15
- "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f4977a5b310>",
16
- "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f4977a5b3a0>",
17
- "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f4977a5b430>",
18
  "__abstractmethods__": "frozenset()",
19
- "_abc_impl": "<_abc_data object at 0x7f49779df0f0>"
20
  },
21
  "verbose": 1,
22
  "policy_kwargs": {},
@@ -47,7 +47,7 @@
47
  "_num_timesteps_at_start": 0,
48
  "seed": null,
49
  "action_noise": null,
50
- "start_time": 1652215080.7988598,
51
  "learning_rate": 0.0003,
52
  "tensorboard_log": null,
53
  "lr_schedule": {
@@ -56,7 +56,7 @@
56
  },
57
  "_last_obs": {
58
  ":type:": "<class 'numpy.ndarray'>",
59
- ":serialized:": "gAWVdQQAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYABAAAAAAAALNueb5AvEw/8kAKvm+xyb4cYIO+veWnPQAAAAAAAAAAzf4fvODZtD/TcEK+o3QRvTc8N7pCAca8AAAAAAAAAABm/5e9XMNmuua+RzxzPSY8dHq7uhEZPDwAAAAAAACAP4Atfz6GtxI/HWKVvlINqr5TKrg9+oLjvQAAAAAAAAAA87oZvi6uhz51THA8Ib54vp28mL1gWhk7AAAAAAAAAABmlU093ZSVPy+zvj3B9Oa+o4abPaM20jwAAAAAAAAAAJocNT3Gzqo/+pPoPjWt976j6kg8BnYuPgAAAAAAAAAAZijTPFxfCrwx88S8fNLqPEfIYj3Wc7+9AACAPwAAgD9NUEA+noPAPssRRr4aDZm+nfgnPfHbE70AAAAAAAAAACO6er535iK9ynNPNluyK7TR9ow+nouHtQAAgD8AAIA/zQoSvOwQoj9P7iS9Cn/uvsM6Gr31QU68AAAAAAAAAAAAp0i9v5PlPlFfJ74oTYa+ieiZvd63jr0AAAAAAAAAAACO0LwP/D49gFhyPVo/Rb7gzHU4mLLpuwAAAAAAAAAA0zSUPrHlTT+usaU+a+LQvv121z4csL49AAAAAAAAAADAw4+9dtpcP7ZIO70rTue+6lG9vaKqSDsAAAAAAAAAAJrO4L2rrRI/2jacPKoulb5NGBq9EKV7vQAAAAAAAAAABkeCvg/WKj+6Lh89pe3UvuHfPr6amec9AAAAAAAAAAAzc94511MxuzYT3zv/CoM8aSszvHILYz0AAIA/AACAP1r/ij5aaxc/kqJCvu6xor7M5N09Qyr6vQAAAAAAAAAAzQCaPK7Jnrodjd006YCZL/rIITpR/SS0AACAPwAAgD9mYrq8KQh1ul38KLSsip6v5eLvOObiqjMAAIA/AACAP9oyy73ETJc/Hm0wvsHU7b4BNQ++VTYEvQAAAAAAAAAA5hthvejgcD91rsO9z0LJvn0olL1DSgA9AAAAAAAAAAAA7kW+FEOIvIXk5LsctCS6ff7pPYUQBDsAAIA/AACAP5phMjvv5O4+9w8pvOo8ob5RmJc8/gW7uwAAAAAAAAAAzVJUPJtQKj8y0iC+grXRvqCs/byVviW9AAAAAAAAAACalb87PFARPXMq/jywQ3C+FeqMvP7hHL0AAAAAAAAAAJp5KjopxAG6y91Mtrw9XDB6PyK7RRZ4NQAAgD8AAIA/AEeJvVxLTrrDQNQ6cXOINXr8QToWZ/q5AACAPwAAgD/N+5u8rqOUuvpOqL01jD2+09ltvEJ3wT4AAIA/AAAAABr9XD0lwXk+iQ25vb3wlr6kpAq9wvaCvQAAAAAAAAAAxjoKPoElcT+We96902rdvj4Z9j314ae9AAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSyBLCIaUjAFDlHSUUpQu"
60
  },
61
  "_last_episode_starts": {
62
  ":type:": "<class 'numpy.ndarray'>",
@@ -69,21 +69,21 @@
69
  "_current_progress_remaining": -0.015808000000000044,
70
  "ep_info_buffer": {
71
  ":type:": "<class 'collections.deque'>",
72
- ":serialized:": "gAWVZhAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBcHj2zujcECUhpRSlIwBbJRNBQGMAXSUR0CWstFxGUfQdX2UKGgGaAloD0MIsd8T61TKckCUhpRSlGgVTRIBaBZHQJayzOcDr7h1fZQoaAZoCWgPQwi0BBkB1adxQJSGlFKUaBVL9WgWR0CWsswtrbg1dX2UKGgGaAloD0MI5GVNLPAIcUCUhpRSlGgVS/FoFkdAlrLTm8ujAXV9lChoBmgJaA9DCInsgyzLknFAlIaUUpRoFUv4aBZHQJay+FfzBhx1fZQoaAZoCWgPQwiKx0W1iLJtQJSGlFKUaBVNBAFoFkdAlrNTSG8Em3V9lChoBmgJaA9DCECmtWksV3FAlIaUUpRoFU0zAWgWR0CWs26STyJ9dX2UKGgGaAloD0MIOV6B6Mk+c0CUhpRSlGgVS/FoFkdAlrP4O6NEPXV9lChoBmgJaA9DCE7RkVx+vm5AlIaUUpRoFUvwaBZHQJa1EPWhAW11fZQoaAZoCWgPQwhbCd0lsXxwQJSGlFKUaBVNDwFoFkdAlrUy5I6KcnV9lChoBmgJaA9DCM8SZASUsXFAlIaUUpRoFU0lAWgWR0CWtVJ7b+LndX2UKGgGaAloD0MI2T7kLdcwcUCUhpRSlGgVTTQBaBZHQJa1V9v0h/11fZQoaAZoCWgPQwgudZDXg2xyQJSGlFKUaBVNBwFoFkdAlrY2CiAUcnV9lChoBmgJaA9DCOfib3vC6HFAlIaUUpRoFUv3aBZHQJa2NDNQj2V1fZQoaAZoCWgPQwjaU3JOrG9xQJSGlFKUaBVNIQFoFkdAlraR6By0bHV9lChoBmgJaA9DCJVE9kEWX25AlIaUUpRoFUvyaBZHQJa2oyBTXJ51fZQoaAZoCWgPQwhVoBaDh8htQJSGlFKUaBVNFQFoFkdAlrbETHsC1nV9lChoBmgJaA9DCL5qZcIvsHBAlIaUUpRoFU0tAWgWR0CWtvNmDlHSdX2UKGgGaAloD0MIQ3QIHMmscUCUhpRSlGgVTQEBaBZHQJa2/K1XvH91fZQoaAZoCWgPQwgRcAhVqq1yQJSGlFKUaBVNHAFoFkdAlrcn3cpLEnV9lChoBmgJaA9DCB0B3Cze8nJAlIaUUpRoFU0KAWgWR0CWt+3SKFZgdX2UKGgGaAloD0MIKV36l6QMcUCUhpRSlGgVTQABaBZHQJa3+qS5iEx1fZQoaAZoCWgPQwicTrLVJTNyQJSGlFKUaBVNGwFoFkdAlrjTkZJkG3V9lChoBmgJaA9DCCDsFKsGgXJAlIaUUpRoFU0HAWgWR0CWuPBYFJQMdX2UKGgGaAloD0MIy9k7oy1OcECUhpRSlGgVTRQBaBZHQJa5MBcRlH11fZQoaAZoCWgPQwgUBmUazfBxQJSGlFKUaBVNMgFoFkdAlrlPhddE9nV9lChoBmgJaA9DCMOC+wFPfnNAlIaUUpRoFU0MAWgWR0CWuV4u9OARdX2UKGgGaAloD0MINq/qrNbZcUCUhpRSlGgVTRwBaBZHQJa5dMbm2b51fZQoaAZoCWgPQwjs2t5uSWtxQJSGlFKUaBVL62gWR0CWucd/axoqdX2UKGgGaAloD0MIbAVNS2wqc0CUhpRSlGgVTRQBaBZHQJa52tga3ql1fZQoaAZoCWgPQwgfaAWGbENyQJSGlFKUaBVL+WgWR0CWulbKRuCPdX2UKGgGaAloD0MIUn5S7VOycECUhpRSlGgVTQUBaBZHQJa6rJcPe551fZQoaAZoCWgPQwh47dKGw1NyQJSGlFKUaBVNHAFoFkdAlrtujIq9XnV9lChoBmgJaA9DCO9YbJMKHW5AlIaUUpRoFU0nAWgWR0CWu48rI5o5dX2UKGgGaAloD0MIJXUCmoj8b0CUhpRSlGgVTScBaBZHQJa7yGfwqiJ1fZQoaAZoCWgPQwjRArSt5rtuQJSGlFKUaBVNEAFoFkdAlrvQEpy6tnV9lChoBmgJaA9DCNXrFoFxU3BAlIaUUpRoFU0FAWgWR0CWvBm03Ov/dX2UKGgGaAloD0MInbryWd6fcECUhpRSlGgVTS0BaBZHQJa8LJDE3sJ1fZQoaAZoCWgPQwg74SU4NQdyQJSGlFKUaBVL62gWR0CWvKU+LWI5dX2UKGgGaAloD0MIXvOqzqo7cUCUhpRSlGgVS/ZoFkdAlrzfI8yN43V9lChoBmgJaA9DCGtj7IQXb3JAlIaUUpRoFU0/AWgWR0CWvSjiGWUsdX2UKGgGaAloD0MIn1p9ddUkbUCUhpRSlGgVTQ4BaBZHQJa9fEpAlfJ1fZQoaAZoCWgPQwjY8sr1dkhxQJSGlFKUaBVL7mgWR0CWve0zCUHIdX2UKGgGaAloD0MIMT83NGU3cECUhpRSlGgVTRcBaBZHQJa+Bn003wV1fZQoaAZoCWgPQwgtQxzr4s1wQJSGlFKUaBVL7WgWR0CWvhWHDaXbdX2UKGgGaAloD0MIxqUqbTERcECUhpRSlGgVS/hoFkdAlr5KbSZ0CHV9lChoBmgJaA9DCMVwdQDEWXFAlIaUUpRoFU0MAWgWR0CWvn5vtMPCdX2UKGgGaAloD0MIOJ86VqmmcUCUhpRSlGgVTR0BaBZHQJa/AZOzpot1fZQoaAZoCWgPQwhJ88e09slyQJSGlFKUaBVNDAFoFkdAlr9kYsNDt3V9lChoBmgJaA9DCPUu3o+bI3FAlIaUUpRoFU0XAWgWR0CWv469TP0JdX2UKGgGaAloD0MIqFFIMqsTQ0CUhpRSlGgVS8BoFkdAlsCxUedTYXV9lChoBmgJaA9DCET5ghaSA3NAlIaUUpRoFU08AWgWR0CWwLrPdEb6dX2UKGgGaAloD0MI16GakqzEbUCUhpRSlGgVTQABaBZHQJbA4E9t/F11fZQoaAZoCWgPQwiVtU3xuM5wQJSGlFKUaBVL9mgWR0CWwPzmfXf7dX2UKGgGaAloD0MIPN154nmocUCUhpRSlGgVTSUBaBZHQJbBDfbblBB1fZQoaAZoCWgPQwjT+lsCcBVyQJSGlFKUaBVNKAFoFkdAlsExmTTvzHV9lChoBmgJaA9DCAnf+xs0OXFAlIaUUpRoFUv5aBZHQJbBmYRdyDJ1fZQoaAZoCWgPQwjsvmN4bAdyQJSGlFKUaBVNBAFoFkdAlsHbg0j1PHV9lChoBmgJaA9DCI51cRvNV3BAlIaUUpRoFU0iAWgWR0CWwitIClrNdX2UKGgGaAloD0MIr0LKT2qmcUCUhpRSlGgVTT0BaBZHQJbCrLyMDOl1fZQoaAZoCWgPQwiCjla1ZLdwQJSGlFKUaBVNGAFoFkdAlsMkRaouPHV9lChoBmgJaA9DCK4NFeN8yHFAlIaUUpRoFUv3aBZHQJbDMnYxtYV1fZQoaAZoCWgPQwjaklURLvpwQJSGlFKUaBVL7GgWR0CWwzY5T6zmdX2UKGgGaAloD0MIXHFxVK4xcECUhpRSlGgVTUUBaBZHQJbDb6wdKdx1fZQoaAZoCWgPQwhaKQRySXJxQJSGlFKUaBVNCAFoFkdAlsPZNTLntHV9lChoBmgJaA9DCGA7GLFPgC9AlIaUUpRoFUuRaBZHQJbEBVQyhzx1fZQoaAZoCWgPQwjI0LGDildwQJSGlFKUaBVNDAFoFkdAlsQu6unuRnV9lChoBmgJaA9DCMfZdAQwfHFAlIaUUpRoFU0SAWgWR0CWxMDRtxdZdX2UKGgGaAloD0MIY7fPKvMOcUCUhpRSlGgVTRYBaBZHQJbEz2/SH/N1fZQoaAZoCWgPQwjTM73EWKBsQJSGlFKUaBVNCQFoFkdAlsTzHwPRRnV9lChoBmgJaA9DCIIDWrrCxHJAlIaUUpRoFUvvaBZHQJbE/RzBAOd1fZQoaAZoCWgPQwj8Gd6sQU1wQJSGlFKUaBVNCgFoFkdAlsV3BxgiNnV9lChoBmgJaA9DCCRkIM/uJ3FAlIaUUpRoFU0YAWgWR0CWxZrq+rU9dX2UKGgGaAloD0MIbt3NU52Fb0CUhpRSlGgVS/VoFkdAlsXwmiQDFXV9lChoBmgJaA9DCLlTOlg/KnFAlIaUUpRoFU0IAWgWR0CWxia1kUbldX2UKGgGaAloD0MI3LdaJy5LRUCUhpRSlGgVS69oFkdAlsYnlOoHcHV9lChoBmgJaA9DCK+XpgiwznFAlIaUUpRoFUvvaBZHQJbHCa1Cw8p1fZQoaAZoCWgPQwgewCK//nxxQJSGlFKUaBVNAwFoFkdAlsccDOkcj3V9lChoBmgJaA9DCKSJd4DnTnJAlIaUUpRoFU0uAWgWR0CWx3jNIK+jdX2UKGgGaAloD0MIdCmuKjtxckCUhpRSlGgVTScBaBZHQJbHse7tiQV1fZQoaAZoCWgPQwgEdjV5CmRyQJSGlFKUaBVL62gWR0CWyEr/bTMJdX2UKGgGaAloD0MIIlD9gwiFcUCUhpRSlGgVTQkBaBZHQJbJKXa8HwB1fZQoaAZoCWgPQwgh5SfVfn5yQJSGlFKUaBVNJwFoFkdAlsoShJyyU3V9lChoBmgJaA9DCHfWbrtQ/HFAlIaUUpRoFUv7aBZHQJbKJl6JIlN1fZQoaAZoCWgPQwhl3qrrEGNyQJSGlFKUaBVNgAFoFkdAlsol0knkUHV9lChoBmgJaA9DCGIRww4jUnFAlIaUUpRoFU0IAWgWR0CWykGPPszEdX2UKGgGaAloD0MIotXJGcoxc0CUhpRSlGgVTSQBaBZHQJbKT8ZUDMh1fZQoaAZoCWgPQwjoE3mS9PFwQJSGlFKUaBVNFgFoFkdAlspwSnLq2XV9lChoBmgJaA9DCGe3lsmwd3JAlIaUUpRoFU0mAWgWR0CWyoS0BwMqdX2UKGgGaAloD0MIecpqup6lc0CUhpRSlGgVTQsBaBZHQJbLJM6BAfN1fZQoaAZoCWgPQwg51VqYBS5vQJSGlFKUaBVNBwFoFkdAlst40dilSHV9lChoBmgJaA9DCBr8/WL2p3JAlIaUUpRoFU0LAWgWR0CWy6gsK9f1dX2UKGgGaAloD0MIwXRatwGOckCUhpRSlGgVTQgBaBZHQJbLzpQk5ZN1fZQoaAZoCWgPQwhZiA6BY4dwQJSGlFKUaBVNEQFoFkdAlsvefdyksXV9lChoBmgJaA9DCGiXb31YAnBAlIaUUpRoFUv4aBZHQJbMD3SKFZh1fZQoaAZoCWgPQwi6S+KsCNRuQJSGlFKUaBVNAgFoFkdAlsw03S8aoHV9lChoBmgJaA9DCMSZX82B43BAlIaUUpRoFU0WAWgWR0CWzKT72tdSdX2UKGgGaAloD0MIkuo7v+iZcECUhpRSlGgVTQoBaBZHQJbNLUYsNDt1fZQoaAZoCWgPQwgGZ/D3S5pyQJSGlFKUaBVNDAFoFkdAls1yQkona3V9lChoBmgJaA9DCBhEpKZd/nBAlIaUUpRoFU0PAWgWR0CWzZUz9CNTdWUu"
73
  },
74
  "ep_success_buffer": {
75
  ":type:": "<class 'collections.deque'>",
76
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
77
  },
78
- "_n_updates": 248,
79
- "n_steps": 1024,
80
  "gamma": 0.999,
81
  "gae_lambda": 0.98,
82
  "ent_coef": 0.01,
83
  "vf_coef": 0.5,
84
  "max_grad_norm": 0.5,
85
- "batch_size": 64,
86
- "n_epochs": 4,
87
  "clip_range": {
88
  ":type:": "<class 'function'>",
89
  ":serialized:": "gAWVfgIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAEsBSwFLE0MEiABTAJROhZQpjAFflIWUjE4vaG9tZS9ua3QvLmxvY2FsL2xpYi9weXRob24zLjgvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuAQwIAAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UaA11Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoF2gOjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoGIwHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/yZmZmZmZmoWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
+ "__init__": "<function ActorCriticPolicy.__init__ at 0x7f4996344c10>",
8
+ "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f4996344ca0>",
9
+ "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f4996344d30>",
10
+ "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f4996344dc0>",
11
+ "_build": "<function ActorCriticPolicy._build at 0x7f4996344e50>",
12
+ "forward": "<function ActorCriticPolicy.forward at 0x7f4996344ee0>",
13
+ "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f4996344f70>",
14
+ "_predict": "<function ActorCriticPolicy._predict at 0x7f49962c7040>",
15
+ "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f49962c70d0>",
16
+ "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f49962c7160>",
17
+ "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f49962c71f0>",
18
  "__abstractmethods__": "frozenset()",
19
+ "_abc_impl": "<_abc_data object at 0x7f4996336f90>"
20
  },
21
  "verbose": 1,
22
  "policy_kwargs": {},
47
  "_num_timesteps_at_start": 0,
48
  "seed": null,
49
  "action_noise": null,
50
+ "start_time": 1652216888.4359014,
51
  "learning_rate": 0.0003,
52
  "tensorboard_log": null,
53
  "lr_schedule": {
56
  },
57
  "_last_obs": {
58
  ":type:": "<class 'numpy.ndarray'>",
59
+ ":serialized:": "gAWVdQQAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYABAAAAAAAALO5rz2PZlW6wHd0uje8b7WScMY6cBuOOQAAgD8AAIA/mtQxPR+dmbmKAV26tvscvXohR7smGT29AAAAAAAAAABm9tW6XPNjuh1hGLokqAm1NSdeOjD0MjkAAIA/AACAP5ot8rx5TG8+zsQyu8CDl77VMM68NfRVPQAAAAAAAAAAZt4xPK7dkLrO2CK6ZJhHNd/9zLobNTk5AACAPwAAgD+zQS499uwZuptFcrkJf/Gz6aOYuWb5jDgAAIA/AACAPzMJ5rwppB66eqFzOrf6MDXBJPu6xdaQuQAAgD8AAIA/Gjk2vfboPrp7r+Y54tpZNdwW6DoPjwe5AACAPwAAgD8zk3E7hcOrueTfpDtDSf03vZ6kumAPg7UAAIA/AACAPzNgLD1y35o/FmP2PaCo6L66/lU8H2oFPAAAAAAAAAAAM0j6vI++crq+3NW3Nhwhs5S2YjpWpPc2AACAPwAAgD8AIQQ9cdQgu3v2RD4lIJ88SrlOvApbiD0AAIA/AACAPzMD5ropYEq64wlgumY7Krar8GU6/JCDOQAAgD8AAIA/zajrvMOpHLptYY27EAqPOBPhvLrYJwY6AACAPwAAgD9myt48KXgyuqXx6bnmePC04jDEOQDaBTkAAIA/AACAPwAHgb2Fi5W54ibfunPuCjV5RHy78aIEOgAAgD8AAIA/zSQhO0iVoLqKRhK6IJIgurlag7sW1p86AACAPwAAgD/NVJc9PRooud61hLqNA0CzdacmOpC4ADMAAIA/AACAP2aylztcAy26MrMbOrwcADVfQFM7f002uQAAgD8AAIA/AFlkPY+eZboIuw84rv1qtvnmLrpS5By3AAAAAAAAgD/mSDE9XCNJuhKlmrXzl8iwEjoLOR/urDQAAIA/AACAPw0EB7640yw/WpfPPYGsrL4G/J68spQGvQAAAAAAAAAAbRRMvgEJtrzmR8W7cqA1unCcHT6EZQ47AACAPwAAgD/myEu9HqeDPtghXT3E8XW+oCxKPD5kHb0AAAAAAAAAADNJUj1xXUC5GPfcOoaGnDVC1xw7YD8BugAAgD8AAIA/AHyiPKIbsT/yuog+U4GBvptzhrtgGWY9AAAAAAAAAACzS5M9SJuRumVwNDgcWxwzrYBNupAPUbcAAIA/AAAAAObwoT3DKQO6H2WGOyRepjYny6U6mCahugAAgD8AAAAAM+mYvMN5fLpkFaE7NaFOOHpsarntIhe4AACAPwAAgD8zZPe8XI9zutIzhDkyxA81myttO3NKl7gAAIA/AACAPzPkmbwUXK66MJvpuND9JTarlgw4ro8EOAAAgD8AAIA/ZpqTOx41mT8yEbw8dBShvsB/hLxOfmK9AAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSyBLCIaUjAFDlHSUUpQu"
60
  },
61
  "_last_episode_starts": {
62
  ":type:": "<class 'numpy.ndarray'>",
69
  "_current_progress_remaining": -0.015808000000000044,
70
  "ep_info_buffer": {
71
  ":type:": "<class 'collections.deque'>",
72
+ ":serialized:": "gAWVgRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIlWOyuH+7bkCUhpRSlIwBbJRNnwGMAXSUR0CUU4bfP5YYdX2UKGgGaAloD0MIIm5OJYMiaECUhpRSlGgVTegDaBZHQJRT0ry1/lR1fZQoaAZoCWgPQwgGSgosAMBlQJSGlFKUaBVN6ANoFkdAlFiDlHSWq3V9lChoBmgJaA9DCO2fpwED7GZAlIaUUpRoFU3oA2gWR0CUWWO2RaHLdX2UKGgGaAloD0MI7X4V4Pt/cUCUhpRSlGgVTccBaBZHQJRdzthNM491fZQoaAZoCWgPQwinsFJBRWVjQJSGlFKUaBVN6ANoFkdAlF3f3ztkWnV9lChoBmgJaA9DCEMCRpc3RmJAlIaUUpRoFU3oA2gWR0CUXfEidJ8OdX2UKGgGaAloD0MIF9nO99OsZECUhpRSlGgVTegDaBZHQJReEEIPbwl1fZQoaAZoCWgPQwgK3LqbJ0NgQJSGlFKUaBVN6ANoFkdAlGEC/wiJO3V9lChoBmgJaA9DCATnjCjtHmdAlIaUUpRoFU3oA2gWR0CUYoD/lyR0dX2UKGgGaAloD0MIFJhO67YDaUCUhpRSlGgVTegDaBZHQJRi4jRlYlp1fZQoaAZoCWgPQwiDUrRyL9pnQJSGlFKUaBVN6ANoFkdAlGS9gfEGaHV9lChoBmgJaA9DCPje36A9R2RAlIaUUpRoFU3oA2gWR0CUafO3lS0jdX2UKGgGaAloD0MIQZ5dvnWabUCUhpRSlGgVTeABaBZHQJRrOU/wAlx1fZQoaAZoCWgPQwgHRIgrZ3hxQJSGlFKUaBVN6AJoFkdAlGzRq0tyxXV9lChoBmgJaA9DCEYL0LYaamNAlIaUUpRoFU3oA2gWR0CUbfgnMMZxdX2UKGgGaAloD0MIHGDmO3jlbkCUhpRSlGgVTVwBaBZHQJRuOYnfEXN1fZQoaAZoCWgPQwhwI2WLJCplQJSGlFKUaBVN6ANoFkdAlHFOOKfnOnV9lChoBmgJaA9DCF8oYDsYLWNAlIaUUpRoFU3oA2gWR0CUcV8WbgCPdX2UKGgGaAloD0MIGLDkKhYlZECUhpRSlGgVTegDaBZHQJRxb8m8dxR1fZQoaAZoCWgPQwgNi1HX2hBoQJSGlFKUaBVN6ANoFkdAlHLCm/FirnV9lChoBmgJaA9DCFEU6BN5g2dAlIaUUpRoFU3oA2gWR0CUd17EHdGidX2UKGgGaAloD0MI0NIVbKNdcUCUhpRSlGgVTWkBaBZHQJSoaJcgQpZ1fZQoaAZoCWgPQwg1ejVA6bdkQJSGlFKUaBVN6ANoFkdAlKhqJQ+EAnV9lChoBmgJaA9DCDVAaagRlXJAlIaUUpRoFU3OAmgWR0CUqTd4FA3UdX2UKGgGaAloD0MIzNQkeAMKcUCUhpRSlGgVTaoDaBZHQJSresQumJp1fZQoaAZoCWgPQwgDQBU37lRhQJSGlFKUaBVN6ANoFkdAlKt71/Ue+3V9lChoBmgJaA9DCHWRQll4bmFAlIaUUpRoFU3oA2gWR0CUq3zS1E3LdX2UKGgGaAloD0MIqmOV0rNhY0CUhpRSlGgVTegDaBZHQJSrjKJVKf51fZQoaAZoCWgPQwilZ3qJsRxhQJSGlFKUaBVN6ANoFkdAlLB5PVNHpnV9lChoBmgJaA9DCN1ELc3tGHBAlIaUUpRoFU22AWgWR0CUs+N+so2GdX2UKGgGaAloD0MIyVaXU4JhcECUhpRSlGgVTasBaBZHQJS0bopx3mp1fZQoaAZoCWgPQwiYMQVr3LhyQJSGlFKUaBVNhAJoFkdAlLRwZGax5nV9lChoBmgJaA9DCB6lEp7QfmBAlIaUUpRoFU3oA2gWR0CUtkEy+HrRdX2UKGgGaAloD0MIiUFg5dAbaECUhpRSlGgVTegDaBZHQJS2yxkd3jd1fZQoaAZoCWgPQwg0uoPYmUtzQJSGlFKUaBVNCAFoFkdAlLfNg0CRwXV9lChoBmgJaA9DCAG9cOcCgnBAlIaUUpRoFU2JAWgWR0CUuEYcebNKdX2UKGgGaAloD0MIsoLfhhhoYUCUhpRSlGgVTegDaBZHQJS4zJGOMl11fZQoaAZoCWgPQwibyMwFLtRsQJSGlFKUaBVNdgNoFkdAlLjbiADq4nV9lChoBmgJaA9DCJpd91ZkU3BAlIaUUpRoFU3vAmgWR0CUusCrcTJydX2UKGgGaAloD0MINWH7yRgxYkCUhpRSlGgVTegDaBZHQJS85foicG11fZQoaAZoCWgPQwjUu3g/bpVvQJSGlFKUaBVNAgNoFkdAlL72OEM9bHV9lChoBmgJaA9DCPaaHhSUZWdAlIaUUpRoFU3oA2gWR0CUv/HVf/m1dX2UKGgGaAloD0MIuyh64GMxY0CUhpRSlGgVTegDaBZHQJTF5vddmg91fZQoaAZoCWgPQwgrFr8p7ARxQJSGlFKUaBVN1AFoFkdAlMfXAZbY9XV9lChoBmgJaA9DCNp1b0Viq1hAlIaUUpRoFU3oA2gWR0CUyrLs8gZCdX2UKGgGaAloD0MIMV2I1R9AZ0CUhpRSlGgVTegDaBZHQJTK08W9DhN1fZQoaAZoCWgPQwivzjEg+2pxQJSGlFKUaBVNSgFoFkdAlMyc5CF9KHV9lChoBmgJaA9DCG+70FwnFHFAlIaUUpRoFU27A2gWR0CUzP+cH4XXdX2UKGgGaAloD0MIol2FlF/ucECUhpRSlGgVTcgCaBZHQJTN4vg3tKJ1fZQoaAZoCWgPQwjnGJC93rlxQJSGlFKUaBVNUQFoFkdAlM4iWu5jIHV9lChoBmgJaA9DCAD+KVWiyWZAlIaUUpRoFU3oA2gWR0CU0ZuJ1q33dX2UKGgGaAloD0MI+3WnO8/1cUCUhpRSlGgVTdkBaBZHQJTR2fChvit1fZQoaAZoCWgPQwhfXKrSFtJxQJSGlFKUaBVN1gJoFkdAlNSIvrWy1XV9lChoBmgJaA9DCOavkLkyhHBAlIaUUpRoFU21AmgWR0CU1b4qwyIpdX2UKGgGaAloD0MIlwM91DZQY0CUhpRSlGgVTegDaBZHQJTZA90Rvm51fZQoaAZoCWgPQwh5Iojz8PVoQJSGlFKUaBVN6ANoFkdAlNoJyMkyDnV9lChoBmgJaA9DCJT3cTTHF2FAlIaUUpRoFU3oA2gWR0CU2kOtW+49dX2UKGgGaAloD0MINE3YfrIyY0CUhpRSlGgVTegDaBZHQJTdHCTEBKd1fZQoaAZoCWgPQwgEHhhA+NpgQJSGlFKUaBVN6ANoFkdAlN0sURFqjHV9lChoBmgJaA9DCNDv+zdvDnBAlIaUUpRoFU2aA2gWR0CU4Gz7/GVBdX2UKGgGaAloD0MIWrxYGKLwZUCUhpRSlGgVTegDaBZHQJTi9RFZxJd1fZQoaAZoCWgPQwhIN8KiIklhQJSGlFKUaBVN6ANoFkdAlOd+KoAGS3V9lChoBmgJaA9DCJZdMLjml2VAlIaUUpRoFU3oA2gWR0CU548274BWdX2UKGgGaAloD0MIMV7zqs7Vb0CUhpRSlGgVTcYDaBZHQJTqu/KyOaR1fZQoaAZoCWgPQwipvYi2YxBwQJSGlFKUaBVNYwNoFkdAlOso150KZ3V9lChoBmgJaA9DCNxkVBlGy25AlIaUUpRoFU3RAmgWR0CU66DtPYWddX2UKGgGaAloD0MI8DZvnBTrYkCUhpRSlGgVTegDaBZHQJTwG8kD6nB1fZQoaAZoCWgPQwieQUP/hBlmQJSGlFKUaBVN6ANoFkdAlPCjqW1MNHV9lChoBmgJaA9DCKBTkJ+NjW9AlIaUUpRoFU2+AmgWR0CU8aJvo/zKdX2UKGgGaAloD0MIh/2eWKfJZECUhpRSlGgVTegDaBZHQJTyb5O8Cgd1fZQoaAZoCWgPQwgpWrkXGIFtQJSGlFKUaBVNtAFoFkdAlPKcyFfzBnV9lChoBmgJaA9DCIyDS8cctWRAlIaUUpRoFU3oA2gWR0CU9Fhb4agmdX2UKGgGaAloD0MIODEkJxNzY0CUhpRSlGgVTegDaBZHQJT06LNwBHV1fZQoaAZoCWgPQwhsy4CzlBNvQJSGlFKUaBVNqwFoFkdAlPYzAeq7y3V9lChoBmgJaA9DCBWL3xTW8WdAlIaUUpRoFU3oA2gWR0CU9sI5YHPedX2UKGgGaAloD0MIflLt03EfaECUhpRSlGgVTegDaBZHQJT4xPfsNUh1fZQoaAZoCWgPQwjZBu5A3bZwQJSGlFKUaBVN6gJoFkdAlPl/XPJJXnV9lChoBmgJaA9DCKEQAYdQcGVAlIaUUpRoFU3oA2gWR0CU+qPbO/tZdX2UKGgGaAloD0MI9HAC02kKaECUhpRSlGgVTegDaBZHQJUA6hxo7FN1fZQoaAZoCWgPQwg9YvTcQmBuQJSGlFKUaBVNxQFoFkdAlQHGWIGhVXV9lChoBmgJaA9DCCBGCI92hHFAlIaUUpRoFU23A2gWR0CVAm7/n4fwdX2UKGgGaAloD0MIyeU/pJ9ycECUhpRSlGgVTUYBaBZHQJUDTsD4gzR1fZQoaAZoCWgPQwgtX5fhPwdoQJSGlFKUaBVN6ANoFkdAlQUtgWrOq3V9lChoBmgJaA9DCNY6cTleiGFAlIaUUpRoFU3oA2gWR0CVBulfJFLGdX2UKGgGaAloD0MIuHNhpBdNZ0CUhpRSlGgVTegDaBZHQJUHRON5t3x1fZQoaAZoCWgPQwipoKLqV3NoQJSGlFKUaBVN6ANoFkdAlQgZA+pwTHV9lChoBmgJaA9DCK6gaYnVD3BAlIaUUpRoFU0HAmgWR0CVCa2fkFOgdX2UKGgGaAloD0MIFkuRfCUKWkCUhpRSlGgVTegDaBZHQJULum3vx6R1fZQoaAZoCWgPQwhM4UGz64hkQJSGlFKUaBVN6ANoFkdAlQv44hllLHV9lChoBmgJaA9DCNfbZipEA3FAlIaUUpRoFU1tA2gWR0CVDVplSS/1dX2UKGgGaAloD0MIo3iVtc2dYUCUhpRSlGgVTegDaBZHQJUOoNI9TxZ1fZQoaAZoCWgPQwi0W8tkOKxoQJSGlFKUaBVN6ANoFkdAlQ/aEWZZ0XV9lChoBmgJaA9DCHV1x2Ib7GRAlIaUUpRoFU3oA2gWR0CVFHCPp6hQdX2UKGgGaAloD0MIpS4Zx8iaZECUhpRSlGgVTegDaBZHQJUXzFQ2uPp1fZQoaAZoCWgPQwgzp8ti4vRwQJSGlFKUaBVN/QJoFkdAlRfsOskpqnV9lChoBmgJaA9DCPevrDQpd2dAlIaUUpRoFU3oA2gWR0CVG4KpkwvhdX2UKGgGaAloD0MIGAXB41srYkCUhpRSlGgVTegDaBZHQJUeRiKBNEh1fZQoaAZoCWgPQwiHhzB+Gl5zQJSGlFKUaBVNFANoFkdAlSBtw71ZknV9lChoBmgJaA9DCN46/3bZ4W9AlIaUUpRoFU3SAWgWR0CVIabWVeKLdWUu"
73
  },
74
  "ep_success_buffer": {
75
  ":type:": "<class 'collections.deque'>",
76
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
77
  },
78
+ "_n_updates": 186,
79
+ "n_steps": 2048,
80
  "gamma": 0.999,
81
  "gae_lambda": 0.98,
82
  "ent_coef": 0.01,
83
  "vf_coef": 0.5,
84
  "max_grad_norm": 0.5,
85
+ "batch_size": 128,
86
+ "n_epochs": 6,
87
  "clip_range": {
88
  ":type:": "<class 'function'>",
89
  ":serialized:": "gAWVfgIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAEsBSwFLE0MEiABTAJROhZQpjAFflIWUjE4vaG9tZS9ua3QvLmxvY2FsL2xpYi9weXRob24zLjgvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuAQwIAAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UaA11Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoF2gOjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoGIwHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/yZmZmZmZmoWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="
nkt32/PPO-LunarLander-v2-T2/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0b7b16451c22e0115541ab62b6d6f70bf992ef6393aef4961eab31d7ce080886
3
  size 84893
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:08d4fd60107a863f5b9daa1ed6187f9794ee6c193afc1b2b0f4df69d8aaf3ca0
3
  size 84893
nkt32/PPO-LunarLander-v2-T2/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1a2200a246a3fd9c7a4bfb1b1376e32d63348d655fcf47163c83b95e52cbf0d9
3
  size 43201
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3dd1c08a8f2af66b74f30af1957dc929bf21b9e9b047d5de05dd6d75868810ac
3
  size 43201
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2e2576a5009b04f3681c9338ea6b692e36bb3e417e3f5fe39ec7422d629eb555
3
- size 202599
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:552c5d6c78fbeadd22b28cde06e828a3cde193400a141651d3e8a871539cfaf4
3
+ size 185664
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 265.07958151306354, "std_reward": 15.390097927125167, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2022-05-10T21:02:35.166278"}
1
+ {"mean_reward": 265.99398732912925, "std_reward": 20.580651168793356, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2022-05-10T21:31:00.599367"}