NathanS-HuggingFace commited on
Commit
3d49f75
1 Parent(s): ec85111

Hyperparameter tuning

Browse files
Files changed (6) hide show
  1. README.md +1 -1
  2. config.json +1 -1
  3. ppo-LunarLander-v2.zip +1 -1
  4. ppo-LunarLander-v2/data +13 -13
  5. replay.mp4 +0 -0
  6. results.json +1 -1
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
- value: 302.39 +/- 17.32
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
+ value: 308.50 +/- 11.39
20
  name: mean_reward
21
  verified: false
22
  ---
config.json CHANGED
@@ -1 +1 @@
1
- {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7fb5e4879b40>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7fb5e4879bd0>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7fb5e4879c60>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7fb5e4879cf0>", "_build": "<function ActorCriticPolicy._build at 0x7fb5e4879d80>", "forward": "<function ActorCriticPolicy.forward at 0x7fb5e4879e10>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7fb5e4879ea0>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7fb5e4879f30>", "_predict": "<function ActorCriticPolicy._predict at 0x7fb5e4879fc0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7fb5e487a050>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7fb5e487a0e0>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7fb5e487a170>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7fb5e486ef00>"}, "verbose": 1, "policy_kwargs": {}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVYAIAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoCIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoESiWCAAAAAAAAAABAQEBAQEBAZRoFUsIhZRoGXSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBEoliAAAAAAAAAAAADAvwAAwL8AAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaAtLCIWUaBl0lFKUjARoaWdolGgRKJYgAAAAAAAAAAAAwD8AAMA/AACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgLSwiFlGgZdJRSlIwIbG93X3JlcHKUjFNbLTEuNSAgICAgICAtMS41ICAgICAgIC01LiAgICAgICAgLTUuICAgICAgICAtMy4xNDE1OTI3IC01LgogLTAuICAgICAgICAtMC4gICAgICAgXZSMCWhpZ2hfcmVwcpSMS1sxLjUgICAgICAgMS41ICAgICAgIDUuICAgICAgICA1LiAgICAgICAgMy4xNDE1OTI3IDUuICAgICAgICAxLgogMS4gICAgICAgXZSMCl9ucF9yYW5kb22UTnViLg==", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-1.5 -1.5 -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[1.5 1.5 5. 5. 3.1415927 5. 1.\n 1. ]", "low_repr": "[-1.5 -1.5 -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[1.5 1.5 5. 5. 3.1415927 5. 1.\n 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gAWVPwsAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwFc3RhcnSUSwCMBl9zaGFwZZQpjAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmk4lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMCl9ucF9yYW5kb22UjBRudW1weS5yYW5kb20uX3BpY2tsZZSMEl9fcmFuZG9tc3RhdGVfY3RvcpSTlIwHTVQxOTkzN5SFlFKUfZQojA1iaXRfZ2VuZXJhdG9ylGgVjAVzdGF0ZZR9lCiMA2tleZSMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJbACQAAAAAAAAAAAICf5XKN7DKTmDdZTQotIHxHHahuyk5nO+GJphGKxas1v9eEd0G4AMIylRzWxMmzodHDYuqNHj4kVOgihRmvR0Se2XjsfpjkDBgLu3Y0xTSHiaz1NlKp9DyyoMCSSbo6tT51/s5EGTOW1Lvh5Kyrqf4dh2uxX+nHTQ34p6pAPdpLv3MIiMscQdPA/AXkT8nvgKsjd1LPTSczCPi7uErgWLVdSJrZb1x8Z2IfZ6eamvVoUaL4Nirf+atqvM+McX7hCkx92ZIWLHOj546boBNAv+9+JX/RmlaeUKKLhF2XnI75WjCOxCQZ8kcsH1O42WFLsSMPaLAdnznPu58PfNE+c3lKKtWwkInheEI+FezHc3kdcgqnkHDl/d/EsJ7PlUIF/Es9rwU3rrzrWtxoV2tyRkPe+e54WpHl2koxaCuDWCl9MAAVJMC4OnFPZRwQvLHO9sE2lf9jc493BQGqYz+tbvAnCpy28nhBYNkJ2CwlPLbWO+lYD43p3fRc6H46Iu4T3ER6mt2D52yk5aZhzYng7tkA+2E1Y6zR1f2dpEfyPoxf/qJejc23ECg+DisZEZ8Dz8b7Km4hZGv2LfPRCT20HGz2AnWOyjfg37Fs4etSjYfVQtawbegKHEq0N+wfD6TCbnvPcT/dKM3e8UTvbrZBn0/8LeKhR0V/qN0GyUPZx3+TsPNu3WbBPltAF4kaULM8bEeVsj1ZZOgB8c6ZPMiBSrCkXetIcSTqtepWGdA9fi4LYaZzx6xm+Z62BPY9cusjOivRTAq7nk0BOZxxk6jDQx6U9rDIEK2mYCwdzx1qnJ1kOyPjOFkmsDQ1D5OQepOiroUjgoS2dYC+qaA5qnMrpM/FbDopeUYCRRt1XP9/2AnNp4ovmBn/e+1Qzoqg7IpytEZlO07w3aMEfxE3yUiOe7aiMA4/ramPo6F3ZQKptugAc0Ozw0A0OM3uDhvLezal7Fxl+A8QoAQ2ybcvcWsb74M5/SN+0AMIu9vMYrC1rNyS8BoEgYnQkEyJXbaU8Q9tcpn+/p3obMkwcNfx6ZOzYBXhZQgw63ySYx1VYEi/o9f+G1n5oAvB1+X+xPjEmFei4IHNe14B11w2cUSZnvxm2ariciMXLDISho8egNoGZSXUcRt0yLgh8+gZ472KNyg68NmP6UCNnxvIdrebTsTh40ehfTS/uhi0QZIU7gfNpMgC07l5bKXLfpkUvhFaWRPwR5KSvE7Abk/y85bQPgWsvTESBwyRnZ8+TmykdMeyF6TJTB/6aqhkeCRMkX7ZimjY9KZx6bT779ZvxfS8+uwkRGpTuSBukgjxzipSwZL3e3McoCY9rlOLQ9V8KZSBGIaTE+S3w0dNp0p7RIxJ2vFRbIM9R2LPFltqJbBvuQyGcyAwk3mxG2VpiOTxfbLcMbnk0y7iGUmy6/Cxw336Dmp5gzJA+4lZJp1ojb94iVX199g/vxTCF6iiinv3txFcwrsooEEjOhU8g6T18wEIRzgKr1PBPfmm3T00XuHFe+2UJkbYf3q8SCaEkrnUbXLI2x578yBvKJFwrUnetk/Uc6jcv/MaoPjuQmjzNPBhy7JTpPuqRYWJOlaGLvp1L5nmUDoyXTeylrkl+fOrlXUCTOaIQNtOb1za+Bty/a+jIHTVUvrC/QLm9ozZpdWXRK7bGA58akXDZS0XJzgEREgog88QOVEwf1om7911ei0RkBbPb+nL8c7OtTxHRfEl/6CoWT/ZP+cadPDq6MqI7SDaVUFOUHgmkUXlH0YkZpTIyGm5Jsnb9HSCXGbwkI/mljmCbuwwCvCYTiXrqYOIa5EPf/lcph7ogk+4+lAQhU/6uq+8Uxiu5SFjB2fs6R21uUsqjkuyuwT6mbzKIhVbF41dPvr1lVUXdC7WINe+nSG+lXuGcduxfydq56WCcWjPfcgmv/cQQwmmPQ1zL0LkQYJpxOuzGAg05aMsM2EgogujI9VYmwmxnpsBxo8rw3EAX3Xw604tXuV7A1EIGD9GMlFV57jbHpfUyH7rjoAn/mZPUDlAi8Cn5+2k99M/z2TkT05U2H2BPh7QkQ6Ied8BWqXSE2eJN/qga6cCbX9DBe/G7ZmxbkUmS4zhblXke83hdIHpDqJF5BZCFwflJ58oO+oR3acFuqNIbNhni0eG9YZACbqf1S3equ0ueXVTnYMd1/2KYci1/Gnvh7fGz8tah+KKM3OHSDtJHcae68rp/KnwH6mL6GANjPA7LeO95LPFR1VEZVjSXuVHOAMz+g3M8pRKLDmzw/gVldGAaVCvCkEjgyB6V5F3+ggCbb+RfWdEom8tqJvGrFfnPqqW6ysCYSnInqLDv3wbKhb+T2Q2EDA6cPnD8EGrzJL5Qo4EtRPnZ6VDQm8MheNitYXrFXo9+UOvzlApOV02oUsHejdKVFFu1Ug3ch0MEIOEK6RSxBtdRbgviswGRmv46ajDOQRSQHxbKKhSzeRdFBPZ40ma2CXTS3YTaj7+LP+eCKLbFR36yawjQp3kLmGqpYUXHOOgNQXiyd+Dqlq8GcapVS5lCbVGqEG7wXUB8Ho6OFJHNXuQzJ7VEX8pHjH2QnjhefCWg/S62AC4OZH8rd8JqE3MTaZKR8vzpEoSgDi0D6sGUR2caOhSwCG11S+oz3evSj13CrGxRyc+bE9TTru1WpsVNk7AGB7hWWrZa8tb+3/f/CJRdX1NQhgN3ifCAr66Q0QncVvi2sysw7QjhToZMMHZmWdN3Wiv3gOFj4kfWvF7APexHsSQjm88pUxHD/9Erv4wP/6/tiUWirgC1wLxVGovLLtB6pX/CU23k1HLAS6EinZKsOFiP/dEKSYTp/hggID8JWGdmOsp+jhOAxWxJLXi+if49wKypQDhJ/ey6VKg3cm2hzN9s/wyN5y0LVBMYj9iMzdlGBYP34vOhZpa7gs/eizLvBPca7c4La3q787tBPC+aBA11wDLUJFQRSoTVI3evDg0yRbRAf5gRNWdX1E+smb1m/1vErSPr/cBB4OYsEy22htKCPCX+eps1RWm+4ZY787m9nZTW/KvMxXY/+4DO+BWJXm8tlc7gYRMWGhjuaIEX+ybji8VtGm2MwQVkOnMUACMeRlwxqaNlPmDL5XfnJMt7ms/Ev1arLa8KpXVvflByqeZQ5dRfdhWXkbeyNbfJTQ/zGP46W1G9olxnVThoG9uoKuY30f/nW5XPjqoKPX1J2ysRZesqa95OkhMrQ+C+4W4mP2smNBGn9mq1RIl65/k++L0aOduV/E7EXV+fiebtnizezaWPTG2lWmsSHwGKmVPziITTVNjVLDlZviv1CX/OiFsGEP+E1G2uZzy5kRmNmw4+JRoC4wCdTSUiYiHlFKUKEsDaA9OTk5K/////0r/////SwB0lGJNcAKFlIwBQ5R0lFKUjANwb3OUTXACdYwJaGFzX2dhdXNzlEsAjAVnYXVzc5RHAAAAAAAAAAB1YnViLg==", "n": 4, "start": 0, "_shape": [], "dtype": "int64", "_np_random": "RandomState(MT19937)"}, "n_envs": 16, "num_timesteps": 1015808, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": 344042492, "action_noise": null, "start_time": 1676230607495514086, "learning_rate": 0.0003, "tensorboard_log": "tensorboard-logs/ppo-LunarLander-v2-stable-reward-penalize-time/LunarLander-v2", "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWV4wIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMWC9ob21lL3RoZWtleW1hc3Rlci8ubG9jYWwvbGliL3B5dGhvbjMuMTAvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuCQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjFgvaG9tZS90aGVrZXltYXN0ZXIvLmxvY2FsL2xpYi9weXRob24zLjEwL3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAGY707xSwus8kwnBvZF4xb7UzjC+rYHqvQAAAAAAAAAA4CArvv0Jbj5ayqw+6uMlv9cPQr7Cz48+AAAAAAAAAADNJH074rq1P8FGQT6sQjw+OvMWu6pv3LkAAAAAAAAAAEbSNL613SQ/DhJNPFwDXr8E2Lq+jIgHPgAAAAAAAAAA87nrvduijz9msAS/FjkyvwxlGb5uAqq+AAAAAAAAAABDl4O+NBuXPyOVu74vlhO/tlEwv/Z0bL4AAAAAAAAAAJr57rxu6NA+utgwvQJXTL+Spq+8uzSlvAAAAAAAAAAAoCRWPu2+hD/T/S4+Pkbrvp4/Nz/xZAo/AAAAAAAAAADNnDO9KQAmupr38bazM4ayvNfGOkLuDTYAAIA/AACAPwDxuDxbbLI/WI1rPjHaQr7Sxf48Z7ANPgAAAAAAAAAAACAhPIlKwD/ILI09mSUcPl+RMDtqRvc8AAAAAAAAAAAzPue8j3Y8umFLCTr0BiS5ZGqgOlvAD7kAAIA/AACAP9MdEz4ORWA/zCfJPXecIr+mjw8//NgQPgAAAAAAAAAAE+kjvgPMXLym+y063BIlOBaOwD22M2O5AAAAAAAAgD+myBQ+84WEP8gMmT4uVyq/d9PLPiY0xT4AAAAAAAAAALCZab54BAM/mqRxPukgYr9WKau+9ZWTPgAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.015808000000000044, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVHRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIUI4CRAFOdECUhpRSlIwBbJRLqIwBdJRHQJvheHymQ8x1fZQoaAZoCWgPQwhN2ekHNXpzQJSGlFKUaBVLoGgWR0Cb4erfcer/dX2UKGgGaAloD0MIxOv6BTv1cUCUhpRSlGgVS7toFkdAm+J8r3CbdHV9lChoBmgJaA9DCHR63o0F+XFAlIaUUpRoFUusaBZHQJvi5GKAJ9l1fZQoaAZoCWgPQwgIy9jQjZ1xQJSGlFKUaBVLmmgWR0Cb5E+85CF9dX2UKGgGaAloD0MIJJhqZu3CcUCUhpRSlGgVS65oFkdAm+TGnn+yaHV9lChoBmgJaA9DCOHTnLxI63FAlIaUUpRoFUuQaBZHQJvmDvd/J/51fZQoaAZoCWgPQwjO/kC5LblxQJSGlFKUaBVLjmgWR0Cb5kkTpPhydX2UKGgGaAloD0MI5BQdyaXscECUhpRSlGgVS5BoFkdAm+cFk6Lfk3V9lChoBmgJaA9DCCKnr+drDnJAlIaUUpRoFUueaBZHQJvnotjCpFV1fZQoaAZoCWgPQwg6ArhZfEhwQJSGlFKUaBVLiWgWR0Cb6ASZjQRgdX2UKGgGaAloD0MIcw8J33sUcUCUhpRSlGgVS4NoFkdAm+gvcFhXsHV9lChoBmgJaA9DCOJcwwwNiHBAlIaUUpRoFUucaBZHQJvo39ZRsM11fZQoaAZoCWgPQwgJ/reS3fZyQJSGlFKUaBVL02gWR0Cb6WvoePq+dX2UKGgGaAloD0MIPiR87282c0CUhpRSlGgVS5doFkdAm+noa1kUbnV9lChoBmgJaA9DCDT2JRuPkHFAlIaUUpRoFUuraBZHQJvqF+1Bt1p1fZQoaAZoCWgPQwjhQ4mWfAlzQJSGlFKUaBVLmmgWR0Cb6qjqfOD8dX2UKGgGaAloD0MIysStgphbcECUhpRSlGgVS5toFkdAm+thf4REnnV9lChoBmgJaA9DCNTzbizounNAlIaUUpRoFUuYaBZHQJvrvwI+nqF1fZQoaAZoCWgPQwh/FHXmHs9zQJSGlFKUaBVL4GgWR0Cb7BZTho/SdX2UKGgGaAloD0MIryE4LmO7cECUhpRSlGgVS41oFkdAm+yYxcmjTXV9lChoBmgJaA9DCIDwoURLOkJAlIaUUpRoFUtnaBZHQJvtKK+BYmt1fZQoaAZoCWgPQwj8NVmj3v9xQJSGlFKUaBVLomgWR0Cb7iowmE5AdX2UKGgGaAloD0MIzH7d6U5xc0CUhpRSlGgVS6BoFkdAm++G9pRGdHV9lChoBmgJaA9DCLHfE+vUtnJAlIaUUpRoFUuvaBZHQJvwhovi97F1fZQoaAZoCWgPQwiKIM7DST5zQJSGlFKUaBVLlmgWR0Cb8Mp35eqrdX2UKGgGaAloD0MIFHmSdM2YcUCUhpRSlGgVS5VoFkdAm/IKJ/G2kXV9lChoBmgJaA9DCCdPWU1XMG9AlIaUUpRoFUuiaBZHQJvyOYQarFR1fZQoaAZoCWgPQwhQ/YNIxlJxQJSGlFKUaBVLr2gWR0Cb8kWNm16WdX2UKGgGaAloD0MIPNujN9yxcECUhpRSlGgVS55oFkdAm/LnQUpNK3V9lChoBmgJaA9DCLuZ0Y9G93JAlIaUUpRoFUvKaBZHQJvzPbpNbkh1fZQoaAZoCWgPQwiXVkPinolwQJSGlFKUaBVLi2gWR0Cb838NhE0BdX2UKGgGaAloD0MILbRzmsUrcECUhpRSlGgVS5VoFkdAm/O1xS5y2nV9lChoBmgJaA9DCKZfIt763XJAlIaUUpRoFUuuaBZHQJvz5x6v7nB1fZQoaAZoCWgPQwiOkewRaoFzQJSGlFKUaBVLpmgWR0Cb8/R2r4nGdX2UKGgGaAloD0MIdGA5Qsapc0CUhpRSlGgVS5BoFkdAm/RkuDjBEnV9lChoBmgJaA9DCMsr19vmM3JAlIaUUpRoFUuJaBZHQJv0iSB9Tgl1fZQoaAZoCWgPQwiWQbXByedxQJSGlFKUaBVLnmgWR0Cb9IUPQOWjdX2UKGgGaAloD0MI4jlbQGi+c0CUhpRSlGgVS6NoFkdAm/ZQX668QXV9lChoBmgJaA9DCOS9amUCV3NAlIaUUpRoFUuxaBZHQJv4cV32VVx1fZQoaAZoCWgPQwi4dTdPNdpxQJSGlFKUaBVLhWgWR0Cb+IO+ZgG9dX2UKGgGaAloD0MIey5Tk2ABckCUhpRSlGgVS6doFkdAm/jlK5Cng3V9lChoBmgJaA9DCJs8ZTVdY3FAlIaUUpRoFUulaBZHQJv5JM6BAfN1fZQoaAZoCWgPQwiOB1vs9vlvQJSGlFKUaBVLjmgWR0Cb+c5mh/RWdX2UKGgGaAloD0MIuMg9XZ20cUCUhpRSlGgVS6VoFkdAm/pubRWtEHV9lChoBmgJaA9DCDp6/N7mtnBAlIaUUpRoFUuZaBZHQJv6zXGwRoR1fZQoaAZoCWgPQwj19BH4A0xwQJSGlFKUaBVLlmgWR0Cb+0K6WgOCdX2UKGgGaAloD0MISG+4j1zjcUCUhpRSlGgVS5loFkdAm/tyDAaegHV9lChoBmgJaA9DCEOR7ufUgXFAlIaUUpRoFUucaBZHQJv7aiblRxd1fZQoaAZoCWgPQwi5bd+jfjlyQJSGlFKUaBVLvmgWR0Cb+71DjR2KdX2UKGgGaAloD0MIpMLYQlArcUCUhpRSlGgVS7ZoFkdAm/yFVT72tnV9lChoBmgJaA9DCDKqDONuiXJAlIaUUpRoFUuraBZHQJv89BOYYzl1fZQoaAZoCWgPQwjEQxg/TatzQJSGlFKUaBVLr2gWR0Cb/UgqmTC+dX2UKGgGaAloD0MI06BoHgD3c0CUhpRSlGgVS7doFkdAm/2rlA/s3XV9lChoBmgJaA9DCKbtX1lp0HJAlIaUUpRoFUuHaBZHQJv/iMl1KXh1fZQoaAZoCWgPQwiiJCTSNnZxQJSGlFKUaBVLi2gWR0Cb/6uaF23bdX2UKGgGaAloD0MIoUeMnpsqc0CUhpRSlGgVS6doFkdAnAJxVAAyVXV9lChoBmgJaA9DCOQViJ4UcnJAlIaUUpRoFUusaBZHQJwCkfs/pt91fZQoaAZoCWgPQwje40wTdqVwQJSGlFKUaBVL3GgWR0CcAsXhfjS5dX2UKGgGaAloD0MIQbYsX5cEcUCUhpRSlGgVS5NoFkdAnAPnHvMKTnV9lChoBmgJaA9DCGSV0jM9t3FAlIaUUpRoFUuEaBZHQJwETaxoqTd1fZQoaAZoCWgPQwgp7Q2+sKdwQJSGlFKUaBVLoWgWR0CcBIeF+NLldX2UKGgGaAloD0MI3PKRlPQpcUCUhpRSlGgVS6toFkdAnASjK1XvIHV9lChoBmgJaA9DCPThWYJManNAlIaUUpRoFUuzaBZHQJwE0xmCiAV1fZQoaAZoCWgPQwhYObTItkNxQJSGlFKUaBVLn2gWR0CcBQMvAXVLdX2UKGgGaAloD0MIucFQh9Vic0CUhpRSlGgVS5BoFkdAnAV6asp5NXV9lChoBmgJaA9DCIVefxJfgXNAlIaUUpRoFUuxaBZHQJwFpyIYWLx1fZQoaAZoCWgPQwisqpffabxwQJSGlFKUaBVLk2gWR0CcBg9uxbB5dX2UKGgGaAloD0MI2V4Leq9rc0CUhpRSlGgVS6loFkdAnAfKhcqvvHV9lChoBmgJaA9DCGEyVTDqfnNAlIaUUpRoFUuiaBZHQJwJxWEK3NN1fZQoaAZoCWgPQwi8sgsG1x9yQJSGlFKUaBVLgGgWR0CcCjmXPZ7HdX2UKGgGaAloD0MIHqSnyGEJdECUhpRSlGgVS7loFkdAnAsUofCAMHV9lChoBmgJaA9DCKZ7ndTXFXJAlIaUUpRoFUuVaBZHQJwLa8CgbqB1fZQoaAZoCWgPQwgNjLysiQdzQJSGlFKUaBVLiWgWR0CcDGyH2ys0dX2UKGgGaAloD0MIqYdodIeocUCUhpRSlGgVS4ZoFkdAnA5KlDWsinV9lChoBmgJaA9DCL3faMeN7XJAlIaUUpRoFUu9aBZHQJwOpbiZOSJ1fZQoaAZoCWgPQwjAdjBiX+VxQJSGlFKUaBVLlWgWR0CcDxSJj2BbdX2UKGgGaAloD0MI2GX4T/fVckCUhpRSlGgVS61oFkdAnA9DNdJJ5HV9lChoBmgJaA9DCOup1VcXs3FAlIaUUpRoFUuoaBZHQJwPbWbwz+F1fZQoaAZoCWgPQwj5LqUu2X5yQJSGlFKUaBVLrGgWR0CcD8T5O8CgdX2UKGgGaAloD0MIaB8r+C1ncUCUhpRSlGgVS7RoFkdAnBAWbPQfIXV9lChoBmgJaA9DCMiZJmz/GHRAlIaUUpRoFUu2aBZHQJwQrUjLSu11fZQoaAZoCWgPQwhzucFQh9NxQJSGlFKUaBVLjGgWR0CcES7qIJqqdX2UKGgGaAloD0MIUb6ghQQLdECUhpRSlGgVS7hoFkdAnBIE8aGYbHV9lChoBmgJaA9DCLXf2omSGHNAlIaUUpRoFUuDaBZHQJwSbk1dgOV1fZQoaAZoCWgPQwhiaHVyxgZxQJSGlFKUaBVLiWgWR0CcE/4nF5v+dX2UKGgGaAloD0MIOpZ31UMgc0CUhpRSlGgVS6FoFkdAnBSqS9ugpXV9lChoBmgJaA9DCLPqc7UVq3FAlIaUUpRoFUufaBZHQJwVzctXgcd1fZQoaAZoCWgPQwg3p5IBoP5yQJSGlFKUaBVLqmgWR0CcF0u8scyWdX2UKGgGaAloD0MI5Gn5gavVb0CUhpRSlGgVS5FoFkdAnBfPDpC8e3V9lChoBmgJaA9DCFYrE35pt3JAlIaUUpRoFUukaBZHQJwYwO09hZ11fZQoaAZoCWgPQwgUzJiCdWdxQJSGlFKUaBVLnWgWR0CcGbSW7e2vdX2UKGgGaAloD0MICOdTx6qyc0CUhpRSlGgVS6NoFkdAnBpxJqZc9nV9lChoBmgJaA9DCKx0d51NcnRAlIaUUpRoFUuvaBZHQJwajuF6Avt1fZQoaAZoCWgPQwj0jH3JRnhyQJSGlFKUaBVLs2gWR0CcGo5lOGj9dX2UKGgGaAloD0MIMsnIWRg+cUCUhpRSlGgVS55oFkdAnBs/tD2JznV9lChoBmgJaA9DCJQUWAATQXJAlIaUUpRoFUuwaBZHQJwcCih37k51fZQoaAZoCWgPQwjGFRdHpRBxQJSGlFKUaBVLy2gWR0CcHGlrM1TBdX2UKGgGaAloD0MIPdF14cfIckCUhpRSlGgVS51oFkdAnBygVfu1GHV9lChoBmgJaA9DCBxhURHnB3JAlIaUUpRoFUuKaBZHQJwdFxm03Ox1ZS4="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 12756, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVwQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMRy9ob21lL21hcmt1cy9zcmMvYWkvc3RhYmxlLWJhc2VsaW5lczMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgUMCBAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxHL2hvbWUvbWFya3VzL3NyYy9haS9zdGFibGUtYmFzZWxpbmVzMy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpSMHGNsb3VkcGlja2xlLmNsb3VkcGlja2xlX2Zhc3SUjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoH32UfZQoaBZoDYwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBeMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHP8mZmZmZmZqFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "system_info": {"OS": "Linux-5.15.52-gentoo-x86_64-x86_64-AMD_Ryzen_5_1600_Six-Core_Processor-with-glibc2.35 # 1 SMP Thu Jul 21 22:26:07 EDT 2022", "Python": "3.10.6", "Stable-Baselines3": "1.7.0", "PyTorch": "1.13.1+cu117", "GPU Enabled": "True", "Numpy": "1.23.1", "Gym": "0.21.0"}}
 
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f6a55b71b40>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f6a55b71bd0>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f6a55b71c60>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f6a55b71cf0>", "_build": "<function ActorCriticPolicy._build at 0x7f6a55b71d80>", "forward": "<function ActorCriticPolicy.forward at 0x7f6a55b71e10>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7f6a55b71ea0>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f6a55b71f30>", "_predict": "<function ActorCriticPolicy._predict at 0x7f6a55b71fc0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f6a55b72050>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f6a55b720e0>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f6a55b72170>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7f6a56194540>"}, "verbose": 1, "policy_kwargs": {}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVYAIAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoCIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoESiWCAAAAAAAAAABAQEBAQEBAZRoFUsIhZRoGXSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBEoliAAAAAAAAAAAADAvwAAwL8AAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaAtLCIWUaBl0lFKUjARoaWdolGgRKJYgAAAAAAAAAAAAwD8AAMA/AACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgLSwiFlGgZdJRSlIwIbG93X3JlcHKUjFNbLTEuNSAgICAgICAtMS41ICAgICAgIC01LiAgICAgICAgLTUuICAgICAgICAtMy4xNDE1OTI3IC01LgogLTAuICAgICAgICAtMC4gICAgICAgXZSMCWhpZ2hfcmVwcpSMS1sxLjUgICAgICAgMS41ICAgICAgIDUuICAgICAgICA1LiAgICAgICAgMy4xNDE1OTI3IDUuICAgICAgICAxLgogMS4gICAgICAgXZSMCl9ucF9yYW5kb22UTnViLg==", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-1.5 -1.5 -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[1.5 1.5 5. 5. 3.1415927 5. 1.\n 1. ]", "low_repr": "[-1.5 -1.5 -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[1.5 1.5 5. 5. 3.1415927 5. 1.\n 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gAWVPwsAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwFc3RhcnSUSwCMBl9zaGFwZZQpjAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmk4lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMCl9ucF9yYW5kb22UjBRudW1weS5yYW5kb20uX3BpY2tsZZSMEl9fcmFuZG9tc3RhdGVfY3RvcpSTlIwHTVQxOTkzN5SFlFKUfZQojA1iaXRfZ2VuZXJhdG9ylGgVjAVzdGF0ZZR9lCiMA2tleZSMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJbACQAAAAAAAAAAAICf5XKN7DKTmDdZTQotIHxHHahuyk5nO+GJphGKxas1v9eEd0G4AMIylRzWxMmzodHDYuqNHj4kVOgihRmvR0Se2XjsfpjkDBgLu3Y0xTSHiaz1NlKp9DyyoMCSSbo6tT51/s5EGTOW1Lvh5Kyrqf4dh2uxX+nHTQ34p6pAPdpLv3MIiMscQdPA/AXkT8nvgKsjd1LPTSczCPi7uErgWLVdSJrZb1x8Z2IfZ6eamvVoUaL4Nirf+atqvM+McX7hCkx92ZIWLHOj546boBNAv+9+JX/RmlaeUKKLhF2XnI75WjCOxCQZ8kcsH1O42WFLsSMPaLAdnznPu58PfNE+c3lKKtWwkInheEI+FezHc3kdcgqnkHDl/d/EsJ7PlUIF/Es9rwU3rrzrWtxoV2tyRkPe+e54WpHl2koxaCuDWCl9MAAVJMC4OnFPZRwQvLHO9sE2lf9jc493BQGqYz+tbvAnCpy28nhBYNkJ2CwlPLbWO+lYD43p3fRc6H46Iu4T3ER6mt2D52yk5aZhzYng7tkA+2E1Y6zR1f2dpEfyPoxf/qJejc23ECg+DisZEZ8Dz8b7Km4hZGv2LfPRCT20HGz2AnWOyjfg37Fs4etSjYfVQtawbegKHEq0N+wfD6TCbnvPcT/dKM3e8UTvbrZBn0/8LeKhR0V/qN0GyUPZx3+TsPNu3WbBPltAF4kaULM8bEeVsj1ZZOgB8c6ZPMiBSrCkXetIcSTqtepWGdA9fi4LYaZzx6xm+Z62BPY9cusjOivRTAq7nk0BOZxxk6jDQx6U9rDIEK2mYCwdzx1qnJ1kOyPjOFkmsDQ1D5OQepOiroUjgoS2dYC+qaA5qnMrpM/FbDopeUYCRRt1XP9/2AnNp4ovmBn/e+1Qzoqg7IpytEZlO07w3aMEfxE3yUiOe7aiMA4/ramPo6F3ZQKptugAc0Ozw0A0OM3uDhvLezal7Fxl+A8QoAQ2ybcvcWsb74M5/SN+0AMIu9vMYrC1rNyS8BoEgYnQkEyJXbaU8Q9tcpn+/p3obMkwcNfx6ZOzYBXhZQgw63ySYx1VYEi/o9f+G1n5oAvB1+X+xPjEmFei4IHNe14B11w2cUSZnvxm2ariciMXLDISho8egNoGZSXUcRt0yLgh8+gZ472KNyg68NmP6UCNnxvIdrebTsTh40ehfTS/uhi0QZIU7gfNpMgC07l5bKXLfpkUvhFaWRPwR5KSvE7Abk/y85bQPgWsvTESBwyRnZ8+TmykdMeyF6TJTB/6aqhkeCRMkX7ZimjY9KZx6bT779ZvxfS8+uwkRGpTuSBukgjxzipSwZL3e3McoCY9rlOLQ9V8KZSBGIaTE+S3w0dNp0p7RIxJ2vFRbIM9R2LPFltqJbBvuQyGcyAwk3mxG2VpiOTxfbLcMbnk0y7iGUmy6/Cxw336Dmp5gzJA+4lZJp1ojb94iVX199g/vxTCF6iiinv3txFcwrsooEEjOhU8g6T18wEIRzgKr1PBPfmm3T00XuHFe+2UJkbYf3q8SCaEkrnUbXLI2x578yBvKJFwrUnetk/Uc6jcv/MaoPjuQmjzNPBhy7JTpPuqRYWJOlaGLvp1L5nmUDoyXTeylrkl+fOrlXUCTOaIQNtOb1za+Bty/a+jIHTVUvrC/QLm9ozZpdWXRK7bGA58akXDZS0XJzgEREgog88QOVEwf1om7911ei0RkBbPb+nL8c7OtTxHRfEl/6CoWT/ZP+cadPDq6MqI7SDaVUFOUHgmkUXlH0YkZpTIyGm5Jsnb9HSCXGbwkI/mljmCbuwwCvCYTiXrqYOIa5EPf/lcph7ogk+4+lAQhU/6uq+8Uxiu5SFjB2fs6R21uUsqjkuyuwT6mbzKIhVbF41dPvr1lVUXdC7WINe+nSG+lXuGcduxfydq56WCcWjPfcgmv/cQQwmmPQ1zL0LkQYJpxOuzGAg05aMsM2EgogujI9VYmwmxnpsBxo8rw3EAX3Xw604tXuV7A1EIGD9GMlFV57jbHpfUyH7rjoAn/mZPUDlAi8Cn5+2k99M/z2TkT05U2H2BPh7QkQ6Ied8BWqXSE2eJN/qga6cCbX9DBe/G7ZmxbkUmS4zhblXke83hdIHpDqJF5BZCFwflJ58oO+oR3acFuqNIbNhni0eG9YZACbqf1S3equ0ueXVTnYMd1/2KYci1/Gnvh7fGz8tah+KKM3OHSDtJHcae68rp/KnwH6mL6GANjPA7LeO95LPFR1VEZVjSXuVHOAMz+g3M8pRKLDmzw/gVldGAaVCvCkEjgyB6V5F3+ggCbb+RfWdEom8tqJvGrFfnPqqW6ysCYSnInqLDv3wbKhb+T2Q2EDA6cPnD8EGrzJL5Qo4EtRPnZ6VDQm8MheNitYXrFXo9+UOvzlApOV02oUsHejdKVFFu1Ug3ch0MEIOEK6RSxBtdRbgviswGRmv46ajDOQRSQHxbKKhSzeRdFBPZ40ma2CXTS3YTaj7+LP+eCKLbFR36yawjQp3kLmGqpYUXHOOgNQXiyd+Dqlq8GcapVS5lCbVGqEG7wXUB8Ho6OFJHNXuQzJ7VEX8pHjH2QnjhefCWg/S62AC4OZH8rd8JqE3MTaZKR8vzpEoSgDi0D6sGUR2caOhSwCG11S+oz3evSj13CrGxRyc+bE9TTru1WpsVNk7AGB7hWWrZa8tb+3/f/CJRdX1NQhgN3ifCAr66Q0QncVvi2sysw7QjhToZMMHZmWdN3Wiv3gOFj4kfWvF7APexHsSQjm88pUxHD/9Erv4wP/6/tiUWirgC1wLxVGovLLtB6pX/CU23k1HLAS6EinZKsOFiP/dEKSYTp/hggID8JWGdmOsp+jhOAxWxJLXi+if49wKypQDhJ/ey6VKg3cm2hzN9s/wyN5y0LVBMYj9iMzdlGBYP34vOhZpa7gs/eizLvBPca7c4La3q787tBPC+aBA11wDLUJFQRSoTVI3evDg0yRbRAf5gRNWdX1E+smb1m/1vErSPr/cBB4OYsEy22htKCPCX+eps1RWm+4ZY787m9nZTW/KvMxXY/+4DO+BWJXm8tlc7gYRMWGhjuaIEX+ybji8VtGm2MwQVkOnMUACMeRlwxqaNlPmDL5XfnJMt7ms/Ev1arLa8KpXVvflByqeZQ5dRfdhWXkbeyNbfJTQ/zGP46W1G9olxnVThoG9uoKuY30f/nW5XPjqoKPX1J2ysRZesqa95OkhMrQ+C+4W4mP2smNBGn9mq1RIl65/k++L0aOduV/E7EXV+fiebtnizezaWPTG2lWmsSHwGKmVPziITTVNjVLDlZviv1CX/OiFsGEP+E1G2uZzy5kRmNmw4+JRoC4wCdTSUiYiHlFKUKEsDaA9OTk5K/////0r/////SwB0lGJNcAKFlIwBQ5R0lFKUjANwb3OUTXACdYwJaGFzX2dhdXNzlEsAjAVnYXVzc5RHAAAAAAAAAAB1YnViLg==", "n": 4, "start": 0, "_shape": [], "dtype": "int64", "_np_random": "RandomState(MT19937)"}, "n_envs": 16, "num_timesteps": 1015808, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": 344042492, "action_noise": null, "start_time": 1676230607495514086, "learning_rate": 0.0003, "tensorboard_log": "tensorboard-logs/ppo-LunarLander-v2-stable-reward-penalize-time/LunarLander-v2", "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWV4wIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMWC9ob21lL3RoZWtleW1hc3Rlci8ubG9jYWwvbGliL3B5dGhvbjMuMTAvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuCQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjFgvaG9tZS90aGVrZXltYXN0ZXIvLmxvY2FsL2xpYi9weXRob24zLjEwL3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAGY707xSwus8kwnBvZF4xb7UzjC+rYHqvQAAAAAAAAAA4CArvv0Jbj5ayqw+6uMlv9cPQr7Cz48+AAAAAAAAAADNJH074rq1P8FGQT6sQjw+OvMWu6pv3LkAAAAAAAAAAEbSNL613SQ/DhJNPFwDXr8E2Lq+jIgHPgAAAAAAAAAA87nrvduijz9msAS/FjkyvwxlGb5uAqq+AAAAAAAAAABDl4O+NBuXPyOVu74vlhO/tlEwv/Z0bL4AAAAAAAAAAJr57rxu6NA+utgwvQJXTL+Spq+8uzSlvAAAAAAAAAAAoCRWPu2+hD/T/S4+Pkbrvp4/Nz/xZAo/AAAAAAAAAADNnDO9KQAmupr38bazM4ayvNfGOkLuDTYAAIA/AACAPwDxuDxbbLI/WI1rPjHaQr7Sxf48Z7ANPgAAAAAAAAAAACAhPIlKwD/ILI09mSUcPl+RMDtqRvc8AAAAAAAAAAAzPue8j3Y8umFLCTr0BiS5ZGqgOlvAD7kAAIA/AACAP9MdEz4ORWA/zCfJPXecIr+mjw8//NgQPgAAAAAAAAAAE+kjvgPMXLym+y063BIlOBaOwD22M2O5AAAAAAAAgD+myBQ+84WEP8gMmT4uVyq/d9PLPiY0xT4AAAAAAAAAALCZab54BAM/mqRxPukgYr9WKau+9ZWTPgAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.015808000000000044, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVHRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIUI4CRAFOdECUhpRSlIwBbJRLqIwBdJRHQJvheHymQ8x1fZQoaAZoCWgPQwhN2ekHNXpzQJSGlFKUaBVLoGgWR0Cb4erfcer/dX2UKGgGaAloD0MIxOv6BTv1cUCUhpRSlGgVS7toFkdAm+J8r3CbdHV9lChoBmgJaA9DCHR63o0F+XFAlIaUUpRoFUusaBZHQJvi5GKAJ9l1fZQoaAZoCWgPQwgIy9jQjZ1xQJSGlFKUaBVLmmgWR0Cb5E+85CF9dX2UKGgGaAloD0MIJJhqZu3CcUCUhpRSlGgVS65oFkdAm+TGnn+yaHV9lChoBmgJaA9DCOHTnLxI63FAlIaUUpRoFUuQaBZHQJvmDvd/J/51fZQoaAZoCWgPQwjO/kC5LblxQJSGlFKUaBVLjmgWR0Cb5kkTpPhydX2UKGgGaAloD0MI5BQdyaXscECUhpRSlGgVS5BoFkdAm+cFk6Lfk3V9lChoBmgJaA9DCCKnr+drDnJAlIaUUpRoFUueaBZHQJvnotjCpFV1fZQoaAZoCWgPQwg6ArhZfEhwQJSGlFKUaBVLiWgWR0Cb6ASZjQRgdX2UKGgGaAloD0MIcw8J33sUcUCUhpRSlGgVS4NoFkdAm+gvcFhXsHV9lChoBmgJaA9DCOJcwwwNiHBAlIaUUpRoFUucaBZHQJvo39ZRsM11fZQoaAZoCWgPQwgJ/reS3fZyQJSGlFKUaBVL02gWR0Cb6WvoePq+dX2UKGgGaAloD0MIPiR87282c0CUhpRSlGgVS5doFkdAm+noa1kUbnV9lChoBmgJaA9DCDT2JRuPkHFAlIaUUpRoFUuraBZHQJvqF+1Bt1p1fZQoaAZoCWgPQwjhQ4mWfAlzQJSGlFKUaBVLmmgWR0Cb6qjqfOD8dX2UKGgGaAloD0MIysStgphbcECUhpRSlGgVS5toFkdAm+thf4REnnV9lChoBmgJaA9DCNTzbizounNAlIaUUpRoFUuYaBZHQJvrvwI+nqF1fZQoaAZoCWgPQwh/FHXmHs9zQJSGlFKUaBVL4GgWR0Cb7BZTho/SdX2UKGgGaAloD0MIryE4LmO7cECUhpRSlGgVS41oFkdAm+yYxcmjTXV9lChoBmgJaA9DCIDwoURLOkJAlIaUUpRoFUtnaBZHQJvtKK+BYmt1fZQoaAZoCWgPQwj8NVmj3v9xQJSGlFKUaBVLomgWR0Cb7iowmE5AdX2UKGgGaAloD0MIzH7d6U5xc0CUhpRSlGgVS6BoFkdAm++G9pRGdHV9lChoBmgJaA9DCLHfE+vUtnJAlIaUUpRoFUuvaBZHQJvwhovi97F1fZQoaAZoCWgPQwiKIM7DST5zQJSGlFKUaBVLlmgWR0Cb8Mp35eqrdX2UKGgGaAloD0MIFHmSdM2YcUCUhpRSlGgVS5VoFkdAm/IKJ/G2kXV9lChoBmgJaA9DCCdPWU1XMG9AlIaUUpRoFUuiaBZHQJvyOYQarFR1fZQoaAZoCWgPQwhQ/YNIxlJxQJSGlFKUaBVLr2gWR0Cb8kWNm16WdX2UKGgGaAloD0MIPNujN9yxcECUhpRSlGgVS55oFkdAm/LnQUpNK3V9lChoBmgJaA9DCLuZ0Y9G93JAlIaUUpRoFUvKaBZHQJvzPbpNbkh1fZQoaAZoCWgPQwiXVkPinolwQJSGlFKUaBVLi2gWR0Cb838NhE0BdX2UKGgGaAloD0MILbRzmsUrcECUhpRSlGgVS5VoFkdAm/O1xS5y2nV9lChoBmgJaA9DCKZfIt763XJAlIaUUpRoFUuuaBZHQJvz5x6v7nB1fZQoaAZoCWgPQwiOkewRaoFzQJSGlFKUaBVLpmgWR0Cb8/R2r4nGdX2UKGgGaAloD0MIdGA5Qsapc0CUhpRSlGgVS5BoFkdAm/RkuDjBEnV9lChoBmgJaA9DCMsr19vmM3JAlIaUUpRoFUuJaBZHQJv0iSB9Tgl1fZQoaAZoCWgPQwiWQbXByedxQJSGlFKUaBVLnmgWR0Cb9IUPQOWjdX2UKGgGaAloD0MI4jlbQGi+c0CUhpRSlGgVS6NoFkdAm/ZQX668QXV9lChoBmgJaA9DCOS9amUCV3NAlIaUUpRoFUuxaBZHQJv4cV32VVx1fZQoaAZoCWgPQwi4dTdPNdpxQJSGlFKUaBVLhWgWR0Cb+IO+ZgG9dX2UKGgGaAloD0MIey5Tk2ABckCUhpRSlGgVS6doFkdAm/jlK5Cng3V9lChoBmgJaA9DCJs8ZTVdY3FAlIaUUpRoFUulaBZHQJv5JM6BAfN1fZQoaAZoCWgPQwiOB1vs9vlvQJSGlFKUaBVLjmgWR0Cb+c5mh/RWdX2UKGgGaAloD0MIuMg9XZ20cUCUhpRSlGgVS6VoFkdAm/pubRWtEHV9lChoBmgJaA9DCDp6/N7mtnBAlIaUUpRoFUuZaBZHQJv6zXGwRoR1fZQoaAZoCWgPQwj19BH4A0xwQJSGlFKUaBVLlmgWR0Cb+0K6WgOCdX2UKGgGaAloD0MISG+4j1zjcUCUhpRSlGgVS5loFkdAm/tyDAaegHV9lChoBmgJaA9DCEOR7ufUgXFAlIaUUpRoFUucaBZHQJv7aiblRxd1fZQoaAZoCWgPQwi5bd+jfjlyQJSGlFKUaBVLvmgWR0Cb+71DjR2KdX2UKGgGaAloD0MIpMLYQlArcUCUhpRSlGgVS7ZoFkdAm/yFVT72tnV9lChoBmgJaA9DCDKqDONuiXJAlIaUUpRoFUuraBZHQJv89BOYYzl1fZQoaAZoCWgPQwjEQxg/TatzQJSGlFKUaBVLr2gWR0Cb/UgqmTC+dX2UKGgGaAloD0MI06BoHgD3c0CUhpRSlGgVS7doFkdAm/2rlA/s3XV9lChoBmgJaA9DCKbtX1lp0HJAlIaUUpRoFUuHaBZHQJv/iMl1KXh1fZQoaAZoCWgPQwiiJCTSNnZxQJSGlFKUaBVLi2gWR0Cb/6uaF23bdX2UKGgGaAloD0MIoUeMnpsqc0CUhpRSlGgVS6doFkdAnAJxVAAyVXV9lChoBmgJaA9DCOQViJ4UcnJAlIaUUpRoFUusaBZHQJwCkfs/pt91fZQoaAZoCWgPQwje40wTdqVwQJSGlFKUaBVL3GgWR0CcAsXhfjS5dX2UKGgGaAloD0MIQbYsX5cEcUCUhpRSlGgVS5NoFkdAnAPnHvMKTnV9lChoBmgJaA9DCGSV0jM9t3FAlIaUUpRoFUuEaBZHQJwETaxoqTd1fZQoaAZoCWgPQwgp7Q2+sKdwQJSGlFKUaBVLoWgWR0CcBIeF+NLldX2UKGgGaAloD0MI3PKRlPQpcUCUhpRSlGgVS6toFkdAnASjK1XvIHV9lChoBmgJaA9DCPThWYJManNAlIaUUpRoFUuzaBZHQJwE0xmCiAV1fZQoaAZoCWgPQwhYObTItkNxQJSGlFKUaBVLn2gWR0CcBQMvAXVLdX2UKGgGaAloD0MIucFQh9Vic0CUhpRSlGgVS5BoFkdAnAV6asp5NXV9lChoBmgJaA9DCIVefxJfgXNAlIaUUpRoFUuxaBZHQJwFpyIYWLx1fZQoaAZoCWgPQwisqpffabxwQJSGlFKUaBVLk2gWR0CcBg9uxbB5dX2UKGgGaAloD0MI2V4Leq9rc0CUhpRSlGgVS6loFkdAnAfKhcqvvHV9lChoBmgJaA9DCGEyVTDqfnNAlIaUUpRoFUuiaBZHQJwJxWEK3NN1fZQoaAZoCWgPQwi8sgsG1x9yQJSGlFKUaBVLgGgWR0CcCjmXPZ7HdX2UKGgGaAloD0MIHqSnyGEJdECUhpRSlGgVS7loFkdAnAsUofCAMHV9lChoBmgJaA9DCKZ7ndTXFXJAlIaUUpRoFUuVaBZHQJwLa8CgbqB1fZQoaAZoCWgPQwgNjLysiQdzQJSGlFKUaBVLiWgWR0CcDGyH2ys0dX2UKGgGaAloD0MIqYdodIeocUCUhpRSlGgVS4ZoFkdAnA5KlDWsinV9lChoBmgJaA9DCL3faMeN7XJAlIaUUpRoFUu9aBZHQJwOpbiZOSJ1fZQoaAZoCWgPQwjAdjBiX+VxQJSGlFKUaBVLlWgWR0CcDxSJj2BbdX2UKGgGaAloD0MI2GX4T/fVckCUhpRSlGgVS61oFkdAnA9DNdJJ5HV9lChoBmgJaA9DCOup1VcXs3FAlIaUUpRoFUuoaBZHQJwPbWbwz+F1fZQoaAZoCWgPQwj5LqUu2X5yQJSGlFKUaBVLrGgWR0CcD8T5O8CgdX2UKGgGaAloD0MIaB8r+C1ncUCUhpRSlGgVS7RoFkdAnBAWbPQfIXV9lChoBmgJaA9DCMiZJmz/GHRAlIaUUpRoFUu2aBZHQJwQrUjLSu11fZQoaAZoCWgPQwhzucFQh9NxQJSGlFKUaBVLjGgWR0CcES7qIJqqdX2UKGgGaAloD0MIUb6ghQQLdECUhpRSlGgVS7hoFkdAnBIE8aGYbHV9lChoBmgJaA9DCLXf2omSGHNAlIaUUpRoFUuDaBZHQJwSbk1dgOV1fZQoaAZoCWgPQwhiaHVyxgZxQJSGlFKUaBVLiWgWR0CcE/4nF5v+dX2UKGgGaAloD0MIOpZ31UMgc0CUhpRSlGgVS6FoFkdAnBSqS9ugpXV9lChoBmgJaA9DCLPqc7UVq3FAlIaUUpRoFUufaBZHQJwVzctXgcd1fZQoaAZoCWgPQwg3p5IBoP5yQJSGlFKUaBVLqmgWR0CcF0u8scyWdX2UKGgGaAloD0MI5Gn5gavVb0CUhpRSlGgVS5FoFkdAnBfPDpC8e3V9lChoBmgJaA9DCFYrE35pt3JAlIaUUpRoFUukaBZHQJwYwO09hZ11fZQoaAZoCWgPQwgUzJiCdWdxQJSGlFKUaBVLnWgWR0CcGbSW7e2vdX2UKGgGaAloD0MICOdTx6qyc0CUhpRSlGgVS6NoFkdAnBpxJqZc9nV9lChoBmgJaA9DCKx0d51NcnRAlIaUUpRoFUuvaBZHQJwajuF6Avt1fZQoaAZoCWgPQwj0jH3JRnhyQJSGlFKUaBVLs2gWR0CcGo5lOGj9dX2UKGgGaAloD0MIMsnIWRg+cUCUhpRSlGgVS55oFkdAnBs/tD2JznV9lChoBmgJaA9DCJQUWAATQXJAlIaUUpRoFUuwaBZHQJwcCih37k51fZQoaAZoCWgPQwjGFRdHpRBxQJSGlFKUaBVLy2gWR0CcHGlrM1TBdX2UKGgGaAloD0MIPdF14cfIckCUhpRSlGgVS51oFkdAnBygVfu1GHV9lChoBmgJaA9DCBxhURHnB3JAlIaUUpRoFUuKaBZHQJwdFxm03Ox1ZS4="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 12756, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVwQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMRy9ob21lL21hcmt1cy9zcmMvYWkvc3RhYmxlLWJhc2VsaW5lczMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgUMCBAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxHL2hvbWUvbWFya3VzL3NyYy9haS9zdGFibGUtYmFzZWxpbmVzMy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpSMHGNsb3VkcGlja2xlLmNsb3VkcGlja2xlX2Zhc3SUjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoH32UfZQoaBZoDYwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBeMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHP8mZmZmZmZqFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "system_info": {"OS": "Linux-5.15.52-gentoo-x86_64-x86_64-AMD_Ryzen_5_1600_Six-Core_Processor-with-glibc2.35 # 1 SMP Thu Jul 21 22:26:07 EDT 2022", "Python": "3.10.6", "Stable-Baselines3": "1.7.0", "PyTorch": "1.13.1+cu117", "GPU Enabled": "True", "Numpy": "1.23.1", "Gym": "0.21.0"}}
ppo-LunarLander-v2.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:54e0ad3ea67519d92cedf13a2d70994678fb0b24e3ffae5847ec09359540e1d8
3
  size 151853
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:87730f9f97bba8a2bb4dcf6b88bf7a5d66cab4f83452dd71deeba3811b6883f3
3
  size 151853
ppo-LunarLander-v2/data CHANGED
@@ -4,20 +4,20 @@
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
- "__init__": "<function ActorCriticPolicy.__init__ at 0x7fb5e4879b40>",
8
- "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7fb5e4879bd0>",
9
- "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7fb5e4879c60>",
10
- "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7fb5e4879cf0>",
11
- "_build": "<function ActorCriticPolicy._build at 0x7fb5e4879d80>",
12
- "forward": "<function ActorCriticPolicy.forward at 0x7fb5e4879e10>",
13
- "extract_features": "<function ActorCriticPolicy.extract_features at 0x7fb5e4879ea0>",
14
- "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7fb5e4879f30>",
15
- "_predict": "<function ActorCriticPolicy._predict at 0x7fb5e4879fc0>",
16
- "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7fb5e487a050>",
17
- "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7fb5e487a0e0>",
18
- "predict_values": "<function ActorCriticPolicy.predict_values at 0x7fb5e487a170>",
19
  "__abstractmethods__": "frozenset()",
20
- "_abc_impl": "<_abc._abc_data object at 0x7fb5e486ef00>"
21
  },
22
  "verbose": 1,
23
  "policy_kwargs": {},
 
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
+ "__init__": "<function ActorCriticPolicy.__init__ at 0x7f6a55b71b40>",
8
+ "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f6a55b71bd0>",
9
+ "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f6a55b71c60>",
10
+ "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f6a55b71cf0>",
11
+ "_build": "<function ActorCriticPolicy._build at 0x7f6a55b71d80>",
12
+ "forward": "<function ActorCriticPolicy.forward at 0x7f6a55b71e10>",
13
+ "extract_features": "<function ActorCriticPolicy.extract_features at 0x7f6a55b71ea0>",
14
+ "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f6a55b71f30>",
15
+ "_predict": "<function ActorCriticPolicy._predict at 0x7f6a55b71fc0>",
16
+ "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f6a55b72050>",
17
+ "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f6a55b720e0>",
18
+ "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f6a55b72170>",
19
  "__abstractmethods__": "frozenset()",
20
+ "_abc_impl": "<_abc._abc_data object at 0x7f6a56194540>"
21
  },
22
  "verbose": 1,
23
  "policy_kwargs": {},
replay.mp4 CHANGED
Binary files a/replay.mp4 and b/replay.mp4 differ
 
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 302.3929243866677, "std_reward": 17.319132157540256, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-02-12T15:12:49.399831"}
 
1
+ {"mean_reward": 308.4969563892229, "std_reward": 11.387259580061457, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-02-13T19:29:18.802571"}