HCNMonsch commited on
Commit
dfdb940
1 Parent(s): 7257040

Upload PPO LunarLander-v2 trained agent

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
- value: 207.81 +/- 21.89
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
+ value: 279.30 +/- 14.01
20
  name: mean_reward
21
  verified: false
22
  ---
config.json CHANGED
@@ -1 +1 @@
1
- {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x783d0040f490>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x783d0040f520>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x783d0040f5b0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x783d0040f640>", "_build": "<function ActorCriticPolicy._build at 0x783d0040f6d0>", "forward": "<function ActorCriticPolicy.forward at 0x783d0040f760>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x783d0040f7f0>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x783d0040f880>", "_predict": "<function ActorCriticPolicy._predict at 0x783d0040f910>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x783d0040f9a0>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x783d0040fa30>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x783d0040fac0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x783d003b7f80>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 1001472, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1694949260147168071, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVlQAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYgAAAAAAAAAEKCrr4tvqY+W4jYPT/cs73orN070AuWvAAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksBSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdAAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYBAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwGFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.0014719999999999178, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVRAwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQGsStwzch1WMAWyUTQgCjAF0lEdApGjKg5BC2XV9lChoBkfAPKeLJjlPrWgHTZ8BaAhHQKRqogDifg91fZQoaAZHQG3mAV45cTtoB00ZAmgIR0CkbFxAbADadX2UKGgGR0BuAWMQ2/BWaAdNswFoCEdApG7sVclgMXV9lChoBkfASheBvrGBF2gHTYsBaAhHQKRwK0fozN51fZQoaAZHQG67qQJXyRVoB03EAWgIR0Ckcapt78ekdX2UKGgGR0BqxvrfLs8gaAdNvQFoCEdApHMRzvJA+3V9lChoBkdAbVs0iyIHkmgHTd8BaAhHQKR1vXcxj8V1fZQoaAZHQG5HoKtxMnJoB02kAWgIR0Ckdw+O4oZydX2UKGgGR8A5eH9WIXTFaAdNeAFoCEdApHhIGyHEdnV9lChoBkdAa4XvBrN4aGgHTbgBaAhHQKR5oYcebNN1fZQoaAZHQG53fEn9ehRoB00JAmgIR0Cke0Rm9QGfdX2UKGgGR0BnMzxG2CumaAdNHgJoCEdApH4xZntfHHV9lChoBkdAay8xk/bCamgHTRICaAhHQKSAVgccU/R1fZQoaAZHQG1taT4cm0FoB03IAWgIR0CkgmBybQTmdX2UKGgGR0BtsqzZ6D5CaAdNMAJoCEdApIUIO4G2TnV9lChoBkdAa0iA93bEgmgHTSICaAhHQKSJJzDGcWl1fZQoaAZHQGUsWq1gH/toB02fAmgIR0Cki05eiSJTdX2UKGgGR0BwVv5KvmozaAdNugFoCEdApIyyjrRjSXV9lChoBkdAbZVTtsvZiGgHTfcBaAhHQKSOSgJ1JUZ1fZQoaAZHwBs8k2P1ct5oB020AWgIR0CkkPE1EVnFdX2UKGgGR0BuE03Mpw0gaAdNpwFoCEdApJJFYU34sXV9lChoBkdAbFar9VFQVWgHTQwCaAhHQKST6zZ6D5F1fZQoaAZHQGgn2ys0YTFoB03TAWgIR0CklXY+bExZdX2UKGgGR0Bpd92A5JbuaAdN+AFoCEdApJg+K8+Ro3V9lChoBkfAJzb2USqU/2gHTYoBaAhHQKSZgGUwBYF1fZQoaAZHwD+q9FnZkCpoB036AWgIR0CkmyPRRdhRdX2UKGgGR0BtlyUVzp5eaAdNHwJoCEdApJ0IIyCWeHV9lChoBkfAOOV+NLlFMWgHTSMCaAhHQKShPYODrZ91fZQoaAZHQG3Omvnr6cloB022AWgIR0Cko1q/ub7TdX2UKGgGR0BuQaMkyDZlaAdNsgFoCEdApKVtY2bXpXV9lChoBkdAbEc6XBxgiWgHTaoBaAhHQKSnDj7yhBZ1fZQoaAZHQGxnfvOQhfVoB03tAWgIR0CkqJ/V7Qb/dX2UKGgGR8A35s9SuQp4aAdNsQFoCEdApKtDsUqQR3V9lChoBkdAZZukIomXxGgHTTACaAhHQKStE9Pk7wN1fZQoaAZHwD5/jrAxi5NoB02cAWgIR0CkrmhJI1+BdX2UKGgGR0BtXg+r2g3+aAdN8QFoCEdApLADhisnzHV9lChoBkfAR8xUipvP1WgHTWsBaAhHQKSycCEHt4R1fZQoaAZHwEpUFHrhR65oB02WAWgIR0Cks7o3irDJdX2UKGgGR0BveIqEvkBCaAdN4gFoCEdApLU/UBnzx3V9lChoBkdAaLCbPQfIS2gHTfsBaAhHQKS23sKLKmt1fZQoaAZHQGwHODzyz5ZoB00RAmgIR0CkudIBzV+adX2UKGgGR0BrHL92ovSMaAdNEAJoCEdApLv/TRYzSHV9lChoBkdAa6TrQgLZz2gHTdIBaAhHQKS+IxKxs2x1fZQoaAZHQGyWFBY3eepoB00cAmgIR0CkwKT1schldX2UKGgGR0Bpgl/SYw7DaAdNOAJoCEdApMTdOKwY+HV9lChoBkdAb/BzQu27WmgHTcMBaAhHQKTGRZGrjo91fZQoaAZHQG39txlxwQ1oB021AWgIR0Ckx6WLP2PDdX2UKGgGR0BrVVhiLEUCaAdNSwJoCEdApMl+98JD3XV9lChoBkdAcCw5wwTM7mgHTcwBaAhHQKTK7wGW2PV1fZQoaAZHQGiw1BMSK3xoB03iAWgIR0CkzbWOhkAhdX2UKGgGR0BsK0CcPOIJaAdNNQJoCEdApM+CGzru6XV9lChoBkdAa+W4BmwqzGgHTeoBaAhHQKTRDSG8Emp1fZQoaAZHQGN9nWBjFydoB00pAmgIR0Ck1AsijcmCdX2UKGgGR0BYH/z8P4EfaAdN6ANoCEdApNc6JVKf4HV9lChoBkdAZ2GpI+W4VmgHTccCaAhHQKTZ5KxLTQV1fZQoaAZHwE21sMy8BdVoB01tAWgIR0Ck3VJYs/Y8dX2UKGgGR0Bvps92X9iuaAdN4wFoCEdApN+UGFBY3nV9lChoBkdAawfoHs1KoWgHTfYBaAhHQKTh/mapgkV1fZQoaAZHQEjE8274BWBoB03oA2gIR0Ck5VUDlo12dX2UKGgGR0BsQAmiQDFIaAdNFAJoCEdApOgxrLyMDXV9lChoBkdAbshHPu5SWWgHTaMBaAhHQKTpgE+Pikx1fZQoaAZHQGfWQ9q1w5xoB03oAWgIR0Ck6xq0MPSVdX2UKGgGR0BrWnGp++dtaAdNKQJoCEdApOzc5U96knV9lChoBkdAboXy7PIGQmgHTcoBaAhHQKTvjJpWV/t1fZQoaAZHQG1bgSnLq2VoB02qAWgIR0Ck8OfIsAeadX2UKGgGR0BswlfiPyTZaAdNlAJoCEdApPL9yvLX+XV9lChoBkdAavucsDnvD2gHTZgBaAhHQKT0R0voNd91fZQoaAZHQGvrDJEH+qBoB03/AWgIR0Ck91qUVzp5dX2UKGgGR0BbSXzlLeyiaAdNVgJoCEdApPndcGC7LHV9lChoBkdAaB5ffGdZq2gHTbwBaAhHQKT79EtNBWx1fZQoaAZHQGtQeJYT0xxoB03WAWgIR0Ck/h++/QBxdX2UKGgGR0BvRX0oScslaAdNjgFoCEdApQFOMyad+XV9lChoBkdAbbVTMqz7dmgHTagBaAhHQKUCpWVeKKp1fZQoaAZHQGyoSf+S8rZoB02qAWgIR0ClA/EleF+NdX2UKGgGR0BuupX8wYceaAdNpgFoCEdApQVEUAT7EnV9lChoBkdAF9D7655JLGgHTUMBaAhHQKUGSKbayrx1fZQoaAZHQHAzH4CZF5RoB02iAWgIR0ClCMZu63AmdX2UKGgGR0BwIuq3mV7haAdNhgFoCEdApQn2O0b963V9lChoBkfAMo+DrZ8KHGgHTUcBaAhHQKUK9/iHZbp1fZQoaAZHQGzVZiuuA7RoB01JAmgIR0ClDM1/DtPYdX2UKGgGR0BwaFQSBbwCaAdNwAFoCEdApQ41V3ljmXV9lChoBkdAavMdRzijtWgHTTICaAhHQKUROpEQXhx1fZQoaAZHQGkRB5HEuQJoB03TAWgIR0ClErwID5j6dX2UKGgGR0Bt2cbiqABlaAdNgwFoCEdApRQHRsuWbHV9lChoBkdAayiJx//ecmgHTZsBaAhHQKUVtbJOnEV1fZQoaAZHwFGJVAAyVOdoB035AWgIR0ClGdLX18LKdX2UKGgGR0Bpl7qSowVTaAdNLQJoCEdApRyJd8iOenV9lChoBkdAbgg4rjHXE2gHTaUBaAhHQKUeil7+kxh1fZQoaAZHQGPiKkM1CPZoB02mA2gIR0ClIs2GIsRQdX2UKGgGR0BwmnHwPRReaAdNpgFoCEdApSQX+ZPVNHV9lChoBkdAa1QUBXCCSWgHTWsCaAhHQKUl/F4LThJ1fZQoaAZHQHALwHqu8sdoB02kAWgIR0ClJ1K9f1HwdX2UKGgGR0BnD9bor4FiaAdN+gFoCEdApSj70J4SpXV9lChoBkdAaeURSP2f02gHTeIBaAhHQKUrsEyLyc11fZQoaAZHQGlp/i5uqFRoB000A2gIR0ClLkhIFvAHdX2UKGgGR0Btx3Vsk6cRaAdNeAJoCEdApTBOUnogWHV9lChoBkdAbIJ21UlzEWgHTZcBaAhHQKUzB+GXXy11fZQoaAZHQHBgXQD3dsVoB02rAWgIR0ClNNJrtVrAdX2UKGgGR0BexxZ+x4Y8aAdN6ANoCEdApTmX6TGHYnVlLg=="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 2152, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVcAIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoECiWCAAAAAAAAAABAQEBAQEBAZRoFEsIhZRoGHSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBAoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaApLCIWUaBh0lFKUjARoaWdolGgQKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgKSwiFlGgYdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV1QAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCloCmgOjApfbnBfcmFuZG9tlE51Yi4=", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 1, "n_steps": 2048, "gamma": 0.999, "gae_lambda": 0.95, "ent_coef": 0.0, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "system_info": {"OS": "Linux-5.15.109+-x86_64-with-glibc2.35 # 1 SMP Fri Jun 9 10:57:30 UTC 2023", "Python": "3.10.12", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.0.1+cu118", "GPU Enabled": "True", "Numpy": "1.23.5", "Cloudpickle": "2.2.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
 
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7b01f8e7fe20>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7b01f8e7feb0>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7b01f8e7ff40>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7b01f8e90040>", "_build": "<function ActorCriticPolicy._build at 0x7b01f8e900d0>", "forward": "<function ActorCriticPolicy.forward at 0x7b01f8e90160>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7b01f8e901f0>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7b01f8e90280>", "_predict": "<function ActorCriticPolicy._predict at 0x7b01f8e90310>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7b01f8e903a0>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7b01f8e90430>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7b01f8e904c0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7b01f8e94180>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 1507328, "_total_timesteps": 1500000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1697312316969903183, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAM1I9zz4AYE8IUK6vcutg75A3re9oCuqvQAAAAAAAAAA5vVivfZwcbpCPRk5AOxKswfe67pWhy+4AACAPwAAgD8Ax4C9zI9HPwYFiL2C2ta+jQ3BvGdvoTwAAAAAAAAAALqGLr4BDCs+nrk1Pt/3ZL5FKgC9fwYQvQAAAAAAAAAAtSeEvjgbcT+VxuO+52UIv5sPrL4qZwe+AAAAAAAAAAAa3UW++jrmPs40wT11mLK+m/o2vspE4z0AAAAAAAAAAObokD64Glg/AngGPYmE/L5EuGY+JZXNvQAAAAAAAAAAZi1MPi636LwmpJM7Z2Azun81Tb7aagi7AACAPwAAgD8AFyI9KZh+urV/MrRnOAwwVHW6uSZ3nTMAAIA/AACAP5pPDTwrbII9omW7vVcQPr5cCFa9JgL9PAAAAAAAAAAAmhfRPIjEoT09Ztu5cG5DvqdAg7w19is9AAAAAAAAAACjU+O+54M2P3tMBT7D5PS+ykaZvmJSXT4AAAAAAAAAAJbBb75Uf7g+yPF9Pp/3g76I8Za8sCP3PQAAAAAAAAAAQzlUvvGNND7maoE+pzuPvgSPTbyOID49AAAAAAAAAADmkOm9uQzqPgmjqLxSqZu+SIubvURcEb0AAAAAAAAAAJqgvDx9ccQ+TUOqvU2FY763Erw7nYD/OAAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.004885333333333408, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVEQwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHMMpm/WUbGMAWyUTSEBjAF0lEdAnSsPDxb0OHV9lChoBkdAcHI8+zMRpWgHTRIBaAhHQJ0rOwyIpH91fZQoaAZHQElGnUlRgqpoB0vBaAhHQJ0rsvnKW9l1fZQoaAZHQHEpNOqNp/RoB00IAWgIR0CdK/Rm9QGfdX2UKGgGR0Bx/dffGdZraAdL72gIR0CdLAM98qnWdX2UKGgGR0BxkMJY1YQraAdL8WgIR0CdLQPqs2ehdX2UKGgGR0BSQD/EOy3TaAdLvGgIR0CdLcKzAvcrdX2UKGgGR0ByCcAIY3vQaAdL+2gIR0CdLfqRlpXZdX2UKGgGR0Bvx6Uqx1PnaAdNFAFoCEdAnS4I/Vy3kXV9lChoBkdAcE+ZxrBTGmgHTQ4BaAhHQJ0uR8CxNZh1fZQoaAZHQHD5mh7E5yVoB0vuaAhHQJ0vOMCLdep1fZQoaAZHQFKiCY1He8BoB0vBaAhHQJ0wvVJ+UhV1fZQoaAZHQHGgU0elsP9oB00SAWgIR0CdMRA7xNItdX2UKGgGR0BxP7dXT3IuaAdNCgFoCEdAnTI3mRvFWHV9lChoBkdAcA0mhM8HOmgHTQQBaAhHQJ0ysyZa3Zx1fZQoaAZHQHC8Bc/t6X1oB00XAWgIR0CdMximVJL/dX2UKGgGR0BxDAp3HJcPaAdNJAFoCEdAnTM7f+CK8HV9lChoBkdAcpvooNNJv2gHS/VoCEdAnTOHyup0fnV9lChoBkdAcTcdCE6DG2gHTQIBaAhHQJ0z497ngYR1fZQoaAZHQHEv1hgE2YRoB00oAWgIR0CdM+KaXrt3dX2UKGgGR0Bx4kTIvJzUaAdL4GgIR0CdNEbH6uW9dX2UKGgGR0BzIc/B3zMBaAdNQgFoCEdAnTR0C7sfJXV9lChoBkdAcSpGEf1YhmgHS+poCEdAnTWIGyHEdnV9lChoBkdAb80QRPGhmGgHS/JoCEdAnTYk9t/FznV9lChoBkdAchWoG6f8M2gHS/loCEdAnTZJsGgSOHV9lChoBkdAcWFyVfNRnGgHTRgBaAhHQJ03zv+fh/B1fZQoaAZHQHEVtoSL61toB00UAWgIR0CdOR3iJfpmdX2UKGgGR0BxhMGRmseXaAdNAwFoCEdAnTqJ31SOznV9lChoBkdAcDUnfl6qsGgHS95oCEdAnTr1fE4vOHV9lChoBkdAc8H9y925hGgHTQoBaAhHQJ07K4Ajps51fZQoaAZHQG0T+F10T11oB0vuaAhHQJ07+tjkMkR1fZQoaAZHQHLr3yd4FA5oB00FAWgIR0CdPCcBU70WdX2UKGgGR0Bvqi7Ackt3aAdL32gIR0CdPDsCDEm6dX2UKGgGR0BtZt5nlGPQaAdL/mgIR0CdPQgmqo60dX2UKGgGR0BvyfPiT+vRaAdL+2gIR0CdPU+PzWf9dX2UKGgGR0BVUo4yXUpeaAdL7GgIR0CdPWmrsByTdX2UKGgGR0BzOCF/QSi/aAdNFAFoCEdAnT2WNipeeHV9lChoBkdAcqYHPeHi32gHTQABaAhHQJ095Q9A5aN1fZQoaAZHQG8PhqCYkVxoB0vjaAhHQJ0+2IbfgrJ1fZQoaAZHQHDjzXSSeRRoB0vjaAhHQJ0/AuSOinJ1fZQoaAZHQHDl9K/VRUFoB0v5aAhHQJ0+/v2GqPx1fZQoaAZHQHFvg7gbZOBoB00ZAWgIR0CdU849ovi+dX2UKGgGR0BxZoFRpDeCaAdL6mgIR0CdVF+FUQ05dX2UKGgGR0Bt1IfEGZ/kaAdL+GgIR0CdVRGahHskdX2UKGgGR0BwBwuVX3g2aAdL92gIR0CdVTByjpLVdX2UKGgGR0BxRS6DoQnQaAdNNAFoCEdAnVWcpLEk0XV9lChoBkdAcD316E8JU2gHTQEBaAhHQJ1WLqUu+RJ1fZQoaAZHQG7csspXp4doB00FAWgIR0CdVi8qnWJ8dX2UKGgGR0Bxfoe6qbSaaAdL4mgIR0CdVj5AyEcsdX2UKGgGR0BzLoJ+lTFVaAdNBAFoCEdAnVZRZU1hs3V9lChoBkdAcEJedkJ8fGgHS/ZoCEdAnVaw44p+dHV9lChoBkdAbTzoVVPva2gHTQABaAhHQJ1WwXm/3391fZQoaAZHQG+sxZEDyOJoB0v+aAhHQJ1XRufmLcd1fZQoaAZHQG8BJkGzKLdoB0vjaAhHQJ1XTOKO1fF1fZQoaAZHQHAqXVsk6cRoB0vraAhHQJ1Xi9lEqlR1fZQoaAZHQHCY9q1w5vNoB00GAWgIR0CdWDFgDzRQdX2UKGgGR0BzH1yyUs4DaAdNNwFoCEdAnVhXEQ5FPXV9lChoBkdAbbhS+g13uGgHTQIBaAhHQJ1abX+VC5V1fZQoaAZHQHJdJHNHH3loB00NAWgIR0CdW1Lux8lYdX2UKGgGR0BwN/sF+uvEaAdNAQFoCEdAnVvQOnVG1HV9lChoBkdAb6HZcLSeAmgHTQQBaAhHQJ1cY5n13+x1fZQoaAZHQHFGstsenydoB0vvaAhHQJ1ce8274BV1fZQoaAZHQHDGUAggX/JoB0v3aAhHQJ1clINEw351fZQoaAZHQG8R5dWyTpxoB00mAWgIR0CdXN/A0sOHdX2UKGgGR0Bzj5br1M/RaAdNDgFoCEdAnV1IoZydWnV9lChoBkdAcLzwH7gsLGgHTRQBaAhHQJ1dZudf9gp1fZQoaAZHQHCaoDxLCepoB0vbaAhHQJ1dZlum78N1fZQoaAZHQHIuuHN5dGBoB00JAWgIR0CdXbIeYD1XdX2UKGgGR0ByFWIwdsBRaAdL+mgIR0CdXeRV6u4gdX2UKGgGR0By/swAU+LWaAdNJgFoCEdAnV5OFg2If3V9lChoBkdAcivkrPMSsmgHTRkBaAhHQJ1ej7Ikqtp1fZQoaAZHQHCmlhLGrCFoB00SAWgIR0CdX0xdY4hmdX2UKGgGR0ByTYK/mDDkaAdNDAFoCEdAnV9UK3NLUXV9lChoBkdAcnW/J/5Ly2gHS+JoCEdAnWE2ldkauXV9lChoBkdAcUsq7yxzJmgHS91oCEdAnWGFHWjGk3V9lChoBkdAboE5OJtSAGgHS/ZoCEdAnWLH2dupCXV9lChoBkdAcmh2ZRbbDmgHS/BoCEdAnWLHLRrrPnV9lChoBkdAcZeu3trsSmgHS/1oCEdAnWMVE/jbSXV9lChoBkdAbxXesxO+I2gHS+BoCEdAnWMtxMnJDHV9lChoBkdAce94+KTB7GgHS/1oCEdAnWN6WHDaXnV9lChoBkdAcUi9aEBbOmgHS/toCEdAnWP1DKHO8nV9lChoBkdAcbwuzQeFL2gHS/VoCEdAnWQc6/7BPHV9lChoBkdAb7fw6ySmqGgHS/ZoCEdAnWRhbKRuCXV9lChoBkdAcgMkcS5AhWgHTQ0BaAhHQJ1kX+ee4Cp1fZQoaAZHQGzQQsGxD9hoB0v/aAhHQJ1lAn9ehPF1fZQoaAZHQHAB0jX4CZFoB00FAWgIR0CdZW0Re1KHdX2UKGgGR0ByeHo4dZJTaAdNBAFoCEdAnWYzUd7v5XV9lChoBkdAb/Pu7YkE92gHS/doCEdAnWf4Q4CIUXV9lChoBkdAcINSh8IAwWgHTUoBaAhHQJ1oNmHxjKB1fZQoaAZHQHGO6pLmITJoB00GAWgIR0CdaMDnNgSfdX2UKGgGR0BwpR5v99+gaAdL+mgIR0CdabBtDUmVdX2UKGgGR0By8c4CIUJwaAdL/WgIR0CdacoP07KadX2UKGgGR0Bumjxsl9jPaAdNAwFoCEdAnWpNlNDc/XV9lChoBkdAcQ4t+CsfaGgHTQYBaAhHQJ1qfxRVIZt1fZQoaAZHQHEYQDFId2hoB0v3aAhHQJ1q3jvNNah1fZQoaAZHQHC94yTINmVoB00KAWgIR0CdavGjsUqQdX2UKGgGR0BwCrRplBhQaAdL72gIR0CdawzLOiWWdX2UKGgGR0BwZgJC0F8paAdNAAFoCEdAnWtAEIPbwnV9lChoBkdAc48xvNu+AWgHS+BoCEdAnWtbE9+w1XV9lChoBkdAbpgSZjQRgGgHS/JoCEdAnWw8EA5q/XVlLg=="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 397, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVcAIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoECiWCAAAAAAAAAABAQEBAQEBAZRoFEsIhZRoGHSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBAoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaApLCIWUaBh0lFKUjARoaWdolGgQKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgKSwiFlGgYdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV1QAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCloCmgOjApfbnBfcmFuZG9tlE51Yi4=", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "system_info": {"OS": "Linux-5.15.120+-x86_64-with-glibc2.35 # 1 SMP Wed Aug 30 11:19:59 UTC 2023", "Python": "3.10.12", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.0.1+cu118", "GPU Enabled": "True", "Numpy": "1.23.5", "Cloudpickle": "2.2.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
ppo-LunarLander-v2.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:963d73f14cc16838fa1b3fef671f64180dda2ac7aaef2e757abae21d16e6efcd
3
+ size 146691
ppo-LunarLander-v2/_stable_baselines3_version ADDED
@@ -0,0 +1 @@
 
 
1
+ 2.0.0a5
ppo-LunarLander-v2/data ADDED
@@ -0,0 +1,99 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "policy_class": {
3
+ ":type:": "<class 'abc.ABCMeta'>",
4
+ ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
+ "__module__": "stable_baselines3.common.policies",
6
+ "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
+ "__init__": "<function ActorCriticPolicy.__init__ at 0x7b01f8e7fe20>",
8
+ "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7b01f8e7feb0>",
9
+ "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7b01f8e7ff40>",
10
+ "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7b01f8e90040>",
11
+ "_build": "<function ActorCriticPolicy._build at 0x7b01f8e900d0>",
12
+ "forward": "<function ActorCriticPolicy.forward at 0x7b01f8e90160>",
13
+ "extract_features": "<function ActorCriticPolicy.extract_features at 0x7b01f8e901f0>",
14
+ "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7b01f8e90280>",
15
+ "_predict": "<function ActorCriticPolicy._predict at 0x7b01f8e90310>",
16
+ "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7b01f8e903a0>",
17
+ "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7b01f8e90430>",
18
+ "predict_values": "<function ActorCriticPolicy.predict_values at 0x7b01f8e904c0>",
19
+ "__abstractmethods__": "frozenset()",
20
+ "_abc_impl": "<_abc._abc_data object at 0x7b01f8e94180>"
21
+ },
22
+ "verbose": 1,
23
+ "policy_kwargs": {},
24
+ "num_timesteps": 1507328,
25
+ "_total_timesteps": 1500000,
26
+ "_num_timesteps_at_start": 0,
27
+ "seed": null,
28
+ "action_noise": null,
29
+ "start_time": 1697312316969903183,
30
+ "learning_rate": 0.0003,
31
+ "tensorboard_log": null,
32
+ "_last_obs": {
33
+ ":type:": "<class 'numpy.ndarray'>",
34
+ ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAM1I9zz4AYE8IUK6vcutg75A3re9oCuqvQAAAAAAAAAA5vVivfZwcbpCPRk5AOxKswfe67pWhy+4AACAPwAAgD8Ax4C9zI9HPwYFiL2C2ta+jQ3BvGdvoTwAAAAAAAAAALqGLr4BDCs+nrk1Pt/3ZL5FKgC9fwYQvQAAAAAAAAAAtSeEvjgbcT+VxuO+52UIv5sPrL4qZwe+AAAAAAAAAAAa3UW++jrmPs40wT11mLK+m/o2vspE4z0AAAAAAAAAAObokD64Glg/AngGPYmE/L5EuGY+JZXNvQAAAAAAAAAAZi1MPi636LwmpJM7Z2Azun81Tb7aagi7AACAPwAAgD8AFyI9KZh+urV/MrRnOAwwVHW6uSZ3nTMAAIA/AACAP5pPDTwrbII9omW7vVcQPr5cCFa9JgL9PAAAAAAAAAAAmhfRPIjEoT09Ztu5cG5DvqdAg7w19is9AAAAAAAAAACjU+O+54M2P3tMBT7D5PS+ykaZvmJSXT4AAAAAAAAAAJbBb75Uf7g+yPF9Pp/3g76I8Za8sCP3PQAAAAAAAAAAQzlUvvGNND7maoE+pzuPvgSPTbyOID49AAAAAAAAAADmkOm9uQzqPgmjqLxSqZu+SIubvURcEb0AAAAAAAAAAJqgvDx9ccQ+TUOqvU2FY763Erw7nYD/OAAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
35
+ },
36
+ "_last_episode_starts": {
37
+ ":type:": "<class 'numpy.ndarray'>",
38
+ ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="
39
+ },
40
+ "_last_original_obs": null,
41
+ "_episode_num": 0,
42
+ "use_sde": false,
43
+ "sde_sample_freq": -1,
44
+ "_current_progress_remaining": -0.004885333333333408,
45
+ "_stats_window_size": 100,
46
+ "ep_info_buffer": {
47
+ ":type:": "<class 'collections.deque'>",
48
+ ":serialized:": "gAWVEQwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHMMpm/WUbGMAWyUTSEBjAF0lEdAnSsPDxb0OHV9lChoBkdAcHI8+zMRpWgHTRIBaAhHQJ0rOwyIpH91fZQoaAZHQElGnUlRgqpoB0vBaAhHQJ0rsvnKW9l1fZQoaAZHQHEpNOqNp/RoB00IAWgIR0CdK/Rm9QGfdX2UKGgGR0Bx/dffGdZraAdL72gIR0CdLAM98qnWdX2UKGgGR0BxkMJY1YQraAdL8WgIR0CdLQPqs2ehdX2UKGgGR0BSQD/EOy3TaAdLvGgIR0CdLcKzAvcrdX2UKGgGR0ByCcAIY3vQaAdL+2gIR0CdLfqRlpXZdX2UKGgGR0Bvx6Uqx1PnaAdNFAFoCEdAnS4I/Vy3kXV9lChoBkdAcE+ZxrBTGmgHTQ4BaAhHQJ0uR8CxNZh1fZQoaAZHQHD5mh7E5yVoB0vuaAhHQJ0vOMCLdep1fZQoaAZHQFKiCY1He8BoB0vBaAhHQJ0wvVJ+UhV1fZQoaAZHQHGgU0elsP9oB00SAWgIR0CdMRA7xNItdX2UKGgGR0BxP7dXT3IuaAdNCgFoCEdAnTI3mRvFWHV9lChoBkdAcA0mhM8HOmgHTQQBaAhHQJ0ysyZa3Zx1fZQoaAZHQHC8Bc/t6X1oB00XAWgIR0CdMximVJL/dX2UKGgGR0BxDAp3HJcPaAdNJAFoCEdAnTM7f+CK8HV9lChoBkdAcpvooNNJv2gHS/VoCEdAnTOHyup0fnV9lChoBkdAcTcdCE6DG2gHTQIBaAhHQJ0z497ngYR1fZQoaAZHQHEv1hgE2YRoB00oAWgIR0CdM+KaXrt3dX2UKGgGR0Bx4kTIvJzUaAdL4GgIR0CdNEbH6uW9dX2UKGgGR0BzIc/B3zMBaAdNQgFoCEdAnTR0C7sfJXV9lChoBkdAcSpGEf1YhmgHS+poCEdAnTWIGyHEdnV9lChoBkdAb80QRPGhmGgHS/JoCEdAnTYk9t/FznV9lChoBkdAchWoG6f8M2gHS/loCEdAnTZJsGgSOHV9lChoBkdAcWFyVfNRnGgHTRgBaAhHQJ03zv+fh/B1fZQoaAZHQHEVtoSL61toB00UAWgIR0CdOR3iJfpmdX2UKGgGR0BxhMGRmseXaAdNAwFoCEdAnTqJ31SOznV9lChoBkdAcDUnfl6qsGgHS95oCEdAnTr1fE4vOHV9lChoBkdAc8H9y925hGgHTQoBaAhHQJ07K4Ajps51fZQoaAZHQG0T+F10T11oB0vuaAhHQJ07+tjkMkR1fZQoaAZHQHLr3yd4FA5oB00FAWgIR0CdPCcBU70WdX2UKGgGR0Bvqi7Ackt3aAdL32gIR0CdPDsCDEm6dX2UKGgGR0BtZt5nlGPQaAdL/mgIR0CdPQgmqo60dX2UKGgGR0BvyfPiT+vRaAdL+2gIR0CdPU+PzWf9dX2UKGgGR0BVUo4yXUpeaAdL7GgIR0CdPWmrsByTdX2UKGgGR0BzOCF/QSi/aAdNFAFoCEdAnT2WNipeeHV9lChoBkdAcqYHPeHi32gHTQABaAhHQJ095Q9A5aN1fZQoaAZHQG8PhqCYkVxoB0vjaAhHQJ0+2IbfgrJ1fZQoaAZHQHDjzXSSeRRoB0vjaAhHQJ0/AuSOinJ1fZQoaAZHQHDl9K/VRUFoB0v5aAhHQJ0+/v2GqPx1fZQoaAZHQHFvg7gbZOBoB00ZAWgIR0CdU849ovi+dX2UKGgGR0BxZoFRpDeCaAdL6mgIR0CdVF+FUQ05dX2UKGgGR0Bt1IfEGZ/kaAdL+GgIR0CdVRGahHskdX2UKGgGR0BwBwuVX3g2aAdL92gIR0CdVTByjpLVdX2UKGgGR0BxRS6DoQnQaAdNNAFoCEdAnVWcpLEk0XV9lChoBkdAcD316E8JU2gHTQEBaAhHQJ1WLqUu+RJ1fZQoaAZHQG7csspXp4doB00FAWgIR0CdVi8qnWJ8dX2UKGgGR0Bxfoe6qbSaaAdL4mgIR0CdVj5AyEcsdX2UKGgGR0BzLoJ+lTFVaAdNBAFoCEdAnVZRZU1hs3V9lChoBkdAcEJedkJ8fGgHS/ZoCEdAnVaw44p+dHV9lChoBkdAbTzoVVPva2gHTQABaAhHQJ1WwXm/3391fZQoaAZHQG+sxZEDyOJoB0v+aAhHQJ1XRufmLcd1fZQoaAZHQG8BJkGzKLdoB0vjaAhHQJ1XTOKO1fF1fZQoaAZHQHAqXVsk6cRoB0vraAhHQJ1Xi9lEqlR1fZQoaAZHQHCY9q1w5vNoB00GAWgIR0CdWDFgDzRQdX2UKGgGR0BzH1yyUs4DaAdNNwFoCEdAnVhXEQ5FPXV9lChoBkdAbbhS+g13uGgHTQIBaAhHQJ1abX+VC5V1fZQoaAZHQHJdJHNHH3loB00NAWgIR0CdW1Lux8lYdX2UKGgGR0BwN/sF+uvEaAdNAQFoCEdAnVvQOnVG1HV9lChoBkdAb6HZcLSeAmgHTQQBaAhHQJ1cY5n13+x1fZQoaAZHQHFGstsenydoB0vvaAhHQJ1ce8274BV1fZQoaAZHQHDGUAggX/JoB0v3aAhHQJ1clINEw351fZQoaAZHQG8R5dWyTpxoB00mAWgIR0CdXN/A0sOHdX2UKGgGR0Bzj5br1M/RaAdNDgFoCEdAnV1IoZydWnV9lChoBkdAcLzwH7gsLGgHTRQBaAhHQJ1dZudf9gp1fZQoaAZHQHCaoDxLCepoB0vbaAhHQJ1dZlum78N1fZQoaAZHQHIuuHN5dGBoB00JAWgIR0CdXbIeYD1XdX2UKGgGR0ByFWIwdsBRaAdL+mgIR0CdXeRV6u4gdX2UKGgGR0By/swAU+LWaAdNJgFoCEdAnV5OFg2If3V9lChoBkdAcivkrPMSsmgHTRkBaAhHQJ1ej7Ikqtp1fZQoaAZHQHCmlhLGrCFoB00SAWgIR0CdX0xdY4hmdX2UKGgGR0ByTYK/mDDkaAdNDAFoCEdAnV9UK3NLUXV9lChoBkdAcnW/J/5Ly2gHS+JoCEdAnWE2ldkauXV9lChoBkdAcUsq7yxzJmgHS91oCEdAnWGFHWjGk3V9lChoBkdAboE5OJtSAGgHS/ZoCEdAnWLH2dupCXV9lChoBkdAcmh2ZRbbDmgHS/BoCEdAnWLHLRrrPnV9lChoBkdAcZeu3trsSmgHS/1oCEdAnWMVE/jbSXV9lChoBkdAbxXesxO+I2gHS+BoCEdAnWMtxMnJDHV9lChoBkdAce94+KTB7GgHS/1oCEdAnWN6WHDaXnV9lChoBkdAcUi9aEBbOmgHS/toCEdAnWP1DKHO8nV9lChoBkdAcbwuzQeFL2gHS/VoCEdAnWQc6/7BPHV9lChoBkdAb7fw6ySmqGgHS/ZoCEdAnWRhbKRuCXV9lChoBkdAcgMkcS5AhWgHTQ0BaAhHQJ1kX+ee4Cp1fZQoaAZHQGzQQsGxD9hoB0v/aAhHQJ1lAn9ehPF1fZQoaAZHQHAB0jX4CZFoB00FAWgIR0CdZW0Re1KHdX2UKGgGR0ByeHo4dZJTaAdNBAFoCEdAnWYzUd7v5XV9lChoBkdAb/Pu7YkE92gHS/doCEdAnWf4Q4CIUXV9lChoBkdAcINSh8IAwWgHTUoBaAhHQJ1oNmHxjKB1fZQoaAZHQHGO6pLmITJoB00GAWgIR0CdaMDnNgSfdX2UKGgGR0BwpR5v99+gaAdL+mgIR0CdabBtDUmVdX2UKGgGR0By8c4CIUJwaAdL/WgIR0CdacoP07KadX2UKGgGR0Bumjxsl9jPaAdNAwFoCEdAnWpNlNDc/XV9lChoBkdAcQ4t+CsfaGgHTQYBaAhHQJ1qfxRVIZt1fZQoaAZHQHEYQDFId2hoB0v3aAhHQJ1q3jvNNah1fZQoaAZHQHC94yTINmVoB00KAWgIR0CdavGjsUqQdX2UKGgGR0BwCrRplBhQaAdL72gIR0CdawzLOiWWdX2UKGgGR0BwZgJC0F8paAdNAAFoCEdAnWtAEIPbwnV9lChoBkdAc48xvNu+AWgHS+BoCEdAnWtbE9+w1XV9lChoBkdAbpgSZjQRgGgHS/JoCEdAnWw8EA5q/XVlLg=="
49
+ },
50
+ "ep_success_buffer": {
51
+ ":type:": "<class 'collections.deque'>",
52
+ ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
53
+ },
54
+ "_n_updates": 397,
55
+ "observation_space": {
56
+ ":type:": "<class 'gymnasium.spaces.box.Box'>",
57
+ ":serialized:": "gAWVcAIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoECiWCAAAAAAAAAABAQEBAQEBAZRoFEsIhZRoGHSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBAoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaApLCIWUaBh0lFKUjARoaWdolGgQKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgKSwiFlGgYdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=",
58
+ "dtype": "float32",
59
+ "bounded_below": "[ True True True True True True True True]",
60
+ "bounded_above": "[ True True True True True True True True]",
61
+ "_shape": [
62
+ 8
63
+ ],
64
+ "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]",
65
+ "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]",
66
+ "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]",
67
+ "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]",
68
+ "_np_random": null
69
+ },
70
+ "action_space": {
71
+ ":type:": "<class 'gymnasium.spaces.discrete.Discrete'>",
72
+ ":serialized:": "gAWV1QAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCloCmgOjApfbnBfcmFuZG9tlE51Yi4=",
73
+ "n": "4",
74
+ "start": "0",
75
+ "_shape": [],
76
+ "dtype": "int64",
77
+ "_np_random": null
78
+ },
79
+ "n_envs": 16,
80
+ "n_steps": 1024,
81
+ "gamma": 0.999,
82
+ "gae_lambda": 0.98,
83
+ "ent_coef": 0.01,
84
+ "vf_coef": 0.5,
85
+ "max_grad_norm": 0.5,
86
+ "batch_size": 64,
87
+ "n_epochs": 4,
88
+ "clip_range": {
89
+ ":type:": "<class 'function'>",
90
+ ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"
91
+ },
92
+ "clip_range_vf": null,
93
+ "normalize_advantage": true,
94
+ "target_kl": null,
95
+ "lr_schedule": {
96
+ ":type:": "<class 'function'>",
97
+ ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"
98
+ }
99
+ }
ppo-LunarLander-v2/policy.optimizer.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:861cad11a6ab82fe60bdc38f096496d9851472b033889cfe3f9ea1853188c187
3
+ size 87929
ppo-LunarLander-v2/policy.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4af7c2629e2472fb049fc8360c664995d1d45458364346ea9adecbf9cc3409b7
3
+ size 43329
ppo-LunarLander-v2/pytorch_variables.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d030ad8db708280fcae77d87e973102039acd23a11bdecc3db8eb6c0ac940ee1
3
+ size 431
ppo-LunarLander-v2/system_info.txt ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ - OS: Linux-5.15.120+-x86_64-with-glibc2.35 # 1 SMP Wed Aug 30 11:19:59 UTC 2023
2
+ - Python: 3.10.12
3
+ - Stable-Baselines3: 2.0.0a5
4
+ - PyTorch: 2.0.1+cu118
5
+ - GPU Enabled: True
6
+ - Numpy: 1.23.5
7
+ - Cloudpickle: 2.2.1
8
+ - Gymnasium: 0.28.1
9
+ - OpenAI Gym: 0.25.2
replay.mp4 CHANGED
Binary files a/replay.mp4 and b/replay.mp4 differ
 
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 207.80544679999997, "std_reward": 21.891140426218445, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-09-17T11:58:28.843049"}
 
1
+ {"mean_reward": 279.3005875, "std_reward": 14.008042291136208, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-10-14T20:16:46.184867"}