hookzeng commited on
Commit
77daf87
1 Parent(s): ad91b10

Upload PPO LunarLander-v2 trained agent

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
- value: 4.77 +/- 138.58
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
+ value: 230.21 +/- 17.26
20
  name: mean_reward
21
  verified: false
22
  ---
config.json CHANGED
@@ -1 +1 @@
1
- {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7fe300ffdca0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7fe300ffdd30>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7fe300ffddc0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7fe300ffde50>", "_build": "<function ActorCriticPolicy._build at 0x7fe300ffdee0>", "forward": "<function ActorCriticPolicy.forward at 0x7fe300ffdf70>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7fe300f80040>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7fe300f800d0>", "_predict": "<function ActorCriticPolicy._predict at 0x7fe300f80160>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7fe300f801f0>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7fe300f80280>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7fe300f80310>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc_data object at 0x7fe300ffb360>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 1015808, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1712321505613798384, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAADPcsbxxg7E/NucGvtGWEb2Dnq08DbcDvQAAAAAAAAAAzYxyOlxssj/rgGc9a7tOvRdtib5tPcM9AAAAAAAAAAC65Cw+9oBzvKjtijzUX4U8jNR9vaY9ab0AAIA/AACAP5rQqTwgzpc/mzMVPmUSur5OkAS/wdm6PgAAAAAAAAAAAHr+PCjvrz/XDCI/i9aKvkFh97wbe/C9AAAAAAAAAADzJ6E95O+gP1WO/D3r/wo9/gChPjUdET8AAAAAAAAAAFpkoT0PBUI/KBjXPgIRYr65dH08YgwuPwAAAAAAAAAAmpFVO6zztT/GhrU8/4F0vIGsfj1AX5U+AAAAAAAAAABdEVO+3jtaP7Zng750UPK+JxsEP91DGb8AAAAAAAAAALJ8g76PfGO86oS9un3fwrin9c091ZzkOQAAgD8AAIA/GqNdvRRUrbrjjSI3PppzMvtAbjpcSzi2AACAPwAAgD/guQo+UrKXu7rdszkamQW3XPzRvPuh4bgAAIA/AACAP5rZdrxGBb8/PeQ7PEZxDDsMHA69Y8hGPQAAAAAAAAAAGAa+vuwf7T5oj+O+IG8Uv1On2T4Sx0K/AAAAAAAAAABNklI+H16mPOl1B75vxcO7qJ0yvRMCIb8AAIA/AAAAAAYhKb6OXXk/6AIBPm/qzziZovc+lRwvPwAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.015808000000000044, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVNQwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHwGbdjeKsMiOMAWyUTS0BjAF0lEdAeIRzQeFL4HV9lChoBkdAakonXNC7b2gHTcUCaAhHQHiGFyaNMoN1fZQoaAZHwErNy5I6KcdoB0vzaAhHQHiGUehf0Ep1fZQoaAZHQER4DHOryUdoB00BAWgIR0B4ikxQBPsSdX2UKGgGR8BoJzu4PPLQaAdNCgFoCEdAeIr9dNWU8nV9lChoBkfAaGl5KODJ2mgHTUIBaAhHQHiLh9G7SRd1fZQoaAZHQF5dWEK3NLVoB03oA2gIR0B4kYt6HCXQdX2UKGgGR0BZprfLs8gZaAdN6ANoCEdAeJPrGBFuvXV9lChoBkfAb4ZAOavzOGgHTSQCaAhHQHipGMS9M9N1fZQoaAZHwG2T7jT8YQ9oB01JAWgIR0B4rgrRSgoPdX2UKGgGR8BEZzf779AHaAdNPgFoCEdAeK6tJnQIEHV9lChoBkdAbBA0waisXGgHTR8CaAhHQHixq8L8aXN1fZQoaAZHwFSiCJGe+VVoB00xAWgIR0B4supT/ACXdX2UKGgGR0BUP8PnSv1UaAdN6ANoCEdAeLNw6hg3LnV9lChoBkdAU8PVFx4pt2gHTegDaAhHQHi0r9AHE/B1fZQoaAZHQDNRfVqesgdoB0vxaAhHQHi07iuMdcV1fZQoaAZHwENKKrq+rU9oB01nAWgIR0B4uBQSBbwCdX2UKGgGR8Btp1ndweeWaAdNiwFoCEdAeMOnKnvUjXV9lChoBkfAZDjqqwQlKWgHS9xoCEdAeNw25xzaK3V9lChoBkdAX+5rYXfqHGgHTegDaAhHQHjfD9n9Nvh1fZQoaAZHQGvrI+fRNRFoB01fAmgIR0B435/I8yN5dX2UKGgGR0Bnr2epXIU8aAdNowJoCEdAeOF8Hv+fiHV9lChoBkfAQP56yB06o2gHS/5oCEdAeORu7pV0cXV9lChoBkfAYvXjMFEApGgHTQ4BaAhHQHjmwY+B6KN1fZQoaAZHwG2Ys/pt78hoB01RAWgIR0B46skLQXyidX2UKGgGR0BqbQ+yJKraaAdNsAJoCEdAeO5/giu+y3V9lChoBkfAUbKbx3FDOWgHTeQBaAhHQHj4DJIUahp1fZQoaAZHwCPl07r9l3BoB0vraAhHQHj4fovBacJ1fZQoaAZHwDL9SBK+SKZoB00/AWgIR0B4/hECvHLidX2UKGgGR8BwAMVBUrCnaAdNFgJoCEdAeQUeiBXjl3V9lChoBkfAaH3H/cWTHWgHTRkBaAhHQHkGVMRHww11fZQoaAZHwGm9aBAfMfRoB00cAWgIR0B5CQaJhvzfdX2UKGgGR8BLQ7ZvkzXSaAdNUwFoCEdAeQoSyt3fRHV9lChoBkdAcbEKQaJhv2gHTWsBaAhHQHkKel9Brvd1fZQoaAZHQFjlPUKArhBoB03oA2gIR0B5C0KBun/DdX2UKGgGR8BncGeFtbcHaAdNPQFoCEdAeROgv114gXV9lChoBkfAay3N2TxG2GgHTQQBaAhHQHkWFzEJjUd1fZQoaAZHQF9QqTr3TNNoB03oA2gIR0B5GHU4JeE7dX2UKGgGR0BsQl89fTkRaAdNpgFoCEdAeRu6jFhod3V9lChoBkfAZAySFGoaUGgHTSsBaAhHQHkfq0QbuMN1fZQoaAZHQGcVRQizLOloB01bAmgIR0B5JZsqJ/G3dX2UKGgGR8Bw9YiW3Sa3aAdNkwFoCEdAeSaisXBP9HV9lChoBkfAaxRVcUuct2gHTSsBaAhHQHkp6EWZZ0V1fZQoaAZHwETtTzd1uBNoB004AWgIR0B5LVHtnf2sdX2UKGgGR8BNWnied07saAdNTAFoCEdAeS6tu1ndwnV9lChoBkdAaR6fK6nR9mgHTZ4BaAhHQHkymVeKKpF1fZQoaAZHQGo/fHggow5oB02fA2gIR0B5NqF49ovjdX2UKGgGR0BCq8Sf16E8aAdN6ANoCEdAeTt7CSA6MnV9lChoBkdAWNKhmGucMGgHTegDaAhHQHk7uaz/p+t1fZQoaAZHwGu6cUVSGahoB00SAWgIR0B5PlMWXTmXdX2UKGgGR8BJp3ZoPCl8aAdNPAFoCEdAeT7AJ9iMHnV9lChoBkfAbI2WszVMEmgHTYsBaAhHQHk/SKR+z+p1fZQoaAZHwGZuqp1ie/ZoB004AWgIR0B5Rq+0w8GLdX2UKGgGR0BpduQZGax5aAdNVgJoCEdAeUdWeYlY2nV9lChoBkfAax/ZaFEiMmgHTUoBaAhHQHlJWx6fJ3h1fZQoaAZHwDVENutOmBRoB00FAWgIR0B5Sik2xY7rdX2UKGgGR0Bncnr6ciGGaAdNcQJoCEdAeV8U1AJLNHV9lChoBkfAa8Uit7rs0GgHS+5oCEdAeWDb2lEZznV9lChoBkdAbUQ4smOU+2gHTR4CaAhHQHlhfrjYI0J1fZQoaAZHwFGAh1Tzd1xoB00LAmgIR0B5YblLeyiVdX2UKGgGR8Bnl4co6S1WaAdNeAFoCEdAeWS+yquKXXV9lChoBkdANbMkMTewcGgHS/BoCEdAeWahOP/7znV9lChoBkfAacGUmD15B2gHTUEBaAhHQHlqjcRDkU91fZQoaAZHwG27zXrdFfBoB01qAWgIR0B5cXLX+VC5dX2UKGgGR8BoYXDUExIraAdNGwFoCEdAeXGsqJ/G2nV9lChoBkfAZNiuU2UB4mgHTTkBaAhHQHl1ioS+QEJ1fZQoaAZHwGL/B8pkPMBoB0v0aAhHQHl2vjfek591fZQoaAZHwGKMJi7TUiJoB0v0aAhHQHl3jPa+N991fZQoaAZHQGTAGhmGucNoB00zAmgIR0B5e5/QSi/PdX2UKGgGR0BtiWgJ1JUYaAdNzQJoCEdAeYOq9GqgiHV9lChoBkfAaOgHmA9V3mgHTTcBaAhHQHmD/8/D+BJ1fZQoaAZHQG9VF23azu5oB01wAWgIR0B5hXPBzmwJdX2UKGgGR0Buqpr30wrUaAdNlQFoCEdAeYYMgU1yenV9lChoBkdAa8p/J/5Ly2gHTdMBaAhHQHmIXgtOEdx1fZQoaAZHwE0elgMMI/toB03rAWgIR0B5i1fTkQwsdX2UKGgGR0Buo6YLLIPtaAdNhAJoCEdAeY4aoMrmQ3V9lChoBkfAbUs78Nx2jmgHTZQBaAhHQHmO8u8K5TZ1fZQoaAZHQGyT66J66atoB03EAmgIR0B5kUPSUkfLdX2UKGgGR8BoEVbor4FiaAdNPQFoCEdAeZGff4yoGnV9lChoBkfAZeCy0rsjV2gHTScBaAhHQHmT/DLr5Zd1fZQoaAZHwGnyYaP0Zm9oB015AWgIR0B5lgXWOIZZdX2UKGgGR8Bnqhmwqy4XaAdNIAFoCEdAeZZmJFb3XnV9lChoBkfAaOKBe5WilGgHTV0BaAhHQHmXheHBUJh1fZQoaAZHQHAgvRVp9JBoB01wAWgIR0B5mBJQLux9dX2UKGgGR8A5/XA/LTx5aAdL7WgIR0B5mPmaH9FXdX2UKGgGR8A3n912aDwpaAdL/GgIR0B5mQxqO939dX2UKGgGR8AS9QCSzPa+aAdNAwFoCEdAeZlPu5SWJXV9lChoBkfAO9nxnWattGgHS/toCEdAeZvEt/WlM3V9lChoBkfAZt7jXFtKqWgHTS8BaAhHQHmiWUjcEeR1fZQoaAZHwGRrgT7EYO5oB0vnaAhHQHmngRsdkrh1fZQoaAZHwGdsSNGViWpoB01CAWgIR0B5p6UOd5IIdX2UKGgGR8BwnCp4rz5HaAdNYAFoCEdAeamhhH9WIXV9lChoBkdAbU+BnSOR1WgHTUEBaAhHQHmqL9If8uV1fZQoaAZHwGZAaTnq3VloB00VAWgIR0B5rFVghKUWdX2UKGgGR8A4tTOPeYUnaAdNOgFoCEdAeazrRjSXt3V9lChoBkfAZmatz0Yj0WgHS/loCEdAea1B0ZFXrHV9lChoBkfAaa9DPWxyGWgHTSUBaAhHQHmv5m29cr11fZQoaAZHwGeLwc5sCT5oB01FAWgIR0B5tBMDfWMCdX2UKGgGR8BjL4YtQKrraAdL42gIR0B5txshxHXmdX2UKGgGR8BqvRRXOnl5aAdNQQFoCEdAebgBCUornXVlLg=="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 248, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVcAIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoECiWCAAAAAAAAAABAQEBAQEBAZRoFEsIhZRoGHSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBAoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaApLCIWUaBh0lFKUjARoaWdolGgQKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgKSwiFlGgYdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV1QAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCloCmgOjApfbnBfcmFuZG9tlE51Yi4=", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "n_steps": 1024, "gamma": 0.6, "gae_lambda": 0.48, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 128, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWV1gIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMYC9ob21lL2hvb2t6ZW5nL2FuYWNvbmRhMy9lbnZzL3B5MzgvbGliL3B5dGhvbjMuOC9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4RDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMYC9ob21lL2hvb2t6ZW5nL2FuYWNvbmRhMy9lbnZzL3B5MzgvbGliL3B5dGhvbjMuOC9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlGgAjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoH32UfZQoaBZoDYwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBeMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHP8mZmZmZmZqFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWV1gIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMYC9ob21lL2hvb2t6ZW5nL2FuYWNvbmRhMy9lbnZzL3B5MzgvbGliL3B5dGhvbjMuOC9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4RDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMYC9ob21lL2hvb2t6ZW5nL2FuYWNvbmRhMy9lbnZzL3B5MzgvbGliL3B5dGhvbjMuOC9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlGgAjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoH32UfZQoaBZoDYwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBeMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHPzOpKjBVMmGFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "system_info": {"OS": "Linux-6.2.0-39-generic-x86_64-with-glibc2.17 # 40~22.04.1-Ubuntu SMP PREEMPT_DYNAMIC Thu Nov 16 10:53:04 UTC 2", "Python": "3.8.18", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.2.2+cu121", "GPU Enabled": "False", "Numpy": "1.24.4", "Cloudpickle": "3.0.0", "Gymnasium": "0.28.1"}}
 
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7efded27dca0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7efded27dd30>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7efded27ddc0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7efded27de50>", "_build": "<function ActorCriticPolicy._build at 0x7efded27dee0>", "forward": "<function ActorCriticPolicy.forward at 0x7efded27df70>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7efded202040>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7efded2020d0>", "_predict": "<function ActorCriticPolicy._predict at 0x7efded202160>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7efded2021f0>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7efded202280>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7efded202310>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc_data object at 0x7efded27c2d0>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 1015808, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1712322094998193614, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAGZhhbxSmOG5qtKvObuD9rVEWvy6okrPuAAAgD8AAIA/hsotPnRNhLxOz8Q5MYscuCr05r0ZhQO5AACAPwAAgD/QZqq+l+5KP100Fz7063C+OUeqvUVlvz0AAAAAAAAAAM19M72P3nm6N6OIuYmrg7TS30a7KqOfOAAAgD8AAIA/M5x1PcPtMrqqpjw8bU65NkPBHLvn3K01AACAPwAAgD8z+1S9rnWJuspfnTlSg5G20TNvutAHtrgAAIA/AACAP/O6tj2PxmG69FQzvLVnF7Z0HL+68quLNQAAgD8AAIA/WlGJPTiqwD0zLAC+RURVvvae5rv1oK69AAAAAAAAAAATqjA+D7BlP16BVbz6dZW+nTHVPbplYr0AAAAAAAAAANPvHT6sxpU/aneYPsmswL7Lsuw9pRPHOwAAAAAAAAAAAGwwPXsanrr6CJS7q9wEtWgUTbr0uao6AACAPwAAgD/m0YG93r2ZPcMDRz4zlGG+FGeFPZurKD0AAAAAAAAAAKYnsb0G+Sw/m3PjPXOhiL6xc586eHkkPQAAAAAAAAAAAPg0O7jm5rmJ3Q66VpmLtVFxmLpr1SY5AACAPwAAgD9aMaI9H031uaQaJrtm6++1mJCwOirDPjoAAIA/AACAP5rZ/ToU3sK6VjB1urXLTTuVXAs7MstevAAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.015808000000000044, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVQQwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQE46o+fRNRGMAWyUS9iMAXSUR0B9G5wjt5UtdX2UKGgGR0BkWQu/UONHaAdN6ANoCEdAfSBwsGxD9nV9lChoBkdAZbcMUh3aBmgHTegDaAhHQH0qTfrKNhp1fZQoaAZHQGLwXjlxOtZoB03oA2gIR0B9MjCbc45tdX2UKGgGR0BgN8xIre67aAdN6ANoCEdAfUBIcinpCHV9lChoBkdAZnzzRQaaTmgHTegDaAhHQH1XYk/r0J51fZQoaAZHQGJF6F/QSjBoB03oA2gIR0B9Y6+Jxeb/dX2UKGgGR0Bk9//95yEMaAdN6ANoCEdAfW6lXzUZvXV9lChoBkdAZkiY+B6KL2gHTegDaAhHQH1wTUAksz51fZQoaAZHQGLLta6jFhpoB03oA2gIR0B9cY7cO9WZdX2UKGgGR0Bc9SUcGTs6aAdN6ANoCEdAfXRVxjriVHV9lChoBkdAYeGplSS/02gHTegDaAhHQH2EYpMHryF1fZQoaAZHQGPq/+sHSndoB03oA2gIR0B9iGaTfR/mdX2UKGgGR0AjM6QvHtF8aAdL9WgIR0B9jxEPUaybdX2UKGgGR0BkvO6d1+y7aAdN6ANoCEdAfY9VLBbfQHV9lChoBkdAY/ipo9LYgGgHTegDaAhHQH2bvc8DB/J1fZQoaAZHQGA3liSaEzxoB03oA2gIR0B9sKr+5vtMdX2UKGgGR0BVwfIOpbUxaAdN6ANoCEdAfbQI55qubXV9lChoBkdAY4/yEtdzGWgHTegDaAhHQH234+B6KLt1fZQoaAZHQGGtnWz4UN9oB03oA2gIR0B9v3di2DxtdX2UKGgGR0BlQdEuxrzoaAdN6ANoCEdAfcWYtQKrrHV9lChoBkdAZdEu5jH4oWgHTegDaAhHQH3Re4oZydZ1fZQoaAZHQGV/nw5NoJ1oB03oA2gIR0B95Do4dZJTdX2UKGgGR0BmLupMpPRBaAdN6ANoCEdAfe3TA31jAnV9lChoBkdAYjpjx0+1SmgHTegDaAhHQH32G47Rv3t1fZQoaAZHQGT8JXp4bCJoB03oA2gIR0B9+EKUmlZYdX2UKGgGR0BlShgiNbTuaAdN6ANoCEdAffpfyf+S83V9lChoBkdAXnHZAY51eWgHTegDaAhHQH4GqgyuZCx1fZQoaAZHQGUYNOEdvKloB03oA2gIR0B+CZntfG+9dX2UKGgGR0BkHnXoTwlTaAdN6ANoCEdAfg7QRPGhmHV9lChoBkdAYLzkWhysCGgHTegDaAhHQH4PBN21Ul11fZQoaAZHQGCpL1/Ue+5oB03oA2gIR0B+GXNY8uBddX2UKGgGR0BjccR6F/QTaAdN6ANoCEdAfhslvZRKpXV9lChoBkdAaOZFKkEcKmgHTegDaAhHQH43WVAzHjp1fZQoaAZHQGA+Wf9P1thoB03oA2gIR0B+Ot3fQ8fWdX2UKGgGR0Bc9qq814xDaAdN6ANoCEdAfkIHU+cH4XV9lChoBkdAYdlYEGJN02gHTegDaAhHQH5IDoUzsQd1fZQoaAZHQGRvT7l7tzFoB03oA2gIR0B+VBxAB1cMdX2UKGgGR0BlfCScLBsRaAdN6ANoCEdAfmhd/J/5L3V9lChoBkdAYp7/jKgZj2gHTegDaAhHQH5zC9EkSmJ1fZQoaAZHQF4l6jWTX8RoB03oA2gIR0B+fDffoA4odX2UKGgGR0BnANm6GxlhaAdN6ANoCEdAfn6qoZQ53nV9lChoBkdAYYtcHGCI12gHTegDaAhHQH6BLKFIuoR1fZQoaAZHQGTT1Ed/8VJoB03oA2gIR0B+kJ4mkWRBdX2UKGgGR0Bfgrns9jgAaAdN6ANoCEdAfpRhXr+o+HV9lChoBkdAXqEfyPMjeWgHTegDaAhHQH6bGEPDpC91fZQoaAZHQGJA7pV0cOtoB03oA2gIR0B+m1iqhlDndX2UKGgGR0Be0JTER8MNaAdN6ANoCEdAfqeyLQ5WBHV9lChoBkdAYUU6qbSZ0GgHTegDaAhHQH6pvQnhKlJ1fZQoaAZHQGC/l+3H7xdoB03oA2gIR0B+rVsLv1DjdX2UKGgGR0BkChrrPdEcaAdN6ANoCEdAfsZmmtQsPXV9lChoBkdAYNVarWAf+2gHTegDaAhHQH7PJTER8MN1fZQoaAZHQFwSiWVu76JoB03oA2gIR0B+1nHaN+9bdX2UKGgGR0Bj+lV/+bVjaAdN6ANoCEdAfuTP0qYqonV9lChoBkdAZQS32EkB0mgHTegDaAhHQH77OdXko4N1fZQoaAZHQGGgjA8B+4NoB03oA2gIR0B/Behf0EowdX2UKGgGR0Bk9RLCemNzaAdN6ANoCEdAfw82xY7q6nV9lChoBkdAZvOK+i8Fp2gHTegDaAhHQH8RjkMkQf91fZQoaAZHQGS2YNqgyuZoB03oA2gIR0B/E/IikftAdX2UKGgGR0BexIXoC+10aAdN6ANoCEdAfyE2M85jpnV9lChoBkdAZiXVhCtzS2gHTegDaAhHQH8kVhoduHh1fZQoaAZHQGNHrxRVIZtoB03oA2gIR0B/KdLxqfvndX2UKGgGR0BkG9fCyhSMaAdN6ANoCEdAfyoMUAT7EnV9lChoBkdAWxUXcgyM1mgHTegDaAhHQH8033UQTVV1fZQoaAZHQGClehGpdbBoB03oA2gIR0B/NrPw/gR9dX2UKGgGR0BldmQ6p5u7aAdN6ANoCEdAfzncy31BdHV9lChoBkdAZNCLiuMdcWgHTegDaAhHQH9Pj1XeWOZ1fZQoaAZHQGWurUkOZstoB03oA2gIR0B/V52eQMhHdX2UKGgGR0Be9L3sXzlLaAdN6ANoCEdAf16UxVQyh3V9lChoBkdAZC9ReC04R2gHTegDaAhHQH9so0IkZ751fZQoaAZHQF20+RYA80VoB03oA2gIR0B/hBcGC7K8dX2UKGgGR0BkzDj94u9OaAdN6ANoCEdAf5CpEhJRO3V9lChoBkdAXdVObiIcimgHTegDaAhHQH+blyaNMoN1fZQoaAZHQF9t6Skj5bhoB03oA2gIR0B/noKLKmsOdX2UKGgGR0BhIjWsijcmaAdN6ANoCEdAf6GFOfukUXV9lChoBkdAYu3b/wRXfmgHTegDaAhHQH+0UNKAavR1fZQoaAZHQGXf2fkFOfxoB03oA2gIR0B/uMytV7x/dX2UKGgGR0BgeByXD3ueaAdN6ANoCEdAf8CS1Vo6CHV9lChoBkdAYzSiO/+Kj2gHTegDaAhHQH/A5SWJJoV1fZQoaAZHQGUEO7QLNOdoB03oA2gIR0B/zyNMoMKDdX2UKGgGR0BnrDTBqKxcaAdN6ANoCEdAf9FugYgq3HV9lChoBkdAYDZs/IKc/mgHTegDaAhHQH/VdOVPepJ1fZQoaAZHQGJ6ml67dzpoB03oA2gIR0B/2hlz2exwdX2UKGgGR0BfMSgTRIBjaAdN6ANoCEdAf/b2HtWuHXV9lChoBkdAXokgzP8htGgHTegDaAhHQH/+K7mMfih1fZQoaAZHQGJaxf4REndoB03oA2gIR0CABdR64UeudX2UKGgGR0BCe1kUbkwOaAdL/WgIR0CADwwTM7lrdX2UKGgGR0BgjRbW3BpIaAdN6ANoCEdAgBAsaCL/CXV9lChoBkdAY4l1Oj7AL2gHTegDaAhHQIAVGkgwGnp1fZQoaAZHQGIHb0e2d/doB03oA2gIR0CAGWMb3oLYdX2UKGgGR0BkMsbtJFspaAdN6ANoCEdAgBp5ZB9kSXV9lChoBkdAYVjEit7rs2gHTegDaAhHQIAblyPuG9J1fZQoaAZHQGbA+VC5VfhoB03oA2gIR0CAIqmVJL/TdX2UKGgGR0BidUUKzAvdaAdN6ANoCEdAgCR1zySV4XV9lChoBkdAYGVTEzfrKWgHTegDaAhHQIAnoq/dqL11fZQoaAZHQGChQVsUIs1oB03oA2gIR0CAJ8NYr8R+dX2UKGgGR0BidtsJpnHvaAdN6ANoCEdAgC3PLHMlknV9lChoBkdAZEN9MsYl6mgHTegDaAhHQIAuzHlwLmZ1fZQoaAZHQGcpHLzPKMhoB03oA2gIR0CAMI9jgAIZdX2UKGgGR0Bg8IKrq+rVaAdN6ANoCEdAgDK9nbqQinVlLg=="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 248, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVcAIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoECiWCAAAAAAAAAABAQEBAQEBAZRoFEsIhZRoGHSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBAoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaApLCIWUaBh0lFKUjARoaWdolGgQKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgKSwiFlGgYdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV1QAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCloCmgOjApfbnBfcmFuZG9tlE51Yi4=", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 128, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWV1gIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMYC9ob21lL2hvb2t6ZW5nL2FuYWNvbmRhMy9lbnZzL3B5MzgvbGliL3B5dGhvbjMuOC9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4RDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMYC9ob21lL2hvb2t6ZW5nL2FuYWNvbmRhMy9lbnZzL3B5MzgvbGliL3B5dGhvbjMuOC9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlGgAjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoH32UfZQoaBZoDYwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBeMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHP8mZmZmZmZqFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWV1gIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMYC9ob21lL2hvb2t6ZW5nL2FuYWNvbmRhMy9lbnZzL3B5MzgvbGliL3B5dGhvbjMuOC9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4RDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMYC9ob21lL2hvb2t6ZW5nL2FuYWNvbmRhMy9lbnZzL3B5MzgvbGliL3B5dGhvbjMuOC9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlGgAjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoH32UfZQoaBZoDYwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBeMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHPzOpKjBVMmGFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "system_info": {"OS": "Linux-6.2.0-39-generic-x86_64-with-glibc2.17 # 40~22.04.1-Ubuntu SMP PREEMPT_DYNAMIC Thu Nov 16 10:53:04 UTC 2", "Python": "3.8.18", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.2.2+cu121", "GPU Enabled": "False", "Numpy": "1.24.4", "Cloudpickle": "3.0.0", "Gymnasium": "0.28.1"}}
ppo-LunarLander-v2.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a7c974677e7b67824e4e0c405e657d97b9b0365fc222e04a043471cfa26aab19
3
- size 147583
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:890c065099b0ddd693a8d4f607420ef1b6761434514aefb7b61eed7e269e553d
3
+ size 147601
ppo-LunarLander-v2/data CHANGED
@@ -4,20 +4,20 @@
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
- "__init__": "<function ActorCriticPolicy.__init__ at 0x7fe300ffdca0>",
8
- "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7fe300ffdd30>",
9
- "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7fe300ffddc0>",
10
- "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7fe300ffde50>",
11
- "_build": "<function ActorCriticPolicy._build at 0x7fe300ffdee0>",
12
- "forward": "<function ActorCriticPolicy.forward at 0x7fe300ffdf70>",
13
- "extract_features": "<function ActorCriticPolicy.extract_features at 0x7fe300f80040>",
14
- "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7fe300f800d0>",
15
- "_predict": "<function ActorCriticPolicy._predict at 0x7fe300f80160>",
16
- "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7fe300f801f0>",
17
- "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7fe300f80280>",
18
- "predict_values": "<function ActorCriticPolicy.predict_values at 0x7fe300f80310>",
19
  "__abstractmethods__": "frozenset()",
20
- "_abc_impl": "<_abc_data object at 0x7fe300ffb360>"
21
  },
22
  "verbose": 1,
23
  "policy_kwargs": {},
@@ -26,12 +26,12 @@
26
  "_num_timesteps_at_start": 0,
27
  "seed": null,
28
  "action_noise": null,
29
- "start_time": 1712321505613798384,
30
  "learning_rate": 0.0003,
31
  "tensorboard_log": null,
32
  "_last_obs": {
33
  ":type:": "<class 'numpy.ndarray'>",
34
- ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAADPcsbxxg7E/NucGvtGWEb2Dnq08DbcDvQAAAAAAAAAAzYxyOlxssj/rgGc9a7tOvRdtib5tPcM9AAAAAAAAAAC65Cw+9oBzvKjtijzUX4U8jNR9vaY9ab0AAIA/AACAP5rQqTwgzpc/mzMVPmUSur5OkAS/wdm6PgAAAAAAAAAAAHr+PCjvrz/XDCI/i9aKvkFh97wbe/C9AAAAAAAAAADzJ6E95O+gP1WO/D3r/wo9/gChPjUdET8AAAAAAAAAAFpkoT0PBUI/KBjXPgIRYr65dH08YgwuPwAAAAAAAAAAmpFVO6zztT/GhrU8/4F0vIGsfj1AX5U+AAAAAAAAAABdEVO+3jtaP7Zng750UPK+JxsEP91DGb8AAAAAAAAAALJ8g76PfGO86oS9un3fwrin9c091ZzkOQAAgD8AAIA/GqNdvRRUrbrjjSI3PppzMvtAbjpcSzi2AACAPwAAgD/guQo+UrKXu7rdszkamQW3XPzRvPuh4bgAAIA/AACAP5rZdrxGBb8/PeQ7PEZxDDsMHA69Y8hGPQAAAAAAAAAAGAa+vuwf7T5oj+O+IG8Uv1On2T4Sx0K/AAAAAAAAAABNklI+H16mPOl1B75vxcO7qJ0yvRMCIb8AAIA/AAAAAAYhKb6OXXk/6AIBPm/qzziZovc+lRwvPwAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
35
  },
36
  "_last_episode_starts": {
37
  ":type:": "<class 'numpy.ndarray'>",
@@ -45,7 +45,7 @@
45
  "_stats_window_size": 100,
46
  "ep_info_buffer": {
47
  ":type:": "<class 'collections.deque'>",
48
- ":serialized:": "gAWVNQwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHwGbdjeKsMiOMAWyUTS0BjAF0lEdAeIRzQeFL4HV9lChoBkdAakonXNC7b2gHTcUCaAhHQHiGFyaNMoN1fZQoaAZHwErNy5I6KcdoB0vzaAhHQHiGUehf0Ep1fZQoaAZHQER4DHOryUdoB00BAWgIR0B4ikxQBPsSdX2UKGgGR8BoJzu4PPLQaAdNCgFoCEdAeIr9dNWU8nV9lChoBkfAaGl5KODJ2mgHTUIBaAhHQHiLh9G7SRd1fZQoaAZHQF5dWEK3NLVoB03oA2gIR0B4kYt6HCXQdX2UKGgGR0BZprfLs8gZaAdN6ANoCEdAeJPrGBFuvXV9lChoBkfAb4ZAOavzOGgHTSQCaAhHQHipGMS9M9N1fZQoaAZHwG2T7jT8YQ9oB01JAWgIR0B4rgrRSgoPdX2UKGgGR8BEZzf779AHaAdNPgFoCEdAeK6tJnQIEHV9lChoBkdAbBA0waisXGgHTR8CaAhHQHixq8L8aXN1fZQoaAZHwFSiCJGe+VVoB00xAWgIR0B4supT/ACXdX2UKGgGR0BUP8PnSv1UaAdN6ANoCEdAeLNw6hg3LnV9lChoBkdAU8PVFx4pt2gHTegDaAhHQHi0r9AHE/B1fZQoaAZHQDNRfVqesgdoB0vxaAhHQHi07iuMdcV1fZQoaAZHwENKKrq+rU9oB01nAWgIR0B4uBQSBbwCdX2UKGgGR8Btp1ndweeWaAdNiwFoCEdAeMOnKnvUjXV9lChoBkfAZDjqqwQlKWgHS9xoCEdAeNw25xzaK3V9lChoBkdAX+5rYXfqHGgHTegDaAhHQHjfD9n9Nvh1fZQoaAZHQGvrI+fRNRFoB01fAmgIR0B435/I8yN5dX2UKGgGR0Bnr2epXIU8aAdNowJoCEdAeOF8Hv+fiHV9lChoBkfAQP56yB06o2gHS/5oCEdAeORu7pV0cXV9lChoBkfAYvXjMFEApGgHTQ4BaAhHQHjmwY+B6KN1fZQoaAZHwG2Ys/pt78hoB01RAWgIR0B46skLQXyidX2UKGgGR0BqbQ+yJKraaAdNsAJoCEdAeO5/giu+y3V9lChoBkfAUbKbx3FDOWgHTeQBaAhHQHj4DJIUahp1fZQoaAZHwCPl07r9l3BoB0vraAhHQHj4fovBacJ1fZQoaAZHwDL9SBK+SKZoB00/AWgIR0B4/hECvHLidX2UKGgGR8BwAMVBUrCnaAdNFgJoCEdAeQUeiBXjl3V9lChoBkfAaH3H/cWTHWgHTRkBaAhHQHkGVMRHww11fZQoaAZHwGm9aBAfMfRoB00cAWgIR0B5CQaJhvzfdX2UKGgGR8BLQ7ZvkzXSaAdNUwFoCEdAeQoSyt3fRHV9lChoBkdAcbEKQaJhv2gHTWsBaAhHQHkKel9Brvd1fZQoaAZHQFjlPUKArhBoB03oA2gIR0B5C0KBun/DdX2UKGgGR8BncGeFtbcHaAdNPQFoCEdAeROgv114gXV9lChoBkfAay3N2TxG2GgHTQQBaAhHQHkWFzEJjUd1fZQoaAZHQF9QqTr3TNNoB03oA2gIR0B5GHU4JeE7dX2UKGgGR0BsQl89fTkRaAdNpgFoCEdAeRu6jFhod3V9lChoBkfAZAySFGoaUGgHTSsBaAhHQHkfq0QbuMN1fZQoaAZHQGcVRQizLOloB01bAmgIR0B5JZsqJ/G3dX2UKGgGR8Bw9YiW3Sa3aAdNkwFoCEdAeSaisXBP9HV9lChoBkfAaxRVcUuct2gHTSsBaAhHQHkp6EWZZ0V1fZQoaAZHwETtTzd1uBNoB004AWgIR0B5LVHtnf2sdX2UKGgGR8BNWnied07saAdNTAFoCEdAeS6tu1ndwnV9lChoBkdAaR6fK6nR9mgHTZ4BaAhHQHkymVeKKpF1fZQoaAZHQGo/fHggow5oB02fA2gIR0B5NqF49ovjdX2UKGgGR0BCq8Sf16E8aAdN6ANoCEdAeTt7CSA6MnV9lChoBkdAWNKhmGucMGgHTegDaAhHQHk7uaz/p+t1fZQoaAZHwGu6cUVSGahoB00SAWgIR0B5PlMWXTmXdX2UKGgGR8BJp3ZoPCl8aAdNPAFoCEdAeT7AJ9iMHnV9lChoBkfAbI2WszVMEmgHTYsBaAhHQHk/SKR+z+p1fZQoaAZHwGZuqp1ie/ZoB004AWgIR0B5Rq+0w8GLdX2UKGgGR0BpduQZGax5aAdNVgJoCEdAeUdWeYlY2nV9lChoBkfAax/ZaFEiMmgHTUoBaAhHQHlJWx6fJ3h1fZQoaAZHwDVENutOmBRoB00FAWgIR0B5Sik2xY7rdX2UKGgGR0Bncnr6ciGGaAdNcQJoCEdAeV8U1AJLNHV9lChoBkfAa8Uit7rs0GgHS+5oCEdAeWDb2lEZznV9lChoBkdAbUQ4smOU+2gHTR4CaAhHQHlhfrjYI0J1fZQoaAZHwFGAh1Tzd1xoB00LAmgIR0B5YblLeyiVdX2UKGgGR8Bnl4co6S1WaAdNeAFoCEdAeWS+yquKXXV9lChoBkdANbMkMTewcGgHS/BoCEdAeWahOP/7znV9lChoBkfAacGUmD15B2gHTUEBaAhHQHlqjcRDkU91fZQoaAZHwG27zXrdFfBoB01qAWgIR0B5cXLX+VC5dX2UKGgGR8BoYXDUExIraAdNGwFoCEdAeXGsqJ/G2nV9lChoBkfAZNiuU2UB4mgHTTkBaAhHQHl1ioS+QEJ1fZQoaAZHwGL/B8pkPMBoB0v0aAhHQHl2vjfek591fZQoaAZHwGKMJi7TUiJoB0v0aAhHQHl3jPa+N991fZQoaAZHQGTAGhmGucNoB00zAmgIR0B5e5/QSi/PdX2UKGgGR0BtiWgJ1JUYaAdNzQJoCEdAeYOq9GqgiHV9lChoBkfAaOgHmA9V3mgHTTcBaAhHQHmD/8/D+BJ1fZQoaAZHQG9VF23azu5oB01wAWgIR0B5hXPBzmwJdX2UKGgGR0Buqpr30wrUaAdNlQFoCEdAeYYMgU1yenV9lChoBkdAa8p/J/5Ly2gHTdMBaAhHQHmIXgtOEdx1fZQoaAZHwE0elgMMI/toB03rAWgIR0B5i1fTkQwsdX2UKGgGR0Buo6YLLIPtaAdNhAJoCEdAeY4aoMrmQ3V9lChoBkfAbUs78Nx2jmgHTZQBaAhHQHmO8u8K5TZ1fZQoaAZHQGyT66J66atoB03EAmgIR0B5kUPSUkfLdX2UKGgGR8BoEVbor4FiaAdNPQFoCEdAeZGff4yoGnV9lChoBkfAZeCy0rsjV2gHTScBaAhHQHmT/DLr5Zd1fZQoaAZHwGnyYaP0Zm9oB015AWgIR0B5lgXWOIZZdX2UKGgGR8Bnqhmwqy4XaAdNIAFoCEdAeZZmJFb3XnV9lChoBkfAaOKBe5WilGgHTV0BaAhHQHmXheHBUJh1fZQoaAZHQHAgvRVp9JBoB01wAWgIR0B5mBJQLux9dX2UKGgGR8A5/XA/LTx5aAdL7WgIR0B5mPmaH9FXdX2UKGgGR8A3n912aDwpaAdL/GgIR0B5mQxqO939dX2UKGgGR8AS9QCSzPa+aAdNAwFoCEdAeZlPu5SWJXV9lChoBkfAO9nxnWattGgHS/toCEdAeZvEt/WlM3V9lChoBkfAZt7jXFtKqWgHTS8BaAhHQHmiWUjcEeR1fZQoaAZHwGRrgT7EYO5oB0vnaAhHQHmngRsdkrh1fZQoaAZHwGdsSNGViWpoB01CAWgIR0B5p6UOd5IIdX2UKGgGR8BwnCp4rz5HaAdNYAFoCEdAeamhhH9WIXV9lChoBkdAbU+BnSOR1WgHTUEBaAhHQHmqL9If8uV1fZQoaAZHwGZAaTnq3VloB00VAWgIR0B5rFVghKUWdX2UKGgGR8A4tTOPeYUnaAdNOgFoCEdAeazrRjSXt3V9lChoBkfAZmatz0Yj0WgHS/loCEdAea1B0ZFXrHV9lChoBkfAaa9DPWxyGWgHTSUBaAhHQHmv5m29cr11fZQoaAZHwGeLwc5sCT5oB01FAWgIR0B5tBMDfWMCdX2UKGgGR8BjL4YtQKrraAdL42gIR0B5txshxHXmdX2UKGgGR8BqvRRXOnl5aAdNQQFoCEdAebgBCUornXVlLg=="
49
  },
50
  "ep_success_buffer": {
51
  ":type:": "<class 'collections.deque'>",
@@ -78,8 +78,8 @@
78
  },
79
  "n_envs": 16,
80
  "n_steps": 1024,
81
- "gamma": 0.6,
82
- "gae_lambda": 0.48,
83
  "ent_coef": 0.01,
84
  "vf_coef": 0.5,
85
  "max_grad_norm": 0.5,
 
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
+ "__init__": "<function ActorCriticPolicy.__init__ at 0x7efded27dca0>",
8
+ "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7efded27dd30>",
9
+ "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7efded27ddc0>",
10
+ "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7efded27de50>",
11
+ "_build": "<function ActorCriticPolicy._build at 0x7efded27dee0>",
12
+ "forward": "<function ActorCriticPolicy.forward at 0x7efded27df70>",
13
+ "extract_features": "<function ActorCriticPolicy.extract_features at 0x7efded202040>",
14
+ "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7efded2020d0>",
15
+ "_predict": "<function ActorCriticPolicy._predict at 0x7efded202160>",
16
+ "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7efded2021f0>",
17
+ "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7efded202280>",
18
+ "predict_values": "<function ActorCriticPolicy.predict_values at 0x7efded202310>",
19
  "__abstractmethods__": "frozenset()",
20
+ "_abc_impl": "<_abc_data object at 0x7efded27c2d0>"
21
  },
22
  "verbose": 1,
23
  "policy_kwargs": {},
 
26
  "_num_timesteps_at_start": 0,
27
  "seed": null,
28
  "action_noise": null,
29
+ "start_time": 1712322094998193614,
30
  "learning_rate": 0.0003,
31
  "tensorboard_log": null,
32
  "_last_obs": {
33
  ":type:": "<class 'numpy.ndarray'>",
34
+ ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAGZhhbxSmOG5qtKvObuD9rVEWvy6okrPuAAAgD8AAIA/hsotPnRNhLxOz8Q5MYscuCr05r0ZhQO5AACAPwAAgD/QZqq+l+5KP100Fz7063C+OUeqvUVlvz0AAAAAAAAAAM19M72P3nm6N6OIuYmrg7TS30a7KqOfOAAAgD8AAIA/M5x1PcPtMrqqpjw8bU65NkPBHLvn3K01AACAPwAAgD8z+1S9rnWJuspfnTlSg5G20TNvutAHtrgAAIA/AACAP/O6tj2PxmG69FQzvLVnF7Z0HL+68quLNQAAgD8AAIA/WlGJPTiqwD0zLAC+RURVvvae5rv1oK69AAAAAAAAAAATqjA+D7BlP16BVbz6dZW+nTHVPbplYr0AAAAAAAAAANPvHT6sxpU/aneYPsmswL7Lsuw9pRPHOwAAAAAAAAAAAGwwPXsanrr6CJS7q9wEtWgUTbr0uao6AACAPwAAgD/m0YG93r2ZPcMDRz4zlGG+FGeFPZurKD0AAAAAAAAAAKYnsb0G+Sw/m3PjPXOhiL6xc586eHkkPQAAAAAAAAAAAPg0O7jm5rmJ3Q66VpmLtVFxmLpr1SY5AACAPwAAgD9aMaI9H031uaQaJrtm6++1mJCwOirDPjoAAIA/AACAP5rZ/ToU3sK6VjB1urXLTTuVXAs7MstevAAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
35
  },
36
  "_last_episode_starts": {
37
  ":type:": "<class 'numpy.ndarray'>",
 
45
  "_stats_window_size": 100,
46
  "ep_info_buffer": {
47
  ":type:": "<class 'collections.deque'>",
48
+ ":serialized:": "gAWVQQwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQE46o+fRNRGMAWyUS9iMAXSUR0B9G5wjt5UtdX2UKGgGR0BkWQu/UONHaAdN6ANoCEdAfSBwsGxD9nV9lChoBkdAZbcMUh3aBmgHTegDaAhHQH0qTfrKNhp1fZQoaAZHQGLwXjlxOtZoB03oA2gIR0B9MjCbc45tdX2UKGgGR0BgN8xIre67aAdN6ANoCEdAfUBIcinpCHV9lChoBkdAZnzzRQaaTmgHTegDaAhHQH1XYk/r0J51fZQoaAZHQGJF6F/QSjBoB03oA2gIR0B9Y6+Jxeb/dX2UKGgGR0Bk9//95yEMaAdN6ANoCEdAfW6lXzUZvXV9lChoBkdAZkiY+B6KL2gHTegDaAhHQH1wTUAksz51fZQoaAZHQGLLta6jFhpoB03oA2gIR0B9cY7cO9WZdX2UKGgGR0Bc9SUcGTs6aAdN6ANoCEdAfXRVxjriVHV9lChoBkdAYeGplSS/02gHTegDaAhHQH2EYpMHryF1fZQoaAZHQGPq/+sHSndoB03oA2gIR0B9iGaTfR/mdX2UKGgGR0AjM6QvHtF8aAdL9WgIR0B9jxEPUaybdX2UKGgGR0BkvO6d1+y7aAdN6ANoCEdAfY9VLBbfQHV9lChoBkdAY/ipo9LYgGgHTegDaAhHQH2bvc8DB/J1fZQoaAZHQGA3liSaEzxoB03oA2gIR0B9sKr+5vtMdX2UKGgGR0BVwfIOpbUxaAdN6ANoCEdAfbQI55qubXV9lChoBkdAY4/yEtdzGWgHTegDaAhHQH234+B6KLt1fZQoaAZHQGGtnWz4UN9oB03oA2gIR0B9v3di2DxtdX2UKGgGR0BlQdEuxrzoaAdN6ANoCEdAfcWYtQKrrHV9lChoBkdAZdEu5jH4oWgHTegDaAhHQH3Re4oZydZ1fZQoaAZHQGV/nw5NoJ1oB03oA2gIR0B95Do4dZJTdX2UKGgGR0BmLupMpPRBaAdN6ANoCEdAfe3TA31jAnV9lChoBkdAYjpjx0+1SmgHTegDaAhHQH32G47Rv3t1fZQoaAZHQGT8JXp4bCJoB03oA2gIR0B9+EKUmlZYdX2UKGgGR0BlShgiNbTuaAdN6ANoCEdAffpfyf+S83V9lChoBkdAXnHZAY51eWgHTegDaAhHQH4GqgyuZCx1fZQoaAZHQGUYNOEdvKloB03oA2gIR0B+CZntfG+9dX2UKGgGR0BkHnXoTwlTaAdN6ANoCEdAfg7QRPGhmHV9lChoBkdAYLzkWhysCGgHTegDaAhHQH4PBN21Ul11fZQoaAZHQGCpL1/Ue+5oB03oA2gIR0B+GXNY8uBddX2UKGgGR0BjccR6F/QTaAdN6ANoCEdAfhslvZRKpXV9lChoBkdAaOZFKkEcKmgHTegDaAhHQH43WVAzHjp1fZQoaAZHQGA+Wf9P1thoB03oA2gIR0B+Ot3fQ8fWdX2UKGgGR0Bc9qq814xDaAdN6ANoCEdAfkIHU+cH4XV9lChoBkdAYdlYEGJN02gHTegDaAhHQH5IDoUzsQd1fZQoaAZHQGRvT7l7tzFoB03oA2gIR0B+VBxAB1cMdX2UKGgGR0BlfCScLBsRaAdN6ANoCEdAfmhd/J/5L3V9lChoBkdAYp7/jKgZj2gHTegDaAhHQH5zC9EkSmJ1fZQoaAZHQF4l6jWTX8RoB03oA2gIR0B+fDffoA4odX2UKGgGR0BnANm6GxlhaAdN6ANoCEdAfn6qoZQ53nV9lChoBkdAYYtcHGCI12gHTegDaAhHQH6BLKFIuoR1fZQoaAZHQGTT1Ed/8VJoB03oA2gIR0B+kJ4mkWRBdX2UKGgGR0Bfgrns9jgAaAdN6ANoCEdAfpRhXr+o+HV9lChoBkdAXqEfyPMjeWgHTegDaAhHQH6bGEPDpC91fZQoaAZHQGJA7pV0cOtoB03oA2gIR0B+m1iqhlDndX2UKGgGR0Be0JTER8MNaAdN6ANoCEdAfqeyLQ5WBHV9lChoBkdAYUU6qbSZ0GgHTegDaAhHQH6pvQnhKlJ1fZQoaAZHQGC/l+3H7xdoB03oA2gIR0B+rVsLv1DjdX2UKGgGR0BkChrrPdEcaAdN6ANoCEdAfsZmmtQsPXV9lChoBkdAYNVarWAf+2gHTegDaAhHQH7PJTER8MN1fZQoaAZHQFwSiWVu76JoB03oA2gIR0B+1nHaN+9bdX2UKGgGR0Bj+lV/+bVjaAdN6ANoCEdAfuTP0qYqonV9lChoBkdAZQS32EkB0mgHTegDaAhHQH77OdXko4N1fZQoaAZHQGGgjA8B+4NoB03oA2gIR0B/Behf0EowdX2UKGgGR0Bk9RLCemNzaAdN6ANoCEdAfw82xY7q6nV9lChoBkdAZvOK+i8Fp2gHTegDaAhHQH8RjkMkQf91fZQoaAZHQGS2YNqgyuZoB03oA2gIR0B/E/IikftAdX2UKGgGR0BexIXoC+10aAdN6ANoCEdAfyE2M85jpnV9lChoBkdAZiXVhCtzS2gHTegDaAhHQH8kVhoduHh1fZQoaAZHQGNHrxRVIZtoB03oA2gIR0B/KdLxqfvndX2UKGgGR0BkG9fCyhSMaAdN6ANoCEdAfyoMUAT7EnV9lChoBkdAWxUXcgyM1mgHTegDaAhHQH8033UQTVV1fZQoaAZHQGClehGpdbBoB03oA2gIR0B/NrPw/gR9dX2UKGgGR0BldmQ6p5u7aAdN6ANoCEdAfzncy31BdHV9lChoBkdAZNCLiuMdcWgHTegDaAhHQH9Pj1XeWOZ1fZQoaAZHQGWurUkOZstoB03oA2gIR0B/V52eQMhHdX2UKGgGR0Be9L3sXzlLaAdN6ANoCEdAf16UxVQyh3V9lChoBkdAZC9ReC04R2gHTegDaAhHQH9so0IkZ751fZQoaAZHQF20+RYA80VoB03oA2gIR0B/hBcGC7K8dX2UKGgGR0BkzDj94u9OaAdN6ANoCEdAf5CpEhJRO3V9lChoBkdAXdVObiIcimgHTegDaAhHQH+blyaNMoN1fZQoaAZHQF9t6Skj5bhoB03oA2gIR0B/noKLKmsOdX2UKGgGR0BhIjWsijcmaAdN6ANoCEdAf6GFOfukUXV9lChoBkdAYu3b/wRXfmgHTegDaAhHQH+0UNKAavR1fZQoaAZHQGXf2fkFOfxoB03oA2gIR0B/uMytV7x/dX2UKGgGR0BgeByXD3ueaAdN6ANoCEdAf8CS1Vo6CHV9lChoBkdAYzSiO/+Kj2gHTegDaAhHQH/A5SWJJoV1fZQoaAZHQGUEO7QLNOdoB03oA2gIR0B/zyNMoMKDdX2UKGgGR0BnrDTBqKxcaAdN6ANoCEdAf9FugYgq3HV9lChoBkdAYDZs/IKc/mgHTegDaAhHQH/VdOVPepJ1fZQoaAZHQGJ6ml67dzpoB03oA2gIR0B/2hlz2exwdX2UKGgGR0BfMSgTRIBjaAdN6ANoCEdAf/b2HtWuHXV9lChoBkdAXokgzP8htGgHTegDaAhHQH/+K7mMfih1fZQoaAZHQGJaxf4REndoB03oA2gIR0CABdR64UeudX2UKGgGR0BCe1kUbkwOaAdL/WgIR0CADwwTM7lrdX2UKGgGR0BgjRbW3BpIaAdN6ANoCEdAgBAsaCL/CXV9lChoBkdAY4l1Oj7AL2gHTegDaAhHQIAVGkgwGnp1fZQoaAZHQGIHb0e2d/doB03oA2gIR0CAGWMb3oLYdX2UKGgGR0BkMsbtJFspaAdN6ANoCEdAgBp5ZB9kSXV9lChoBkdAYVjEit7rs2gHTegDaAhHQIAblyPuG9J1fZQoaAZHQGbA+VC5VfhoB03oA2gIR0CAIqmVJL/TdX2UKGgGR0BidUUKzAvdaAdN6ANoCEdAgCR1zySV4XV9lChoBkdAYGVTEzfrKWgHTegDaAhHQIAnoq/dqL11fZQoaAZHQGChQVsUIs1oB03oA2gIR0CAJ8NYr8R+dX2UKGgGR0BidtsJpnHvaAdN6ANoCEdAgC3PLHMlknV9lChoBkdAZEN9MsYl6mgHTegDaAhHQIAuzHlwLmZ1fZQoaAZHQGcpHLzPKMhoB03oA2gIR0CAMI9jgAIZdX2UKGgGR0Bg8IKrq+rVaAdN6ANoCEdAgDK9nbqQinVlLg=="
49
  },
50
  "ep_success_buffer": {
51
  ":type:": "<class 'collections.deque'>",
 
78
  },
79
  "n_envs": 16,
80
  "n_steps": 1024,
81
+ "gamma": 0.999,
82
+ "gae_lambda": 0.98,
83
  "ent_coef": 0.01,
84
  "vf_coef": 0.5,
85
  "max_grad_norm": 0.5,
ppo-LunarLander-v2/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:eb8729bad0d8afa9ac2d6eba4cc7a7580f0e6f6c0b7a6c5e8261ba6b14ab06ba
3
  size 87978
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:071ebaa3cc3626b31dff97224b73ddd608e60936def0e5f1e9de8809ef1afd8d
3
  size 87978
ppo-LunarLander-v2/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e2cb2371ec5f31a8f5196323d2b194f832125fb54ee4d79974de9eb760d4368c
3
  size 43634
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:08c8af57f5b771a90f5dfebe93c8b387b828ae0d88f0862b6e2691ed4bc6cc76
3
  size 43634
replay.mp4 CHANGED
Binary files a/replay.mp4 and b/replay.mp4 differ
 
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 4.774459000000002, "std_reward": 138.5829294597152, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2024-04-05T20:58:44.065071"}
 
1
+ {"mean_reward": 230.2089746, "std_reward": 17.25921101590976, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2024-04-05T21:10:19.568394"}