tung491 commited on
Commit
b297e43
1 Parent(s): b852169

Upload PPO LunarLander-v2 trained agent

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
- value: 229.49 +/- 55.46
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
+ value: 260.72 +/- 19.36
20
  name: mean_reward
21
  verified: false
22
  ---
config.json CHANGED
@@ -1 +1 @@
1
- {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7a9bdf53e560>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7a9bdf53e5f0>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7a9bdf53e680>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7a9bdf53e710>", "_build": "<function ActorCriticPolicy._build at 0x7a9bdf53e7a0>", "forward": "<function ActorCriticPolicy.forward at 0x7a9bdf53e830>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7a9bdf53e8c0>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7a9bdf53e950>", "_predict": "<function ActorCriticPolicy._predict at 0x7a9bdf53e9e0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7a9bdf53ea70>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7a9bdf53eb00>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7a9bdf53eb90>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7a9bdf6d9e80>"}, "verbose": true, "policy_kwargs": {}, "num_timesteps": 1015808, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1711106625402709981, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAAZtjj7FZhc/UgjZPc845r4AME8+0oywvQAAAAAAAAAAWod/Puh94T4iF5u9M5iuvlg2oD0zhNW9AAAAAAAAAAAz+py8S5ySP+syUr1FcR2/QITivMkpgjwAAAAAAAAAAA3VnL32OGe6tbdXulfH4DVb3xw7lVR3OQAAAAAAAAAAnVhrvq+tUD9Kwqu+1O3nvkaqib5Fzi69AAAAAAAAAACaJyO+XH9cvJ07xLrmv/i40v/BPf5LBDoAAIA/AACAPwNnuT62wig/pxAtPZGj074CK0Y+Ng8qvgAAAAAAAAAA0z48Pg5yjbytXw87qzxkueib9L26skK6AACAPwAAgD+zKUC+0F/LPmBTU726I5C+nnzKvf6GpDwAAAAAAAAAABovrT1xHM4+cx/WPGvls77aZAk94vk+vQAAAAAAAAAA03d/PpGD6z2nCMu9iR2DvtvfHz2iJaq8AAAAAAAAAADN9B++D1NevOGXBrv56C+59NbGPXJmOToAAIA/AACAPwCwELtTdb8/CiWdvGqDVj4AVS88tXJCPAAAAAAAAAAAoMMFPly+ZDuiiDm+BYUVvNH8iT01zhm+AACAPwAAgD9TxTk+tMGuvFKM1bppvaI5NgwYvk6dPjoAAIA/AACAPxNAIL5PXkC8IKf7upfXCbnc6qY95isjOgAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.015808000000000044, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWV9gsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQGzJ5dWyTpyMAWyUS9yMAXSUR0Ce2QhW5paidX2UKGgGR0By4UlXzUZvaAdL3WgIR0Ce2SqlxffGdX2UKGgGR0BxyAihWYF8aAdL82gIR0CfNo384xUOdX2UKGgGR0BuZng75mAcaAdLyWgIR0CfNplzEJjUdX2UKGgGR0BvZT3AVO9GaAdLyGgIR0CfNzk7wKBvdX2UKGgGR0BzWFvYODraaAdL1GgIR0CfOVkWAPNFdX2UKGgGR0BvLZaRp1zRaAdL2WgIR0CfOp8nNPgvdX2UKGgGR0BwMqKP4mCzaAdL0GgIR0CfO3SL61stdX2UKGgGR0ByxOd9Ujs2aAdLzmgIR0CfO9a1TisGdX2UKGgGR0ByDtTyauwHaAdL1WgIR0CfPWp+tr9EdX2UKGgGR0Bk0MFKTSssaAdN6ANoCEdAnz23+6y0KXV9lChoBkdAcPJvoNd7fGgHS8ZoCEdAnz68lPacqnV9lChoBkdAcikz7uUliWgHS91oCEdAnz/y08eS0XV9lChoBkdAcEw/keZG8WgHTQwBaAhHQJ9DZyWAwwl1fZQoaAZHQGqojI7vG6xoB03gAmgIR0CfQ+jZL7GedX2UKGgGR0BwimXfIjnnaAdL4mgIR0CfRDw8nuzAdX2UKGgGR0BxgR1r6+FlaAdL12gIR0CfRg30f5k9dX2UKGgGR0BvvVSVGCqZaAdL5GgIR0CfRtzj3mFKdX2UKGgGR0BzJIm3OObRaAdNAAFoCEdAn0lGNWEK3XV9lChoBkdAc2oLThHby2gHTQkBaAhHQJ9Jbs5XEIh1fZQoaAZHQHEkc3hn8KpoB0vcaAhHQJ9JofLcKw91fZQoaAZHQHEIUHD7655oB00LAWgIR0CfSnbTMJQddX2UKGgGR0BjLpF5OafBaAdN6ANoCEdAn0tl6E8JU3V9lChoBkdAcdrrupjtomgHS+1oCEdAn0x+ogmqpHV9lChoBkdAcX6OZLIxQGgHS+VoCEdAn0y7EUCaJHV9lChoBkdARGacwxnFpGgHS6hoCEdAn0zqcy31BnV9lChoBkdAcIgQg9vCM2gHS/loCEdAn00x8UmD2HV9lChoBkdAYo6qYqoZRGgHTegDaAhHQJ9NkMqjJuF1fZQoaAZHQHCyhg7YChhoB0vhaAhHQJ9OA77sOXp1fZQoaAZHQHCKQyqMm4RoB0vSaAhHQJ9QmRB/qgR1fZQoaAZHQG0+Dwpe/pNoB0vQaAhHQJ9RToGIKtx1fZQoaAZHQHC13zxwyZdoB0vsaAhHQJ9RV2St/4J1fZQoaAZHQHEF2KdhAnloB0v6aAhHQJ9RsLH+6y11fZQoaAZHQHBv+1Bt1p1oB0vSaAhHQJ9SQ3bVSXN1fZQoaAZHQGZAqHoHLRtoB03oA2gIR0CfUlLiuMdcdX2UKGgGR0BvnZFb3XZoaAdLw2gIR0CfUslOoHcDdX2UKGgGR0BtXMDMeOn3aAdL22gIR0CfU7WyTpxFdX2UKGgGR0BveI/xDst1aAdL12gIR0CfU8R15jYqdX2UKGgGR0BwjkvBacI7aAdL32gIR0CfVDYK6WgOdX2UKGgGR0BfsA8SwnpjaAdN6ANoCEdAn1TKYJE6UHV9lChoBkdAcXEGzKLbYmgHS+ZoCEdAn1UbNB4UvnV9lChoBkdAch8MA3kxRGgHS9FoCEdAn1bZ+MIeHXV9lChoBkdAZI20svqTr2gHTegDaAhHQJ9XCeYlY2d1fZQoaAZHQHF36HXVbzNoB0vKaAhHQJ9YIacZtN11fZQoaAZHQHIkh/EwWWRoB0vyaAhHQJ9YeZZ0Syt1fZQoaAZHQHFtSZKFqSJoB0v3aAhHQJ9YmXMQmNR1fZQoaAZHQG6Mbvw3HaNoB0vPaAhHQJ9YyKUFB6d1fZQoaAZHQHDTyr5qM3toB0vzaAhHQJ9ZVa8pTdd1fZQoaAZHQFoXtO2y9mJoB03oA2gIR0CfWbVtXPqtdX2UKGgGR0BuFx1vES/TaAdNEgFoCEdAn1nE9ECvHXV9lChoBkdAbmKOUdJaq2gHS9xoCEdAn1o0XpGFz3V9lChoBkdAcHW0SAYpD2gHS/BoCEdAn1qxB7eEZnV9lChoBkdAcaawBHTZx2gHS+JoCEdAn1tgJswcpHV9lChoBkdAcqlsFdLQHGgHTRIBaAhHQJ9dIFotcwB1fZQoaAZHQHCdWACnxaxoB0vVaAhHQJ9dSt3fQ8h1fZQoaAZHQHJEWLHdXT5oB0voaAhHQJ9dsKTjebd1fZQoaAZHQHDokka/ATJoB0vBaAhHQJ9d1gy/KyR1fZQoaAZHQGS2BIOH311oB03oA2gIR0CfXjX9zfaYdX2UKGgGR0Bv9dsxfv4NaAdLz2gIR0CfXpIrvsqsdX2UKGgGR0Bv0aDsdDIBaAdLzGgIR0CfX7Hh0hePdX2UKGgGR0BwYGV7hNucaAdL22gIR0CfX7vCMxXXdX2UKGgGR0BxOrlLeyiVaAdL32gIR0CfYDBtk4FSdX2UKGgGR0ByZYa1kUblaAdNBQFoCEdAn2A94Z/CqXV9lChoBkdAbtbrMTviLmgHS9xoCEdAn2EGETQE6nV9lChoBkdAcicTKDCgsmgHTQ4BaAhHQJ9h78Muvll1fZQoaAZHQHEH+UY8+zNoB0v1aAhHQJ9ifAFgUlB1fZQoaAZHQG95ZfdAPd5oB0veaAhHQJ9ji3+dbxF1fZQoaAZHQG9atXPqs2hoB0vSaAhHQJ9jujM3ZPF1fZQoaAZHQHF6Itcv/R5oB0vWaAhHQJ9kWZw4sEt1fZQoaAZHQHD6sVQAMlVoB0vnaAhHQJ9kgQVbiZR1fZQoaAZHQHJaQ6ltTDRoB0vUaAhHQJ9krIbOu7p1fZQoaAZHQHAIcJlar3loB0vQaAhHQJ9lqwcHWz51fZQoaAZHQHFZcYEW69VoB0voaAhHQJ9nDZuhsZZ1fZQoaAZHQHF805uIhyNoB0v7aAhHQJ9nF1ZDArR1fZQoaAZHQHEBWKZUkv9oB0vXaAhHQJ9ofyMDOkd1fZQoaAZHQG/VQRGtp25oB0vgaAhHQJ9pbgk1Muh1fZQoaAZHQG4gPnr6ciJoB0vTaAhHQJ9qSnzg/C91fZQoaAZHQHC6MGxD9floB0vRaAhHQJ9qeB8QZoB1fZQoaAZHQGPvRYJVsDZoB03oA2gIR0CfbBunMt9QdX2UKGgGR0ByCdufmLccaAdL72gIR0CfbHyWAwwkdX2UKGgGR0Bx5z3L3bmEaAdL4GgIR0CfbadonKGMdX2UKGgGR0Bw5r3FkxyoaAdL4WgIR0Cfb/E8aGYbdX2UKGgGR0BvKAZuQ6p6aAdN4wFoCEdAn3MB9LHuJHV9lChoBkdAbVSADJU5uWgHTR4BaAhHQJ9zZSR8twt1fZQoaAZHQHIz0Aksz2xoB0v7aAhHQJ9zzc580DV1fZQoaAZHQHGj68g6ltVoB0vbaAhHQJ90tcyFfzB1fZQoaAZHQHIZNK28Zk1oB0v3aAhHQJ906JKraM91fZQoaAZHQHM2XKB/ZuhoB0vhaAhHQJ91NC7btZ51fZQoaAZHQGWlaisXBP9oB03oA2gIR0CfdoMuOCGvdX2UKGgGR0BwF+V5a/yoaAdL7WgIR0Cfd8RLsa86dX2UKGgGR0Bwws2R7qptaAdL8GgIR0CfeLRsdkrgdX2UKGgGR0Bx6/ktEofCaAdL0WgIR0CfeSJQ+EAYdX2UKGgGR0BxB/LwF1SwaAdL42gIR0Cfe7VLzwtrdX2UKGgGR0BkmjtqpLmIaAdN6ANoCEdAn3vtJrcj7nV9lChoBkdAbuQz+FUQ1GgHS85oCEdAn3wpOWSlnHV9lChoBkdAcFq1UEPlMmgHS+toCEdAn3w6n3ta6nV9lChoBkdAcsg7e2uxKWgHS95oCEdAn3zF63RXwXV9lChoBkdAcErcJ+lTFWgHS+9oCEdAn317drO7hHV9lChoBkdAcQFyRjjJdWgHS95oCEdAn33pM6BAfXV9lChoBkdAcRIjghr302gHS81oCEdAn36Fyq+8G3VlLg=="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 380, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVdgIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoCIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoESiWCAAAAAAAAAABAQEBAQEBAZRoFUsIhZRoGXSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBEoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaAtLCIWUaBl0lFKUjARoaWdolGgRKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgLSwiFlGgZdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV2wAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCmMBWR0eXBllGgOjApfbnBfcmFuZG9tlE51Yi4=", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "n_steps": 2048, "gamma": 0.99, "gae_lambda": 0.95, "ent_coef": 0.0, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 10, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "system_info": {"OS": "Linux-6.1.58+-x86_64-with-glibc2.35 # 1 SMP PREEMPT_DYNAMIC Sat Nov 18 15:31:17 UTC 2023", "Python": "3.10.12", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.2.1+cu121", "GPU Enabled": "True", "Numpy": "1.25.2", "Cloudpickle": "2.2.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
 
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7c5f53a89630>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7c5f53a896c0>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7c5f53a89750>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7c5f53a897e0>", "_build": "<function ActorCriticPolicy._build at 0x7c5f53a89870>", "forward": "<function ActorCriticPolicy.forward at 0x7c5f53a89900>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7c5f53a89990>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7c5f53a89a20>", "_predict": "<function ActorCriticPolicy._predict at 0x7c5f53a89ab0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7c5f53a89b40>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7c5f53a89bd0>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7c5f53a89c60>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7c5f53a8cb40>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 1507328, "_total_timesteps": 1500000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1711526485592841125, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAACbLmr24l5C7Z2CGuyqOsjzMBu68Q0qWPQAAgD8AAIA/Bhg1vn2GUz5aYK89/i5TvjYpnLzSyL27AAAAAAAAAADmh6+9ubOXP+Ib5b6FcxS/Yze0vQ9TQb4AAAAAAAAAAOalMT1Iv5G6i379NES4Li1S5cQ6iFVqtAAAgD8AAIA/gE9tvQV5oLs3u0c8tEEXPH5L37xezgU9AACAPwAAgD9Apgu+pwFPPjRWwj3HiTG+KrmVvB+1tDwAAAAAAAAAAJr3n71NW1c/sqJevZm47b4jIBK9m8EfvAAAAAAAAAAAM20EPOwv6D7Er5S82QeevnB/fjxh7ii9AAAAAAAAAACNwC6+ewuGvFU2druMWa+5DHP5Peo1pDoAAIA/AACAP5oOnDxIEo0/qp4aPeaYCL867+08lpI5vQAAAAAAAAAA03Ayvu7PnbzC/ii8rVO7uqu1Bz64LZQ7AACAPwAAgD8aBjU9xabvPG4LV70SMy6+drqkO5/ZHjwAAAAAAAAAAJrsib6tb+0+aKJhPkqEvL6oZq69Jls+PgAAAAAAAAAAzZRrPSecvj8YUQA/byI7Ptgv5jyaawI+AAAAAAAAAABNWRC+gbUjP6pVfTzVkdm+t4g+vYp/Kj0AAAAAAAAAAEDhI76cZUi8wwmzOraBajloTqk9ulAcugAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.004885333333333408, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWV/wsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHCDcafjCHiMAWyUS/6MAXSUR0CgIcodMj/udX2UKGgGR0Bw+Bvze40/aAdL+GgIR0CgIeFXJYDDdX2UKGgGR0BwRfY+Sr5qaAdL4WgIR0CgIfIsZpBYdX2UKGgGR0BupV43WFviaAdL4mgIR0CgIfki2UjcdX2UKGgGR0Bya8XvYvnKaAdL7mgIR0CgIkzK9wm3dX2UKGgGR0Bxy5V94NZvaAdL/2gIR0CgIl6hxo7FdX2UKGgGR0BwGtPDYRNAaAdL5mgIR0CgIoG0/nnudX2UKGgGR0BvbimoBJZoaAdL7WgIR0CgI15s0pEydX2UKGgGR0BwiMiJO32FaAdL/mgIR0CgI3ZSeiBYdX2UKGgGR0BylxESdvsJaAdL/2gIR0CgI4mmce8xdX2UKGgGR0BvWJh+fAbiaAdL5GgIR0CgI+EGZ/kOdX2UKGgGR0ByUh0q6OHWaAdL9mgIR0CgJDGGdqcmdX2UKGgGR0BxWkyyleniaAdL72gIR0CgJOZz5oGqdX2UKGgGR0BxTF1bJOnEaAdL2WgIR0CgJPI/7iyZdX2UKGgGR0BwUPfAKv3baAdL12gIR0CgJPzEaVD8dX2UKGgGR0BfffrfLs8gaAdN6ANoCEdAoCUhEfDDTHV9lChoBkdAbyfokAxSHmgHTQMBaAhHQKAlcPsAvL51fZQoaAZHQG8VgI6bONZoB0v/aAhHQKAljXSSeRR1fZQoaAZHQHHsNgSeyzJoB0v7aAhHQKAl0M5wOvt1fZQoaAZHQHHUBrJr+HdoB0v4aAhHQKAl2K/mDDl1fZQoaAZHQG4akHt4RmNoB0v6aAhHQKAmAm1pj+d1fZQoaAZHQHDG8zZYgaFoB0v3aAhHQKAm1CPZIxx1fZQoaAZHQHDr1uR9w3poB0v1aAhHQKAm4sTWXkZ1fZQoaAZHQGxPVr6+FlFoB0v9aAhHQKAnFKSxJNF1fZQoaAZHQHLbRUm2LHdoB00SAWgIR0CgKBanzg/DdX2UKGgGR0Bx7V8gIQe4aAdL+2gIR0CgKIIIF/x2dX2UKGgGR0BxECX9itq6aAdNBgFoCEdAoCi/ymQ8wHV9lChoBkdAcd/XtjTa02gHTQQBaAhHQKAoxElVtGd1fZQoaAZHQG4mx2St/4JoB0vqaAhHQKApBhAnlXB1fZQoaAZHQHIzNwJgLJFoB00VAWgIR0CgKTPh60IDdX2UKGgGR0Bxb81k1/DtaAdL6WgIR0CgKVy8J2MbdX2UKGgGR0Bw/jgm7aqTaAdL62gIR0CgKV0FKTStdX2UKGgGR0BytbjIaLn+aAdNgQFoCEdAoCmPN3W4E3V9lChoBkdAbkMK3uuzQmgHS+poCEdAoCmT6P8ye3V9lChoBkdAcOnHavicXmgHS/BoCEdAoCpvn2ZiNXV9lChoBkdAbJM+JP69CmgHS/ZoCEdAoCqUygwoLHV9lChoBkdAbwy5EMLF42gHS/JoCEdAoCq2R7qptXV9lChoBkdAcwPlSS/0umgHS/NoCEdAoCuuM4tHx3V9lChoBkdAcLVXyiEg4mgHS+xoCEdAoCv64SYgJXV9lChoBkdAcbuvwmVqvmgHS+loCEdAoCwr6N2ki3V9lChoBkdAcOq+L3sXzmgHS9hoCEdAoCyDreIl+nV9lChoBkdAcljNJvo/zWgHS+5oCEdAoCyHgUDdQHV9lChoBkdAckbAood+5WgHS+loCEdAoCzGqioKlnV9lChoBkdAceI7Qb+98WgHS/FoCEdAoC0ZC8e0X3V9lChoBkdAchEN21UlzGgHTRsBaAhHQKAtW6U7jkx1fZQoaAZHQHBDYIKMNttoB00HAWgIR0CgLWZavA45dX2UKGgGR0Bw5xKODJ2daAdNRgFoCEdAoC2RJNCZ4XV9lChoBkdATh2AEt/WlWgHS9loCEdAoC3tpTMq0HV9lChoBkdAbrP8cdYGMWgHS/poCEdAoC5Ho1UEPnV9lChoBkdAYcsHZ9NN8GgHTegDaAhHQKAuUENe+mF1fZQoaAZHQHDjx15jYqZoB00KAWgIR0CgLmXsw+MZdX2UKGgGR0BwsNdhRZU2aAdL7GgIR0CgLzL1EmY0dX2UKGgGR0Bu8ZfOUt7KaAdL8mgIR0CgL4w2VE/jdX2UKGgGR0BwGY1xbSqmaAdL+2gIR0CgL99ycTakdX2UKGgGR0BuFT7XQMQVaAdL52gIR0CgL9/WDpTudX2UKGgGR0BcxU4JeE7GaAdN6ANoCEdAoDAbDKoybnV9lChoBkdAcU17kXDWLGgHTRwBaAhHQKAwrQ5WBBl1fZQoaAZHQHMqnZXdTHdoB00NAWgIR0CgMLLTH80ldX2UKGgGR0BwcXmW+oLoaAdNAAFoCEdAoDDaCg9Ne3V9lChoBkdAbMfyJbdJrmgHS/RoCEdAoDDw0EX+EXV9lChoBkdAcHfJhfBvaWgHS+doCEdAoDD4DzRQanV9lChoBkdAcM4DlHSWq2gHS9poCEdAoDF5JiAlOXV9lChoBkdAckmBYFJQL2gHS/poCEdAoDGWQGOdXnV9lChoBkdAcmNPppvgnGgHTSMBaAhHQKAxn1q33Ht1fZQoaAZHQHDmupS75EdoB0v7aAhHQKAx+/pt78h1fZQoaAZHQHFNR15jYqZoB00QAWgIR0CgMjILgGbDdX2UKGgGR0A+hqp97WupaAdLg2gIR0CgMoXC0ngHdX2UKGgGR0BxzF63RXwLaAdL8GgIR0CgMrHYxtYTdX2UKGgGR0ByOvHyVfNSaAdL5mgIR0CgMvQdS2pidX2UKGgGR0BwrLyvs7dSaAdL52gIR0CgM1b3fyf+dX2UKGgGR0BzUxC9h7VsaAdLyWgIR0CgM/MKb8WLdX2UKGgGR0ByPbFaSs8xaAdNDQFoCEdAoDQGr8zhxnV9lChoBkdAZHU11GLDRGgHTegDaAhHQKA0Zgnc+JR1fZQoaAZHQG88ubAk9lpoB0vxaAhHQKA0gRFI/aB1fZQoaAZHQHG11abF0gdoB00kAWgIR0CgNMEyULUkdX2UKGgGR0Bw3a+evpyIaAdL7mgIR0CgNMoMjNY9dX2UKGgGR0Bx99Ukv9LpaAdNDQFoCEdAoDVOu9vjwXV9lChoBkdAcO/fKp1ifGgHS+poCEdAoDWTT+ee4HV9lChoBkdAcEE9uP3i72gHTQIBaAhHQKA2AYqG1x91fZQoaAZHQHFDL2L5ylxoB0vhaAhHQKA2qgAZKnN1fZQoaAZHQHJYcPatcOdoB00NAWgIR0CgNwLVvuPWdX2UKGgGR0Bwno8aGYa6aAdNEQFoCEdAoDeEcXFcZHV9lChoBkdAcUxNBWxQi2gHS+9oCEdAoDeMxTKkmHV9lChoBkdAcU+/3WWhRWgHTQgBaAhHQKA3mKXOW0J1fZQoaAZHQHFky0KJEYxoB0vvaAhHQKA4F8jzI3l1fZQoaAZHQHAv1WS2Yv5oB0v0aAhHQKA4eK8+Ro11fZQoaAZHQHKfeRT0g8toB00OAWgIR0CgOIIZIg/1dX2UKGgGR0Bxom8oQWepaAdL+2gIR0CgOOXCTEBKdX2UKGgGR0Bwwxk+X7cgaAdL6WgIR0CgORC22G7BdX2UKGgGR0BvN4t6HCXQaAdNrgFoCEdAoDkn9YOlPHV9lChoBkdAcEXgBcRlH2gHTQABaAhHQKA5m6RQrMF1fZQoaAZHQG/ZTgVGkN5oB0v1aAhHQKA5wjDbah91fZQoaAZHQHJ0KRZEDyRoB0vhaAhHQKA5/CLuQZJ1fZQoaAZHQG5PFJQLux9oB0vyaAhHQKA6lriVB2R1fZQoaAZHQGxa7Z39rGloB0vpaAhHQKA7C1JlJ6J1fZQoaAZHQG/fG7BfrrxoB0vyaAhHQKA7KoddVvN1fZQoaAZHQHCToqwyIpJoB00DAWgIR0CgO4G5UcXFdX2UKGgGR0BvQQF1SwW4aAdL52gIR0CgPAPz4DcNdX2UKGgGR0BylrBCUornaAdL62gIR0CgPB1zIV/MdX2UKGgGR0BwqJJZntfHaAdNDAFoCEdAoDw1Jaq0dHVlLg=="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 460, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVdgIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoCIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoESiWCAAAAAAAAAABAQEBAQEBAZRoFUsIhZRoGXSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBEoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaAtLCIWUaBl0lFKUjARoaWdolGgRKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgLSwiFlGgZdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV2wAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCmMBWR0eXBllGgOjApfbnBfcmFuZG9tlE51Yi4=", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "n_steps": 2048, "gamma": 0.99, "gae_lambda": 0.95, "ent_coef": 0.0, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 10, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "system_info": {"OS": "Linux-6.1.58+-x86_64-with-glibc2.35 # 1 SMP PREEMPT_DYNAMIC Sat Nov 18 15:31:17 UTC 2023", "Python": "3.10.12", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.2.1+cu121", "GPU Enabled": "True", "Numpy": "1.25.2", "Cloudpickle": "2.2.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
ppo-LunarLander-v2.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f9d2d527e1b889eb822cbd333376de146bf1a55bb6c0770eae1c30629134160a
3
- size 147986
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:214052fbaad774ff9a82075ec9a7200500332bc73d1d77d2a86d33711a887c03
3
+ size 147995
ppo-LunarLander-v2/data CHANGED
@@ -4,34 +4,34 @@
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
- "__init__": "<function ActorCriticPolicy.__init__ at 0x7a9bdf53e560>",
8
- "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7a9bdf53e5f0>",
9
- "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7a9bdf53e680>",
10
- "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7a9bdf53e710>",
11
- "_build": "<function ActorCriticPolicy._build at 0x7a9bdf53e7a0>",
12
- "forward": "<function ActorCriticPolicy.forward at 0x7a9bdf53e830>",
13
- "extract_features": "<function ActorCriticPolicy.extract_features at 0x7a9bdf53e8c0>",
14
- "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7a9bdf53e950>",
15
- "_predict": "<function ActorCriticPolicy._predict at 0x7a9bdf53e9e0>",
16
- "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7a9bdf53ea70>",
17
- "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7a9bdf53eb00>",
18
- "predict_values": "<function ActorCriticPolicy.predict_values at 0x7a9bdf53eb90>",
19
  "__abstractmethods__": "frozenset()",
20
- "_abc_impl": "<_abc._abc_data object at 0x7a9bdf6d9e80>"
21
  },
22
- "verbose": true,
23
  "policy_kwargs": {},
24
- "num_timesteps": 1015808,
25
- "_total_timesteps": 1000000,
26
  "_num_timesteps_at_start": 0,
27
  "seed": null,
28
  "action_noise": null,
29
- "start_time": 1711106625402709981,
30
  "learning_rate": 0.0003,
31
  "tensorboard_log": null,
32
  "_last_obs": {
33
  ":type:": "<class 'numpy.ndarray'>",
34
- ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAAZtjj7FZhc/UgjZPc845r4AME8+0oywvQAAAAAAAAAAWod/Puh94T4iF5u9M5iuvlg2oD0zhNW9AAAAAAAAAAAz+py8S5ySP+syUr1FcR2/QITivMkpgjwAAAAAAAAAAA3VnL32OGe6tbdXulfH4DVb3xw7lVR3OQAAAAAAAAAAnVhrvq+tUD9Kwqu+1O3nvkaqib5Fzi69AAAAAAAAAACaJyO+XH9cvJ07xLrmv/i40v/BPf5LBDoAAIA/AACAPwNnuT62wig/pxAtPZGj074CK0Y+Ng8qvgAAAAAAAAAA0z48Pg5yjbytXw87qzxkueib9L26skK6AACAPwAAgD+zKUC+0F/LPmBTU726I5C+nnzKvf6GpDwAAAAAAAAAABovrT1xHM4+cx/WPGvls77aZAk94vk+vQAAAAAAAAAA03d/PpGD6z2nCMu9iR2DvtvfHz2iJaq8AAAAAAAAAADN9B++D1NevOGXBrv56C+59NbGPXJmOToAAIA/AACAPwCwELtTdb8/CiWdvGqDVj4AVS88tXJCPAAAAAAAAAAAoMMFPly+ZDuiiDm+BYUVvNH8iT01zhm+AACAPwAAgD9TxTk+tMGuvFKM1bppvaI5NgwYvk6dPjoAAIA/AACAPxNAIL5PXkC8IKf7upfXCbnc6qY95isjOgAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
35
  },
36
  "_last_episode_starts": {
37
  ":type:": "<class 'numpy.ndarray'>",
@@ -41,17 +41,17 @@
41
  "_episode_num": 0,
42
  "use_sde": false,
43
  "sde_sample_freq": -1,
44
- "_current_progress_remaining": -0.015808000000000044,
45
  "_stats_window_size": 100,
46
  "ep_info_buffer": {
47
  ":type:": "<class 'collections.deque'>",
48
- ":serialized:": "gAWV9gsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQGzJ5dWyTpyMAWyUS9yMAXSUR0Ce2QhW5paidX2UKGgGR0By4UlXzUZvaAdL3WgIR0Ce2SqlxffGdX2UKGgGR0BxyAihWYF8aAdL82gIR0CfNo384xUOdX2UKGgGR0BuZng75mAcaAdLyWgIR0CfNplzEJjUdX2UKGgGR0BvZT3AVO9GaAdLyGgIR0CfNzk7wKBvdX2UKGgGR0BzWFvYODraaAdL1GgIR0CfOVkWAPNFdX2UKGgGR0BvLZaRp1zRaAdL2WgIR0CfOp8nNPgvdX2UKGgGR0BwMqKP4mCzaAdL0GgIR0CfO3SL61stdX2UKGgGR0ByxOd9Ujs2aAdLzmgIR0CfO9a1TisGdX2UKGgGR0ByDtTyauwHaAdL1WgIR0CfPWp+tr9EdX2UKGgGR0Bk0MFKTSssaAdN6ANoCEdAnz23+6y0KXV9lChoBkdAcPJvoNd7fGgHS8ZoCEdAnz68lPacqnV9lChoBkdAcikz7uUliWgHS91oCEdAnz/y08eS0XV9lChoBkdAcEw/keZG8WgHTQwBaAhHQJ9DZyWAwwl1fZQoaAZHQGqojI7vG6xoB03gAmgIR0CfQ+jZL7GedX2UKGgGR0BwimXfIjnnaAdL4mgIR0CfRDw8nuzAdX2UKGgGR0BxgR1r6+FlaAdL12gIR0CfRg30f5k9dX2UKGgGR0BvvVSVGCqZaAdL5GgIR0CfRtzj3mFKdX2UKGgGR0BzJIm3OObRaAdNAAFoCEdAn0lGNWEK3XV9lChoBkdAc2oLThHby2gHTQkBaAhHQJ9Jbs5XEIh1fZQoaAZHQHEkc3hn8KpoB0vcaAhHQJ9JofLcKw91fZQoaAZHQHEIUHD7655oB00LAWgIR0CfSnbTMJQddX2UKGgGR0BjLpF5OafBaAdN6ANoCEdAn0tl6E8JU3V9lChoBkdAcdrrupjtomgHS+1oCEdAn0x+ogmqpHV9lChoBkdAcX6OZLIxQGgHS+VoCEdAn0y7EUCaJHV9lChoBkdARGacwxnFpGgHS6hoCEdAn0zqcy31BnV9lChoBkdAcIgQg9vCM2gHS/loCEdAn00x8UmD2HV9lChoBkdAYo6qYqoZRGgHTegDaAhHQJ9NkMqjJuF1fZQoaAZHQHCyhg7YChhoB0vhaAhHQJ9OA77sOXp1fZQoaAZHQHCKQyqMm4RoB0vSaAhHQJ9QmRB/qgR1fZQoaAZHQG0+Dwpe/pNoB0vQaAhHQJ9RToGIKtx1fZQoaAZHQHC13zxwyZdoB0vsaAhHQJ9RV2St/4J1fZQoaAZHQHEF2KdhAnloB0v6aAhHQJ9RsLH+6y11fZQoaAZHQHBv+1Bt1p1oB0vSaAhHQJ9SQ3bVSXN1fZQoaAZHQGZAqHoHLRtoB03oA2gIR0CfUlLiuMdcdX2UKGgGR0BvnZFb3XZoaAdLw2gIR0CfUslOoHcDdX2UKGgGR0BtXMDMeOn3aAdL22gIR0CfU7WyTpxFdX2UKGgGR0BveI/xDst1aAdL12gIR0CfU8R15jYqdX2UKGgGR0BwjkvBacI7aAdL32gIR0CfVDYK6WgOdX2UKGgGR0BfsA8SwnpjaAdN6ANoCEdAn1TKYJE6UHV9lChoBkdAcXEGzKLbYmgHS+ZoCEdAn1UbNB4UvnV9lChoBkdAch8MA3kxRGgHS9FoCEdAn1bZ+MIeHXV9lChoBkdAZI20svqTr2gHTegDaAhHQJ9XCeYlY2d1fZQoaAZHQHF36HXVbzNoB0vKaAhHQJ9YIacZtN11fZQoaAZHQHIkh/EwWWRoB0vyaAhHQJ9YeZZ0Syt1fZQoaAZHQHFtSZKFqSJoB0v3aAhHQJ9YmXMQmNR1fZQoaAZHQG6Mbvw3HaNoB0vPaAhHQJ9YyKUFB6d1fZQoaAZHQHDTyr5qM3toB0vzaAhHQJ9ZVa8pTdd1fZQoaAZHQFoXtO2y9mJoB03oA2gIR0CfWbVtXPqtdX2UKGgGR0BuFx1vES/TaAdNEgFoCEdAn1nE9ECvHXV9lChoBkdAbmKOUdJaq2gHS9xoCEdAn1o0XpGFz3V9lChoBkdAcHW0SAYpD2gHS/BoCEdAn1qxB7eEZnV9lChoBkdAcaawBHTZx2gHS+JoCEdAn1tgJswcpHV9lChoBkdAcqlsFdLQHGgHTRIBaAhHQJ9dIFotcwB1fZQoaAZHQHCdWACnxaxoB0vVaAhHQJ9dSt3fQ8h1fZQoaAZHQHJEWLHdXT5oB0voaAhHQJ9dsKTjebd1fZQoaAZHQHDokka/ATJoB0vBaAhHQJ9d1gy/KyR1fZQoaAZHQGS2BIOH311oB03oA2gIR0CfXjX9zfaYdX2UKGgGR0Bv9dsxfv4NaAdLz2gIR0CfXpIrvsqsdX2UKGgGR0Bv0aDsdDIBaAdLzGgIR0CfX7Hh0hePdX2UKGgGR0BwYGV7hNucaAdL22gIR0CfX7vCMxXXdX2UKGgGR0BxOrlLeyiVaAdL32gIR0CfYDBtk4FSdX2UKGgGR0ByZYa1kUblaAdNBQFoCEdAn2A94Z/CqXV9lChoBkdAbtbrMTviLmgHS9xoCEdAn2EGETQE6nV9lChoBkdAcicTKDCgsmgHTQ4BaAhHQJ9h78Muvll1fZQoaAZHQHEH+UY8+zNoB0v1aAhHQJ9ifAFgUlB1fZQoaAZHQG95ZfdAPd5oB0veaAhHQJ9ji3+dbxF1fZQoaAZHQG9atXPqs2hoB0vSaAhHQJ9jujM3ZPF1fZQoaAZHQHF6Itcv/R5oB0vWaAhHQJ9kWZw4sEt1fZQoaAZHQHD6sVQAMlVoB0vnaAhHQJ9kgQVbiZR1fZQoaAZHQHJaQ6ltTDRoB0vUaAhHQJ9krIbOu7p1fZQoaAZHQHAIcJlar3loB0vQaAhHQJ9lqwcHWz51fZQoaAZHQHFZcYEW69VoB0voaAhHQJ9nDZuhsZZ1fZQoaAZHQHF805uIhyNoB0v7aAhHQJ9nF1ZDArR1fZQoaAZHQHEBWKZUkv9oB0vXaAhHQJ9ofyMDOkd1fZQoaAZHQG/VQRGtp25oB0vgaAhHQJ9pbgk1Muh1fZQoaAZHQG4gPnr6ciJoB0vTaAhHQJ9qSnzg/C91fZQoaAZHQHC6MGxD9floB0vRaAhHQJ9qeB8QZoB1fZQoaAZHQGPvRYJVsDZoB03oA2gIR0CfbBunMt9QdX2UKGgGR0ByCdufmLccaAdL72gIR0CfbHyWAwwkdX2UKGgGR0Bx5z3L3bmEaAdL4GgIR0CfbadonKGMdX2UKGgGR0Bw5r3FkxyoaAdL4WgIR0Cfb/E8aGYbdX2UKGgGR0BvKAZuQ6p6aAdN4wFoCEdAn3MB9LHuJHV9lChoBkdAbVSADJU5uWgHTR4BaAhHQJ9zZSR8twt1fZQoaAZHQHIz0Aksz2xoB0v7aAhHQJ9zzc580DV1fZQoaAZHQHGj68g6ltVoB0vbaAhHQJ90tcyFfzB1fZQoaAZHQHIZNK28Zk1oB0v3aAhHQJ906JKraM91fZQoaAZHQHM2XKB/ZuhoB0vhaAhHQJ91NC7btZ51fZQoaAZHQGWlaisXBP9oB03oA2gIR0CfdoMuOCGvdX2UKGgGR0BwF+V5a/yoaAdL7WgIR0Cfd8RLsa86dX2UKGgGR0Bwws2R7qptaAdL8GgIR0CfeLRsdkrgdX2UKGgGR0Bx6/ktEofCaAdL0WgIR0CfeSJQ+EAYdX2UKGgGR0BxB/LwF1SwaAdL42gIR0Cfe7VLzwtrdX2UKGgGR0BkmjtqpLmIaAdN6ANoCEdAn3vtJrcj7nV9lChoBkdAbuQz+FUQ1GgHS85oCEdAn3wpOWSlnHV9lChoBkdAcFq1UEPlMmgHS+toCEdAn3w6n3ta6nV9lChoBkdAcsg7e2uxKWgHS95oCEdAn3zF63RXwXV9lChoBkdAcErcJ+lTFWgHS+9oCEdAn317drO7hHV9lChoBkdAcQFyRjjJdWgHS95oCEdAn33pM6BAfXV9lChoBkdAcRIjghr302gHS81oCEdAn36Fyq+8G3VlLg=="
49
  },
50
  "ep_success_buffer": {
51
  ":type:": "<class 'collections.deque'>",
52
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
53
  },
54
- "_n_updates": 380,
55
  "observation_space": {
56
  ":type:": "<class 'gymnasium.spaces.box.Box'>",
57
  ":serialized:": "gAWVdgIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoCIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoESiWCAAAAAAAAAABAQEBAQEBAZRoFUsIhZRoGXSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBEoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaAtLCIWUaBl0lFKUjARoaWdolGgRKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgLSwiFlGgZdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=",
 
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
+ "__init__": "<function ActorCriticPolicy.__init__ at 0x7c5f53a89630>",
8
+ "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7c5f53a896c0>",
9
+ "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7c5f53a89750>",
10
+ "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7c5f53a897e0>",
11
+ "_build": "<function ActorCriticPolicy._build at 0x7c5f53a89870>",
12
+ "forward": "<function ActorCriticPolicy.forward at 0x7c5f53a89900>",
13
+ "extract_features": "<function ActorCriticPolicy.extract_features at 0x7c5f53a89990>",
14
+ "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7c5f53a89a20>",
15
+ "_predict": "<function ActorCriticPolicy._predict at 0x7c5f53a89ab0>",
16
+ "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7c5f53a89b40>",
17
+ "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7c5f53a89bd0>",
18
+ "predict_values": "<function ActorCriticPolicy.predict_values at 0x7c5f53a89c60>",
19
  "__abstractmethods__": "frozenset()",
20
+ "_abc_impl": "<_abc._abc_data object at 0x7c5f53a8cb40>"
21
  },
22
+ "verbose": 1,
23
  "policy_kwargs": {},
24
+ "num_timesteps": 1507328,
25
+ "_total_timesteps": 1500000,
26
  "_num_timesteps_at_start": 0,
27
  "seed": null,
28
  "action_noise": null,
29
+ "start_time": 1711526485592841125,
30
  "learning_rate": 0.0003,
31
  "tensorboard_log": null,
32
  "_last_obs": {
33
  ":type:": "<class 'numpy.ndarray'>",
34
+ ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAACbLmr24l5C7Z2CGuyqOsjzMBu68Q0qWPQAAgD8AAIA/Bhg1vn2GUz5aYK89/i5TvjYpnLzSyL27AAAAAAAAAADmh6+9ubOXP+Ib5b6FcxS/Yze0vQ9TQb4AAAAAAAAAAOalMT1Iv5G6i379NES4Li1S5cQ6iFVqtAAAgD8AAIA/gE9tvQV5oLs3u0c8tEEXPH5L37xezgU9AACAPwAAgD9Apgu+pwFPPjRWwj3HiTG+KrmVvB+1tDwAAAAAAAAAAJr3n71NW1c/sqJevZm47b4jIBK9m8EfvAAAAAAAAAAAM20EPOwv6D7Er5S82QeevnB/fjxh7ii9AAAAAAAAAACNwC6+ewuGvFU2druMWa+5DHP5Peo1pDoAAIA/AACAP5oOnDxIEo0/qp4aPeaYCL867+08lpI5vQAAAAAAAAAA03Ayvu7PnbzC/ii8rVO7uqu1Bz64LZQ7AACAPwAAgD8aBjU9xabvPG4LV70SMy6+drqkO5/ZHjwAAAAAAAAAAJrsib6tb+0+aKJhPkqEvL6oZq69Jls+PgAAAAAAAAAAzZRrPSecvj8YUQA/byI7Ptgv5jyaawI+AAAAAAAAAABNWRC+gbUjP6pVfTzVkdm+t4g+vYp/Kj0AAAAAAAAAAEDhI76cZUi8wwmzOraBajloTqk9ulAcugAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
35
  },
36
  "_last_episode_starts": {
37
  ":type:": "<class 'numpy.ndarray'>",
 
41
  "_episode_num": 0,
42
  "use_sde": false,
43
  "sde_sample_freq": -1,
44
+ "_current_progress_remaining": -0.004885333333333408,
45
  "_stats_window_size": 100,
46
  "ep_info_buffer": {
47
  ":type:": "<class 'collections.deque'>",
48
+ ":serialized:": "gAWV/wsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHCDcafjCHiMAWyUS/6MAXSUR0CgIcodMj/udX2UKGgGR0Bw+Bvze40/aAdL+GgIR0CgIeFXJYDDdX2UKGgGR0BwRfY+Sr5qaAdL4WgIR0CgIfIsZpBYdX2UKGgGR0BupV43WFviaAdL4mgIR0CgIfki2UjcdX2UKGgGR0Bya8XvYvnKaAdL7mgIR0CgIkzK9wm3dX2UKGgGR0Bxy5V94NZvaAdL/2gIR0CgIl6hxo7FdX2UKGgGR0BwGtPDYRNAaAdL5mgIR0CgIoG0/nnudX2UKGgGR0BvbimoBJZoaAdL7WgIR0CgI15s0pEydX2UKGgGR0BwiMiJO32FaAdL/mgIR0CgI3ZSeiBYdX2UKGgGR0BylxESdvsJaAdL/2gIR0CgI4mmce8xdX2UKGgGR0BvWJh+fAbiaAdL5GgIR0CgI+EGZ/kOdX2UKGgGR0ByUh0q6OHWaAdL9mgIR0CgJDGGdqcmdX2UKGgGR0BxWkyyleniaAdL72gIR0CgJOZz5oGqdX2UKGgGR0BxTF1bJOnEaAdL2WgIR0CgJPI/7iyZdX2UKGgGR0BwUPfAKv3baAdL12gIR0CgJPzEaVD8dX2UKGgGR0BfffrfLs8gaAdN6ANoCEdAoCUhEfDDTHV9lChoBkdAbyfokAxSHmgHTQMBaAhHQKAlcPsAvL51fZQoaAZHQG8VgI6bONZoB0v/aAhHQKAljXSSeRR1fZQoaAZHQHHsNgSeyzJoB0v7aAhHQKAl0M5wOvt1fZQoaAZHQHHUBrJr+HdoB0v4aAhHQKAl2K/mDDl1fZQoaAZHQG4akHt4RmNoB0v6aAhHQKAmAm1pj+d1fZQoaAZHQHDG8zZYgaFoB0v3aAhHQKAm1CPZIxx1fZQoaAZHQHDr1uR9w3poB0v1aAhHQKAm4sTWXkZ1fZQoaAZHQGxPVr6+FlFoB0v9aAhHQKAnFKSxJNF1fZQoaAZHQHLbRUm2LHdoB00SAWgIR0CgKBanzg/DdX2UKGgGR0Bx7V8gIQe4aAdL+2gIR0CgKIIIF/x2dX2UKGgGR0BxECX9itq6aAdNBgFoCEdAoCi/ymQ8wHV9lChoBkdAcd/XtjTa02gHTQQBaAhHQKAoxElVtGd1fZQoaAZHQG4mx2St/4JoB0vqaAhHQKApBhAnlXB1fZQoaAZHQHIzNwJgLJFoB00VAWgIR0CgKTPh60IDdX2UKGgGR0Bxb81k1/DtaAdL6WgIR0CgKVy8J2MbdX2UKGgGR0Bw/jgm7aqTaAdL62gIR0CgKV0FKTStdX2UKGgGR0BytbjIaLn+aAdNgQFoCEdAoCmPN3W4E3V9lChoBkdAbkMK3uuzQmgHS+poCEdAoCmT6P8ye3V9lChoBkdAcOnHavicXmgHS/BoCEdAoCpvn2ZiNXV9lChoBkdAbJM+JP69CmgHS/ZoCEdAoCqUygwoLHV9lChoBkdAbwy5EMLF42gHS/JoCEdAoCq2R7qptXV9lChoBkdAcwPlSS/0umgHS/NoCEdAoCuuM4tHx3V9lChoBkdAcLVXyiEg4mgHS+xoCEdAoCv64SYgJXV9lChoBkdAcbuvwmVqvmgHS+loCEdAoCwr6N2ki3V9lChoBkdAcOq+L3sXzmgHS9hoCEdAoCyDreIl+nV9lChoBkdAcljNJvo/zWgHS+5oCEdAoCyHgUDdQHV9lChoBkdAckbAood+5WgHS+loCEdAoCzGqioKlnV9lChoBkdAceI7Qb+98WgHS/FoCEdAoC0ZC8e0X3V9lChoBkdAchEN21UlzGgHTRsBaAhHQKAtW6U7jkx1fZQoaAZHQHBDYIKMNttoB00HAWgIR0CgLWZavA45dX2UKGgGR0Bw5xKODJ2daAdNRgFoCEdAoC2RJNCZ4XV9lChoBkdATh2AEt/WlWgHS9loCEdAoC3tpTMq0HV9lChoBkdAbrP8cdYGMWgHS/poCEdAoC5Ho1UEPnV9lChoBkdAYcsHZ9NN8GgHTegDaAhHQKAuUENe+mF1fZQoaAZHQHDjx15jYqZoB00KAWgIR0CgLmXsw+MZdX2UKGgGR0BwsNdhRZU2aAdL7GgIR0CgLzL1EmY0dX2UKGgGR0Bu8ZfOUt7KaAdL8mgIR0CgL4w2VE/jdX2UKGgGR0BwGY1xbSqmaAdL+2gIR0CgL99ycTakdX2UKGgGR0BuFT7XQMQVaAdL52gIR0CgL9/WDpTudX2UKGgGR0BcxU4JeE7GaAdN6ANoCEdAoDAbDKoybnV9lChoBkdAcU17kXDWLGgHTRwBaAhHQKAwrQ5WBBl1fZQoaAZHQHMqnZXdTHdoB00NAWgIR0CgMLLTH80ldX2UKGgGR0BwcXmW+oLoaAdNAAFoCEdAoDDaCg9Ne3V9lChoBkdAbMfyJbdJrmgHS/RoCEdAoDDw0EX+EXV9lChoBkdAcHfJhfBvaWgHS+doCEdAoDD4DzRQanV9lChoBkdAcM4DlHSWq2gHS9poCEdAoDF5JiAlOXV9lChoBkdAckmBYFJQL2gHS/poCEdAoDGWQGOdXnV9lChoBkdAcmNPppvgnGgHTSMBaAhHQKAxn1q33Ht1fZQoaAZHQHDmupS75EdoB0v7aAhHQKAx+/pt78h1fZQoaAZHQHFNR15jYqZoB00QAWgIR0CgMjILgGbDdX2UKGgGR0A+hqp97WupaAdLg2gIR0CgMoXC0ngHdX2UKGgGR0BxzF63RXwLaAdL8GgIR0CgMrHYxtYTdX2UKGgGR0ByOvHyVfNSaAdL5mgIR0CgMvQdS2pidX2UKGgGR0BwrLyvs7dSaAdL52gIR0CgM1b3fyf+dX2UKGgGR0BzUxC9h7VsaAdLyWgIR0CgM/MKb8WLdX2UKGgGR0ByPbFaSs8xaAdNDQFoCEdAoDQGr8zhxnV9lChoBkdAZHU11GLDRGgHTegDaAhHQKA0Zgnc+JR1fZQoaAZHQG88ubAk9lpoB0vxaAhHQKA0gRFI/aB1fZQoaAZHQHG11abF0gdoB00kAWgIR0CgNMEyULUkdX2UKGgGR0Bw3a+evpyIaAdL7mgIR0CgNMoMjNY9dX2UKGgGR0Bx99Ukv9LpaAdNDQFoCEdAoDVOu9vjwXV9lChoBkdAcO/fKp1ifGgHS+poCEdAoDWTT+ee4HV9lChoBkdAcEE9uP3i72gHTQIBaAhHQKA2AYqG1x91fZQoaAZHQHFDL2L5ylxoB0vhaAhHQKA2qgAZKnN1fZQoaAZHQHJYcPatcOdoB00NAWgIR0CgNwLVvuPWdX2UKGgGR0Bwno8aGYa6aAdNEQFoCEdAoDeEcXFcZHV9lChoBkdAcUxNBWxQi2gHS+9oCEdAoDeMxTKkmHV9lChoBkdAcU+/3WWhRWgHTQgBaAhHQKA3mKXOW0J1fZQoaAZHQHFky0KJEYxoB0vvaAhHQKA4F8jzI3l1fZQoaAZHQHAv1WS2Yv5oB0v0aAhHQKA4eK8+Ro11fZQoaAZHQHKfeRT0g8toB00OAWgIR0CgOIIZIg/1dX2UKGgGR0Bxom8oQWepaAdL+2gIR0CgOOXCTEBKdX2UKGgGR0Bwwxk+X7cgaAdL6WgIR0CgORC22G7BdX2UKGgGR0BvN4t6HCXQaAdNrgFoCEdAoDkn9YOlPHV9lChoBkdAcEXgBcRlH2gHTQABaAhHQKA5m6RQrMF1fZQoaAZHQG/ZTgVGkN5oB0v1aAhHQKA5wjDbah91fZQoaAZHQHJ0KRZEDyRoB0vhaAhHQKA5/CLuQZJ1fZQoaAZHQG5PFJQLux9oB0vyaAhHQKA6lriVB2R1fZQoaAZHQGxa7Z39rGloB0vpaAhHQKA7C1JlJ6J1fZQoaAZHQG/fG7BfrrxoB0vyaAhHQKA7KoddVvN1fZQoaAZHQHCToqwyIpJoB00DAWgIR0CgO4G5UcXFdX2UKGgGR0BvQQF1SwW4aAdL52gIR0CgPAPz4DcNdX2UKGgGR0BylrBCUornaAdL62gIR0CgPB1zIV/MdX2UKGgGR0BwqJJZntfHaAdNDAFoCEdAoDw1Jaq0dHVlLg=="
49
  },
50
  "ep_success_buffer": {
51
  ":type:": "<class 'collections.deque'>",
52
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
53
  },
54
+ "_n_updates": 460,
55
  "observation_space": {
56
  ":type:": "<class 'gymnasium.spaces.box.Box'>",
57
  ":serialized:": "gAWVdgIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoCIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoESiWCAAAAAAAAAABAQEBAQEBAZRoFUsIhZRoGXSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBEoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaAtLCIWUaBl0lFKUjARoaWdolGgRKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgLSwiFlGgZdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=",
ppo-LunarLander-v2/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6882b9adc455d7990be81def618d86566d7b6f87970ce88db00affd9c5c4e293
3
  size 88362
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef1939840e3bfaa6070a7e7d081c0c7cc25ecfa165e2008006a10f115ca93e9e
3
  size 88362
ppo-LunarLander-v2/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d153b7946bb2010952c00bb5232382758151c382ddbc2552dc1c82325cd26366
3
  size 43762
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aca183006757871e1b9905993aa53300ca461c3b20a027b500d03c956a65047f
3
  size 43762
replay.mp4 CHANGED
Binary files a/replay.mp4 and b/replay.mp4 differ
 
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 229.4870018, "std_reward": 55.459437173393965, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2024-03-22T11:55:20.039660"}
 
1
+ {"mean_reward": 260.72180706618326, "std_reward": 19.360104937819813, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2024-03-27T08:35:58.861285"}