Upload PPO LunarLander-v2 trained agent
Browse files- README.md +1 -1
- config.json +1 -1
- ppo-LunarLander-v2.zip +2 -2
- ppo-LunarLander-v2/data +21 -21
- ppo-LunarLander-v2/policy.optimizer.pth +1 -1
- ppo-LunarLander-v2/policy.pth +1 -1
- replay.mp4 +0 -0
- results.json +1 -1
README.md
CHANGED
@@ -16,7 +16,7 @@ model-index:
|
|
16 |
type: LunarLander-v2
|
17 |
metrics:
|
18 |
- type: mean_reward
|
19 |
-
value:
|
20 |
name: mean_reward
|
21 |
verified: false
|
22 |
---
|
|
|
16 |
type: LunarLander-v2
|
17 |
metrics:
|
18 |
- type: mean_reward
|
19 |
+
value: 260.72 +/- 19.36
|
20 |
name: mean_reward
|
21 |
verified: false
|
22 |
---
|
config.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7a9bdf53e560>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7a9bdf53e5f0>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7a9bdf53e680>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7a9bdf53e710>", "_build": "<function ActorCriticPolicy._build at 0x7a9bdf53e7a0>", "forward": "<function ActorCriticPolicy.forward at 0x7a9bdf53e830>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7a9bdf53e8c0>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7a9bdf53e950>", "_predict": "<function ActorCriticPolicy._predict at 0x7a9bdf53e9e0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7a9bdf53ea70>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7a9bdf53eb00>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7a9bdf53eb90>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7a9bdf6d9e80>"}, "verbose": true, "policy_kwargs": {}, "num_timesteps": 1015808, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1711106625402709981, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAAZtjj7FZhc/UgjZPc845r4AME8+0oywvQAAAAAAAAAAWod/Puh94T4iF5u9M5iuvlg2oD0zhNW9AAAAAAAAAAAz+py8S5ySP+syUr1FcR2/QITivMkpgjwAAAAAAAAAAA3VnL32OGe6tbdXulfH4DVb3xw7lVR3OQAAAAAAAAAAnVhrvq+tUD9Kwqu+1O3nvkaqib5Fzi69AAAAAAAAAACaJyO+XH9cvJ07xLrmv/i40v/BPf5LBDoAAIA/AACAPwNnuT62wig/pxAtPZGj074CK0Y+Ng8qvgAAAAAAAAAA0z48Pg5yjbytXw87qzxkueib9L26skK6AACAPwAAgD+zKUC+0F/LPmBTU726I5C+nnzKvf6GpDwAAAAAAAAAABovrT1xHM4+cx/WPGvls77aZAk94vk+vQAAAAAAAAAA03d/PpGD6z2nCMu9iR2DvtvfHz2iJaq8AAAAAAAAAADN9B++D1NevOGXBrv56C+59NbGPXJmOToAAIA/AACAPwCwELtTdb8/CiWdvGqDVj4AVS88tXJCPAAAAAAAAAAAoMMFPly+ZDuiiDm+BYUVvNH8iT01zhm+AACAPwAAgD9TxTk+tMGuvFKM1bppvaI5NgwYvk6dPjoAAIA/AACAPxNAIL5PXkC8IKf7upfXCbnc6qY95isjOgAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.015808000000000044, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWV9gsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQGzJ5dWyTpyMAWyUS9yMAXSUR0Ce2QhW5paidX2UKGgGR0By4UlXzUZvaAdL3WgIR0Ce2SqlxffGdX2UKGgGR0BxyAihWYF8aAdL82gIR0CfNo384xUOdX2UKGgGR0BuZng75mAcaAdLyWgIR0CfNplzEJjUdX2UKGgGR0BvZT3AVO9GaAdLyGgIR0CfNzk7wKBvdX2UKGgGR0BzWFvYODraaAdL1GgIR0CfOVkWAPNFdX2UKGgGR0BvLZaRp1zRaAdL2WgIR0CfOp8nNPgvdX2UKGgGR0BwMqKP4mCzaAdL0GgIR0CfO3SL61stdX2UKGgGR0ByxOd9Ujs2aAdLzmgIR0CfO9a1TisGdX2UKGgGR0ByDtTyauwHaAdL1WgIR0CfPWp+tr9EdX2UKGgGR0Bk0MFKTSssaAdN6ANoCEdAnz23+6y0KXV9lChoBkdAcPJvoNd7fGgHS8ZoCEdAnz68lPacqnV9lChoBkdAcikz7uUliWgHS91oCEdAnz/y08eS0XV9lChoBkdAcEw/keZG8WgHTQwBaAhHQJ9DZyWAwwl1fZQoaAZHQGqojI7vG6xoB03gAmgIR0CfQ+jZL7GedX2UKGgGR0BwimXfIjnnaAdL4mgIR0CfRDw8nuzAdX2UKGgGR0BxgR1r6+FlaAdL12gIR0CfRg30f5k9dX2UKGgGR0BvvVSVGCqZaAdL5GgIR0CfRtzj3mFKdX2UKGgGR0BzJIm3OObRaAdNAAFoCEdAn0lGNWEK3XV9lChoBkdAc2oLThHby2gHTQkBaAhHQJ9Jbs5XEIh1fZQoaAZHQHEkc3hn8KpoB0vcaAhHQJ9JofLcKw91fZQoaAZHQHEIUHD7655oB00LAWgIR0CfSnbTMJQddX2UKGgGR0BjLpF5OafBaAdN6ANoCEdAn0tl6E8JU3V9lChoBkdAcdrrupjtomgHS+1oCEdAn0x+ogmqpHV9lChoBkdAcX6OZLIxQGgHS+VoCEdAn0y7EUCaJHV9lChoBkdARGacwxnFpGgHS6hoCEdAn0zqcy31BnV9lChoBkdAcIgQg9vCM2gHS/loCEdAn00x8UmD2HV9lChoBkdAYo6qYqoZRGgHTegDaAhHQJ9NkMqjJuF1fZQoaAZHQHCyhg7YChhoB0vhaAhHQJ9OA77sOXp1fZQoaAZHQHCKQyqMm4RoB0vSaAhHQJ9QmRB/qgR1fZQoaAZHQG0+Dwpe/pNoB0vQaAhHQJ9RToGIKtx1fZQoaAZHQHC13zxwyZdoB0vsaAhHQJ9RV2St/4J1fZQoaAZHQHEF2KdhAnloB0v6aAhHQJ9RsLH+6y11fZQoaAZHQHBv+1Bt1p1oB0vSaAhHQJ9SQ3bVSXN1fZQoaAZHQGZAqHoHLRtoB03oA2gIR0CfUlLiuMdcdX2UKGgGR0BvnZFb3XZoaAdLw2gIR0CfUslOoHcDdX2UKGgGR0BtXMDMeOn3aAdL22gIR0CfU7WyTpxFdX2UKGgGR0BveI/xDst1aAdL12gIR0CfU8R15jYqdX2UKGgGR0BwjkvBacI7aAdL32gIR0CfVDYK6WgOdX2UKGgGR0BfsA8SwnpjaAdN6ANoCEdAn1TKYJE6UHV9lChoBkdAcXEGzKLbYmgHS+ZoCEdAn1UbNB4UvnV9lChoBkdAch8MA3kxRGgHS9FoCEdAn1bZ+MIeHXV9lChoBkdAZI20svqTr2gHTegDaAhHQJ9XCeYlY2d1fZQoaAZHQHF36HXVbzNoB0vKaAhHQJ9YIacZtN11fZQoaAZHQHIkh/EwWWRoB0vyaAhHQJ9YeZZ0Syt1fZQoaAZHQHFtSZKFqSJoB0v3aAhHQJ9YmXMQmNR1fZQoaAZHQG6Mbvw3HaNoB0vPaAhHQJ9YyKUFB6d1fZQoaAZHQHDTyr5qM3toB0vzaAhHQJ9ZVa8pTdd1fZQoaAZHQFoXtO2y9mJoB03oA2gIR0CfWbVtXPqtdX2UKGgGR0BuFx1vES/TaAdNEgFoCEdAn1nE9ECvHXV9lChoBkdAbmKOUdJaq2gHS9xoCEdAn1o0XpGFz3V9lChoBkdAcHW0SAYpD2gHS/BoCEdAn1qxB7eEZnV9lChoBkdAcaawBHTZx2gHS+JoCEdAn1tgJswcpHV9lChoBkdAcqlsFdLQHGgHTRIBaAhHQJ9dIFotcwB1fZQoaAZHQHCdWACnxaxoB0vVaAhHQJ9dSt3fQ8h1fZQoaAZHQHJEWLHdXT5oB0voaAhHQJ9dsKTjebd1fZQoaAZHQHDokka/ATJoB0vBaAhHQJ9d1gy/KyR1fZQoaAZHQGS2BIOH311oB03oA2gIR0CfXjX9zfaYdX2UKGgGR0Bv9dsxfv4NaAdLz2gIR0CfXpIrvsqsdX2UKGgGR0Bv0aDsdDIBaAdLzGgIR0CfX7Hh0hePdX2UKGgGR0BwYGV7hNucaAdL22gIR0CfX7vCMxXXdX2UKGgGR0BxOrlLeyiVaAdL32gIR0CfYDBtk4FSdX2UKGgGR0ByZYa1kUblaAdNBQFoCEdAn2A94Z/CqXV9lChoBkdAbtbrMTviLmgHS9xoCEdAn2EGETQE6nV9lChoBkdAcicTKDCgsmgHTQ4BaAhHQJ9h78Muvll1fZQoaAZHQHEH+UY8+zNoB0v1aAhHQJ9ifAFgUlB1fZQoaAZHQG95ZfdAPd5oB0veaAhHQJ9ji3+dbxF1fZQoaAZHQG9atXPqs2hoB0vSaAhHQJ9jujM3ZPF1fZQoaAZHQHF6Itcv/R5oB0vWaAhHQJ9kWZw4sEt1fZQoaAZHQHD6sVQAMlVoB0vnaAhHQJ9kgQVbiZR1fZQoaAZHQHJaQ6ltTDRoB0vUaAhHQJ9krIbOu7p1fZQoaAZHQHAIcJlar3loB0vQaAhHQJ9lqwcHWz51fZQoaAZHQHFZcYEW69VoB0voaAhHQJ9nDZuhsZZ1fZQoaAZHQHF805uIhyNoB0v7aAhHQJ9nF1ZDArR1fZQoaAZHQHEBWKZUkv9oB0vXaAhHQJ9ofyMDOkd1fZQoaAZHQG/VQRGtp25oB0vgaAhHQJ9pbgk1Muh1fZQoaAZHQG4gPnr6ciJoB0vTaAhHQJ9qSnzg/C91fZQoaAZHQHC6MGxD9floB0vRaAhHQJ9qeB8QZoB1fZQoaAZHQGPvRYJVsDZoB03oA2gIR0CfbBunMt9QdX2UKGgGR0ByCdufmLccaAdL72gIR0CfbHyWAwwkdX2UKGgGR0Bx5z3L3bmEaAdL4GgIR0CfbadonKGMdX2UKGgGR0Bw5r3FkxyoaAdL4WgIR0Cfb/E8aGYbdX2UKGgGR0BvKAZuQ6p6aAdN4wFoCEdAn3MB9LHuJHV9lChoBkdAbVSADJU5uWgHTR4BaAhHQJ9zZSR8twt1fZQoaAZHQHIz0Aksz2xoB0v7aAhHQJ9zzc580DV1fZQoaAZHQHGj68g6ltVoB0vbaAhHQJ90tcyFfzB1fZQoaAZHQHIZNK28Zk1oB0v3aAhHQJ906JKraM91fZQoaAZHQHM2XKB/ZuhoB0vhaAhHQJ91NC7btZ51fZQoaAZHQGWlaisXBP9oB03oA2gIR0CfdoMuOCGvdX2UKGgGR0BwF+V5a/yoaAdL7WgIR0Cfd8RLsa86dX2UKGgGR0Bwws2R7qptaAdL8GgIR0CfeLRsdkrgdX2UKGgGR0Bx6/ktEofCaAdL0WgIR0CfeSJQ+EAYdX2UKGgGR0BxB/LwF1SwaAdL42gIR0Cfe7VLzwtrdX2UKGgGR0BkmjtqpLmIaAdN6ANoCEdAn3vtJrcj7nV9lChoBkdAbuQz+FUQ1GgHS85oCEdAn3wpOWSlnHV9lChoBkdAcFq1UEPlMmgHS+toCEdAn3w6n3ta6nV9lChoBkdAcsg7e2uxKWgHS95oCEdAn3zF63RXwXV9lChoBkdAcErcJ+lTFWgHS+9oCEdAn317drO7hHV9lChoBkdAcQFyRjjJdWgHS95oCEdAn33pM6BAfXV9lChoBkdAcRIjghr302gHS81oCEdAn36Fyq+8G3VlLg=="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 380, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVdgIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoCIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoESiWCAAAAAAAAAABAQEBAQEBAZRoFUsIhZRoGXSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBEoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaAtLCIWUaBl0lFKUjARoaWdolGgRKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgLSwiFlGgZdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV2wAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCmMBWR0eXBllGgOjApfbnBfcmFuZG9tlE51Yi4=", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "n_steps": 2048, "gamma": 0.99, "gae_lambda": 0.95, "ent_coef": 0.0, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 10, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "system_info": {"OS": "Linux-6.1.58+-x86_64-with-glibc2.35 # 1 SMP PREEMPT_DYNAMIC Sat Nov 18 15:31:17 UTC 2023", "Python": "3.10.12", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.2.1+cu121", "GPU Enabled": "True", "Numpy": "1.25.2", "Cloudpickle": "2.2.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
|
|
|
1 |
+
{"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7c5f53a89630>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7c5f53a896c0>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7c5f53a89750>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7c5f53a897e0>", "_build": "<function ActorCriticPolicy._build at 0x7c5f53a89870>", "forward": "<function ActorCriticPolicy.forward at 0x7c5f53a89900>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7c5f53a89990>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7c5f53a89a20>", "_predict": "<function ActorCriticPolicy._predict at 0x7c5f53a89ab0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7c5f53a89b40>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7c5f53a89bd0>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7c5f53a89c60>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7c5f53a8cb40>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 1507328, "_total_timesteps": 1500000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1711526485592841125, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAACbLmr24l5C7Z2CGuyqOsjzMBu68Q0qWPQAAgD8AAIA/Bhg1vn2GUz5aYK89/i5TvjYpnLzSyL27AAAAAAAAAADmh6+9ubOXP+Ib5b6FcxS/Yze0vQ9TQb4AAAAAAAAAAOalMT1Iv5G6i379NES4Li1S5cQ6iFVqtAAAgD8AAIA/gE9tvQV5oLs3u0c8tEEXPH5L37xezgU9AACAPwAAgD9Apgu+pwFPPjRWwj3HiTG+KrmVvB+1tDwAAAAAAAAAAJr3n71NW1c/sqJevZm47b4jIBK9m8EfvAAAAAAAAAAAM20EPOwv6D7Er5S82QeevnB/fjxh7ii9AAAAAAAAAACNwC6+ewuGvFU2druMWa+5DHP5Peo1pDoAAIA/AACAP5oOnDxIEo0/qp4aPeaYCL867+08lpI5vQAAAAAAAAAA03Ayvu7PnbzC/ii8rVO7uqu1Bz64LZQ7AACAPwAAgD8aBjU9xabvPG4LV70SMy6+drqkO5/ZHjwAAAAAAAAAAJrsib6tb+0+aKJhPkqEvL6oZq69Jls+PgAAAAAAAAAAzZRrPSecvj8YUQA/byI7Ptgv5jyaawI+AAAAAAAAAABNWRC+gbUjP6pVfTzVkdm+t4g+vYp/Kj0AAAAAAAAAAEDhI76cZUi8wwmzOraBajloTqk9ulAcugAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.004885333333333408, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWV/wsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHCDcafjCHiMAWyUS/6MAXSUR0CgIcodMj/udX2UKGgGR0Bw+Bvze40/aAdL+GgIR0CgIeFXJYDDdX2UKGgGR0BwRfY+Sr5qaAdL4WgIR0CgIfIsZpBYdX2UKGgGR0BupV43WFviaAdL4mgIR0CgIfki2UjcdX2UKGgGR0Bya8XvYvnKaAdL7mgIR0CgIkzK9wm3dX2UKGgGR0Bxy5V94NZvaAdL/2gIR0CgIl6hxo7FdX2UKGgGR0BwGtPDYRNAaAdL5mgIR0CgIoG0/nnudX2UKGgGR0BvbimoBJZoaAdL7WgIR0CgI15s0pEydX2UKGgGR0BwiMiJO32FaAdL/mgIR0CgI3ZSeiBYdX2UKGgGR0BylxESdvsJaAdL/2gIR0CgI4mmce8xdX2UKGgGR0BvWJh+fAbiaAdL5GgIR0CgI+EGZ/kOdX2UKGgGR0ByUh0q6OHWaAdL9mgIR0CgJDGGdqcmdX2UKGgGR0BxWkyyleniaAdL72gIR0CgJOZz5oGqdX2UKGgGR0BxTF1bJOnEaAdL2WgIR0CgJPI/7iyZdX2UKGgGR0BwUPfAKv3baAdL12gIR0CgJPzEaVD8dX2UKGgGR0BfffrfLs8gaAdN6ANoCEdAoCUhEfDDTHV9lChoBkdAbyfokAxSHmgHTQMBaAhHQKAlcPsAvL51fZQoaAZHQG8VgI6bONZoB0v/aAhHQKAljXSSeRR1fZQoaAZHQHHsNgSeyzJoB0v7aAhHQKAl0M5wOvt1fZQoaAZHQHHUBrJr+HdoB0v4aAhHQKAl2K/mDDl1fZQoaAZHQG4akHt4RmNoB0v6aAhHQKAmAm1pj+d1fZQoaAZHQHDG8zZYgaFoB0v3aAhHQKAm1CPZIxx1fZQoaAZHQHDr1uR9w3poB0v1aAhHQKAm4sTWXkZ1fZQoaAZHQGxPVr6+FlFoB0v9aAhHQKAnFKSxJNF1fZQoaAZHQHLbRUm2LHdoB00SAWgIR0CgKBanzg/DdX2UKGgGR0Bx7V8gIQe4aAdL+2gIR0CgKIIIF/x2dX2UKGgGR0BxECX9itq6aAdNBgFoCEdAoCi/ymQ8wHV9lChoBkdAcd/XtjTa02gHTQQBaAhHQKAoxElVtGd1fZQoaAZHQG4mx2St/4JoB0vqaAhHQKApBhAnlXB1fZQoaAZHQHIzNwJgLJFoB00VAWgIR0CgKTPh60IDdX2UKGgGR0Bxb81k1/DtaAdL6WgIR0CgKVy8J2MbdX2UKGgGR0Bw/jgm7aqTaAdL62gIR0CgKV0FKTStdX2UKGgGR0BytbjIaLn+aAdNgQFoCEdAoCmPN3W4E3V9lChoBkdAbkMK3uuzQmgHS+poCEdAoCmT6P8ye3V9lChoBkdAcOnHavicXmgHS/BoCEdAoCpvn2ZiNXV9lChoBkdAbJM+JP69CmgHS/ZoCEdAoCqUygwoLHV9lChoBkdAbwy5EMLF42gHS/JoCEdAoCq2R7qptXV9lChoBkdAcwPlSS/0umgHS/NoCEdAoCuuM4tHx3V9lChoBkdAcLVXyiEg4mgHS+xoCEdAoCv64SYgJXV9lChoBkdAcbuvwmVqvmgHS+loCEdAoCwr6N2ki3V9lChoBkdAcOq+L3sXzmgHS9hoCEdAoCyDreIl+nV9lChoBkdAcljNJvo/zWgHS+5oCEdAoCyHgUDdQHV9lChoBkdAckbAood+5WgHS+loCEdAoCzGqioKlnV9lChoBkdAceI7Qb+98WgHS/FoCEdAoC0ZC8e0X3V9lChoBkdAchEN21UlzGgHTRsBaAhHQKAtW6U7jkx1fZQoaAZHQHBDYIKMNttoB00HAWgIR0CgLWZavA45dX2UKGgGR0Bw5xKODJ2daAdNRgFoCEdAoC2RJNCZ4XV9lChoBkdATh2AEt/WlWgHS9loCEdAoC3tpTMq0HV9lChoBkdAbrP8cdYGMWgHS/poCEdAoC5Ho1UEPnV9lChoBkdAYcsHZ9NN8GgHTegDaAhHQKAuUENe+mF1fZQoaAZHQHDjx15jYqZoB00KAWgIR0CgLmXsw+MZdX2UKGgGR0BwsNdhRZU2aAdL7GgIR0CgLzL1EmY0dX2UKGgGR0Bu8ZfOUt7KaAdL8mgIR0CgL4w2VE/jdX2UKGgGR0BwGY1xbSqmaAdL+2gIR0CgL99ycTakdX2UKGgGR0BuFT7XQMQVaAdL52gIR0CgL9/WDpTudX2UKGgGR0BcxU4JeE7GaAdN6ANoCEdAoDAbDKoybnV9lChoBkdAcU17kXDWLGgHTRwBaAhHQKAwrQ5WBBl1fZQoaAZHQHMqnZXdTHdoB00NAWgIR0CgMLLTH80ldX2UKGgGR0BwcXmW+oLoaAdNAAFoCEdAoDDaCg9Ne3V9lChoBkdAbMfyJbdJrmgHS/RoCEdAoDDw0EX+EXV9lChoBkdAcHfJhfBvaWgHS+doCEdAoDD4DzRQanV9lChoBkdAcM4DlHSWq2gHS9poCEdAoDF5JiAlOXV9lChoBkdAckmBYFJQL2gHS/poCEdAoDGWQGOdXnV9lChoBkdAcmNPppvgnGgHTSMBaAhHQKAxn1q33Ht1fZQoaAZHQHDmupS75EdoB0v7aAhHQKAx+/pt78h1fZQoaAZHQHFNR15jYqZoB00QAWgIR0CgMjILgGbDdX2UKGgGR0A+hqp97WupaAdLg2gIR0CgMoXC0ngHdX2UKGgGR0BxzF63RXwLaAdL8GgIR0CgMrHYxtYTdX2UKGgGR0ByOvHyVfNSaAdL5mgIR0CgMvQdS2pidX2UKGgGR0BwrLyvs7dSaAdL52gIR0CgM1b3fyf+dX2UKGgGR0BzUxC9h7VsaAdLyWgIR0CgM/MKb8WLdX2UKGgGR0ByPbFaSs8xaAdNDQFoCEdAoDQGr8zhxnV9lChoBkdAZHU11GLDRGgHTegDaAhHQKA0Zgnc+JR1fZQoaAZHQG88ubAk9lpoB0vxaAhHQKA0gRFI/aB1fZQoaAZHQHG11abF0gdoB00kAWgIR0CgNMEyULUkdX2UKGgGR0Bw3a+evpyIaAdL7mgIR0CgNMoMjNY9dX2UKGgGR0Bx99Ukv9LpaAdNDQFoCEdAoDVOu9vjwXV9lChoBkdAcO/fKp1ifGgHS+poCEdAoDWTT+ee4HV9lChoBkdAcEE9uP3i72gHTQIBaAhHQKA2AYqG1x91fZQoaAZHQHFDL2L5ylxoB0vhaAhHQKA2qgAZKnN1fZQoaAZHQHJYcPatcOdoB00NAWgIR0CgNwLVvuPWdX2UKGgGR0Bwno8aGYa6aAdNEQFoCEdAoDeEcXFcZHV9lChoBkdAcUxNBWxQi2gHS+9oCEdAoDeMxTKkmHV9lChoBkdAcU+/3WWhRWgHTQgBaAhHQKA3mKXOW0J1fZQoaAZHQHFky0KJEYxoB0vvaAhHQKA4F8jzI3l1fZQoaAZHQHAv1WS2Yv5oB0v0aAhHQKA4eK8+Ro11fZQoaAZHQHKfeRT0g8toB00OAWgIR0CgOIIZIg/1dX2UKGgGR0Bxom8oQWepaAdL+2gIR0CgOOXCTEBKdX2UKGgGR0Bwwxk+X7cgaAdL6WgIR0CgORC22G7BdX2UKGgGR0BvN4t6HCXQaAdNrgFoCEdAoDkn9YOlPHV9lChoBkdAcEXgBcRlH2gHTQABaAhHQKA5m6RQrMF1fZQoaAZHQG/ZTgVGkN5oB0v1aAhHQKA5wjDbah91fZQoaAZHQHJ0KRZEDyRoB0vhaAhHQKA5/CLuQZJ1fZQoaAZHQG5PFJQLux9oB0vyaAhHQKA6lriVB2R1fZQoaAZHQGxa7Z39rGloB0vpaAhHQKA7C1JlJ6J1fZQoaAZHQG/fG7BfrrxoB0vyaAhHQKA7KoddVvN1fZQoaAZHQHCToqwyIpJoB00DAWgIR0CgO4G5UcXFdX2UKGgGR0BvQQF1SwW4aAdL52gIR0CgPAPz4DcNdX2UKGgGR0BylrBCUornaAdL62gIR0CgPB1zIV/MdX2UKGgGR0BwqJJZntfHaAdNDAFoCEdAoDw1Jaq0dHVlLg=="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 460, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVdgIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoCIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoESiWCAAAAAAAAAABAQEBAQEBAZRoFUsIhZRoGXSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBEoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaAtLCIWUaBl0lFKUjARoaWdolGgRKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgLSwiFlGgZdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV2wAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCmMBWR0eXBllGgOjApfbnBfcmFuZG9tlE51Yi4=", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "n_steps": 2048, "gamma": 0.99, "gae_lambda": 0.95, "ent_coef": 0.0, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 10, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "system_info": {"OS": "Linux-6.1.58+-x86_64-with-glibc2.35 # 1 SMP PREEMPT_DYNAMIC Sat Nov 18 15:31:17 UTC 2023", "Python": "3.10.12", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.2.1+cu121", "GPU Enabled": "True", "Numpy": "1.25.2", "Cloudpickle": "2.2.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
|
ppo-LunarLander-v2.zip
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:214052fbaad774ff9a82075ec9a7200500332bc73d1d77d2a86d33711a887c03
|
3 |
+
size 147995
|
ppo-LunarLander-v2/data
CHANGED
@@ -4,34 +4,34 @@
|
|
4 |
":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
|
5 |
"__module__": "stable_baselines3.common.policies",
|
6 |
"__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
|
7 |
-
"__init__": "<function ActorCriticPolicy.__init__ at
|
8 |
-
"_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at
|
9 |
-
"reset_noise": "<function ActorCriticPolicy.reset_noise at
|
10 |
-
"_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at
|
11 |
-
"_build": "<function ActorCriticPolicy._build at
|
12 |
-
"forward": "<function ActorCriticPolicy.forward at
|
13 |
-
"extract_features": "<function ActorCriticPolicy.extract_features at
|
14 |
-
"_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at
|
15 |
-
"_predict": "<function ActorCriticPolicy._predict at
|
16 |
-
"evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at
|
17 |
-
"get_distribution": "<function ActorCriticPolicy.get_distribution at
|
18 |
-
"predict_values": "<function ActorCriticPolicy.predict_values at
|
19 |
"__abstractmethods__": "frozenset()",
|
20 |
-
"_abc_impl": "<_abc._abc_data object at
|
21 |
},
|
22 |
-
"verbose":
|
23 |
"policy_kwargs": {},
|
24 |
-
"num_timesteps":
|
25 |
-
"_total_timesteps":
|
26 |
"_num_timesteps_at_start": 0,
|
27 |
"seed": null,
|
28 |
"action_noise": null,
|
29 |
-
"start_time":
|
30 |
"learning_rate": 0.0003,
|
31 |
"tensorboard_log": null,
|
32 |
"_last_obs": {
|
33 |
":type:": "<class 'numpy.ndarray'>",
|
34 |
-
":serialized:": "
|
35 |
},
|
36 |
"_last_episode_starts": {
|
37 |
":type:": "<class 'numpy.ndarray'>",
|
@@ -41,17 +41,17 @@
|
|
41 |
"_episode_num": 0,
|
42 |
"use_sde": false,
|
43 |
"sde_sample_freq": -1,
|
44 |
-
"_current_progress_remaining": -0.
|
45 |
"_stats_window_size": 100,
|
46 |
"ep_info_buffer": {
|
47 |
":type:": "<class 'collections.deque'>",
|
48 |
-
":serialized:": "
|
49 |
},
|
50 |
"ep_success_buffer": {
|
51 |
":type:": "<class 'collections.deque'>",
|
52 |
":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
|
53 |
},
|
54 |
-
"_n_updates":
|
55 |
"observation_space": {
|
56 |
":type:": "<class 'gymnasium.spaces.box.Box'>",
|
57 |
":serialized:": "gAWVdgIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoCIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoESiWCAAAAAAAAAABAQEBAQEBAZRoFUsIhZRoGXSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBEoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaAtLCIWUaBl0lFKUjARoaWdolGgRKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgLSwiFlGgZdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=",
|
|
|
4 |
":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
|
5 |
"__module__": "stable_baselines3.common.policies",
|
6 |
"__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
|
7 |
+
"__init__": "<function ActorCriticPolicy.__init__ at 0x7c5f53a89630>",
|
8 |
+
"_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7c5f53a896c0>",
|
9 |
+
"reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7c5f53a89750>",
|
10 |
+
"_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7c5f53a897e0>",
|
11 |
+
"_build": "<function ActorCriticPolicy._build at 0x7c5f53a89870>",
|
12 |
+
"forward": "<function ActorCriticPolicy.forward at 0x7c5f53a89900>",
|
13 |
+
"extract_features": "<function ActorCriticPolicy.extract_features at 0x7c5f53a89990>",
|
14 |
+
"_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7c5f53a89a20>",
|
15 |
+
"_predict": "<function ActorCriticPolicy._predict at 0x7c5f53a89ab0>",
|
16 |
+
"evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7c5f53a89b40>",
|
17 |
+
"get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7c5f53a89bd0>",
|
18 |
+
"predict_values": "<function ActorCriticPolicy.predict_values at 0x7c5f53a89c60>",
|
19 |
"__abstractmethods__": "frozenset()",
|
20 |
+
"_abc_impl": "<_abc._abc_data object at 0x7c5f53a8cb40>"
|
21 |
},
|
22 |
+
"verbose": 1,
|
23 |
"policy_kwargs": {},
|
24 |
+
"num_timesteps": 1507328,
|
25 |
+
"_total_timesteps": 1500000,
|
26 |
"_num_timesteps_at_start": 0,
|
27 |
"seed": null,
|
28 |
"action_noise": null,
|
29 |
+
"start_time": 1711526485592841125,
|
30 |
"learning_rate": 0.0003,
|
31 |
"tensorboard_log": null,
|
32 |
"_last_obs": {
|
33 |
":type:": "<class 'numpy.ndarray'>",
|
34 |
+
":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAACbLmr24l5C7Z2CGuyqOsjzMBu68Q0qWPQAAgD8AAIA/Bhg1vn2GUz5aYK89/i5TvjYpnLzSyL27AAAAAAAAAADmh6+9ubOXP+Ib5b6FcxS/Yze0vQ9TQb4AAAAAAAAAAOalMT1Iv5G6i379NES4Li1S5cQ6iFVqtAAAgD8AAIA/gE9tvQV5oLs3u0c8tEEXPH5L37xezgU9AACAPwAAgD9Apgu+pwFPPjRWwj3HiTG+KrmVvB+1tDwAAAAAAAAAAJr3n71NW1c/sqJevZm47b4jIBK9m8EfvAAAAAAAAAAAM20EPOwv6D7Er5S82QeevnB/fjxh7ii9AAAAAAAAAACNwC6+ewuGvFU2druMWa+5DHP5Peo1pDoAAIA/AACAP5oOnDxIEo0/qp4aPeaYCL867+08lpI5vQAAAAAAAAAA03Ayvu7PnbzC/ii8rVO7uqu1Bz64LZQ7AACAPwAAgD8aBjU9xabvPG4LV70SMy6+drqkO5/ZHjwAAAAAAAAAAJrsib6tb+0+aKJhPkqEvL6oZq69Jls+PgAAAAAAAAAAzZRrPSecvj8YUQA/byI7Ptgv5jyaawI+AAAAAAAAAABNWRC+gbUjP6pVfTzVkdm+t4g+vYp/Kj0AAAAAAAAAAEDhI76cZUi8wwmzOraBajloTqk9ulAcugAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
|
35 |
},
|
36 |
"_last_episode_starts": {
|
37 |
":type:": "<class 'numpy.ndarray'>",
|
|
|
41 |
"_episode_num": 0,
|
42 |
"use_sde": false,
|
43 |
"sde_sample_freq": -1,
|
44 |
+
"_current_progress_remaining": -0.004885333333333408,
|
45 |
"_stats_window_size": 100,
|
46 |
"ep_info_buffer": {
|
47 |
":type:": "<class 'collections.deque'>",
|
48 |
+
":serialized:": "gAWV/wsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHCDcafjCHiMAWyUS/6MAXSUR0CgIcodMj/udX2UKGgGR0Bw+Bvze40/aAdL+GgIR0CgIeFXJYDDdX2UKGgGR0BwRfY+Sr5qaAdL4WgIR0CgIfIsZpBYdX2UKGgGR0BupV43WFviaAdL4mgIR0CgIfki2UjcdX2UKGgGR0Bya8XvYvnKaAdL7mgIR0CgIkzK9wm3dX2UKGgGR0Bxy5V94NZvaAdL/2gIR0CgIl6hxo7FdX2UKGgGR0BwGtPDYRNAaAdL5mgIR0CgIoG0/nnudX2UKGgGR0BvbimoBJZoaAdL7WgIR0CgI15s0pEydX2UKGgGR0BwiMiJO32FaAdL/mgIR0CgI3ZSeiBYdX2UKGgGR0BylxESdvsJaAdL/2gIR0CgI4mmce8xdX2UKGgGR0BvWJh+fAbiaAdL5GgIR0CgI+EGZ/kOdX2UKGgGR0ByUh0q6OHWaAdL9mgIR0CgJDGGdqcmdX2UKGgGR0BxWkyyleniaAdL72gIR0CgJOZz5oGqdX2UKGgGR0BxTF1bJOnEaAdL2WgIR0CgJPI/7iyZdX2UKGgGR0BwUPfAKv3baAdL12gIR0CgJPzEaVD8dX2UKGgGR0BfffrfLs8gaAdN6ANoCEdAoCUhEfDDTHV9lChoBkdAbyfokAxSHmgHTQMBaAhHQKAlcPsAvL51fZQoaAZHQG8VgI6bONZoB0v/aAhHQKAljXSSeRR1fZQoaAZHQHHsNgSeyzJoB0v7aAhHQKAl0M5wOvt1fZQoaAZHQHHUBrJr+HdoB0v4aAhHQKAl2K/mDDl1fZQoaAZHQG4akHt4RmNoB0v6aAhHQKAmAm1pj+d1fZQoaAZHQHDG8zZYgaFoB0v3aAhHQKAm1CPZIxx1fZQoaAZHQHDr1uR9w3poB0v1aAhHQKAm4sTWXkZ1fZQoaAZHQGxPVr6+FlFoB0v9aAhHQKAnFKSxJNF1fZQoaAZHQHLbRUm2LHdoB00SAWgIR0CgKBanzg/DdX2UKGgGR0Bx7V8gIQe4aAdL+2gIR0CgKIIIF/x2dX2UKGgGR0BxECX9itq6aAdNBgFoCEdAoCi/ymQ8wHV9lChoBkdAcd/XtjTa02gHTQQBaAhHQKAoxElVtGd1fZQoaAZHQG4mx2St/4JoB0vqaAhHQKApBhAnlXB1fZQoaAZHQHIzNwJgLJFoB00VAWgIR0CgKTPh60IDdX2UKGgGR0Bxb81k1/DtaAdL6WgIR0CgKVy8J2MbdX2UKGgGR0Bw/jgm7aqTaAdL62gIR0CgKV0FKTStdX2UKGgGR0BytbjIaLn+aAdNgQFoCEdAoCmPN3W4E3V9lChoBkdAbkMK3uuzQmgHS+poCEdAoCmT6P8ye3V9lChoBkdAcOnHavicXmgHS/BoCEdAoCpvn2ZiNXV9lChoBkdAbJM+JP69CmgHS/ZoCEdAoCqUygwoLHV9lChoBkdAbwy5EMLF42gHS/JoCEdAoCq2R7qptXV9lChoBkdAcwPlSS/0umgHS/NoCEdAoCuuM4tHx3V9lChoBkdAcLVXyiEg4mgHS+xoCEdAoCv64SYgJXV9lChoBkdAcbuvwmVqvmgHS+loCEdAoCwr6N2ki3V9lChoBkdAcOq+L3sXzmgHS9hoCEdAoCyDreIl+nV9lChoBkdAcljNJvo/zWgHS+5oCEdAoCyHgUDdQHV9lChoBkdAckbAood+5WgHS+loCEdAoCzGqioKlnV9lChoBkdAceI7Qb+98WgHS/FoCEdAoC0ZC8e0X3V9lChoBkdAchEN21UlzGgHTRsBaAhHQKAtW6U7jkx1fZQoaAZHQHBDYIKMNttoB00HAWgIR0CgLWZavA45dX2UKGgGR0Bw5xKODJ2daAdNRgFoCEdAoC2RJNCZ4XV9lChoBkdATh2AEt/WlWgHS9loCEdAoC3tpTMq0HV9lChoBkdAbrP8cdYGMWgHS/poCEdAoC5Ho1UEPnV9lChoBkdAYcsHZ9NN8GgHTegDaAhHQKAuUENe+mF1fZQoaAZHQHDjx15jYqZoB00KAWgIR0CgLmXsw+MZdX2UKGgGR0BwsNdhRZU2aAdL7GgIR0CgLzL1EmY0dX2UKGgGR0Bu8ZfOUt7KaAdL8mgIR0CgL4w2VE/jdX2UKGgGR0BwGY1xbSqmaAdL+2gIR0CgL99ycTakdX2UKGgGR0BuFT7XQMQVaAdL52gIR0CgL9/WDpTudX2UKGgGR0BcxU4JeE7GaAdN6ANoCEdAoDAbDKoybnV9lChoBkdAcU17kXDWLGgHTRwBaAhHQKAwrQ5WBBl1fZQoaAZHQHMqnZXdTHdoB00NAWgIR0CgMLLTH80ldX2UKGgGR0BwcXmW+oLoaAdNAAFoCEdAoDDaCg9Ne3V9lChoBkdAbMfyJbdJrmgHS/RoCEdAoDDw0EX+EXV9lChoBkdAcHfJhfBvaWgHS+doCEdAoDD4DzRQanV9lChoBkdAcM4DlHSWq2gHS9poCEdAoDF5JiAlOXV9lChoBkdAckmBYFJQL2gHS/poCEdAoDGWQGOdXnV9lChoBkdAcmNPppvgnGgHTSMBaAhHQKAxn1q33Ht1fZQoaAZHQHDmupS75EdoB0v7aAhHQKAx+/pt78h1fZQoaAZHQHFNR15jYqZoB00QAWgIR0CgMjILgGbDdX2UKGgGR0A+hqp97WupaAdLg2gIR0CgMoXC0ngHdX2UKGgGR0BxzF63RXwLaAdL8GgIR0CgMrHYxtYTdX2UKGgGR0ByOvHyVfNSaAdL5mgIR0CgMvQdS2pidX2UKGgGR0BwrLyvs7dSaAdL52gIR0CgM1b3fyf+dX2UKGgGR0BzUxC9h7VsaAdLyWgIR0CgM/MKb8WLdX2UKGgGR0ByPbFaSs8xaAdNDQFoCEdAoDQGr8zhxnV9lChoBkdAZHU11GLDRGgHTegDaAhHQKA0Zgnc+JR1fZQoaAZHQG88ubAk9lpoB0vxaAhHQKA0gRFI/aB1fZQoaAZHQHG11abF0gdoB00kAWgIR0CgNMEyULUkdX2UKGgGR0Bw3a+evpyIaAdL7mgIR0CgNMoMjNY9dX2UKGgGR0Bx99Ukv9LpaAdNDQFoCEdAoDVOu9vjwXV9lChoBkdAcO/fKp1ifGgHS+poCEdAoDWTT+ee4HV9lChoBkdAcEE9uP3i72gHTQIBaAhHQKA2AYqG1x91fZQoaAZHQHFDL2L5ylxoB0vhaAhHQKA2qgAZKnN1fZQoaAZHQHJYcPatcOdoB00NAWgIR0CgNwLVvuPWdX2UKGgGR0Bwno8aGYa6aAdNEQFoCEdAoDeEcXFcZHV9lChoBkdAcUxNBWxQi2gHS+9oCEdAoDeMxTKkmHV9lChoBkdAcU+/3WWhRWgHTQgBaAhHQKA3mKXOW0J1fZQoaAZHQHFky0KJEYxoB0vvaAhHQKA4F8jzI3l1fZQoaAZHQHAv1WS2Yv5oB0v0aAhHQKA4eK8+Ro11fZQoaAZHQHKfeRT0g8toB00OAWgIR0CgOIIZIg/1dX2UKGgGR0Bxom8oQWepaAdL+2gIR0CgOOXCTEBKdX2UKGgGR0Bwwxk+X7cgaAdL6WgIR0CgORC22G7BdX2UKGgGR0BvN4t6HCXQaAdNrgFoCEdAoDkn9YOlPHV9lChoBkdAcEXgBcRlH2gHTQABaAhHQKA5m6RQrMF1fZQoaAZHQG/ZTgVGkN5oB0v1aAhHQKA5wjDbah91fZQoaAZHQHJ0KRZEDyRoB0vhaAhHQKA5/CLuQZJ1fZQoaAZHQG5PFJQLux9oB0vyaAhHQKA6lriVB2R1fZQoaAZHQGxa7Z39rGloB0vpaAhHQKA7C1JlJ6J1fZQoaAZHQG/fG7BfrrxoB0vyaAhHQKA7KoddVvN1fZQoaAZHQHCToqwyIpJoB00DAWgIR0CgO4G5UcXFdX2UKGgGR0BvQQF1SwW4aAdL52gIR0CgPAPz4DcNdX2UKGgGR0BylrBCUornaAdL62gIR0CgPB1zIV/MdX2UKGgGR0BwqJJZntfHaAdNDAFoCEdAoDw1Jaq0dHVlLg=="
|
49 |
},
|
50 |
"ep_success_buffer": {
|
51 |
":type:": "<class 'collections.deque'>",
|
52 |
":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
|
53 |
},
|
54 |
+
"_n_updates": 460,
|
55 |
"observation_space": {
|
56 |
":type:": "<class 'gymnasium.spaces.box.Box'>",
|
57 |
":serialized:": "gAWVdgIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoCIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoESiWCAAAAAAAAAABAQEBAQEBAZRoFUsIhZRoGXSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBEoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaAtLCIWUaBl0lFKUjARoaWdolGgRKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgLSwiFlGgZdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=",
|
ppo-LunarLander-v2/policy.optimizer.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 88362
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ef1939840e3bfaa6070a7e7d081c0c7cc25ecfa165e2008006a10f115ca93e9e
|
3 |
size 88362
|
ppo-LunarLander-v2/policy.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 43762
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aca183006757871e1b9905993aa53300ca461c3b20a027b500d03c956a65047f
|
3 |
size 43762
|
replay.mp4
CHANGED
Binary files a/replay.mp4 and b/replay.mp4 differ
|
|
results.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"mean_reward":
|
|
|
1 |
+
{"mean_reward": 260.72180706618326, "std_reward": 19.360104937819813, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2024-03-27T08:35:58.861285"}
|