hookzeng commited on
Commit
b7e7c3d
1 Parent(s): 77daf87

Upload PPO LunarLander-v2 trained agent

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
- value: 230.21 +/- 17.26
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
+ value: 229.02 +/- 28.04
20
  name: mean_reward
21
  verified: false
22
  ---
config.json CHANGED
@@ -1 +1 @@
1
- {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7efded27dca0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7efded27dd30>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7efded27ddc0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7efded27de50>", "_build": "<function ActorCriticPolicy._build at 0x7efded27dee0>", "forward": "<function ActorCriticPolicy.forward at 0x7efded27df70>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7efded202040>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7efded2020d0>", "_predict": "<function ActorCriticPolicy._predict at 0x7efded202160>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7efded2021f0>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7efded202280>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7efded202310>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc_data object at 0x7efded27c2d0>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 1015808, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1712322094998193614, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAGZhhbxSmOG5qtKvObuD9rVEWvy6okrPuAAAgD8AAIA/hsotPnRNhLxOz8Q5MYscuCr05r0ZhQO5AACAPwAAgD/QZqq+l+5KP100Fz7063C+OUeqvUVlvz0AAAAAAAAAAM19M72P3nm6N6OIuYmrg7TS30a7KqOfOAAAgD8AAIA/M5x1PcPtMrqqpjw8bU65NkPBHLvn3K01AACAPwAAgD8z+1S9rnWJuspfnTlSg5G20TNvutAHtrgAAIA/AACAP/O6tj2PxmG69FQzvLVnF7Z0HL+68quLNQAAgD8AAIA/WlGJPTiqwD0zLAC+RURVvvae5rv1oK69AAAAAAAAAAATqjA+D7BlP16BVbz6dZW+nTHVPbplYr0AAAAAAAAAANPvHT6sxpU/aneYPsmswL7Lsuw9pRPHOwAAAAAAAAAAAGwwPXsanrr6CJS7q9wEtWgUTbr0uao6AACAPwAAgD/m0YG93r2ZPcMDRz4zlGG+FGeFPZurKD0AAAAAAAAAAKYnsb0G+Sw/m3PjPXOhiL6xc586eHkkPQAAAAAAAAAAAPg0O7jm5rmJ3Q66VpmLtVFxmLpr1SY5AACAPwAAgD9aMaI9H031uaQaJrtm6++1mJCwOirDPjoAAIA/AACAP5rZ/ToU3sK6VjB1urXLTTuVXAs7MstevAAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.015808000000000044, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVQQwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQE46o+fRNRGMAWyUS9iMAXSUR0B9G5wjt5UtdX2UKGgGR0BkWQu/UONHaAdN6ANoCEdAfSBwsGxD9nV9lChoBkdAZbcMUh3aBmgHTegDaAhHQH0qTfrKNhp1fZQoaAZHQGLwXjlxOtZoB03oA2gIR0B9MjCbc45tdX2UKGgGR0BgN8xIre67aAdN6ANoCEdAfUBIcinpCHV9lChoBkdAZnzzRQaaTmgHTegDaAhHQH1XYk/r0J51fZQoaAZHQGJF6F/QSjBoB03oA2gIR0B9Y6+Jxeb/dX2UKGgGR0Bk9//95yEMaAdN6ANoCEdAfW6lXzUZvXV9lChoBkdAZkiY+B6KL2gHTegDaAhHQH1wTUAksz51fZQoaAZHQGLLta6jFhpoB03oA2gIR0B9cY7cO9WZdX2UKGgGR0Bc9SUcGTs6aAdN6ANoCEdAfXRVxjriVHV9lChoBkdAYeGplSS/02gHTegDaAhHQH2EYpMHryF1fZQoaAZHQGPq/+sHSndoB03oA2gIR0B9iGaTfR/mdX2UKGgGR0AjM6QvHtF8aAdL9WgIR0B9jxEPUaybdX2UKGgGR0BkvO6d1+y7aAdN6ANoCEdAfY9VLBbfQHV9lChoBkdAY/ipo9LYgGgHTegDaAhHQH2bvc8DB/J1fZQoaAZHQGA3liSaEzxoB03oA2gIR0B9sKr+5vtMdX2UKGgGR0BVwfIOpbUxaAdN6ANoCEdAfbQI55qubXV9lChoBkdAY4/yEtdzGWgHTegDaAhHQH234+B6KLt1fZQoaAZHQGGtnWz4UN9oB03oA2gIR0B9v3di2DxtdX2UKGgGR0BlQdEuxrzoaAdN6ANoCEdAfcWYtQKrrHV9lChoBkdAZdEu5jH4oWgHTegDaAhHQH3Re4oZydZ1fZQoaAZHQGV/nw5NoJ1oB03oA2gIR0B95Do4dZJTdX2UKGgGR0BmLupMpPRBaAdN6ANoCEdAfe3TA31jAnV9lChoBkdAYjpjx0+1SmgHTegDaAhHQH32G47Rv3t1fZQoaAZHQGT8JXp4bCJoB03oA2gIR0B9+EKUmlZYdX2UKGgGR0BlShgiNbTuaAdN6ANoCEdAffpfyf+S83V9lChoBkdAXnHZAY51eWgHTegDaAhHQH4GqgyuZCx1fZQoaAZHQGUYNOEdvKloB03oA2gIR0B+CZntfG+9dX2UKGgGR0BkHnXoTwlTaAdN6ANoCEdAfg7QRPGhmHV9lChoBkdAYLzkWhysCGgHTegDaAhHQH4PBN21Ul11fZQoaAZHQGCpL1/Ue+5oB03oA2gIR0B+GXNY8uBddX2UKGgGR0BjccR6F/QTaAdN6ANoCEdAfhslvZRKpXV9lChoBkdAaOZFKkEcKmgHTegDaAhHQH43WVAzHjp1fZQoaAZHQGA+Wf9P1thoB03oA2gIR0B+Ot3fQ8fWdX2UKGgGR0Bc9qq814xDaAdN6ANoCEdAfkIHU+cH4XV9lChoBkdAYdlYEGJN02gHTegDaAhHQH5IDoUzsQd1fZQoaAZHQGRvT7l7tzFoB03oA2gIR0B+VBxAB1cMdX2UKGgGR0BlfCScLBsRaAdN6ANoCEdAfmhd/J/5L3V9lChoBkdAYp7/jKgZj2gHTegDaAhHQH5zC9EkSmJ1fZQoaAZHQF4l6jWTX8RoB03oA2gIR0B+fDffoA4odX2UKGgGR0BnANm6GxlhaAdN6ANoCEdAfn6qoZQ53nV9lChoBkdAYYtcHGCI12gHTegDaAhHQH6BLKFIuoR1fZQoaAZHQGTT1Ed/8VJoB03oA2gIR0B+kJ4mkWRBdX2UKGgGR0Bfgrns9jgAaAdN6ANoCEdAfpRhXr+o+HV9lChoBkdAXqEfyPMjeWgHTegDaAhHQH6bGEPDpC91fZQoaAZHQGJA7pV0cOtoB03oA2gIR0B+m1iqhlDndX2UKGgGR0Be0JTER8MNaAdN6ANoCEdAfqeyLQ5WBHV9lChoBkdAYUU6qbSZ0GgHTegDaAhHQH6pvQnhKlJ1fZQoaAZHQGC/l+3H7xdoB03oA2gIR0B+rVsLv1DjdX2UKGgGR0BkChrrPdEcaAdN6ANoCEdAfsZmmtQsPXV9lChoBkdAYNVarWAf+2gHTegDaAhHQH7PJTER8MN1fZQoaAZHQFwSiWVu76JoB03oA2gIR0B+1nHaN+9bdX2UKGgGR0Bj+lV/+bVjaAdN6ANoCEdAfuTP0qYqonV9lChoBkdAZQS32EkB0mgHTegDaAhHQH77OdXko4N1fZQoaAZHQGGgjA8B+4NoB03oA2gIR0B/Behf0EowdX2UKGgGR0Bk9RLCemNzaAdN6ANoCEdAfw82xY7q6nV9lChoBkdAZvOK+i8Fp2gHTegDaAhHQH8RjkMkQf91fZQoaAZHQGS2YNqgyuZoB03oA2gIR0B/E/IikftAdX2UKGgGR0BexIXoC+10aAdN6ANoCEdAfyE2M85jpnV9lChoBkdAZiXVhCtzS2gHTegDaAhHQH8kVhoduHh1fZQoaAZHQGNHrxRVIZtoB03oA2gIR0B/KdLxqfvndX2UKGgGR0BkG9fCyhSMaAdN6ANoCEdAfyoMUAT7EnV9lChoBkdAWxUXcgyM1mgHTegDaAhHQH8033UQTVV1fZQoaAZHQGClehGpdbBoB03oA2gIR0B/NrPw/gR9dX2UKGgGR0BldmQ6p5u7aAdN6ANoCEdAfzncy31BdHV9lChoBkdAZNCLiuMdcWgHTegDaAhHQH9Pj1XeWOZ1fZQoaAZHQGWurUkOZstoB03oA2gIR0B/V52eQMhHdX2UKGgGR0Be9L3sXzlLaAdN6ANoCEdAf16UxVQyh3V9lChoBkdAZC9ReC04R2gHTegDaAhHQH9so0IkZ751fZQoaAZHQF20+RYA80VoB03oA2gIR0B/hBcGC7K8dX2UKGgGR0BkzDj94u9OaAdN6ANoCEdAf5CpEhJRO3V9lChoBkdAXdVObiIcimgHTegDaAhHQH+blyaNMoN1fZQoaAZHQF9t6Skj5bhoB03oA2gIR0B/noKLKmsOdX2UKGgGR0BhIjWsijcmaAdN6ANoCEdAf6GFOfukUXV9lChoBkdAYu3b/wRXfmgHTegDaAhHQH+0UNKAavR1fZQoaAZHQGXf2fkFOfxoB03oA2gIR0B/uMytV7x/dX2UKGgGR0BgeByXD3ueaAdN6ANoCEdAf8CS1Vo6CHV9lChoBkdAYzSiO/+Kj2gHTegDaAhHQH/A5SWJJoV1fZQoaAZHQGUEO7QLNOdoB03oA2gIR0B/zyNMoMKDdX2UKGgGR0BnrDTBqKxcaAdN6ANoCEdAf9FugYgq3HV9lChoBkdAYDZs/IKc/mgHTegDaAhHQH/VdOVPepJ1fZQoaAZHQGJ6ml67dzpoB03oA2gIR0B/2hlz2exwdX2UKGgGR0BfMSgTRIBjaAdN6ANoCEdAf/b2HtWuHXV9lChoBkdAXokgzP8htGgHTegDaAhHQH/+K7mMfih1fZQoaAZHQGJaxf4REndoB03oA2gIR0CABdR64UeudX2UKGgGR0BCe1kUbkwOaAdL/WgIR0CADwwTM7lrdX2UKGgGR0BgjRbW3BpIaAdN6ANoCEdAgBAsaCL/CXV9lChoBkdAY4l1Oj7AL2gHTegDaAhHQIAVGkgwGnp1fZQoaAZHQGIHb0e2d/doB03oA2gIR0CAGWMb3oLYdX2UKGgGR0BkMsbtJFspaAdN6ANoCEdAgBp5ZB9kSXV9lChoBkdAYVjEit7rs2gHTegDaAhHQIAblyPuG9J1fZQoaAZHQGbA+VC5VfhoB03oA2gIR0CAIqmVJL/TdX2UKGgGR0BidUUKzAvdaAdN6ANoCEdAgCR1zySV4XV9lChoBkdAYGVTEzfrKWgHTegDaAhHQIAnoq/dqL11fZQoaAZHQGChQVsUIs1oB03oA2gIR0CAJ8NYr8R+dX2UKGgGR0BidtsJpnHvaAdN6ANoCEdAgC3PLHMlknV9lChoBkdAZEN9MsYl6mgHTegDaAhHQIAuzHlwLmZ1fZQoaAZHQGcpHLzPKMhoB03oA2gIR0CAMI9jgAIZdX2UKGgGR0Bg8IKrq+rVaAdN6ANoCEdAgDK9nbqQinVlLg=="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 248, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVcAIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoECiWCAAAAAAAAAABAQEBAQEBAZRoFEsIhZRoGHSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBAoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaApLCIWUaBh0lFKUjARoaWdolGgQKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgKSwiFlGgYdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV1QAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCloCmgOjApfbnBfcmFuZG9tlE51Yi4=", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 128, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWV1gIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMYC9ob21lL2hvb2t6ZW5nL2FuYWNvbmRhMy9lbnZzL3B5MzgvbGliL3B5dGhvbjMuOC9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4RDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMYC9ob21lL2hvb2t6ZW5nL2FuYWNvbmRhMy9lbnZzL3B5MzgvbGliL3B5dGhvbjMuOC9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlGgAjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoH32UfZQoaBZoDYwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBeMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHP8mZmZmZmZqFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWV1gIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMYC9ob21lL2hvb2t6ZW5nL2FuYWNvbmRhMy9lbnZzL3B5MzgvbGliL3B5dGhvbjMuOC9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4RDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMYC9ob21lL2hvb2t6ZW5nL2FuYWNvbmRhMy9lbnZzL3B5MzgvbGliL3B5dGhvbjMuOC9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlGgAjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoH32UfZQoaBZoDYwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBeMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHPzOpKjBVMmGFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "system_info": {"OS": "Linux-6.2.0-39-generic-x86_64-with-glibc2.17 # 40~22.04.1-Ubuntu SMP PREEMPT_DYNAMIC Thu Nov 16 10:53:04 UTC 2", "Python": "3.8.18", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.2.2+cu121", "GPU Enabled": "False", "Numpy": "1.24.4", "Cloudpickle": "3.0.0", "Gymnasium": "0.28.1"}}
 
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7fb26a67dca0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7fb26a67dd30>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7fb26a67ddc0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7fb26a67de50>", "_build": "<function ActorCriticPolicy._build at 0x7fb26a67dee0>", "forward": "<function ActorCriticPolicy.forward at 0x7fb26a67df70>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7fb26a602040>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7fb26a6020d0>", "_predict": "<function ActorCriticPolicy._predict at 0x7fb26a602160>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7fb26a6021f0>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7fb26a602280>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7fb26a602310>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc_data object at 0x7fb26a67c2a0>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 1015808, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1712322867214142034, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAM2mDrz2/Cq6gORtO4Gbyzbwieo5Wj6JugAAgD8AAIA/U5AIvq7RhLr3hjU9u3phOfLNyDvlM0S6AACAPwAAgD+zspk99nxBujrOP7kDX5U248BMugajWTgAAIA/AACAP9rZ9z09hyG7YUkFupfWrTfPkWG8wnY7OQAAgD8AAIA/WmctvjjC67vOgCw8nDcbOt95Xz2j9QG7AACAPwAAgD9q9LI+xJM5P1EWnby3Q6O+M2oLvKsOBT0AAAAAAAAAAPrWEr5PkUo+FJAgPTMIV76ffae6/cocvQAAAAAAAAAAzctEPfaIGrpQweQ6PoyoNZ+MfDtmpwe6AACAPwAAgD8A6NY7cDCAP1CbKzyTZYa+ymI8vXZtNj0AAAAAAAAAAM3z1LwpOD+6tbx/vIfyxDXfEbg5Su4wtQAAgD8AAIA/gEMBPY9CVbiAlOq5Q3oWtkZ5dDv7VAo5AACAPwAAgD9QsH2+y/MpP9pOqztdZHO+WSFtvSD7sb0AAAAAAAAAAGa7/zyPHiK6LZvWOcmyBjXgdMs68HH4uAAAgD8AAIA/AFSwO4+eTbqSquk7pBi5NiagkrvcDrM1AACAPwAAgD+z61i9rSBHP4oh9Lwp4lG+W6hEvB0P37wAAAAAAAAAAABlsjxc6zK66NTWOlzykDXCIey5QCX5uQAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.015808000000000044, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVQwwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQGRHdNvfj0eMAWyUTegDjAF0lEdAe04qzZ6D5HV9lChoBkdAYLHOymhufmgHTegDaAhHQHtU98zAN5N1fZQoaAZHQGL143m3fANoB03oA2gIR0B7Vr3ai9IxdX2UKGgGR0BazbnLaEi/aAdN6ANoCEdAe1i6xPfsNXV9lChoBkdAYdFRQaaTfWgHTegDaAhHQHtcUc4o7V91fZQoaAZHQFy3rQPZqVRoB03oA2gIR0B7YAx59mYjdX2UKGgGR0Bg5M5jpcHGaAdN6ANoCEdAe2fkC3gDR3V9lChoBkdAZQQDUVi4KGgHTegDaAhHQHt2ZB5X2dx1fZQoaAZHwCl9KkEcKgJoB006AWgIR0B7fN7kXDWLdX2UKGgGR0Bb3J9E1EVnaAdN6ANoCEdAe4YEk0JnhHV9lChoBkdAQUsGC7K7qmgHTSIBaAhHQHuHEUO/cnF1fZQoaAZHQGFdXr2QGOdoB03oA2gIR0B7rHTgEU0vdX2UKGgGR0BdlX9itq59aAdN6ANoCEdAe68IhQm/nHV9lChoBkdAYoUwX668QWgHTegDaAhHQHuyPEn9ehR1fZQoaAZHQGB65Gz8gp1oB03oA2gIR0B7yIVj7Q9idX2UKGgGR0BessjNY8uBaAdN6ANoCEdAe8p5dGAkLXV9lChoBkdAYRmIMSbpeWgHTegDaAhHQHvMKvNeMQ51fZQoaAZHQF0HqubI91VoB03oA2gIR0B72by9VWCFdX2UKGgGR0BcuGQOnVG1aAdN6ANoCEdAe92D0UXYUXV9lChoBkdAZJxKyv9tM2gHTegDaAhHQHvllkMCtA91fZQoaAZHQFy/ztkWhytoB03oA2gIR0B754DZDiOvdX2UKGgGR0BrL+WnjyWiaAdNzANoCEdAe+eqYJE6UHV9lChoBkdAZJ0fHxSYPWgHTegDaAhHQHv20XLvCuV1fZQoaAZHQGJVBb4agmJoB03oA2gIR0B8Bio2n88+dX2UKGgGR0BsIFgfEGaAaAdN7AFoCEdAfAu1vl2eQXV9lChoBkdAYBoerdWQwWgHTegDaAhHQHwMn+ERJ3B1fZQoaAZHQFh6URFqi49oB03oA2gIR0B8FXryDqW1dX2UKGgGR0BgHz9hqj8DaAdN6ANoCEdAfBaRGMGX5XV9lChoBkfAJVRWtEG7jGgHTTkBaAhHQHwjUgSvkil1fZQoaAZHQFtOigTRIBloB03oA2gIR0B8M/EOy3TedX2UKGgGR0BeqmBvrGBGaAdN6ANoCEdAfD6neizsyHV9lChoBkdAY0csAeaKDWgHTegDaAhHQHxB7xmTTv11fZQoaAZHQFrhktEofCBoB03oA2gIR0B8WeNNrTH9dX2UKGgGR0BhytaB7NSqaAdN6ANoCEdAfFwaisXBQHV9lChoBkdAYtAL+glF+mgHTegDaAhHQHxtrQw9JSR1fZQoaAZHQGFMECeVcD9oB03oA2gIR0B8cckC3gDSdX2UKGgGR0BheAkqtozvaAdN6ANoCEdAfHsAAQxvenV9lChoBkdAXw6fSQYDT2gHTegDaAhHQHx9JvkzXSV1fZQoaAZHQGJzXuuzQeFoB03oA2gIR0B8fVX6qKgqdX2UKGgGR0BhqEtXgccVaAdN6ANoCEdAfJ0AE+xGD3V9lChoBkdAYxoyLQ5WBGgHTegDaAhHQHyizuv2XcB1fZQoaAZHQFwgrKeTV2BoB03oA2gIR0B8o7/5tWMkdX2UKGgGR0BhcbGaQV9GaAdN6ANoCEdAfKxctXgccXV9lChoBkdAYdxIT4+KTGgHTegDaAhHQHytYqPOpsJ1fZQoaAZHQGPJoikfs/poB03oA2gIR0B8uuj7ALy+dX2UKGgGR0A8dJ2+wkgPaAdL+2gIR0B8x6RvFWGRdX2UKGgGR0BaaDXnQpnZaAdN6ANoCEdAfMn+10DEFXV9lChoBkdAYOkDJ2dNFmgHTegDaAhHQHzMThLoOhF1fZQoaAZHQFsusSCe2/loB03oA2gIR0B815IsiB5HdX2UKGgGR0Bk7Y2GZeAvaAdN6ANoCEdAfOvpyIYWL3V9lChoBkdAY8uMqjJuEWgHTegDaAhHQHztoeLehwl1fZQoaAZHQF/i4QBgeBBoB03oA2gIR0B8+47tAs06dX2UKGgGR0Bb+9OVPepGaAdN6ANoCEdAfP8MpgCwKXV9lChoBkdAXhNNGmUGFGgHTegDaAhHQH0G9a6jFhp1fZQoaAZHQFoEVN5+pfhoB03oA2gIR0B9COfYjB2wdX2UKGgGR0BgAKij+JgtaAdN6ANoCEdAfQkQTmGM43V9lChoBkdAGV/N7jT8YWgHTRgBaAhHQH0O2d3B55Z1fZQoaAZHQGNAGyPdVNpoB03oA2gIR0B9JRrhzeXSdX2UKGgGR0BiXX7aZhKEaAdN6ANoCEdAfSoHuZ1FIHV9lChoBkdAW+YSamXPaGgHTegDaAhHQH0y0zCUHIJ1fZQoaAZHQGHAqmTC+DhoB03oA2gIR0B9M8LXtjTbdX2UKGgGR0Bi4bUmUnogaAdN6ANoCEdAfT+5tWMjvHV9lChoBkdAYL87MgU1ymgHTegDaAhHQH1MMBp5/sp1fZQoaAZHQAGt9QXQ+lloB00IAWgIR0B9TSA5Jbt7dX2UKGgGR0BaqUbkwN9ZaAdN6ANoCEdAfU55Dqnm73V9lChoBkdAYivnwob4rWgHTegDaAhHQH1QjufEn9h1fZQoaAZHQFs5doWYWtVoB03oA2gIR0B9U0Pf8/D+dX2UKGgGR0BdQnE61b7kaAdN6ANoCEdAfW8bbUPQOXV9lChoBkdAWJnmmtQsPWgHTegDaAhHQH2CWj0th/l1fZQoaAZHQGMaBq0tyxRoB03oA2gIR0B9htVNpM6BdX2UKGgGR0BiVbYXfqHHaAdN6ANoCEdAfZFL3sXzlXV9lChoBkdAWq0Rbr1M/WgHTegDaAhHQH2T6/20zCV1fZQoaAZHQGCf7dJrcj9oB03oA2gIR0B9lCInBtUGdX2UKGgGR0BiGI9ovi97aAdN6ANoCEdAfZtoTwlSj3V9lChoBkdAXoNAu7HyVmgHTegDaAhHQH221EVnEl51fZQoaAZHQGHbDopx3mpoB03oA2gIR0B9yFFUhmoSdX2UKGgGR0BhOo+0PYnOaAdN6ANoCEdAfcmIWP91l3V9lChoBkdAYF3sqrilzmgHTegDaAhHQH3ZFwHZ9NN1fZQoaAZHQFm+xaPjn3doB03oA2gIR0B96QUYbbUPdX2UKGgGR0BgIYywfQruaAdN6ANoCEdAfeoa6z3RHHV9lChoBkdAYwCs4ku6E2gHTegDaAhHQH3rsWoFV1h1fZQoaAZHQGQGnSv1UVBoB03oA2gIR0B97jC2tuDSdX2UKGgGR0BhjdhsqJ/HaAdN6ANoCEdAffFv/BFd9nV9lChoBkdAYKyIsyzolmgHTegDaAhHQH4RzmSyMUB1fZQoaAZHQGOylum78NxoB03oA2gIR0B+J0ySFGoadX2UKGgGR0A4CRDkU9IPaAdNQgFoCEdAfiuJk5IYnHV9lChoBkdAX95Q3xWkrWgHTegDaAhHQH4r7hvR7Z51fZQoaAZHQFt4SW7e2uxoB03oA2gIR0B+NeH+IdlvdX2UKGgGR0BiMUTHsC1aaAdN6ANoCEdAfjg16mfoR3V9lChoBkdAZL+vxH5JsmgHTegDaAhHQH44aBNEgGN1fZQoaAZHQGEcCcoYvWZoB03oA2gIR0B+P1X1anrIdX2UKGgGR0Bcv4SQHRkVaAdN6ANoCEdAflkFt8/lhnV9lChoBkdAJIdSMtK7I2gHTSIBaAhHQH5grI91U2l1fZQoaAZHQGLwifQKKHhoB03oA2gIR0B+aMvrWy1NdX2UKGgGR0Bg4K2tuDSPaAdN6ANoCEdAfmnTIeYD1XV9lChoBkdAXifRv3rUsmgHTegDaAhHQH52P/m1YyR1fZQoaAZHQGXlmvnr6cloB03oA2gIR0B+g0Kx9oexdX2UKGgGR0BeUvT1CgK4aAdN6ANoCEdAfoQ371qWT3V9lChoBkdAYC4Z88cMmWgHTegDaAhHQH6FlU6xPft1fZQoaAZHQGQCFxXGOuJoB03oA2gIR0B+h9lg+hXbdWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 248, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVcAIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoECiWCAAAAAAAAAABAQEBAQEBAZRoFEsIhZRoGHSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBAoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaApLCIWUaBh0lFKUjARoaWdolGgQKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgKSwiFlGgYdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV1QAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCloCmgOjApfbnBfcmFuZG9tlE51Yi4=", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 256, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWV1gIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMYC9ob21lL2hvb2t6ZW5nL2FuYWNvbmRhMy9lbnZzL3B5MzgvbGliL3B5dGhvbjMuOC9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4RDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMYC9ob21lL2hvb2t6ZW5nL2FuYWNvbmRhMy9lbnZzL3B5MzgvbGliL3B5dGhvbjMuOC9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlGgAjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoH32UfZQoaBZoDYwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBeMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHP8mZmZmZmZqFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWV1gIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMYC9ob21lL2hvb2t6ZW5nL2FuYWNvbmRhMy9lbnZzL3B5MzgvbGliL3B5dGhvbjMuOC9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4RDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMYC9ob21lL2hvb2t6ZW5nL2FuYWNvbmRhMy9lbnZzL3B5MzgvbGliL3B5dGhvbjMuOC9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlGgAjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoH32UfZQoaBZoDYwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBeMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHPzOpKjBVMmGFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "system_info": {"OS": "Linux-6.2.0-39-generic-x86_64-with-glibc2.17 # 40~22.04.1-Ubuntu SMP PREEMPT_DYNAMIC Thu Nov 16 10:53:04 UTC 2", "Python": "3.8.18", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.2.2+cu121", "GPU Enabled": "False", "Numpy": "1.24.4", "Cloudpickle": "3.0.0", "Gymnasium": "0.28.1"}}
ppo-LunarLander-v2.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:890c065099b0ddd693a8d4f607420ef1b6761434514aefb7b61eed7e269e553d
3
  size 147601
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0b2c2670c646e9adb567ee37983c5a2347e6f9c0bd879a5c5c76caf2a92bd30
3
  size 147601
ppo-LunarLander-v2/data CHANGED
@@ -4,20 +4,20 @@
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
- "__init__": "<function ActorCriticPolicy.__init__ at 0x7efded27dca0>",
8
- "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7efded27dd30>",
9
- "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7efded27ddc0>",
10
- "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7efded27de50>",
11
- "_build": "<function ActorCriticPolicy._build at 0x7efded27dee0>",
12
- "forward": "<function ActorCriticPolicy.forward at 0x7efded27df70>",
13
- "extract_features": "<function ActorCriticPolicy.extract_features at 0x7efded202040>",
14
- "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7efded2020d0>",
15
- "_predict": "<function ActorCriticPolicy._predict at 0x7efded202160>",
16
- "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7efded2021f0>",
17
- "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7efded202280>",
18
- "predict_values": "<function ActorCriticPolicy.predict_values at 0x7efded202310>",
19
  "__abstractmethods__": "frozenset()",
20
- "_abc_impl": "<_abc_data object at 0x7efded27c2d0>"
21
  },
22
  "verbose": 1,
23
  "policy_kwargs": {},
@@ -26,12 +26,12 @@
26
  "_num_timesteps_at_start": 0,
27
  "seed": null,
28
  "action_noise": null,
29
- "start_time": 1712322094998193614,
30
  "learning_rate": 0.0003,
31
  "tensorboard_log": null,
32
  "_last_obs": {
33
  ":type:": "<class 'numpy.ndarray'>",
34
- ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAGZhhbxSmOG5qtKvObuD9rVEWvy6okrPuAAAgD8AAIA/hsotPnRNhLxOz8Q5MYscuCr05r0ZhQO5AACAPwAAgD/QZqq+l+5KP100Fz7063C+OUeqvUVlvz0AAAAAAAAAAM19M72P3nm6N6OIuYmrg7TS30a7KqOfOAAAgD8AAIA/M5x1PcPtMrqqpjw8bU65NkPBHLvn3K01AACAPwAAgD8z+1S9rnWJuspfnTlSg5G20TNvutAHtrgAAIA/AACAP/O6tj2PxmG69FQzvLVnF7Z0HL+68quLNQAAgD8AAIA/WlGJPTiqwD0zLAC+RURVvvae5rv1oK69AAAAAAAAAAATqjA+D7BlP16BVbz6dZW+nTHVPbplYr0AAAAAAAAAANPvHT6sxpU/aneYPsmswL7Lsuw9pRPHOwAAAAAAAAAAAGwwPXsanrr6CJS7q9wEtWgUTbr0uao6AACAPwAAgD/m0YG93r2ZPcMDRz4zlGG+FGeFPZurKD0AAAAAAAAAAKYnsb0G+Sw/m3PjPXOhiL6xc586eHkkPQAAAAAAAAAAAPg0O7jm5rmJ3Q66VpmLtVFxmLpr1SY5AACAPwAAgD9aMaI9H031uaQaJrtm6++1mJCwOirDPjoAAIA/AACAP5rZ/ToU3sK6VjB1urXLTTuVXAs7MstevAAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
35
  },
36
  "_last_episode_starts": {
37
  ":type:": "<class 'numpy.ndarray'>",
@@ -45,7 +45,7 @@
45
  "_stats_window_size": 100,
46
  "ep_info_buffer": {
47
  ":type:": "<class 'collections.deque'>",
48
- ":serialized:": "gAWVQQwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQE46o+fRNRGMAWyUS9iMAXSUR0B9G5wjt5UtdX2UKGgGR0BkWQu/UONHaAdN6ANoCEdAfSBwsGxD9nV9lChoBkdAZbcMUh3aBmgHTegDaAhHQH0qTfrKNhp1fZQoaAZHQGLwXjlxOtZoB03oA2gIR0B9MjCbc45tdX2UKGgGR0BgN8xIre67aAdN6ANoCEdAfUBIcinpCHV9lChoBkdAZnzzRQaaTmgHTegDaAhHQH1XYk/r0J51fZQoaAZHQGJF6F/QSjBoB03oA2gIR0B9Y6+Jxeb/dX2UKGgGR0Bk9//95yEMaAdN6ANoCEdAfW6lXzUZvXV9lChoBkdAZkiY+B6KL2gHTegDaAhHQH1wTUAksz51fZQoaAZHQGLLta6jFhpoB03oA2gIR0B9cY7cO9WZdX2UKGgGR0Bc9SUcGTs6aAdN6ANoCEdAfXRVxjriVHV9lChoBkdAYeGplSS/02gHTegDaAhHQH2EYpMHryF1fZQoaAZHQGPq/+sHSndoB03oA2gIR0B9iGaTfR/mdX2UKGgGR0AjM6QvHtF8aAdL9WgIR0B9jxEPUaybdX2UKGgGR0BkvO6d1+y7aAdN6ANoCEdAfY9VLBbfQHV9lChoBkdAY/ipo9LYgGgHTegDaAhHQH2bvc8DB/J1fZQoaAZHQGA3liSaEzxoB03oA2gIR0B9sKr+5vtMdX2UKGgGR0BVwfIOpbUxaAdN6ANoCEdAfbQI55qubXV9lChoBkdAY4/yEtdzGWgHTegDaAhHQH234+B6KLt1fZQoaAZHQGGtnWz4UN9oB03oA2gIR0B9v3di2DxtdX2UKGgGR0BlQdEuxrzoaAdN6ANoCEdAfcWYtQKrrHV9lChoBkdAZdEu5jH4oWgHTegDaAhHQH3Re4oZydZ1fZQoaAZHQGV/nw5NoJ1oB03oA2gIR0B95Do4dZJTdX2UKGgGR0BmLupMpPRBaAdN6ANoCEdAfe3TA31jAnV9lChoBkdAYjpjx0+1SmgHTegDaAhHQH32G47Rv3t1fZQoaAZHQGT8JXp4bCJoB03oA2gIR0B9+EKUmlZYdX2UKGgGR0BlShgiNbTuaAdN6ANoCEdAffpfyf+S83V9lChoBkdAXnHZAY51eWgHTegDaAhHQH4GqgyuZCx1fZQoaAZHQGUYNOEdvKloB03oA2gIR0B+CZntfG+9dX2UKGgGR0BkHnXoTwlTaAdN6ANoCEdAfg7QRPGhmHV9lChoBkdAYLzkWhysCGgHTegDaAhHQH4PBN21Ul11fZQoaAZHQGCpL1/Ue+5oB03oA2gIR0B+GXNY8uBddX2UKGgGR0BjccR6F/QTaAdN6ANoCEdAfhslvZRKpXV9lChoBkdAaOZFKkEcKmgHTegDaAhHQH43WVAzHjp1fZQoaAZHQGA+Wf9P1thoB03oA2gIR0B+Ot3fQ8fWdX2UKGgGR0Bc9qq814xDaAdN6ANoCEdAfkIHU+cH4XV9lChoBkdAYdlYEGJN02gHTegDaAhHQH5IDoUzsQd1fZQoaAZHQGRvT7l7tzFoB03oA2gIR0B+VBxAB1cMdX2UKGgGR0BlfCScLBsRaAdN6ANoCEdAfmhd/J/5L3V9lChoBkdAYp7/jKgZj2gHTegDaAhHQH5zC9EkSmJ1fZQoaAZHQF4l6jWTX8RoB03oA2gIR0B+fDffoA4odX2UKGgGR0BnANm6GxlhaAdN6ANoCEdAfn6qoZQ53nV9lChoBkdAYYtcHGCI12gHTegDaAhHQH6BLKFIuoR1fZQoaAZHQGTT1Ed/8VJoB03oA2gIR0B+kJ4mkWRBdX2UKGgGR0Bfgrns9jgAaAdN6ANoCEdAfpRhXr+o+HV9lChoBkdAXqEfyPMjeWgHTegDaAhHQH6bGEPDpC91fZQoaAZHQGJA7pV0cOtoB03oA2gIR0B+m1iqhlDndX2UKGgGR0Be0JTER8MNaAdN6ANoCEdAfqeyLQ5WBHV9lChoBkdAYUU6qbSZ0GgHTegDaAhHQH6pvQnhKlJ1fZQoaAZHQGC/l+3H7xdoB03oA2gIR0B+rVsLv1DjdX2UKGgGR0BkChrrPdEcaAdN6ANoCEdAfsZmmtQsPXV9lChoBkdAYNVarWAf+2gHTegDaAhHQH7PJTER8MN1fZQoaAZHQFwSiWVu76JoB03oA2gIR0B+1nHaN+9bdX2UKGgGR0Bj+lV/+bVjaAdN6ANoCEdAfuTP0qYqonV9lChoBkdAZQS32EkB0mgHTegDaAhHQH77OdXko4N1fZQoaAZHQGGgjA8B+4NoB03oA2gIR0B/Behf0EowdX2UKGgGR0Bk9RLCemNzaAdN6ANoCEdAfw82xY7q6nV9lChoBkdAZvOK+i8Fp2gHTegDaAhHQH8RjkMkQf91fZQoaAZHQGS2YNqgyuZoB03oA2gIR0B/E/IikftAdX2UKGgGR0BexIXoC+10aAdN6ANoCEdAfyE2M85jpnV9lChoBkdAZiXVhCtzS2gHTegDaAhHQH8kVhoduHh1fZQoaAZHQGNHrxRVIZtoB03oA2gIR0B/KdLxqfvndX2UKGgGR0BkG9fCyhSMaAdN6ANoCEdAfyoMUAT7EnV9lChoBkdAWxUXcgyM1mgHTegDaAhHQH8033UQTVV1fZQoaAZHQGClehGpdbBoB03oA2gIR0B/NrPw/gR9dX2UKGgGR0BldmQ6p5u7aAdN6ANoCEdAfzncy31BdHV9lChoBkdAZNCLiuMdcWgHTegDaAhHQH9Pj1XeWOZ1fZQoaAZHQGWurUkOZstoB03oA2gIR0B/V52eQMhHdX2UKGgGR0Be9L3sXzlLaAdN6ANoCEdAf16UxVQyh3V9lChoBkdAZC9ReC04R2gHTegDaAhHQH9so0IkZ751fZQoaAZHQF20+RYA80VoB03oA2gIR0B/hBcGC7K8dX2UKGgGR0BkzDj94u9OaAdN6ANoCEdAf5CpEhJRO3V9lChoBkdAXdVObiIcimgHTegDaAhHQH+blyaNMoN1fZQoaAZHQF9t6Skj5bhoB03oA2gIR0B/noKLKmsOdX2UKGgGR0BhIjWsijcmaAdN6ANoCEdAf6GFOfukUXV9lChoBkdAYu3b/wRXfmgHTegDaAhHQH+0UNKAavR1fZQoaAZHQGXf2fkFOfxoB03oA2gIR0B/uMytV7x/dX2UKGgGR0BgeByXD3ueaAdN6ANoCEdAf8CS1Vo6CHV9lChoBkdAYzSiO/+Kj2gHTegDaAhHQH/A5SWJJoV1fZQoaAZHQGUEO7QLNOdoB03oA2gIR0B/zyNMoMKDdX2UKGgGR0BnrDTBqKxcaAdN6ANoCEdAf9FugYgq3HV9lChoBkdAYDZs/IKc/mgHTegDaAhHQH/VdOVPepJ1fZQoaAZHQGJ6ml67dzpoB03oA2gIR0B/2hlz2exwdX2UKGgGR0BfMSgTRIBjaAdN6ANoCEdAf/b2HtWuHXV9lChoBkdAXokgzP8htGgHTegDaAhHQH/+K7mMfih1fZQoaAZHQGJaxf4REndoB03oA2gIR0CABdR64UeudX2UKGgGR0BCe1kUbkwOaAdL/WgIR0CADwwTM7lrdX2UKGgGR0BgjRbW3BpIaAdN6ANoCEdAgBAsaCL/CXV9lChoBkdAY4l1Oj7AL2gHTegDaAhHQIAVGkgwGnp1fZQoaAZHQGIHb0e2d/doB03oA2gIR0CAGWMb3oLYdX2UKGgGR0BkMsbtJFspaAdN6ANoCEdAgBp5ZB9kSXV9lChoBkdAYVjEit7rs2gHTegDaAhHQIAblyPuG9J1fZQoaAZHQGbA+VC5VfhoB03oA2gIR0CAIqmVJL/TdX2UKGgGR0BidUUKzAvdaAdN6ANoCEdAgCR1zySV4XV9lChoBkdAYGVTEzfrKWgHTegDaAhHQIAnoq/dqL11fZQoaAZHQGChQVsUIs1oB03oA2gIR0CAJ8NYr8R+dX2UKGgGR0BidtsJpnHvaAdN6ANoCEdAgC3PLHMlknV9lChoBkdAZEN9MsYl6mgHTegDaAhHQIAuzHlwLmZ1fZQoaAZHQGcpHLzPKMhoB03oA2gIR0CAMI9jgAIZdX2UKGgGR0Bg8IKrq+rVaAdN6ANoCEdAgDK9nbqQinVlLg=="
49
  },
50
  "ep_success_buffer": {
51
  ":type:": "<class 'collections.deque'>",
@@ -83,7 +83,7 @@
83
  "ent_coef": 0.01,
84
  "vf_coef": 0.5,
85
  "max_grad_norm": 0.5,
86
- "batch_size": 128,
87
  "n_epochs": 4,
88
  "clip_range": {
89
  ":type:": "<class 'function'>",
 
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
+ "__init__": "<function ActorCriticPolicy.__init__ at 0x7fb26a67dca0>",
8
+ "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7fb26a67dd30>",
9
+ "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7fb26a67ddc0>",
10
+ "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7fb26a67de50>",
11
+ "_build": "<function ActorCriticPolicy._build at 0x7fb26a67dee0>",
12
+ "forward": "<function ActorCriticPolicy.forward at 0x7fb26a67df70>",
13
+ "extract_features": "<function ActorCriticPolicy.extract_features at 0x7fb26a602040>",
14
+ "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7fb26a6020d0>",
15
+ "_predict": "<function ActorCriticPolicy._predict at 0x7fb26a602160>",
16
+ "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7fb26a6021f0>",
17
+ "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7fb26a602280>",
18
+ "predict_values": "<function ActorCriticPolicy.predict_values at 0x7fb26a602310>",
19
  "__abstractmethods__": "frozenset()",
20
+ "_abc_impl": "<_abc_data object at 0x7fb26a67c2a0>"
21
  },
22
  "verbose": 1,
23
  "policy_kwargs": {},
 
26
  "_num_timesteps_at_start": 0,
27
  "seed": null,
28
  "action_noise": null,
29
+ "start_time": 1712322867214142034,
30
  "learning_rate": 0.0003,
31
  "tensorboard_log": null,
32
  "_last_obs": {
33
  ":type:": "<class 'numpy.ndarray'>",
34
+ ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAM2mDrz2/Cq6gORtO4Gbyzbwieo5Wj6JugAAgD8AAIA/U5AIvq7RhLr3hjU9u3phOfLNyDvlM0S6AACAPwAAgD+zspk99nxBujrOP7kDX5U248BMugajWTgAAIA/AACAP9rZ9z09hyG7YUkFupfWrTfPkWG8wnY7OQAAgD8AAIA/WmctvjjC67vOgCw8nDcbOt95Xz2j9QG7AACAPwAAgD9q9LI+xJM5P1EWnby3Q6O+M2oLvKsOBT0AAAAAAAAAAPrWEr5PkUo+FJAgPTMIV76ffae6/cocvQAAAAAAAAAAzctEPfaIGrpQweQ6PoyoNZ+MfDtmpwe6AACAPwAAgD8A6NY7cDCAP1CbKzyTZYa+ymI8vXZtNj0AAAAAAAAAAM3z1LwpOD+6tbx/vIfyxDXfEbg5Su4wtQAAgD8AAIA/gEMBPY9CVbiAlOq5Q3oWtkZ5dDv7VAo5AACAPwAAgD9QsH2+y/MpP9pOqztdZHO+WSFtvSD7sb0AAAAAAAAAAGa7/zyPHiK6LZvWOcmyBjXgdMs68HH4uAAAgD8AAIA/AFSwO4+eTbqSquk7pBi5NiagkrvcDrM1AACAPwAAgD+z61i9rSBHP4oh9Lwp4lG+W6hEvB0P37wAAAAAAAAAAABlsjxc6zK66NTWOlzykDXCIey5QCX5uQAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
35
  },
36
  "_last_episode_starts": {
37
  ":type:": "<class 'numpy.ndarray'>",
 
45
  "_stats_window_size": 100,
46
  "ep_info_buffer": {
47
  ":type:": "<class 'collections.deque'>",
48
+ ":serialized:": "gAWVQwwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQGRHdNvfj0eMAWyUTegDjAF0lEdAe04qzZ6D5HV9lChoBkdAYLHOymhufmgHTegDaAhHQHtU98zAN5N1fZQoaAZHQGL143m3fANoB03oA2gIR0B7Vr3ai9IxdX2UKGgGR0BazbnLaEi/aAdN6ANoCEdAe1i6xPfsNXV9lChoBkdAYdFRQaaTfWgHTegDaAhHQHtcUc4o7V91fZQoaAZHQFy3rQPZqVRoB03oA2gIR0B7YAx59mYjdX2UKGgGR0Bg5M5jpcHGaAdN6ANoCEdAe2fkC3gDR3V9lChoBkdAZQQDUVi4KGgHTegDaAhHQHt2ZB5X2dx1fZQoaAZHwCl9KkEcKgJoB006AWgIR0B7fN7kXDWLdX2UKGgGR0Bb3J9E1EVnaAdN6ANoCEdAe4YEk0JnhHV9lChoBkdAQUsGC7K7qmgHTSIBaAhHQHuHEUO/cnF1fZQoaAZHQGFdXr2QGOdoB03oA2gIR0B7rHTgEU0vdX2UKGgGR0BdlX9itq59aAdN6ANoCEdAe68IhQm/nHV9lChoBkdAYoUwX668QWgHTegDaAhHQHuyPEn9ehR1fZQoaAZHQGB65Gz8gp1oB03oA2gIR0B7yIVj7Q9idX2UKGgGR0BessjNY8uBaAdN6ANoCEdAe8p5dGAkLXV9lChoBkdAYRmIMSbpeWgHTegDaAhHQHvMKvNeMQ51fZQoaAZHQF0HqubI91VoB03oA2gIR0B72by9VWCFdX2UKGgGR0BcuGQOnVG1aAdN6ANoCEdAe92D0UXYUXV9lChoBkdAZJxKyv9tM2gHTegDaAhHQHvllkMCtA91fZQoaAZHQFy/ztkWhytoB03oA2gIR0B754DZDiOvdX2UKGgGR0BrL+WnjyWiaAdNzANoCEdAe+eqYJE6UHV9lChoBkdAZJ0fHxSYPWgHTegDaAhHQHv20XLvCuV1fZQoaAZHQGJVBb4agmJoB03oA2gIR0B8Bio2n88+dX2UKGgGR0BsIFgfEGaAaAdN7AFoCEdAfAu1vl2eQXV9lChoBkdAYBoerdWQwWgHTegDaAhHQHwMn+ERJ3B1fZQoaAZHQFh6URFqi49oB03oA2gIR0B8FXryDqW1dX2UKGgGR0BgHz9hqj8DaAdN6ANoCEdAfBaRGMGX5XV9lChoBkfAJVRWtEG7jGgHTTkBaAhHQHwjUgSvkil1fZQoaAZHQFtOigTRIBloB03oA2gIR0B8M/EOy3TedX2UKGgGR0BeqmBvrGBGaAdN6ANoCEdAfD6neizsyHV9lChoBkdAY0csAeaKDWgHTegDaAhHQHxB7xmTTv11fZQoaAZHQFrhktEofCBoB03oA2gIR0B8WeNNrTH9dX2UKGgGR0BhytaB7NSqaAdN6ANoCEdAfFwaisXBQHV9lChoBkdAYtAL+glF+mgHTegDaAhHQHxtrQw9JSR1fZQoaAZHQGFMECeVcD9oB03oA2gIR0B8cckC3gDSdX2UKGgGR0BheAkqtozvaAdN6ANoCEdAfHsAAQxvenV9lChoBkdAXw6fSQYDT2gHTegDaAhHQHx9JvkzXSV1fZQoaAZHQGJzXuuzQeFoB03oA2gIR0B8fVX6qKgqdX2UKGgGR0BhqEtXgccVaAdN6ANoCEdAfJ0AE+xGD3V9lChoBkdAYxoyLQ5WBGgHTegDaAhHQHyizuv2XcB1fZQoaAZHQFwgrKeTV2BoB03oA2gIR0B8o7/5tWMkdX2UKGgGR0BhcbGaQV9GaAdN6ANoCEdAfKxctXgccXV9lChoBkdAYdxIT4+KTGgHTegDaAhHQHytYqPOpsJ1fZQoaAZHQGPJoikfs/poB03oA2gIR0B8uuj7ALy+dX2UKGgGR0A8dJ2+wkgPaAdL+2gIR0B8x6RvFWGRdX2UKGgGR0BaaDXnQpnZaAdN6ANoCEdAfMn+10DEFXV9lChoBkdAYOkDJ2dNFmgHTegDaAhHQHzMThLoOhF1fZQoaAZHQFsusSCe2/loB03oA2gIR0B815IsiB5HdX2UKGgGR0Bk7Y2GZeAvaAdN6ANoCEdAfOvpyIYWL3V9lChoBkdAY8uMqjJuEWgHTegDaAhHQHztoeLehwl1fZQoaAZHQF/i4QBgeBBoB03oA2gIR0B8+47tAs06dX2UKGgGR0Bb+9OVPepGaAdN6ANoCEdAfP8MpgCwKXV9lChoBkdAXhNNGmUGFGgHTegDaAhHQH0G9a6jFhp1fZQoaAZHQFoEVN5+pfhoB03oA2gIR0B9COfYjB2wdX2UKGgGR0BgAKij+JgtaAdN6ANoCEdAfQkQTmGM43V9lChoBkdAGV/N7jT8YWgHTRgBaAhHQH0O2d3B55Z1fZQoaAZHQGNAGyPdVNpoB03oA2gIR0B9JRrhzeXSdX2UKGgGR0BiXX7aZhKEaAdN6ANoCEdAfSoHuZ1FIHV9lChoBkdAW+YSamXPaGgHTegDaAhHQH0y0zCUHIJ1fZQoaAZHQGHAqmTC+DhoB03oA2gIR0B9M8LXtjTbdX2UKGgGR0Bi4bUmUnogaAdN6ANoCEdAfT+5tWMjvHV9lChoBkdAYL87MgU1ymgHTegDaAhHQH1MMBp5/sp1fZQoaAZHQAGt9QXQ+lloB00IAWgIR0B9TSA5Jbt7dX2UKGgGR0BaqUbkwN9ZaAdN6ANoCEdAfU55Dqnm73V9lChoBkdAYivnwob4rWgHTegDaAhHQH1QjufEn9h1fZQoaAZHQFs5doWYWtVoB03oA2gIR0B9U0Pf8/D+dX2UKGgGR0BdQnE61b7kaAdN6ANoCEdAfW8bbUPQOXV9lChoBkdAWJnmmtQsPWgHTegDaAhHQH2CWj0th/l1fZQoaAZHQGMaBq0tyxRoB03oA2gIR0B9htVNpM6BdX2UKGgGR0BiVbYXfqHHaAdN6ANoCEdAfZFL3sXzlXV9lChoBkdAWq0Rbr1M/WgHTegDaAhHQH2T6/20zCV1fZQoaAZHQGCf7dJrcj9oB03oA2gIR0B9lCInBtUGdX2UKGgGR0BiGI9ovi97aAdN6ANoCEdAfZtoTwlSj3V9lChoBkdAXoNAu7HyVmgHTegDaAhHQH221EVnEl51fZQoaAZHQGHbDopx3mpoB03oA2gIR0B9yFFUhmoSdX2UKGgGR0BhOo+0PYnOaAdN6ANoCEdAfcmIWP91l3V9lChoBkdAYF3sqrilzmgHTegDaAhHQH3ZFwHZ9NN1fZQoaAZHQFm+xaPjn3doB03oA2gIR0B96QUYbbUPdX2UKGgGR0BgIYywfQruaAdN6ANoCEdAfeoa6z3RHHV9lChoBkdAYwCs4ku6E2gHTegDaAhHQH3rsWoFV1h1fZQoaAZHQGQGnSv1UVBoB03oA2gIR0B97jC2tuDSdX2UKGgGR0BhjdhsqJ/HaAdN6ANoCEdAffFv/BFd9nV9lChoBkdAYKyIsyzolmgHTegDaAhHQH4RzmSyMUB1fZQoaAZHQGOylum78NxoB03oA2gIR0B+J0ySFGoadX2UKGgGR0A4CRDkU9IPaAdNQgFoCEdAfiuJk5IYnHV9lChoBkdAX95Q3xWkrWgHTegDaAhHQH4r7hvR7Z51fZQoaAZHQFt4SW7e2uxoB03oA2gIR0B+NeH+IdlvdX2UKGgGR0BiMUTHsC1aaAdN6ANoCEdAfjg16mfoR3V9lChoBkdAZL+vxH5JsmgHTegDaAhHQH44aBNEgGN1fZQoaAZHQGEcCcoYvWZoB03oA2gIR0B+P1X1anrIdX2UKGgGR0Bcv4SQHRkVaAdN6ANoCEdAflkFt8/lhnV9lChoBkdAJIdSMtK7I2gHTSIBaAhHQH5grI91U2l1fZQoaAZHQGLwifQKKHhoB03oA2gIR0B+aMvrWy1NdX2UKGgGR0Bg4K2tuDSPaAdN6ANoCEdAfmnTIeYD1XV9lChoBkdAXifRv3rUsmgHTegDaAhHQH52P/m1YyR1fZQoaAZHQGXlmvnr6cloB03oA2gIR0B+g0Kx9oexdX2UKGgGR0BeUvT1CgK4aAdN6ANoCEdAfoQ371qWT3V9lChoBkdAYC4Z88cMmWgHTegDaAhHQH6FlU6xPft1fZQoaAZHQGQCFxXGOuJoB03oA2gIR0B+h9lg+hXbdWUu"
49
  },
50
  "ep_success_buffer": {
51
  ":type:": "<class 'collections.deque'>",
 
83
  "ent_coef": 0.01,
84
  "vf_coef": 0.5,
85
  "max_grad_norm": 0.5,
86
+ "batch_size": 256,
87
  "n_epochs": 4,
88
  "clip_range": {
89
  ":type:": "<class 'function'>",
ppo-LunarLander-v2/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:071ebaa3cc3626b31dff97224b73ddd608e60936def0e5f1e9de8809ef1afd8d
3
  size 87978
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8dc3611144be90ec0b759e6a2e899010f1087dc869d805915d2e7687cb160554
3
  size 87978
ppo-LunarLander-v2/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:08c8af57f5b771a90f5dfebe93c8b387b828ae0d88f0862b6e2691ed4bc6cc76
3
  size 43634
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9cd470121d6a6803d49e8f98d556cb68fd0e952ec246b3763beb8964bce5454d
3
  size 43634
replay.mp4 CHANGED
Binary files a/replay.mp4 and b/replay.mp4 differ
 
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 230.2089746, "std_reward": 17.25921101590976, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2024-04-05T21:10:19.568394"}
 
1
+ {"mean_reward": 229.01773050000003, "std_reward": 28.04352246627346, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2024-04-05T21:22:41.639231"}