Upload ppo-LunarLander-v2 model with longer training session
Browse files- README.md +1 -1
- config.json +1 -1
- ppo-LunarLander-v2.zip +2 -2
- ppo-LunarLander-v2/data +20 -20
- ppo-LunarLander-v2/policy.optimizer.pth +1 -1
- ppo-LunarLander-v2/policy.pth +1 -1
- replay.mp4 +2 -2
- results.json +1 -1
README.md
CHANGED
@@ -10,7 +10,7 @@ model-index:
|
|
10 |
results:
|
11 |
- metrics:
|
12 |
- type: mean_reward
|
13 |
-
value:
|
14 |
name: mean_reward
|
15 |
task:
|
16 |
type: reinforcement-learning
|
|
|
10 |
results:
|
11 |
- metrics:
|
12 |
- type: mean_reward
|
13 |
+
value: 263.17 +/- 20.32
|
14 |
name: mean_reward
|
15 |
task:
|
16 |
type: reinforcement-learning
|
config.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f7c6869fdc0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f7c6869fe50>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f7c6869fee0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f7c6869ff70>", "_build": "<function ActorCriticPolicy._build at 0x7f7c686a4040>", "forward": "<function ActorCriticPolicy.forward at 0x7f7c686a40d0>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f7c686a4160>", "_predict": "<function ActorCriticPolicy._predict at 0x7f7c686a41f0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f7c686a4280>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f7c686a4310>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f7c686a43a0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7f7c68863300>"}, "verbose": 1, "policy_kwargs": {}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVnwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/5RoCksIhZSMAUOUdJRSlIwEaGlnaJRoEiiWIAAAAAAAAAAAAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAf5RoCksIhZRoFXSUUpSMDWJvdW5kZWRfYmVsb3eUaBIolggAAAAAAAAAAAAAAAAAAACUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYIAAAAAAAAAAAAAAAAAAAAlGghSwiFlGgVdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [8], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False]", "bounded_above": "[False False False False False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gAWVggAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUaAeTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu", "n": 4, "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 32, "num_timesteps": 524288, "_total_timesteps": 500000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1652398743.131799, "learning_rate": 0.0003, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVAwMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAEsBSwFLE0MEiABTAJROhZQpjAFflIWUjGkvaG9tZS9pbm5vbS1kdC9tYW1iYWZvcmdlL2VudnMvaGYtZHJsLWNsYXNzL2xpYi9weXRob24zLjkvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuAQwIAAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjGkvaG9tZS9pbm5vbS1kdC9tYW1iYWZvcmdlL2VudnMvaGYtZHJsLWNsYXNzL2xpYi9weXRob24zLjkvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpSMHGNsb3VkcGlja2xlLmNsb3VkcGlja2xlX2Zhc3SUjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoIH2UfZQoaBdoDowMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBiMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHPzOpKjBVMmGFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQQAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYABAAAAAAAACYwwb29zJo/a36svnmG074NnXC8xp+vvAAAAAAAAAAAM3AbP8w+gT+w17g+lib1vqnv9D4t6WE+AAAAAAAAAACq45w+wt8UPrbeqj7Erk6/HsA/PbyAoD0AAAAAAAAAAM1A7jtH27w/2t3GvJFeiL6cLdO84gdAvQAAAAAAAAAA5gIovSHvsD/yo92+kL1ivgMjGz3qIaI8AAAAAAAAAACaxIU9FZOnP0Jugj1er6q+rF7kPEuM1D0AAAAAAAAAADNC+D3rQIk/jVEFPtytAr/FI7E92vw3vQAAAAAAAAAA4nYRP7D5Vj8WixM/yeAbv9q06z14xxq9AAAAAAAAAAAmCwE+s9tfP3MTcT5nSCm/wcXjPdo7cb0AAAAAAAAAAGai2zvCDrY/5MstP/vCAT8BR/67UHgdvgAAAAAAAAAADaf7PWTsiT4ug4k9tFIUvxH7wD0m8re9AAAAAAAAAADzM1o+UKggP+691T0TjVu/iNfePv51hb0AAAAAAAAAAJPVCD757qY/Ps87PtsAwr7A6kc+VRr9vQAAAAAAAAAAumEqvuO2PT/qls++vUdsvwbbkr1dM929AAAAAAAAAAA9BvW+z1DqveKWTz1AtDS/s4R3vsuhRj4AAIA/AAAAANP3Q76ymn4/Aj16voMSO78UatW9kUOuPQAAAAAAAAAA5v8+vSXh3D4qr+c9RH9Zv7gULr5NxQk+AAAAAAAAAACaGS88wRy9P4qyBj7yirY+G7/CvMdxh7wAAAAAAAAAAJoKobwblrU/MgDIvtkQfjzZK1U8Wq/8PAAAAAAAAAAAZsgRvAu9wz/zLnG9CxAUPlE0aLzydQI9AAAAAAAAAAANCvM9h45FP27xaz3tuyu/CyQHPgXtK74AAAAAAAAAAJat6T73fpM/5ijmPh5FGr+BwYk+0TCDPQAAAAAAAAAAtn8Wv3QAnD0D0+u+8o9Cv7wt4L14N2k9AAAAAAAAAADBKyq/HAEwvlO+Hj1lbxc9OCPDvgiCwTsAAIA/AACAP4YfpT4B9QQ/Si+4Pp0jXb/3JYw9UpM7vQAAAAAAAAAAk3Y6vp8ovj8IhQG/Bqk2vlbaAr1yX4q9AAAAAAAAAABjeaI+ZvrbPhhwiz7cs0m/u6CFPnP7070AAAAAAAAAAKamAr52vlc/HKlCvsecEL80hiG8H8ilvQAAAAAAAAAAUzg0PnnykT9jsmA+/Ug+v3URaT1HRZC8AAAAAAAAAADNl+A8pDdtPxLV9DzLLM6+vO5Qvoa4kb4AAAAAAAAAAA0Eyj2tXY0/crSRPizSAL8ZXbm93QLWPAAAAAAAAAAAJiP3PR59sD9Fq3I+nz+6vuL2mz3WCwQ9AAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSyBLCIaUjAFDlHSUUpQu"}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVkwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYgAAAAAAAAAAAAAAAAAAAAAAEAAAAAAAAAAAAAAAAAAAAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksghZSMAUOUdJRSlC4="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.04857599999999995, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVHRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIXrneNlPBKcCUhpRSlIwBbJRLkowBdJRHQG5Trzf779B1fZQoaAZoCWgPQwiH+8itSYZUwJSGlFKUaBVLjGgWR0BuVG3trsSkdX2UKGgGaAloD0MIrJFdaRntVsCUhpRSlGgVS3hoFkdAblUd4FA3UHV9lChoBmgJaA9DCJon1xTI7O+/lIaUUpRoFUvNaBZHQG5VpkPMB6t1fZQoaAZoCWgPQwgErcCQ1T0pwJSGlFKUaBVLY2gWR0BuVfM4cWCVdX2UKGgGaAloD0MItwn3yrx7QsCUhpRSlGgVS65oFkdAblcCBf8dgnV9lChoBmgJaA9DCCiZnNoZbjTAlIaUUpRoFUtaaBZHQG5W/z8P4Eh1fZQoaAZoCWgPQwiJXHAGf35WwJSGlFKUaBVLtWgWR0BuWBFiKBNFdX2UKGgGaAloD0MI2iCTjJyfTsCUhpRSlGgVS3RoFkdAbli2Jiy6c3V9lChoBmgJaA9DCEM50a5CiinAlIaUUpRoFUtfaBZHQG5ZMPJ7sv91fZQoaAZoCWgPQwhQjgJEwYJAwJSGlFKUaBVLe2gWR0BuWXZqVQhwdX2UKGgGaAloD0MIU5W2uMYzOMCUhpRSlGgVS7FoFkdAblpPRArxzHV9lChoBmgJaA9DCMOgTKPJVRxAlIaUUpRoFUtaaBZHQG5amf5DZ151fZQoaAZoCWgPQwiVnBN7aCs1QJSGlFKUaBVLnGgWR0BuWuEPDpC8dX2UKGgGaAloD0MINLvurUgMTcCUhpRSlGgVS5doFkdAblszposZpHV9lChoBmgJaA9DCNaLoZxoxUPAlIaUUpRoFUuVaBZHQG5bmO2iL2p1fZQoaAZoCWgPQwi8eD9uv+wvwJSGlFKUaBVLf2gWR0BuW/cWTHKfdX2UKGgGaAloD0MI9vBloggoUsCUhpRSlGgVS1VoFkdAblwZXMhX83V9lChoBmgJaA9DCArWOJuOgknAlIaUUpRoFUtbaBZHQG5cO4oZydZ1fZQoaAZoCWgPQwj/If32dX1WwJSGlFKUaBVLa2gWR0BuXDUb1h9cdX2UKGgGaAloD0MInL8JhQgEQMCUhpRSlGgVS1FoFkdAbl1gZTAFgXV9lChoBmgJaA9DCPX0EfjDQ0LAlIaUUpRoFUtiaBZHQG5djEFW4mV1fZQoaAZoCWgPQwhWYp6VtO46wJSGlFKUaBVLkWgWR0BuXb0z0pVkdX2UKGgGaAloD0MIRdeFH5xhRcCUhpRSlGgVS1loFkdAbl4w7kn1F3V9lChoBmgJaA9DCLwIU5RLt0HAlIaUUpRoFUuFaBZHQG5eMbFS88N1fZQoaAZoCWgPQwiNmUS94DM+wJSGlFKUaBVLgWgWR0BuYA+fRNRFdX2UKGgGaAloD0MIbFuU2SDPWcCUhpRSlGgVS2JoFkdAbmBONYKYzHV9lChoBmgJaA9DCA1S8BRyh0LAlIaUUpRoFUuSaBZHQG5g9XT3IuJ1fZQoaAZoCWgPQwim0HmNXQpFwJSGlFKUaBVLeGgWR0BuYkVDa4+bdX2UKGgGaAloD0MI7QvohTu1Q8CUhpRSlGgVS0hoFkdAbmNCF9KEnXV9lChoBmgJaA9DCMpskElGLEPAlIaUUpRoFUtZaBZHQG5jdVea8Yh1fZQoaAZoCWgPQwiEgefewwUGwJSGlFKUaBVLaWgWR0BuY8WweNkwdX2UKGgGaAloD0MI0TsVcM9tR8CUhpRSlGgVS5xoFkdAbmQJ+DvmYHV9lChoBmgJaA9DCIgTmE7r0kfAlIaUUpRoFUtkaBZHQG5kOloDgZV1fZQoaAZoCWgPQwjNV8nH7ihHwJSGlFKUaBVLXGgWR0BuZFzIV/MGdX2UKGgGaAloD0MI/+ibNA2IS8CUhpRSlGgVS5BoFkdAbmVSZSeiBXV9lChoBmgJaA9DCIiE7/0NBj7AlIaUUpRoFUtcaBZHQG5mgkka/AV1fZQoaAZoCWgPQwgXtmYrL+tKwJSGlFKUaBVLZGgWR0BuZqaCtihGdX2UKGgGaAloD0MI/u2yX3e6RcCUhpRSlGgVS5xoFkdAbmcMRYigTXV9lChoBmgJaA9DCDwvFRvzUELAlIaUUpRoFUuNaBZHQG5nC4SYgJV1fZQoaAZoCWgPQwiu1/SgoIwnwJSGlFKUaBVLXmgWR0BuZ0OG0u14dX2UKGgGaAloD0MI3uUivhPJR8CUhpRSlGgVS1BoFkdAbmhffoA4oHV9lChoBmgJaA9DCFftmpDWjDvAlIaUUpRoFUtiaBZHQG5ogHVwxWV1fZQoaAZoCWgPQwjJyi+DMcI/wJSGlFKUaBVLoGgWR0BuaQbn5i3HdX2UKGgGaAloD0MIr7K2KR5rNECUhpRSlGgVS2doFkdAbmkgq3EycnV9lChoBmgJaA9DCA/QfTmzVSfAlIaUUpRoFUtiaBZHQG5p/TkQwsZ1fZQoaAZoCWgPQwg/OnXls1ZGwJSGlFKUaBVLaGgWR0BuapBkZrHmdX2UKGgGaAloD0MIwqT4+ISGS8CUhpRSlGgVS6BoFkdAbmsFHrhR7HV9lChoBmgJaA9DCCBFnbmHrE3AlIaUUpRoFUtUaBZHQG5rQemvW6N1fZQoaAZoCWgPQwhWEANd+6o5QJSGlFKUaBVLwmgWR0Bua3nEETxodX2UKGgGaAloD0MIu+1Cc512McCUhpRSlGgVS31oFkdAbmu8IzFdcHV9lChoBmgJaA9DCKispuuJLvG/lIaUUpRoFUuVaBZHQG5sK9oN/fB1fZQoaAZoCWgPQwh3S3LAruYSQJSGlFKUaBVLt2gWR0BubNgKF7D3dX2UKGgGaAloD0MIDHkEN1LcSsCUhpRSlGgVS5FoFkdAbm0eiBXjl3V9lChoBmgJaA9DCIUmiSXlskHAlIaUUpRoFUtRaBZHQG5uo2wV0tB1fZQoaAZoCWgPQwjiPnJr0ldHwJSGlFKUaBVLaWgWR0BubqWgOBlMdX2UKGgGaAloD0MInwJgPINGQsCUhpRSlGgVS4loFkdAbm+zTF2mpHV9lChoBmgJaA9DCHBbW3heai7AlIaUUpRoFUucaBZHQG5v0A93bEh1fZQoaAZoCWgPQwjqQNZTq8JQwJSGlFKUaBVLYGgWR0Bub86JZW7wdX2UKGgGaAloD0MI2gQYlj9vOcCUhpRSlGgVS2JoFkdAbnA7cO9WZXV9lChoBmgJaA9DCNy8cVKYBlDAlIaUUpRoFUuRaBZHQG5wPGyX2M91fZQoaAZoCWgPQwhdGr/wSk47wJSGlFKUaBVLf2gWR0BucHmcOLBLdX2UKGgGaAloD0MIC34bYrzhUcCUhpRSlGgVS0poFkdAbnDDn/1g6XV9lChoBmgJaA9DCLrzxHO2ICHAlIaUUpRoFUtmaBZHQG5w/P5YYBN1fZQoaAZoCWgPQwiMg0vHnFFLwJSGlFKUaBVLZ2gWR0Bucav3ai9JdX2UKGgGaAloD0MICK7yBMI6TMCUhpRSlGgVS3xoFkdAbnJAckt293V9lChoBmgJaA9DCE/LD1zlQ0XAlIaUUpRoFUtaaBZHQG5yihWYF7l1fZQoaAZoCWgPQwgQ5nYv9zFEwJSGlFKUaBVLXGgWR0Bucsv24/eMdX2UKGgGaAloD0MIroIY6Nq1RcCUhpRSlGgVS1loFkdAbnOuAZsKs3V9lChoBmgJaA9DCKYKRiV1ak3AlIaUUpRoFUuHaBZHQG51cL8aXKN1fZQoaAZoCWgPQwiJsUy/RFBNwJSGlFKUaBVLXWgWR0BudrqMWGh3dX2UKGgGaAloD0MIV8wIbw9wQcCUhpRSlGgVS2NoFkdAbne86FM7EHV9lChoBmgJaA9DCMYVF0fldlDAlIaUUpRoFUuJaBZHQG54OdwvQF91fZQoaAZoCWgPQwgqUmFsIUpCwJSGlFKUaBVLjmgWR0BueMwHqu8sdX2UKGgGaAloD0MIYHXkSGcOQMCUhpRSlGgVS2FoFkdAbnmUrTYukHV9lChoBmgJaA9DCIYCtoMRcU7AlIaUUpRoFUtOaBZHQG55vszEaVF1fZQoaAZoCWgPQwiJQPUPIlFCwJSGlFKUaBVLnmgWR0Buebz5GjKxdX2UKGgGaAloD0MIWRe30QB2IkCUhpRSlGgVS4poFkdAbnojMV1wHnV9lChoBmgJaA9DCAxYchWLyzjAlIaUUpRoFUtZaBZHQG56GXXyy2R1fZQoaAZoCWgPQwgDJnDrbh5BwJSGlFKUaBVLdWgWR0BuesNOM2m6dX2UKGgGaAloD0MIR+nSvyThUcCUhpRSlGgVS3doFkdAbnrGHYYixHV9lChoBmgJaA9DCDpXlBKCeTjAlIaUUpRoFUtvaBZHQG57LaufVZt1fZQoaAZoCWgPQwgdO6jEdUQkQJSGlFKUaBVLVGgWR0Bue7a/RE4OdX2UKGgGaAloD0MI2xZlNshkP8CUhpRSlGgVS5VoFkdAbnxcZccENnV9lChoBmgJaA9DCCb8Uj9vLkLAlIaUUpRoFUtjaBZHQG59EAo5PuZ1fZQoaAZoCWgPQwhM/bypSEE+wJSGlFKUaBVLk2gWR0BufQKUmlZYdX2UKGgGaAloD0MIVYSbjCo3SMCUhpRSlGgVS5RoFkdAbn25/b0voXV9lChoBmgJaA9DCDZYOEnzJzTAlIaUUpRoFUuiaBZHQG5994eLehx1fZQoaAZoCWgPQwhPdjOjH30swJSGlFKUaBVLY2gWR0Bufes5n13/dX2UKGgGaAloD0MIVU57Ss5pJsCUhpRSlGgVS3doFkdAbn4O/cnE23V9lChoBmgJaA9DCPkTlQ1rxkbAlIaUUpRoFUuMaBZHQG5+ROclPad1fZQoaAZoCWgPQwgU0ETY8LTyv5SGlFKUaBVLcWgWR0BufuruIAOsdX2UKGgGaAloD0MIu9bep6oWSMCUhpRSlGgVS2VoFkdAbn7qY7aIvnV9lChoBmgJaA9DCJeo3hrYLE/AlIaUUpRoFUt/aBZHQG6AMHbAUL51fZQoaAZoCWgPQwjUD+oihbovQJSGlFKUaBVLbmgWR0BugSBun/DMdX2UKGgGaAloD0MIjUephCfqScCUhpRSlGgVS5BoFkdAboJo6CDmKnV9lChoBmgJaA9DCMuFyr+WF0vAlIaUUpRoFUuCaBZHQG6Df5ckdFR1fZQoaAZoCWgPQwjrq6sCtYJGwJSGlFKUaBVLeWgWR0Bug5jjJdSmdX2UKGgGaAloD0MIyJQPQdU8RsCUhpRSlGgVS4hoFkdAboQCJXQtz3V9lChoBmgJaA9DCMr+eRowSEHAlIaUUpRoFUubaBZHQG6Ej4xk/bF1ZS4="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 80, "n_steps": 2048, "gamma": 0.999, "gae_lambda": 0.95, "ent_coef": 0.0, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 10, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVAwMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAEsBSwFLE0MEiABTAJROhZQpjAFflIWUjGkvaG9tZS9pbm5vbS1kdC9tYW1iYWZvcmdlL2VudnMvaGYtZHJsLWNsYXNzL2xpYi9weXRob24zLjkvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuAQwIAAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjGkvaG9tZS9pbm5vbS1kdC9tYW1iYWZvcmdlL2VudnMvaGYtZHJsLWNsYXNzL2xpYi9weXRob24zLjkvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpSMHGNsb3VkcGlja2xlLmNsb3VkcGlja2xlX2Zhc3SUjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoIH2UfZQoaBdoDowMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBiMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHP7mZmZmZmZqFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "system_info": {"OS": "Linux-5.15.0-27-generic-x86_64-with-glibc2.35 #28-Ubuntu SMP Thu Apr 14 04:55:28 UTC 2022", "Python": "3.9.12", "Stable-Baselines3": "1.5.0", "PyTorch": "1.11.0", "GPU Enabled": "True", "Numpy": "1.22.3", "Gym": "0.21.0"}}
|
|
|
1 |
+
{"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f2f489dedc0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f2f489dee50>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f2f489deee0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f2f489def70>", "_build": "<function ActorCriticPolicy._build at 0x7f2f489e2040>", "forward": "<function ActorCriticPolicy.forward at 0x7f2f489e20d0>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f2f489e2160>", "_predict": "<function ActorCriticPolicy._predict at 0x7f2f489e21f0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f2f489e2280>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f2f489e2310>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f2f489e23a0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7f2f48ba9e40>"}, "verbose": 1, "policy_kwargs": {}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVnwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/5RoCksIhZSMAUOUdJRSlIwEaGlnaJRoEiiWIAAAAAAAAAAAAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAf5RoCksIhZRoFXSUUpSMDWJvdW5kZWRfYmVsb3eUaBIolggAAAAAAAAAAAAAAAAAAACUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYIAAAAAAAAAAAAAAAAAAAAlGghSwiFlGgVdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [8], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False]", "bounded_above": "[False False False False False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gAWVggAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUaAeTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu", "n": 4, "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 8, "num_timesteps": 507904, "_total_timesteps": 500000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1652399066.091435, "learning_rate": 0.0003, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVAwMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAEsBSwFLE0MEiABTAJROhZQpjAFflIWUjGkvaG9tZS9pbm5vbS1kdC9tYW1iYWZvcmdlL2VudnMvaGYtZHJsLWNsYXNzL2xpYi9weXRob24zLjkvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuAQwIAAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjGkvaG9tZS9pbm5vbS1kdC9tYW1iYWZvcmdlL2VudnMvaGYtZHJsLWNsYXNzL2xpYi9weXRob24zLjkvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpSMHGNsb3VkcGlja2xlLmNsb3VkcGlja2xlX2Zhc3SUjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoIH2UfZQoaBdoDowMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBiMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHPzOpKjBVMmGFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQEAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAQAAAAAAAMY0L749tQ67ojbTO65IpjiQHj48t2ePuQAAgD8AAIA/WogBvvZgXDsvgrg8Y79Guy0vBL2jnzI8AACAPwAAgD8AziQ8uIaGucP3QrqBHIS1Qee3uQjgYjkAAIA/AACAPzPyMr3hqJC6sJJau8rMI7jzTqE6EVCTNwAAgD8AAIA/QH0EvlJQgbnERQ263FLVNtlODby2TiE5AACAPwAAgD+a+bm7e7qCuj4O8LpELgE1QeFhu1rICDoAAIA/AACAP+YEVL1IzYm6lq1hOm/4mrSXije7yAWAuQAAgD8AAIA/gEjBvYWz5bmS7S086vyFNmy6w7onf4Q1AACAPwAAgD+UjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSwhLCIaUjAFDlHSUUpQu"}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVewAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYIAAAAAAAAAAAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlC4="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.015808000000000044, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVeBAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBMqmXOGnTkCUhpRSlIwBbJRN6AOMAXSUR0BzyRUfgaWHdX2UKGgGaAloD0MIw9Zs5SVjRkCUhpRSlGgVS85oFkdAc9SvDxb0OHV9lChoBmgJaA9DCHkfR3PkfWFAlIaUUpRoFU3oA2gWR0Bz1f3i704BdX2UKGgGaAloD0MINxsrMU+7Y0CUhpRSlGgVTegDaBZHQHPeitA9mpV1fZQoaAZoCWgPQwjnNuFemW9EQJSGlFKUaBVLxWgWR0Bz43kKeCkHdX2UKGgGaAloD0MIBRcrajCMXUCUhpRSlGgVTegDaBZHQHPx0qtozvZ1fZQoaAZoCWgPQwjGa17VWWE5QJSGlFKUaBVN6ANoFkdAc/enkkrwv3V9lChoBmgJaA9DCJfGL7yS5N+/lIaUUpRoFUvDaBZHQHQGACr92ox1fZQoaAZoCWgPQwjX+412XGBmQJSGlFKUaBVN6ANoFkdAdAeS8J2MbXV9lChoBmgJaA9DCEJcOXtn8WBAlIaUUpRoFU3oA2gWR0B0DIw22oegdX2UKGgGaAloD0MIEhJpG39MXECUhpRSlGgVTegDaBZHQHQMsTzundh1fZQoaAZoCWgPQwjwNJnxNhRhQJSGlFKUaBVN6ANoFkdAdBh+10DEFXV9lChoBmgJaA9DCFhWmpSC1GBAlIaUUpRoFU3oA2gWR0B0IHMyJsO5dX2UKGgGaAloD0MImbnA5TEAY0CUhpRSlGgVTegDaBZHQHQk55mh/RV1fZQoaAZoCWgPQwiE8dO4tytjQJSGlFKUaBVN6ANoFkdAdJY0g8r7O3V9lChoBmgJaA9DCGr5gas8OV5AlIaUUpRoFU3oA2gWR0B0qmasp5NXdX2UKGgGaAloD0MI/DbEeM1rVUCUhpRSlGgVTegDaBZHQHSsELlV94N1fZQoaAZoCWgPQwjid9MtO0ZiQJSGlFKUaBVN6ANoFkdAdLF6lchTwXV9lChoBmgJaA9DCBy1wvQ9lmVAlIaUUpRoFU3oA2gWR0B0saKtPpIMdX2UKGgGaAloD0MIE0n0MopOYkCUhpRSlGgVTegDaBZHQHS/14gRsdl1fZQoaAZoCWgPQwj2Jobk5HtgQJSGlFKUaBVN6ANoFkdAdMnLux8lX3V9lChoBmgJaA9DCDVG66hq6V5AlIaUUpRoFU3oA2gWR0B0zwsJ6Y3OdX2UKGgGaAloD0MIZVWEm4yqNkCUhpRSlGgVS7NoFkdAdNUtozvZy3V9lChoBmgJaA9DCEIFhxfEQGBAlIaUUpRoFU3oA2gWR0B03Apqh11XdX2UKGgGaAloD0MIforjwKvnTUCUhpRSlGgVS8loFkdAdOqlaKUFCHV9lChoBmgJaA9DCMNF7unqj2VAlIaUUpRoFU3oA2gWR0B08F4dIXj3dX2UKGgGaAloD0MIIO1/gLVYY0CUhpRSlGgVTegDaBZHQHTx9eUpuuR1fZQoaAZoCWgPQwj2B8pt+39kQJSGlFKUaBVN6ANoFkdAdPcTr3TNMXV9lChoBmgJaA9DCDOJesGnzl9AlIaUUpRoFU3oA2gWR0B09zlOoHcDdX2UKGgGaAloD0MIMjogCfu2NECUhpRSlGgVS91oFkdAdP6UzKs+3nV9lChoBmgJaA9DCMLB3sSQ0F5AlIaUUpRoFU3oA2gWR0B1BO+VTrE+dX2UKGgGaAloD0MIIJbNHJIiS0CUhpRSlGgVS9toFkdAdQT0fYBeX3V9lChoBmgJaA9DCLd546QwO15AlIaUUpRoFU3oA2gWR0B1EsGPgeijdX2UKGgGaAloD0MI2jo42BtMYECUhpRSlGgVTegDaBZHQHUZpZSvTw51fZQoaAZoCWgPQwg7jh8qjZpiQJSGlFKUaBVN6ANoFkdAdZT5XEIgNnV9lChoBmgJaA9DCENxx5t8y2NAlIaUUpRoFU3oA2gWR0B1nJYJVsDXdX2UKGgGaAloD0MIgXwJFZxfYECUhpRSlGgVTegDaBZHQHWiWOMl1KZ1fZQoaAZoCWgPQwigOIB+35xcQJSGlFKUaBVN6ANoFkdAdasbWEsasXV9lChoBmgJaA9DCBjshm0LDWRAlIaUUpRoFU3oA2gWR0B1saews5GSdX2UKGgGaAloD0MIUfpCyPnyZECUhpRSlGgVTegDaBZHQHWxrnoxHoZ1fZQoaAZoCWgPQwhpOjsZHBxVQJSGlFKUaBVN6ANoFkdAdcEZqmCROnV9lChoBmgJaA9DCNFZZhGKFGNAlIaUUpRoFU3oA2gWR0B1yZBPbfxddX2UKGgGaAloD0MIOxqH+t1wYECUhpRSlGgVTegDaBZHQHXjD0th/iJ1fZQoaAZoCWgPQwhi2jf3V85ZQJSGlFKUaBVN6ANoFkdAdep8Z1mrbXV9lChoBmgJaA9DCEPmyqDaw1xAlIaUUpRoFU3oA2gWR0B18BOVPepGdX2UKGgGaAloD0MIfentz0WzYUCUhpRSlGgVTegDaBZHQHX4/lyR0U51fZQoaAZoCWgPQwhG66hqApBlQJSGlFKUaBVN6ANoFkdAdf92AG0NSnV9lChoBmgJaA9DCAZ/v5gtJWJAlIaUUpRoFU3oA2gWR0B1/34BV+7UdX2UKGgGaAloD0MIFTduMT9vXUCUhpRSlGgVTegDaBZHQHYNuPV/c351fZQoaAZoCWgPQwjpK0gzFpVVQJSGlFKUaBVN6ANoFkdAdhaRLbpNbnV9lChoBmgJaA9DCC7GwDqO/2FAlIaUUpRoFU3oA2gWR0B2m8BaLXMAdX2UKGgGaAloD0MIsHWpEXr6Z0CUhpRSlGgVTegDaBZHQHakTzqbBoF1fZQoaAZoCWgPQwgCDMuf77diQJSGlFKUaBVN6ANoFkdAdqoC17Y023V9lChoBmgJaA9DCHQLXYlAxWRAlIaUUpRoFU3oA2gWR0B2sw6jnFHbdX2UKGgGaAloD0MITWVR2MXHY0CUhpRSlGgVTegDaBZHQHa5WsFMZgp1fZQoaAZoCWgPQwhXBtUGJytfQJSGlFKUaBVN6ANoFkdAdrljGDL8rXV9lChoBmgJaA9DCOtU+Z6Re19AlIaUUpRoFU3oA2gWR0B2x2yGBWgfdX2UKGgGaAloD0MIqU4Hsp4xUUCUhpRSlGgVTegDaBZHQHbOxRAKOT91fZQoaAZoCWgPQwgY7lwYaZ1gQJSGlFKUaBVN6ANoFkdAduaBBAv+O3V9lChoBmgJaA9DCFex+E1hql9AlIaUUpRoFU3oA2gWR0B27kbedkJ8dX2UKGgGaAloD0MI8PlhhPAtX0CUhpRSlGgVTegDaBZHQHb0Jxm03Ox1fZQoaAZoCWgPQwhXs874vpFfQJSGlFKUaBVN6ANoFkdAdv3S3b212XV9lChoBmgJaA9DCOtx32qdXF1AlIaUUpRoFU3oA2gWR0B3BOCiAUcodX2UKGgGaAloD0MIj/0sliKYY0CUhpRSlGgVTegDaBZHQHcE6bKA8Sx1fZQoaAZoCWgPQwiXjjnPWDdgQJSGlFKUaBVN6ANoFkdAdxTH7gsK9nV9lChoBmgJaA9DCCnqzD0kW1tAlIaUUpRoFU3oA2gWR0B3HBhc7hegdX2UKGgGaAloD0MIjSYXY2BqVUCUhpRSlGgVTegDaBZHQHeU4uwosqd1fZQoaAZoCWgPQwh5IojzcFZfQJSGlFKUaBVN6ANoFkdAd5xPy08eS3V9lChoBmgJaA9DCOnX1k//ulpAlIaUUpRoFU3oA2gWR0B3obI4lyBDdX2UKGgGaAloD0MI3eukvizrX0CUhpRSlGgVTegDaBZHQHeq3maH9FZ1fZQoaAZoCWgPQwh8KTxodjBhQJSGlFKUaBVN6ANoFkdAd7FOIInjQ3V9lChoBmgJaA9DCK6AQj19M2NAlIaUUpRoFU3oA2gWR0B3sVRCQcPwdX2UKGgGaAloD0MIWRe30QARX0CUhpRSlGgVTegDaBZHQHfAeFlCkXV1fZQoaAZoCWgPQwiLUGwFTbhfQJSGlFKUaBVN6ANoFkdAd8iGh24d63V9lChoBmgJaA9DCKZfIt46N2JAlIaUUpRoFU3oA2gWR0B34Zw++ueSdX2UKGgGaAloD0MINszQeKKMYECUhpRSlGgVTegDaBZHQHfph3FDOTt1fZQoaAZoCWgPQwihgy7h0KpbQJSGlFKUaBVN6ANoFkdAd+9uGbkOqnV9lChoBmgJaA9DCKkSZW+pemBAlIaUUpRoFU3oA2gWR0B3+Tu+h4+sdX2UKGgGaAloD0MIQgqeQq55ZUCUhpRSlGgVTegDaBZHQHgALpJPIn11fZQoaAZoCWgPQwjytWeWBBpRQJSGlFKUaBVN6ANoFkdAeAA2OhkAgnV9lChoBmgJaA9DCJdxUwPN2z1AlIaUUpRoFUuuaBZHQHgMhoduHet1fZQoaAZoCWgPQwjDZoALMnVgQJSGlFKUaBVN6ANoFkdAeA+tHQQcxXV9lChoBmgJaA9DCHGuYYbGsWBAlIaUUpRoFU3oA2gWR0B4FsKlYU35dX2UKGgGaAloD0MIr5Y7M8GmYECUhpRSlGgVTegDaBZHQHiQ++23KCB1fZQoaAZoCWgPQwhyb37DRB5iQJSGlFKUaBVN6ANoFkdAeJeTI/7iynV9lChoBmgJaA9DCLxa7swE4FpAlIaUUpRoFU3oA2gWR0B4nLC1qnFYdX2UKGgGaAloD0MIAOMZNPTWY0CUhpRSlGgVTegDaBZHQHilOIMz/Id1fZQoaAZoCWgPQwjf+xu0Vx1fQJSGlFKUaBVN6ANoFkdAeKwkBS1ma3V9lChoBmgJaA9DCKsjRzqDzWJAlIaUUpRoFU3oA2gWR0B4uamelKsddX2UKGgGaAloD0MIj/rrFRbVXECUhpRSlGgVTegDaBZHQHi8kGJN0vJ1fZQoaAZoCWgPQwilaybfbLNmQJSGlFKUaBVN6ANoFkdAeMORTS9dvHV9lChoBmgJaA9DCHKo34WtvWRAlIaUUpRoFU3oA2gWR0B42dp1zQu3dX2UKGgGaAloD0MIdAzIXu/uYkCUhpRSlGgVTegDaBZHQHjguvIOpbV1fZQoaAZoCWgPQwi1bRgFwWdgQJSGlFKUaBVN6ANoFkdAeOUkn1Fpf3V9lChoBmgJaA9DCMxG5/yU6GFAlIaUUpRoFU3oA2gWR0B469BAv+OwdX2UKGgGaAloD0MI2ERmLnDPTUCUhpRSlGgVS9BoFkdAePBLFXJYDHV9lChoBmgJaA9DCMvydRl+32RAlIaUUpRoFU3oA2gWR0B48QhJRO1wdX2UKGgGaAloD0MI5geu8gRCYkCUhpRSlGgVTegDaBZHQHj7K1b7j1h1fZQoaAZoCWgPQwhExM2pZN1dQJSGlFKUaBVN6ANoFkdAeP3RQJokA3V9lChoBmgJaA9DCHqp2JhX0GRAlIaUUpRoFU3oA2gWR0B5BG9Gqgh9dWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 310, "n_steps": 2048, "gamma": 0.999, "gae_lambda": 0.95, "ent_coef": 0.0, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 10, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVAwMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAEsBSwFLE0MEiABTAJROhZQpjAFflIWUjGkvaG9tZS9pbm5vbS1kdC9tYW1iYWZvcmdlL2VudnMvaGYtZHJsLWNsYXNzL2xpYi9weXRob24zLjkvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuAQwIAAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjGkvaG9tZS9pbm5vbS1kdC9tYW1iYWZvcmdlL2VudnMvaGYtZHJsLWNsYXNzL2xpYi9weXRob24zLjkvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpSMHGNsb3VkcGlja2xlLmNsb3VkcGlja2xlX2Zhc3SUjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoIH2UfZQoaBdoDowMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBiMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHP7mZmZmZmZqFlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "system_info": {"OS": "Linux-5.15.0-27-generic-x86_64-with-glibc2.35 #28-Ubuntu SMP Thu Apr 14 04:55:28 UTC 2022", "Python": "3.9.12", "Stable-Baselines3": "1.5.0", "PyTorch": "1.11.0", "GPU Enabled": "True", "Numpy": "1.22.3", "Gym": "0.21.0"}}
|
ppo-LunarLander-v2.zip
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:82cbd49dd8d83c0350649997af77d06c028f83be0dbca8ba91a1c15caa146d53
|
3 |
+
size 143932
|
ppo-LunarLander-v2/data
CHANGED
@@ -4,19 +4,19 @@
|
|
4 |
":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
|
5 |
"__module__": "stable_baselines3.common.policies",
|
6 |
"__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
|
7 |
-
"__init__": "<function ActorCriticPolicy.__init__ at
|
8 |
-
"_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at
|
9 |
-
"reset_noise": "<function ActorCriticPolicy.reset_noise at
|
10 |
-
"_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at
|
11 |
-
"_build": "<function ActorCriticPolicy._build at
|
12 |
-
"forward": "<function ActorCriticPolicy.forward at
|
13 |
-
"_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at
|
14 |
-
"_predict": "<function ActorCriticPolicy._predict at
|
15 |
-
"evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at
|
16 |
-
"get_distribution": "<function ActorCriticPolicy.get_distribution at
|
17 |
-
"predict_values": "<function ActorCriticPolicy.predict_values at
|
18 |
"__abstractmethods__": "frozenset()",
|
19 |
-
"_abc_impl": "<_abc._abc_data object at
|
20 |
},
|
21 |
"verbose": 1,
|
22 |
"policy_kwargs": {},
|
@@ -41,13 +41,13 @@
|
|
41 |
"dtype": "int64",
|
42 |
"_np_random": null
|
43 |
},
|
44 |
-
"n_envs":
|
45 |
-
"num_timesteps":
|
46 |
"_total_timesteps": 500000,
|
47 |
"_num_timesteps_at_start": 0,
|
48 |
"seed": null,
|
49 |
"action_noise": null,
|
50 |
-
"start_time":
|
51 |
"learning_rate": 0.0003,
|
52 |
"tensorboard_log": null,
|
53 |
"lr_schedule": {
|
@@ -56,26 +56,26 @@
|
|
56 |
},
|
57 |
"_last_obs": {
|
58 |
":type:": "<class 'numpy.ndarray'>",
|
59 |
-
":serialized:": "
|
60 |
},
|
61 |
"_last_episode_starts": {
|
62 |
":type:": "<class 'numpy.ndarray'>",
|
63 |
-
":serialized:": "
|
64 |
},
|
65 |
"_last_original_obs": null,
|
66 |
"_episode_num": 0,
|
67 |
"use_sde": false,
|
68 |
"sde_sample_freq": -1,
|
69 |
-
"_current_progress_remaining": -0.
|
70 |
"ep_info_buffer": {
|
71 |
":type:": "<class 'collections.deque'>",
|
72 |
-
":serialized:": "
|
73 |
},
|
74 |
"ep_success_buffer": {
|
75 |
":type:": "<class 'collections.deque'>",
|
76 |
":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
|
77 |
},
|
78 |
-
"_n_updates":
|
79 |
"n_steps": 2048,
|
80 |
"gamma": 0.999,
|
81 |
"gae_lambda": 0.95,
|
|
|
4 |
":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
|
5 |
"__module__": "stable_baselines3.common.policies",
|
6 |
"__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
|
7 |
+
"__init__": "<function ActorCriticPolicy.__init__ at 0x7f2f489dedc0>",
|
8 |
+
"_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f2f489dee50>",
|
9 |
+
"reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f2f489deee0>",
|
10 |
+
"_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f2f489def70>",
|
11 |
+
"_build": "<function ActorCriticPolicy._build at 0x7f2f489e2040>",
|
12 |
+
"forward": "<function ActorCriticPolicy.forward at 0x7f2f489e20d0>",
|
13 |
+
"_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f2f489e2160>",
|
14 |
+
"_predict": "<function ActorCriticPolicy._predict at 0x7f2f489e21f0>",
|
15 |
+
"evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f2f489e2280>",
|
16 |
+
"get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f2f489e2310>",
|
17 |
+
"predict_values": "<function ActorCriticPolicy.predict_values at 0x7f2f489e23a0>",
|
18 |
"__abstractmethods__": "frozenset()",
|
19 |
+
"_abc_impl": "<_abc._abc_data object at 0x7f2f48ba9e40>"
|
20 |
},
|
21 |
"verbose": 1,
|
22 |
"policy_kwargs": {},
|
|
|
41 |
"dtype": "int64",
|
42 |
"_np_random": null
|
43 |
},
|
44 |
+
"n_envs": 8,
|
45 |
+
"num_timesteps": 507904,
|
46 |
"_total_timesteps": 500000,
|
47 |
"_num_timesteps_at_start": 0,
|
48 |
"seed": null,
|
49 |
"action_noise": null,
|
50 |
+
"start_time": 1652399066.091435,
|
51 |
"learning_rate": 0.0003,
|
52 |
"tensorboard_log": null,
|
53 |
"lr_schedule": {
|
|
|
56 |
},
|
57 |
"_last_obs": {
|
58 |
":type:": "<class 'numpy.ndarray'>",
|
59 |
+
":serialized:": "gAWVdQEAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAQAAAAAAAMY0L749tQ67ojbTO65IpjiQHj48t2ePuQAAgD8AAIA/WogBvvZgXDsvgrg8Y79Guy0vBL2jnzI8AACAPwAAgD8AziQ8uIaGucP3QrqBHIS1Qee3uQjgYjkAAIA/AACAPzPyMr3hqJC6sJJau8rMI7jzTqE6EVCTNwAAgD8AAIA/QH0EvlJQgbnERQ263FLVNtlODby2TiE5AACAPwAAgD+a+bm7e7qCuj4O8LpELgE1QeFhu1rICDoAAIA/AACAP+YEVL1IzYm6lq1hOm/4mrSXije7yAWAuQAAgD8AAIA/gEjBvYWz5bmS7S086vyFNmy6w7onf4Q1AACAPwAAgD+UjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSwhLCIaUjAFDlHSUUpQu"
|
60 |
},
|
61 |
"_last_episode_starts": {
|
62 |
":type:": "<class 'numpy.ndarray'>",
|
63 |
+
":serialized:": "gAWVewAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYIAAAAAAAAAAAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlC4="
|
64 |
},
|
65 |
"_last_original_obs": null,
|
66 |
"_episode_num": 0,
|
67 |
"use_sde": false,
|
68 |
"sde_sample_freq": -1,
|
69 |
+
"_current_progress_remaining": -0.015808000000000044,
|
70 |
"ep_info_buffer": {
|
71 |
":type:": "<class 'collections.deque'>",
|
72 |
+
":serialized:": "gAWVeBAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBMqmXOGnTkCUhpRSlIwBbJRN6AOMAXSUR0BzyRUfgaWHdX2UKGgGaAloD0MIw9Zs5SVjRkCUhpRSlGgVS85oFkdAc9SvDxb0OHV9lChoBmgJaA9DCHkfR3PkfWFAlIaUUpRoFU3oA2gWR0Bz1f3i704BdX2UKGgGaAloD0MINxsrMU+7Y0CUhpRSlGgVTegDaBZHQHPeitA9mpV1fZQoaAZoCWgPQwjnNuFemW9EQJSGlFKUaBVLxWgWR0Bz43kKeCkHdX2UKGgGaAloD0MIBRcrajCMXUCUhpRSlGgVTegDaBZHQHPx0qtozvZ1fZQoaAZoCWgPQwjGa17VWWE5QJSGlFKUaBVN6ANoFkdAc/enkkrwv3V9lChoBmgJaA9DCJfGL7yS5N+/lIaUUpRoFUvDaBZHQHQGACr92ox1fZQoaAZoCWgPQwjX+412XGBmQJSGlFKUaBVN6ANoFkdAdAeS8J2MbXV9lChoBmgJaA9DCEJcOXtn8WBAlIaUUpRoFU3oA2gWR0B0DIw22oegdX2UKGgGaAloD0MIEhJpG39MXECUhpRSlGgVTegDaBZHQHQMsTzundh1fZQoaAZoCWgPQwjwNJnxNhRhQJSGlFKUaBVN6ANoFkdAdBh+10DEFXV9lChoBmgJaA9DCFhWmpSC1GBAlIaUUpRoFU3oA2gWR0B0IHMyJsO5dX2UKGgGaAloD0MImbnA5TEAY0CUhpRSlGgVTegDaBZHQHQk55mh/RV1fZQoaAZoCWgPQwiE8dO4tytjQJSGlFKUaBVN6ANoFkdAdJY0g8r7O3V9lChoBmgJaA9DCGr5gas8OV5AlIaUUpRoFU3oA2gWR0B0qmasp5NXdX2UKGgGaAloD0MI/DbEeM1rVUCUhpRSlGgVTegDaBZHQHSsELlV94N1fZQoaAZoCWgPQwjid9MtO0ZiQJSGlFKUaBVN6ANoFkdAdLF6lchTwXV9lChoBmgJaA9DCBy1wvQ9lmVAlIaUUpRoFU3oA2gWR0B0saKtPpIMdX2UKGgGaAloD0MIE0n0MopOYkCUhpRSlGgVTegDaBZHQHS/14gRsdl1fZQoaAZoCWgPQwj2Jobk5HtgQJSGlFKUaBVN6ANoFkdAdMnLux8lX3V9lChoBmgJaA9DCDVG66hq6V5AlIaUUpRoFU3oA2gWR0B0zwsJ6Y3OdX2UKGgGaAloD0MIZVWEm4yqNkCUhpRSlGgVS7NoFkdAdNUtozvZy3V9lChoBmgJaA9DCEIFhxfEQGBAlIaUUpRoFU3oA2gWR0B03Apqh11XdX2UKGgGaAloD0MIforjwKvnTUCUhpRSlGgVS8loFkdAdOqlaKUFCHV9lChoBmgJaA9DCMNF7unqj2VAlIaUUpRoFU3oA2gWR0B08F4dIXj3dX2UKGgGaAloD0MIIO1/gLVYY0CUhpRSlGgVTegDaBZHQHTx9eUpuuR1fZQoaAZoCWgPQwj2B8pt+39kQJSGlFKUaBVN6ANoFkdAdPcTr3TNMXV9lChoBmgJaA9DCDOJesGnzl9AlIaUUpRoFU3oA2gWR0B09zlOoHcDdX2UKGgGaAloD0MIMjogCfu2NECUhpRSlGgVS91oFkdAdP6UzKs+3nV9lChoBmgJaA9DCMLB3sSQ0F5AlIaUUpRoFU3oA2gWR0B1BO+VTrE+dX2UKGgGaAloD0MIIJbNHJIiS0CUhpRSlGgVS9toFkdAdQT0fYBeX3V9lChoBmgJaA9DCLd546QwO15AlIaUUpRoFU3oA2gWR0B1EsGPgeijdX2UKGgGaAloD0MI2jo42BtMYECUhpRSlGgVTegDaBZHQHUZpZSvTw51fZQoaAZoCWgPQwg7jh8qjZpiQJSGlFKUaBVN6ANoFkdAdZT5XEIgNnV9lChoBmgJaA9DCENxx5t8y2NAlIaUUpRoFU3oA2gWR0B1nJYJVsDXdX2UKGgGaAloD0MIgXwJFZxfYECUhpRSlGgVTegDaBZHQHWiWOMl1KZ1fZQoaAZoCWgPQwigOIB+35xcQJSGlFKUaBVN6ANoFkdAdasbWEsasXV9lChoBmgJaA9DCBjshm0LDWRAlIaUUpRoFU3oA2gWR0B1saews5GSdX2UKGgGaAloD0MIUfpCyPnyZECUhpRSlGgVTegDaBZHQHWxrnoxHoZ1fZQoaAZoCWgPQwhpOjsZHBxVQJSGlFKUaBVN6ANoFkdAdcEZqmCROnV9lChoBmgJaA9DCNFZZhGKFGNAlIaUUpRoFU3oA2gWR0B1yZBPbfxddX2UKGgGaAloD0MIOxqH+t1wYECUhpRSlGgVTegDaBZHQHXjD0th/iJ1fZQoaAZoCWgPQwhi2jf3V85ZQJSGlFKUaBVN6ANoFkdAdep8Z1mrbXV9lChoBmgJaA9DCEPmyqDaw1xAlIaUUpRoFU3oA2gWR0B18BOVPepGdX2UKGgGaAloD0MIfentz0WzYUCUhpRSlGgVTegDaBZHQHX4/lyR0U51fZQoaAZoCWgPQwhG66hqApBlQJSGlFKUaBVN6ANoFkdAdf92AG0NSnV9lChoBmgJaA9DCAZ/v5gtJWJAlIaUUpRoFU3oA2gWR0B1/34BV+7UdX2UKGgGaAloD0MIFTduMT9vXUCUhpRSlGgVTegDaBZHQHYNuPV/c351fZQoaAZoCWgPQwjpK0gzFpVVQJSGlFKUaBVN6ANoFkdAdhaRLbpNbnV9lChoBmgJaA9DCC7GwDqO/2FAlIaUUpRoFU3oA2gWR0B2m8BaLXMAdX2UKGgGaAloD0MIsHWpEXr6Z0CUhpRSlGgVTegDaBZHQHakTzqbBoF1fZQoaAZoCWgPQwgCDMuf77diQJSGlFKUaBVN6ANoFkdAdqoC17Y023V9lChoBmgJaA9DCHQLXYlAxWRAlIaUUpRoFU3oA2gWR0B2sw6jnFHbdX2UKGgGaAloD0MITWVR2MXHY0CUhpRSlGgVTegDaBZHQHa5WsFMZgp1fZQoaAZoCWgPQwhXBtUGJytfQJSGlFKUaBVN6ANoFkdAdrljGDL8rXV9lChoBmgJaA9DCOtU+Z6Re19AlIaUUpRoFU3oA2gWR0B2x2yGBWgfdX2UKGgGaAloD0MIqU4Hsp4xUUCUhpRSlGgVTegDaBZHQHbOxRAKOT91fZQoaAZoCWgPQwgY7lwYaZ1gQJSGlFKUaBVN6ANoFkdAduaBBAv+O3V9lChoBmgJaA9DCFex+E1hql9AlIaUUpRoFU3oA2gWR0B27kbedkJ8dX2UKGgGaAloD0MI8PlhhPAtX0CUhpRSlGgVTegDaBZHQHb0Jxm03Ox1fZQoaAZoCWgPQwhXs874vpFfQJSGlFKUaBVN6ANoFkdAdv3S3b212XV9lChoBmgJaA9DCOtx32qdXF1AlIaUUpRoFU3oA2gWR0B3BOCiAUcodX2UKGgGaAloD0MIj/0sliKYY0CUhpRSlGgVTegDaBZHQHcE6bKA8Sx1fZQoaAZoCWgPQwiXjjnPWDdgQJSGlFKUaBVN6ANoFkdAdxTH7gsK9nV9lChoBmgJaA9DCCnqzD0kW1tAlIaUUpRoFU3oA2gWR0B3HBhc7hegdX2UKGgGaAloD0MIjSYXY2BqVUCUhpRSlGgVTegDaBZHQHeU4uwosqd1fZQoaAZoCWgPQwh5IojzcFZfQJSGlFKUaBVN6ANoFkdAd5xPy08eS3V9lChoBmgJaA9DCOnX1k//ulpAlIaUUpRoFU3oA2gWR0B3obI4lyBDdX2UKGgGaAloD0MI3eukvizrX0CUhpRSlGgVTegDaBZHQHeq3maH9FZ1fZQoaAZoCWgPQwh8KTxodjBhQJSGlFKUaBVN6ANoFkdAd7FOIInjQ3V9lChoBmgJaA9DCK6AQj19M2NAlIaUUpRoFU3oA2gWR0B3sVRCQcPwdX2UKGgGaAloD0MIWRe30QARX0CUhpRSlGgVTegDaBZHQHfAeFlCkXV1fZQoaAZoCWgPQwiLUGwFTbhfQJSGlFKUaBVN6ANoFkdAd8iGh24d63V9lChoBmgJaA9DCKZfIt46N2JAlIaUUpRoFU3oA2gWR0B34Zw++ueSdX2UKGgGaAloD0MINszQeKKMYECUhpRSlGgVTegDaBZHQHfph3FDOTt1fZQoaAZoCWgPQwihgy7h0KpbQJSGlFKUaBVN6ANoFkdAd+9uGbkOqnV9lChoBmgJaA9DCKkSZW+pemBAlIaUUpRoFU3oA2gWR0B3+Tu+h4+sdX2UKGgGaAloD0MIQgqeQq55ZUCUhpRSlGgVTegDaBZHQHgALpJPIn11fZQoaAZoCWgPQwjytWeWBBpRQJSGlFKUaBVN6ANoFkdAeAA2OhkAgnV9lChoBmgJaA9DCJdxUwPN2z1AlIaUUpRoFUuuaBZHQHgMhoduHet1fZQoaAZoCWgPQwjDZoALMnVgQJSGlFKUaBVN6ANoFkdAeA+tHQQcxXV9lChoBmgJaA9DCHGuYYbGsWBAlIaUUpRoFU3oA2gWR0B4FsKlYU35dX2UKGgGaAloD0MIr5Y7M8GmYECUhpRSlGgVTegDaBZHQHiQ++23KCB1fZQoaAZoCWgPQwhyb37DRB5iQJSGlFKUaBVN6ANoFkdAeJeTI/7iynV9lChoBmgJaA9DCLxa7swE4FpAlIaUUpRoFU3oA2gWR0B4nLC1qnFYdX2UKGgGaAloD0MIAOMZNPTWY0CUhpRSlGgVTegDaBZHQHilOIMz/Id1fZQoaAZoCWgPQwjf+xu0Vx1fQJSGlFKUaBVN6ANoFkdAeKwkBS1ma3V9lChoBmgJaA9DCKsjRzqDzWJAlIaUUpRoFU3oA2gWR0B4uamelKsddX2UKGgGaAloD0MIj/rrFRbVXECUhpRSlGgVTegDaBZHQHi8kGJN0vJ1fZQoaAZoCWgPQwilaybfbLNmQJSGlFKUaBVN6ANoFkdAeMORTS9dvHV9lChoBmgJaA9DCHKo34WtvWRAlIaUUpRoFU3oA2gWR0B42dp1zQu3dX2UKGgGaAloD0MIdAzIXu/uYkCUhpRSlGgVTegDaBZHQHjguvIOpbV1fZQoaAZoCWgPQwi1bRgFwWdgQJSGlFKUaBVN6ANoFkdAeOUkn1Fpf3V9lChoBmgJaA9DCMxG5/yU6GFAlIaUUpRoFU3oA2gWR0B469BAv+OwdX2UKGgGaAloD0MI2ERmLnDPTUCUhpRSlGgVS9BoFkdAePBLFXJYDHV9lChoBmgJaA9DCMvydRl+32RAlIaUUpRoFU3oA2gWR0B48QhJRO1wdX2UKGgGaAloD0MI5geu8gRCYkCUhpRSlGgVTegDaBZHQHj7K1b7j1h1fZQoaAZoCWgPQwhExM2pZN1dQJSGlFKUaBVN6ANoFkdAeP3RQJokA3V9lChoBmgJaA9DCHqp2JhX0GRAlIaUUpRoFU3oA2gWR0B5BG9Gqgh9dWUu"
|
73 |
},
|
74 |
"ep_success_buffer": {
|
75 |
":type:": "<class 'collections.deque'>",
|
76 |
":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
|
77 |
},
|
78 |
+
"_n_updates": 310,
|
79 |
"n_steps": 2048,
|
80 |
"gamma": 0.999,
|
81 |
"gae_lambda": 0.95,
|
ppo-LunarLander-v2/policy.optimizer.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 84893
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:854365468382db2ecc2b8603c8f3f4293fcd12f7553de915d0c8bb44c6aeebd6
|
3 |
size 84893
|
ppo-LunarLander-v2/policy.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 43201
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:90a9c8b790d69c679e2d19b4a457fb4446715ad3eee9a3e9eef63d12588b3a1d
|
3 |
size 43201
|
replay.mp4
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8a7b518877bb7cecd340a18e158143096ca9964e1b4408e2353bdd71da8e4f17
|
3 |
+
size 248168
|
results.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"mean_reward":
|
|
|
1 |
+
{"mean_reward": 263.16943458744606, "std_reward": 20.315705885789782, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2022-05-12T16:51:23.500710"}
|