CoderMan-O commited on
Commit
2edff25
1 Parent(s): 7bde56d

Upload PPO BipedalWalker-v3 trained agent

Browse files
BipedalWalker-v3.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:28c6e8ef172da4a89c65875d25b6b16cf29bda756462620f80057a000877800b
3
- size 173364
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff3d13b79b05c7de9538570cf2cd35a230ba8953c97feb9a0f67a507bacc2441
3
+ size 173404
BipedalWalker-v3/data CHANGED
@@ -26,12 +26,12 @@
26
  "_num_timesteps_at_start": 0,
27
  "seed": null,
28
  "action_noise": null,
29
- "start_time": 1713927914852567191,
30
  "learning_rate": 0.0003,
31
  "tensorboard_log": null,
32
  "_last_obs": {
33
  ":type:": "<class 'numpy.ndarray'>",
34
- ":serialized:": "gAWVdQYAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYABgAAAAAAAIIU2z/JDXg9lDa2vHIx67yApUm/9rXWvpzTHb8AgBi3AACAP6qo7j0cU4G/yt1sP+v/fz8AAAAARA+bPhHSnD4VT6I+9DOsPujfuz6R69M+zXL5PgvRGz+W9VU/AACAP4TXzD3KWcg7MRc+vLz2YL3rUZE/AACos0hYbz8AAAAAAAAAAJkoT7/6/3+/YJmrvQMAgD8AAAAAYJmCPhAVhD5xtIg+wQmRPtM8nj5vfbI+IxnSPpY8Az8aNTQ/AACAP/Jqqj5kOHY92TGhvRxulr3m4JQ/9f9/P0gGGb8AAAAAAAAAAMZrUj/lVQy+RPvpvmVE7DwAAIA/SBusPqQPrj4gJ7Q+dCK/PnmH0D7fN+s+p28KP13yLD9Ie20/AACAP9mp7D3FE6O8wfwYvbsHczzQNE2/OpscP2jkar4BAIC/AAAAAGm0jD+4MiA/HMxQPwAAgL8AAAAAh+hvPgGicj7ZH3s+WjeFPgBXkT4F8aM+LfnAPlcU8T7ahCU/AACAP4Zuxj0q7p+9ajOAPc5uUrsyVY0/AAAAAASOfz8UDno/AACAP3WLPL9MtjU/QLtFvQEAgD8AAAAAO5N9Pjg6gD4Pt4Q+HM6MPpCemT7cR60+Z/fLPh/Q/j6y8i4/AACAP9kT3D1GM+u8xZxGvefxBzwLBUq/YJeTu5C4u741cIW8AACAP4/3jD+KdGc/1gZdPwAAgL8AAIA/z7VpPkRdbD7yonQ+SMaBPr6VjT68tJ8+4fy7PuDZ6j4iPiE/AACAP7cfRz/ltq+9nf7oPDZsXLxIyDi/TJJOP85cJr83PE2/AACAP8Clqj4CAIA/7E5hP8wsBz8AAIA/OhWKPqymiz7ciZA+a1mZPiBOpz7Vt7w+NyPePsrBCj+yiD4/AACAP+ELZj/Y8aa87Mp+u2Hcm7v2mU+/S8lWPi4+J79Ic8K+AACAP7Qjcj9EyH0+ohkDv90YgD8AAAAAqwCIPhCMiT5nXI4++wmXPtzIpD7737k+ecraPqKqCD/YqTs/AACAPzo0mD6Mw329lVjrPKaJJz32z0c/BgCAv+vVhj8AiQhAAACAP68CCL8pKIg+AFLgvvv/fz8AAIA/PlyQPvD/kT4CHJc+G1KgPjvprj4kTMU+djzoPqYQET8jMkc/AACAPwhM3j6rkQ88jaVPvcNnEbxME4s/rReDvuBChjz7/38/AAAAAPGXU78AAIC/YKNHvgAAgD8AAAAAeECQPtnjkT7v/pY+QzOgPpTHrj4vJsU+yA/oPr70ED/RC0c/AACAP/YEqD28uTs99rYNvVDRgbwED0+/y/egPrDIYz7//3+/AACAP3nmjz8AAAAA0nFhP/v/f78AAAAAMZlvPsRRcj7NzHo+TAuFPvAmkT7OuqM+XLnAPp7E8D7n9yQ/bthyPwQVDT5PZ/07qMrmvP1OFjwVKEq/wH8COtBcNr/uCYC/AACAPyIRkT8AMJ+30CZRP/kHgL8AAAAA7XJqPoccbT7oaHU+Sy+CPlAIjj73NaA+/5S8PuqX6z6cwCE/AACAPyrclj6xTpa8OVa5PS1bdL2pgUW/wYt6v9BkAr4BAIA/AACAP+bcgD99h8Y+RI3oPsCIj7wAAIA/2iiFPvyrhj6QYos+s+GTPgVXoT5G/bU+njfWPkPPBT+QvTc/AACAP93ykr4/1ns9cYDlvOGYxrsnz2g/CACAv1y/ND8BAIC/AAAAAJZIiz76/3+/iIvNPS2sqr4AAAAAzLLwPpJu8z6T8/s+q6cFP4vRET8+eyQ/4JtBP5nfcT8AAIA/AACAP+XZaT/HTwO8UFyQva0hDryhxFG/cGdEPrAYG7/3dAW+AACAP3YThT/0pS6+8C4nv5ExRL8AAAAAkBeJPiCmij5WgI8+tj+YPscapj4mXbs+JIvcPuPCCT+tKj0/AACAPx3z0j7/VC88ca6QvEGsmLz1zVW/AADAskYXfz/7/38/AAAAAA5Ho75SBIU+rCJLPgEAgL8AAAAAHL3zPrmB9j5GIv8+2lcHPw6pEz8ajyY/7A1EP7btdD8AAIA/AACAP5SMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJLEEsYhpSMAUOUdJRSlC4="
35
  },
36
  "_last_episode_starts": {
37
  ":type:": "<class 'numpy.ndarray'>",
@@ -45,7 +45,7 @@
45
  "_stats_window_size": 100,
46
  "ep_info_buffer": {
47
  ":type:": "<class 'collections.deque'>",
48
- ":serialized:": "gAWVFgMAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHwFu75dnkDISMAWyUSzKMAXSUR0AvqePq9oN/dX2UKGgGR8BcYPyf+S8raAdLM2gIR0AvtJNCZ4OddX2UKGgGR8Ba4sWoFV1faAdLOWgIR0Av1GmUGFBZdX2UKGgGR8BZT8+mm+CcaAdLQGgIR0Av+8AaNuLrdX2UKGgGR8BavOT7l7tzaAdLR2gIR0AwEsNlRP43dX2UKGgGR8BZh46Kcd5qaAdLSmgIR0AwGw8GLUCrdX2UKGgGR8BaU0yxiXpoaAdLTGgIR0AwIwGnn+yadX2UKGgGR8Ba8xgqmTC+aAdLZGgIR0AwWexfOUt7dX2UKGgGR8BfsDdYW+GoaAdLcWgIR0AwdgCfYjB3dX2UKGgGR8BZjjYywfQsaAdLSmgIR0AwlJnQID5kdX2UKGgGR8BYxWDlHSWraAdLO2gIR0AwqK5kK/mDdX2UKGgGR8BaZtuHerMlaAdLUmgIR0AwxkK/mDDkdX2UKGgGR8BZ6iCaqjrSaAdLTmgIR0Aw0iXpnpSrdX2UKGgGR8BaO+h0yP+5aAdLVGgIR0Aw7wYcebNKdX2UKGgGR8Bcz876pHZsaAdLPGgIR0Aw8HBDXvphdX2UKGgGR8BedovalDWtaAdLgmgIR0AxIXzlLeyidX2UKGgGR8BafBHf/FR6aAdLL2gIR0AxQWCmMwUQdX2UKGgGR8BbH7jPv8ZUaAdLJGgIR0AxTcD8tPHldX2UKGgGR8Bah6hcqvvCaAdLMmgIR0AxVfqX4TK1dX2UKGgGR8BaMd6w+t8vaAdLXmgIR0AxmmygPEsKdX2UKGgGR8BaaHi704BFaAdLemgIR0Axrg4wRGtqdX2UKGgGR8BZgNTLns9kaAdLL2gIR0Axu2eg+QlsdX2UKGgGR8BaFo8Md92HaAdLPGgIR0Ax7aR6nivQdX2UKGgGR8BeRnXumaYvaAdLVmgIR0Ax9bKA8SwodX2UKGgGR8BbD+8oQWepaAdLLmgIR0AyFvNu+AVgdWUu"
49
  },
50
  "ep_success_buffer": {
51
  ":type:": "<class 'collections.deque'>",
@@ -85,7 +85,7 @@
85
  "n_envs": 16,
86
  "n_steps": 300,
87
  "gamma": 0.999,
88
- "gae_lambda": 0.99,
89
  "ent_coef": 0.01,
90
  "vf_coef": 0.5,
91
  "max_grad_norm": 0.5,
 
26
  "_num_timesteps_at_start": 0,
27
  "seed": null,
28
  "action_noise": null,
29
+ "start_time": 1713928043719850162,
30
  "learning_rate": 0.0003,
31
  "tensorboard_log": null,
32
  "_last_obs": {
33
  ":type:": "<class 'numpy.ndarray'>",
34
+ ":serialized:": "gAWVdQYAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYABgAAAAAAAHElyz3lBAU8fN4lvVGN6TyfGFa/4HcdO8AHPz0ns38/AACAPw5GkT8AjKS4IG5ZP7LAB74AAIA/oZliPmosZT6sMW0+JKd7Pg5HiT7q2Jo+ykS2Ps+04z7pahk/AACAP6/RoD6vtIi9Y1hyPl6MAL0UGyC/MFxovTyLx774AIA/AACAP/u2Vb8AAN22sIPnvpIVDD4AAAAAyUOKPsLViz6ZupA+II2ZPomGpz5297w+HW7ePpPwCj9pQj8/AACAPzXnmT4AQN+8xyrNvchyQD1tUQ2/CZf7PiKsIb8AAAAAAAAAAINncT99eAm/5FMmP///fz8AAAAAHx2LPpCxjD4YnpE+fX6aPt6NqD5/IL4+wMvfPvnKCz+Zzj8/AACAP/IxgD8xKLC8gBcTPpyErbxZgT2/SgKAP/7MD7/7AIC/AACAP7FDH78451S9Vnwov1XpIjoAAIA/xbigPgiMoj5bPKg+t32yPiu8wj6bqNs+VEcBP6CBIT8KJl4/AACAP517ZbwTvq88wNH6PYh/Or6huxE9AACAv9Z2CL/7/38/AAAAAFPUYr13EDi+SCVbvr3pp74AAIA/nry0PhHKtj7AL70+DbjIPl782j5gA/c+w2ARP3yeNT/p3ns/AACAP0lU8z2KMru89boXPcRpAr21vFW/AABgtAAQh7z//38/AAAAAKxTjz8kWlm+VMJaPwEAgD8AAIA/69FnPuFzaj5vqHI+lrmAPphwjD4Rap4+p3e6Pp/z6D6Cex8/AACAP++6wT1+Kxw8DXwpuwoQDT23aEu/ADQFuZzErr4Pyis/AACAP23QjD8AoJk2hqVqP3D3Hr4AAIA/D/lkPr6SZz6ArW8+ukl+Pgu3ij4AeJw+Yy24PjQX5j5t+R0/AACAP+oqHD8MJji9EzlyvR2hiTx1Nlo/rlB+P7L9Mj9jAIC/AAAAAOvnI7++jQk/GtItv/lyVL8AAIA/TGCNPlH7jj5Z/JM+swGdPp1Lqz4OOME+fG/jPvoQDj8CFEM/AACAP3NvTT5Q9wq9W55uPYu3Ib2N2oo/mp7Ivj6tVD83AYA/AACAP65KVr8AQEk3gJVyvk8GgD8AAIA/53V5PiZLfD7Gj4I+OIWKPnEglz4ReKo+JajIPqet+j77Gyw/AACAPyCltj9s1K27LhkWvkWZUjx8DUi/UL5aPhgvGr9g7TO8AACAP0IVkr7j+Ao+0MMqvvTCf78AAAAAkWCiPqQ4pD7396k+XlS0Pqe9xD7P690+N5wCP30rIz92DmA/AACAPxwn87tSUk69fdoVuZjEir0rScC+o591P5Z6AD+LsWW/AACAP7iuVz90Wws/KoUoP+f/fz8AAIA/HgbHPrxIyT4eVNA+IwfdPpwk8T7LAAg/YhYgP9b+Rz8AAIA/AACAP5VrSj/kFlo8kfoCPW9AGb2cfoU/qHflvhT4qz77/3+/AAAAAMHlNL/8/38/wO42v/2iP78AAAAAJvGLPv+HjT4IfJI+9mmbPsSOqT5GQr8+2CDhPgmgDD9lGUE/AACAP0G06z0WnPU7oiC9PMMDqrxjLpE/AACgMgpWcD8Unsc+AACAP4/aTb8iQ8E9gLzjvP3/f78AAAAA4xB5Pvzkez7oWoI+IU2KPj/jlj4KM6o+5FbIPiVI+j5J1is/AACAP8Kr1z1I4IG99XSWPXrii7sIOy+/WMZ4PgAmjLsAAIA/AAAAAO/hgj9q69M+2CVvP6uqqjAAAIA/w7x6PriVfT7YOoM+uDqLPnXmlz5tV6s+D6/JPhv2+z59/Sw/AACAP2cqhj7JRuq7aVgjPamXeDx5vFW/AAAAACCChj1545Q9AAAAAH6sjz8AAAAAdMyzPrM9kz4AAIA/14J8PvRgfz5/KIQ+3DaMPoz5mD65jaw+TRzLPme+/T7FNi4/AACAPwfbTD6OzXE87SgFPLbvML0a0JA/hZ0KP9YbIz+g61S/AACAP/uGQ7/7V4E+QG+hvgEAgL8AAAAAbeyCPg5phD5gC4k+/GWRPnOhnj7w7rI+vp7SPguQAz/XuTE/AACAP5SMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJLEEsYhpSMAUOUdJRSlC4="
35
  },
36
  "_last_episode_starts": {
37
  ":type:": "<class 'numpy.ndarray'>",
 
45
  "_stats_window_size": 100,
46
  "ep_info_buffer": {
47
  ":type:": "<class 'collections.deque'>",
48
+ ":serialized:": "gAWVNAMAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHwFyGl+EytV+MAWyUSzuMAXSUR0BiCFdzGPxQdX2UKGgGR8BalN2xIJ7caAdLPmgIR0BiCPGhmGucdX2UKGgGR8BZ71KwpvxZaAdLQ2gIR0BiChSrHU+cdX2UKGgGR8BcylDOTq0MaAdLRGgIR0BiCjEk0JnhdX2UKGgGR8BaGywKSgXeaAdLRmgIR0BiCzRIBikPdX2UKGgGR8BZ83wsoUi7aAdLRmgIR0BiCvQ0GeMAdX2UKGgGR8BZLLOiWVu8aAdLSWgIR0BiC8MNMGordX2UKGgGR8BZ/yVjZtelaAdLUGgIR0BiDWNPxhDxdX2UKGgGR8BaiaRuCPIXaAdLUmgIR0BiDfTgEU0vdX2UKGgGR8BdgPvWpZOjaAdLU2gIR0BiDpVQyhzvdX2UKGgGR8BemiJ9AooeaAdLV2gIR0BiD3UH6dlNdX2UKGgGR8BeHZ22Xsw+aAdLXWgIR0BiEKCg9NeudX2UKGgGR8BavljI7vG7aAdLN2gIR0BiFN36hxo7dX2UKGgGR8BZ4V4TsY2saAdLcmgIR0BiFPLHMlkZdX2UKGgGR8BarsPnSv1UaAdLO2gIR0BiF0vIwM6SdX2UKGgGR8BaDJrULDyfaAdLQ2gIR0BiGCBK+SKWdX2UKGgGR8BZ3F8stkFwaAdLO2gIR0BiGkVQAMlUdX2UKGgGR8BaqkF4cFQmaAdLP2gIR0BiG3BtUGVzdX2UKGgGR8BaVhxo7FKkaAdLPGgIR0BiG8TviLl4dX2UKGgGR8BcrhrWRRuTaAdLOGgIR0BiINuBMBZIdX2UKGgGR8BZ9ENjLB9DaAdLO2gIR0BiKF/8VHnVdX2UKGgGR8BarGRFI/Z/aAdLlWgIR0BiLb5AQg9vdX2UKGgGR8BZl//rB0p3aAdLX2gIR0BiLnX05EMLdX2UKGgGR8Baa8pXp4bCaAdLSGgIR0BiMCR8twrEdX2UKGgGR8Bc6Eb961LKaAdLP2gIR0BiNUtf5ULldX2UKGgGR8Bc05hWo3rEaAdLgGgIR0BiNmZ/kNnXdWUu"
49
  },
50
  "ep_success_buffer": {
51
  ":type:": "<class 'collections.deque'>",
 
85
  "n_envs": 16,
86
  "n_steps": 300,
87
  "gamma": 0.999,
88
+ "gae_lambda": 0.98,
89
  "ent_coef": 0.01,
90
  "vf_coef": 0.5,
91
  "max_grad_norm": 0.5,
BipedalWalker-v3/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8efe1369d3054db90473e3fce641809bd8c1dcf7d26216af9e07bb59322bc6b1
3
  size 105121
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c7f055588d07259f507ca6ece79215824edc10b4ddb2c5a620aa3be49de78b62
3
  size 105121
BipedalWalker-v3/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:16683d835b746824c2d4764b46ce347dcdbbcb46596054da74793d22e129cfcd
3
  size 52143
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:014a9b98204934461272ea85a762b622b36c7d7e1458ebd8c2ae8f252f859f44
3
  size 52143
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: BipedalWalker-v3
17
  metrics:
18
  - type: mean_reward
19
- value: -92.20 +/- 0.18
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: BipedalWalker-v3
17
  metrics:
18
  - type: mean_reward
19
+ value: -102.81 +/- 5.11
20
  name: mean_reward
21
  verified: false
22
  ---
config.json CHANGED
@@ -1 +1 @@
1
- {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7fa01b21db40>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7fa01b21dbd0>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7fa01b21dc60>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7fa01b21dcf0>", "_build": "<function ActorCriticPolicy._build at 0x7fa01b21dd80>", "forward": "<function ActorCriticPolicy.forward at 0x7fa01b21de10>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7fa01b21dea0>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7fa01b21df30>", "_predict": "<function ActorCriticPolicy._predict at 0x7fa01b21dfc0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7fa01b21e050>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7fa01b21e0e0>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7fa01b21e170>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7fa01b3c2ec0>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 4800, "_total_timesteps": 2000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1713927914852567191, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQYAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYABgAAAAAAAIIU2z/JDXg9lDa2vHIx67yApUm/9rXWvpzTHb8AgBi3AACAP6qo7j0cU4G/yt1sP+v/fz8AAAAARA+bPhHSnD4VT6I+9DOsPujfuz6R69M+zXL5PgvRGz+W9VU/AACAP4TXzD3KWcg7MRc+vLz2YL3rUZE/AACos0hYbz8AAAAAAAAAAJkoT7/6/3+/YJmrvQMAgD8AAAAAYJmCPhAVhD5xtIg+wQmRPtM8nj5vfbI+IxnSPpY8Az8aNTQ/AACAP/Jqqj5kOHY92TGhvRxulr3m4JQ/9f9/P0gGGb8AAAAAAAAAAMZrUj/lVQy+RPvpvmVE7DwAAIA/SBusPqQPrj4gJ7Q+dCK/PnmH0D7fN+s+p28KP13yLD9Ie20/AACAP9mp7D3FE6O8wfwYvbsHczzQNE2/OpscP2jkar4BAIC/AAAAAGm0jD+4MiA/HMxQPwAAgL8AAAAAh+hvPgGicj7ZH3s+WjeFPgBXkT4F8aM+LfnAPlcU8T7ahCU/AACAP4Zuxj0q7p+9ajOAPc5uUrsyVY0/AAAAAASOfz8UDno/AACAP3WLPL9MtjU/QLtFvQEAgD8AAAAAO5N9Pjg6gD4Pt4Q+HM6MPpCemT7cR60+Z/fLPh/Q/j6y8i4/AACAP9kT3D1GM+u8xZxGvefxBzwLBUq/YJeTu5C4u741cIW8AACAP4/3jD+KdGc/1gZdPwAAgL8AAIA/z7VpPkRdbD7yonQ+SMaBPr6VjT68tJ8+4fy7PuDZ6j4iPiE/AACAP7cfRz/ltq+9nf7oPDZsXLxIyDi/TJJOP85cJr83PE2/AACAP8Clqj4CAIA/7E5hP8wsBz8AAIA/OhWKPqymiz7ciZA+a1mZPiBOpz7Vt7w+NyPePsrBCj+yiD4/AACAP+ELZj/Y8aa87Mp+u2Hcm7v2mU+/S8lWPi4+J79Ic8K+AACAP7Qjcj9EyH0+ohkDv90YgD8AAAAAqwCIPhCMiT5nXI4++wmXPtzIpD7737k+ecraPqKqCD/YqTs/AACAPzo0mD6Mw329lVjrPKaJJz32z0c/BgCAv+vVhj8AiQhAAACAP68CCL8pKIg+AFLgvvv/fz8AAIA/PlyQPvD/kT4CHJc+G1KgPjvprj4kTMU+djzoPqYQET8jMkc/AACAPwhM3j6rkQ88jaVPvcNnEbxME4s/rReDvuBChjz7/38/AAAAAPGXU78AAIC/YKNHvgAAgD8AAAAAeECQPtnjkT7v/pY+QzOgPpTHrj4vJsU+yA/oPr70ED/RC0c/AACAP/YEqD28uTs99rYNvVDRgbwED0+/y/egPrDIYz7//3+/AACAP3nmjz8AAAAA0nFhP/v/f78AAAAAMZlvPsRRcj7NzHo+TAuFPvAmkT7OuqM+XLnAPp7E8D7n9yQ/bthyPwQVDT5PZ/07qMrmvP1OFjwVKEq/wH8COtBcNr/uCYC/AACAPyIRkT8AMJ+30CZRP/kHgL8AAAAA7XJqPoccbT7oaHU+Sy+CPlAIjj73NaA+/5S8PuqX6z6cwCE/AACAPyrclj6xTpa8OVa5PS1bdL2pgUW/wYt6v9BkAr4BAIA/AACAP+bcgD99h8Y+RI3oPsCIj7wAAIA/2iiFPvyrhj6QYos+s+GTPgVXoT5G/bU+njfWPkPPBT+QvTc/AACAP93ykr4/1ns9cYDlvOGYxrsnz2g/CACAv1y/ND8BAIC/AAAAAJZIiz76/3+/iIvNPS2sqr4AAAAAzLLwPpJu8z6T8/s+q6cFP4vRET8+eyQ/4JtBP5nfcT8AAIA/AACAP+XZaT/HTwO8UFyQva0hDryhxFG/cGdEPrAYG7/3dAW+AACAP3YThT/0pS6+8C4nv5ExRL8AAAAAkBeJPiCmij5WgI8+tj+YPscapj4mXbs+JIvcPuPCCT+tKj0/AACAPx3z0j7/VC88ca6QvEGsmLz1zVW/AADAskYXfz/7/38/AAAAAA5Ho75SBIU+rCJLPgEAgL8AAAAAHL3zPrmB9j5GIv8+2lcHPw6pEz8ajyY/7A1EP7btdD8AAIA/AACAP5SMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJLEEsYhpSMAUOUdJRSlC4="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -1.4, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVFgMAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHwFu75dnkDISMAWyUSzKMAXSUR0AvqePq9oN/dX2UKGgGR8BcYPyf+S8raAdLM2gIR0AvtJNCZ4OddX2UKGgGR8Ba4sWoFV1faAdLOWgIR0Av1GmUGFBZdX2UKGgGR8BZT8+mm+CcaAdLQGgIR0Av+8AaNuLrdX2UKGgGR8BavOT7l7tzaAdLR2gIR0AwEsNlRP43dX2UKGgGR8BZh46Kcd5qaAdLSmgIR0AwGw8GLUCrdX2UKGgGR8BaU0yxiXpoaAdLTGgIR0AwIwGnn+yadX2UKGgGR8Ba8xgqmTC+aAdLZGgIR0AwWexfOUt7dX2UKGgGR8BfsDdYW+GoaAdLcWgIR0AwdgCfYjB3dX2UKGgGR8BZjjYywfQsaAdLSmgIR0AwlJnQID5kdX2UKGgGR8BYxWDlHSWraAdLO2gIR0AwqK5kK/mDdX2UKGgGR8BaZtuHerMlaAdLUmgIR0AwxkK/mDDkdX2UKGgGR8BZ6iCaqjrSaAdLTmgIR0Aw0iXpnpSrdX2UKGgGR8BaO+h0yP+5aAdLVGgIR0Aw7wYcebNKdX2UKGgGR8Bcz876pHZsaAdLPGgIR0Aw8HBDXvphdX2UKGgGR8BedovalDWtaAdLgmgIR0AxIXzlLeyidX2UKGgGR8BafBHf/FR6aAdLL2gIR0AxQWCmMwUQdX2UKGgGR8BbH7jPv8ZUaAdLJGgIR0AxTcD8tPHldX2UKGgGR8Bah6hcqvvCaAdLMmgIR0AxVfqX4TK1dX2UKGgGR8BaMd6w+t8vaAdLXmgIR0AxmmygPEsKdX2UKGgGR8BaaHi704BFaAdLemgIR0Axrg4wRGtqdX2UKGgGR8BZgNTLns9kaAdLL2gIR0Axu2eg+QlsdX2UKGgGR8BaFo8Md92HaAdLPGgIR0Ax7aR6nivQdX2UKGgGR8BeRnXumaYvaAdLVmgIR0Ax9bKA8SwodX2UKGgGR8BbD+8oQWepaAdLLmgIR0AyFvNu+AVgdWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 4, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVTAQAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWGAAAAAAAAAABAQEBAQEBAQEBAQEBAQEBAQEBAQEBAQGUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLGIWUjAFDlHSUUpSMDWJvdW5kZWRfYWJvdmWUaBEolhgAAAAAAAAAAQEBAQEBAQEBAQEBAQEBAQEBAQEBAQEBlGgVSxiFlGgZdJRSlIwGX3NoYXBllEsYhZSMA2xvd5RoESiWYAAAAAAAAADbD0nAAACgwAAAoMAAAKDA2w9JwAAAoMDbD0nAAACgwAAAAIDbD0nAAACgwNsPScAAAKDAAAAAgAAAgL8AAIC/AACAvwAAgL8AAIC/AACAvwAAgL8AAIC/AACAvwAAgL+UaAtLGIWUaBl0lFKUjARoaWdolGgRKJZgAAAAAAAAANsPSUAAAKBAAACgQAAAoEDbD0lAAACgQNsPSUAAAKBAAACgQNsPSUAAAKBA2w9JQAAAoEAAAKBAAACAPwAAgD8AAIA/AACAPwAAgD8AAIA/AACAPwAAgD8AAIA/AACAP5RoC0sYhZRoGXSUUpSMCGxvd19yZXBylIz+Wy0zLjE0MTU5MjcgLTUuICAgICAgICAtNS4gICAgICAgIC01LiAgICAgICAgLTMuMTQxNTkyNyAtNS4KIC0zLjE0MTU5MjcgLTUuICAgICAgICAtMC4gICAgICAgIC0zLjE0MTU5MjcgLTUuICAgICAgICAtMy4xNDE1OTI3CiAtNS4gICAgICAgIC0wLiAgICAgICAgLTEuICAgICAgICAtMS4gICAgICAgIC0xLiAgICAgICAgLTEuCiAtMS4gICAgICAgIC0xLiAgICAgICAgLTEuICAgICAgICAtMS4gICAgICAgIC0xLiAgICAgICAgLTEuICAgICAgIF2UjAloaWdoX3JlcHKUjOZbMy4xNDE1OTI3IDUuICAgICAgICA1LiAgICAgICAgNS4gICAgICAgIDMuMTQxNTkyNyA1LiAgICAgICAgMy4xNDE1OTI3CiA1LiAgICAgICAgNS4gICAgICAgIDMuMTQxNTkyNyA1LiAgICAgICAgMy4xNDE1OTI3IDUuICAgICAgICA1LgogMS4gICAgICAgIDEuICAgICAgICAxLiAgICAgICAgMS4gICAgICAgIDEuICAgICAgICAxLiAgICAgICAgMS4KIDEuICAgICAgICAxLiAgICAgICAgMS4gICAgICAgXZSMCl9ucF9yYW5kb22UTnViLg==", "dtype": "float32", "bounded_below": "[ True True True True True True True True True True True True\n True True True True True True True True True True True True]", "bounded_above": "[ True True True True True True True True True True True True\n True True True True True True True True True True True True]", "_shape": [24], "low": "[-3.1415927 -5. -5. -5. -3.1415927 -5.\n -3.1415927 -5. -0. -3.1415927 -5. -3.1415927\n -5. -0. -1. -1. -1. -1.\n -1. -1. -1. -1. -1. -1. ]", "high": "[3.1415927 5. 5. 5. 3.1415927 5. 3.1415927\n 5. 5. 3.1415927 5. 3.1415927 5. 5.\n 1. 1. 1. 1. 1. 1. 1.\n 1. 1. 1. ]", "low_repr": "[-3.1415927 -5. -5. -5. -3.1415927 -5.\n -3.1415927 -5. -0. -3.1415927 -5. -3.1415927\n -5. -0. -1. -1. -1. -1.\n -1. -1. -1. -1. -1. -1. ]", "high_repr": "[3.1415927 5. 5. 5. 3.1415927 5. 3.1415927\n 5. 5. 3.1415927 5. 3.1415927 5. 5.\n 1. 1. 1. 1. 1. 1. 1.\n 1. 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVpwEAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWBAAAAAAAAAABAQEBlGgIjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwSFlIwBQ5R0lFKUjA1ib3VuZGVkX2Fib3ZllGgRKJYEAAAAAAAAAAEBAQGUaBVLBIWUaBl0lFKUjAZfc2hhcGWUSwSFlIwDbG93lGgRKJYQAAAAAAAAAAAAgL8AAIC/AACAvwAAgL+UaAtLBIWUaBl0lFKUjARoaWdolGgRKJYQAAAAAAAAAAAAgD8AAIA/AACAPwAAgD+UaAtLBIWUaBl0lFKUjAhsb3dfcmVwcpSMBC0xLjCUjAloaWdoX3JlcHKUjAMxLjCUjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True]", "bounded_above": "[ True True True True]", "_shape": [4], "low": "[-1. -1. -1. -1.]", "high": "[1. 1. 1. 1.]", "low_repr": "-1.0", "high_repr": "1.0", "_np_random": null}, "n_envs": 16, "n_steps": 300, "gamma": 0.999, "gae_lambda": 0.99, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "system_info": {"OS": "Linux-6.1.58+-x86_64-with-glibc2.35 # 1 SMP PREEMPT_DYNAMIC Sat Nov 18 15:31:17 UTC 2023", "Python": "3.10.12", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.2.1+cu121", "GPU Enabled": "False", "Numpy": "1.25.2", "Cloudpickle": "2.2.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
 
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7fa01b21db40>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7fa01b21dbd0>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7fa01b21dc60>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7fa01b21dcf0>", "_build": "<function ActorCriticPolicy._build at 0x7fa01b21dd80>", "forward": "<function ActorCriticPolicy.forward at 0x7fa01b21de10>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7fa01b21dea0>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7fa01b21df30>", "_predict": "<function ActorCriticPolicy._predict at 0x7fa01b21dfc0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7fa01b21e050>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7fa01b21e0e0>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7fa01b21e170>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7fa01b3c2ec0>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 4800, "_total_timesteps": 2000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1713928043719850162, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQYAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYABgAAAAAAAHElyz3lBAU8fN4lvVGN6TyfGFa/4HcdO8AHPz0ns38/AACAPw5GkT8AjKS4IG5ZP7LAB74AAIA/oZliPmosZT6sMW0+JKd7Pg5HiT7q2Jo+ykS2Ps+04z7pahk/AACAP6/RoD6vtIi9Y1hyPl6MAL0UGyC/MFxovTyLx774AIA/AACAP/u2Vb8AAN22sIPnvpIVDD4AAAAAyUOKPsLViz6ZupA+II2ZPomGpz5297w+HW7ePpPwCj9pQj8/AACAPzXnmT4AQN+8xyrNvchyQD1tUQ2/CZf7PiKsIb8AAAAAAAAAAINncT99eAm/5FMmP///fz8AAAAAHx2LPpCxjD4YnpE+fX6aPt6NqD5/IL4+wMvfPvnKCz+Zzj8/AACAP/IxgD8xKLC8gBcTPpyErbxZgT2/SgKAP/7MD7/7AIC/AACAP7FDH78451S9Vnwov1XpIjoAAIA/xbigPgiMoj5bPKg+t32yPiu8wj6bqNs+VEcBP6CBIT8KJl4/AACAP517ZbwTvq88wNH6PYh/Or6huxE9AACAv9Z2CL/7/38/AAAAAFPUYr13EDi+SCVbvr3pp74AAIA/nry0PhHKtj7AL70+DbjIPl782j5gA/c+w2ARP3yeNT/p3ns/AACAP0lU8z2KMru89boXPcRpAr21vFW/AABgtAAQh7z//38/AAAAAKxTjz8kWlm+VMJaPwEAgD8AAIA/69FnPuFzaj5vqHI+lrmAPphwjD4Rap4+p3e6Pp/z6D6Cex8/AACAP++6wT1+Kxw8DXwpuwoQDT23aEu/ADQFuZzErr4Pyis/AACAP23QjD8AoJk2hqVqP3D3Hr4AAIA/D/lkPr6SZz6ArW8+ukl+Pgu3ij4AeJw+Yy24PjQX5j5t+R0/AACAP+oqHD8MJji9EzlyvR2hiTx1Nlo/rlB+P7L9Mj9jAIC/AAAAAOvnI7++jQk/GtItv/lyVL8AAIA/TGCNPlH7jj5Z/JM+swGdPp1Lqz4OOME+fG/jPvoQDj8CFEM/AACAP3NvTT5Q9wq9W55uPYu3Ib2N2oo/mp7Ivj6tVD83AYA/AACAP65KVr8AQEk3gJVyvk8GgD8AAIA/53V5PiZLfD7Gj4I+OIWKPnEglz4ReKo+JajIPqet+j77Gyw/AACAPyCltj9s1K27LhkWvkWZUjx8DUi/UL5aPhgvGr9g7TO8AACAP0IVkr7j+Ao+0MMqvvTCf78AAAAAkWCiPqQ4pD7396k+XlS0Pqe9xD7P690+N5wCP30rIz92DmA/AACAPxwn87tSUk69fdoVuZjEir0rScC+o591P5Z6AD+LsWW/AACAP7iuVz90Wws/KoUoP+f/fz8AAIA/HgbHPrxIyT4eVNA+IwfdPpwk8T7LAAg/YhYgP9b+Rz8AAIA/AACAP5VrSj/kFlo8kfoCPW9AGb2cfoU/qHflvhT4qz77/3+/AAAAAMHlNL/8/38/wO42v/2iP78AAAAAJvGLPv+HjT4IfJI+9mmbPsSOqT5GQr8+2CDhPgmgDD9lGUE/AACAP0G06z0WnPU7oiC9PMMDqrxjLpE/AACgMgpWcD8Unsc+AACAP4/aTb8iQ8E9gLzjvP3/f78AAAAA4xB5Pvzkez7oWoI+IU2KPj/jlj4KM6o+5FbIPiVI+j5J1is/AACAP8Kr1z1I4IG99XSWPXrii7sIOy+/WMZ4PgAmjLsAAIA/AAAAAO/hgj9q69M+2CVvP6uqqjAAAIA/w7x6PriVfT7YOoM+uDqLPnXmlz5tV6s+D6/JPhv2+z59/Sw/AACAP2cqhj7JRuq7aVgjPamXeDx5vFW/AAAAACCChj1545Q9AAAAAH6sjz8AAAAAdMyzPrM9kz4AAIA/14J8PvRgfz5/KIQ+3DaMPoz5mD65jaw+TRzLPme+/T7FNi4/AACAPwfbTD6OzXE87SgFPLbvML0a0JA/hZ0KP9YbIz+g61S/AACAP/uGQ7/7V4E+QG+hvgEAgL8AAAAAbeyCPg5phD5gC4k+/GWRPnOhnj7w7rI+vp7SPguQAz/XuTE/AACAP5SMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJLEEsYhpSMAUOUdJRSlC4="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -1.4, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVNAMAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHwFyGl+EytV+MAWyUSzuMAXSUR0BiCFdzGPxQdX2UKGgGR8BalN2xIJ7caAdLPmgIR0BiCPGhmGucdX2UKGgGR8BZ71KwpvxZaAdLQ2gIR0BiChSrHU+cdX2UKGgGR8BcylDOTq0MaAdLRGgIR0BiCjEk0JnhdX2UKGgGR8BaGywKSgXeaAdLRmgIR0BiCzRIBikPdX2UKGgGR8BZ83wsoUi7aAdLRmgIR0BiCvQ0GeMAdX2UKGgGR8BZLLOiWVu8aAdLSWgIR0BiC8MNMGordX2UKGgGR8BZ/yVjZtelaAdLUGgIR0BiDWNPxhDxdX2UKGgGR8BaiaRuCPIXaAdLUmgIR0BiDfTgEU0vdX2UKGgGR8BdgPvWpZOjaAdLU2gIR0BiDpVQyhzvdX2UKGgGR8BemiJ9AooeaAdLV2gIR0BiD3UH6dlNdX2UKGgGR8BeHZ22Xsw+aAdLXWgIR0BiEKCg9NeudX2UKGgGR8BavljI7vG7aAdLN2gIR0BiFN36hxo7dX2UKGgGR8BZ4V4TsY2saAdLcmgIR0BiFPLHMlkZdX2UKGgGR8BarsPnSv1UaAdLO2gIR0BiF0vIwM6SdX2UKGgGR8BaDJrULDyfaAdLQ2gIR0BiGCBK+SKWdX2UKGgGR8BZ3F8stkFwaAdLO2gIR0BiGkVQAMlUdX2UKGgGR8BaqkF4cFQmaAdLP2gIR0BiG3BtUGVzdX2UKGgGR8BaVhxo7FKkaAdLPGgIR0BiG8TviLl4dX2UKGgGR8BcrhrWRRuTaAdLOGgIR0BiINuBMBZIdX2UKGgGR8BZ9ENjLB9DaAdLO2gIR0BiKF/8VHnVdX2UKGgGR8BarGRFI/Z/aAdLlWgIR0BiLb5AQg9vdX2UKGgGR8BZl//rB0p3aAdLX2gIR0BiLnX05EMLdX2UKGgGR8Baa8pXp4bCaAdLSGgIR0BiMCR8twrEdX2UKGgGR8Bc6Eb961LKaAdLP2gIR0BiNUtf5ULldX2UKGgGR8Bc05hWo3rEaAdLgGgIR0BiNmZ/kNnXdWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 4, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVTAQAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWGAAAAAAAAAABAQEBAQEBAQEBAQEBAQEBAQEBAQEBAQGUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLGIWUjAFDlHSUUpSMDWJvdW5kZWRfYWJvdmWUaBEolhgAAAAAAAAAAQEBAQEBAQEBAQEBAQEBAQEBAQEBAQEBlGgVSxiFlGgZdJRSlIwGX3NoYXBllEsYhZSMA2xvd5RoESiWYAAAAAAAAADbD0nAAACgwAAAoMAAAKDA2w9JwAAAoMDbD0nAAACgwAAAAIDbD0nAAACgwNsPScAAAKDAAAAAgAAAgL8AAIC/AACAvwAAgL8AAIC/AACAvwAAgL8AAIC/AACAvwAAgL+UaAtLGIWUaBl0lFKUjARoaWdolGgRKJZgAAAAAAAAANsPSUAAAKBAAACgQAAAoEDbD0lAAACgQNsPSUAAAKBAAACgQNsPSUAAAKBA2w9JQAAAoEAAAKBAAACAPwAAgD8AAIA/AACAPwAAgD8AAIA/AACAPwAAgD8AAIA/AACAP5RoC0sYhZRoGXSUUpSMCGxvd19yZXBylIz+Wy0zLjE0MTU5MjcgLTUuICAgICAgICAtNS4gICAgICAgIC01LiAgICAgICAgLTMuMTQxNTkyNyAtNS4KIC0zLjE0MTU5MjcgLTUuICAgICAgICAtMC4gICAgICAgIC0zLjE0MTU5MjcgLTUuICAgICAgICAtMy4xNDE1OTI3CiAtNS4gICAgICAgIC0wLiAgICAgICAgLTEuICAgICAgICAtMS4gICAgICAgIC0xLiAgICAgICAgLTEuCiAtMS4gICAgICAgIC0xLiAgICAgICAgLTEuICAgICAgICAtMS4gICAgICAgIC0xLiAgICAgICAgLTEuICAgICAgIF2UjAloaWdoX3JlcHKUjOZbMy4xNDE1OTI3IDUuICAgICAgICA1LiAgICAgICAgNS4gICAgICAgIDMuMTQxNTkyNyA1LiAgICAgICAgMy4xNDE1OTI3CiA1LiAgICAgICAgNS4gICAgICAgIDMuMTQxNTkyNyA1LiAgICAgICAgMy4xNDE1OTI3IDUuICAgICAgICA1LgogMS4gICAgICAgIDEuICAgICAgICAxLiAgICAgICAgMS4gICAgICAgIDEuICAgICAgICAxLiAgICAgICAgMS4KIDEuICAgICAgICAxLiAgICAgICAgMS4gICAgICAgXZSMCl9ucF9yYW5kb22UTnViLg==", "dtype": "float32", "bounded_below": "[ True True True True True True True True True True True True\n True True True True True True True True True True True True]", "bounded_above": "[ True True True True True True True True True True True True\n True True True True True True True True True True True True]", "_shape": [24], "low": "[-3.1415927 -5. -5. -5. -3.1415927 -5.\n -3.1415927 -5. -0. -3.1415927 -5. -3.1415927\n -5. -0. -1. -1. -1. -1.\n -1. -1. -1. -1. -1. -1. ]", "high": "[3.1415927 5. 5. 5. 3.1415927 5. 3.1415927\n 5. 5. 3.1415927 5. 3.1415927 5. 5.\n 1. 1. 1. 1. 1. 1. 1.\n 1. 1. 1. ]", "low_repr": "[-3.1415927 -5. -5. -5. -3.1415927 -5.\n -3.1415927 -5. -0. -3.1415927 -5. -3.1415927\n -5. -0. -1. -1. -1. -1.\n -1. -1. -1. -1. -1. -1. ]", "high_repr": "[3.1415927 5. 5. 5. 3.1415927 5. 3.1415927\n 5. 5. 3.1415927 5. 3.1415927 5. 5.\n 1. 1. 1. 1. 1. 1. 1.\n 1. 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVpwEAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWBAAAAAAAAAABAQEBlGgIjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwSFlIwBQ5R0lFKUjA1ib3VuZGVkX2Fib3ZllGgRKJYEAAAAAAAAAAEBAQGUaBVLBIWUaBl0lFKUjAZfc2hhcGWUSwSFlIwDbG93lGgRKJYQAAAAAAAAAAAAgL8AAIC/AACAvwAAgL+UaAtLBIWUaBl0lFKUjARoaWdolGgRKJYQAAAAAAAAAAAAgD8AAIA/AACAPwAAgD+UaAtLBIWUaBl0lFKUjAhsb3dfcmVwcpSMBC0xLjCUjAloaWdoX3JlcHKUjAMxLjCUjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True]", "bounded_above": "[ True True True True]", "_shape": [4], "low": "[-1. -1. -1. -1.]", "high": "[1. 1. 1. 1.]", "low_repr": "-1.0", "high_repr": "1.0", "_np_random": null}, "n_envs": 16, "n_steps": 300, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "system_info": {"OS": "Linux-6.1.58+-x86_64-with-glibc2.35 # 1 SMP PREEMPT_DYNAMIC Sat Nov 18 15:31:17 UTC 2023", "Python": "3.10.12", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.2.1+cu121", "GPU Enabled": "False", "Numpy": "1.25.2", "Cloudpickle": "2.2.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
replay.mp4 CHANGED
Binary files a/replay.mp4 and b/replay.mp4 differ
 
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": -92.1980797922799, "std_reward": 0.17525968699805827, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2024-04-24T03:05:41.965914"}
 
1
+ {"mean_reward": -102.80616708775088, "std_reward": 5.105159288719299, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2024-04-24T03:07:31.450449"}