hannahh7 commited on
Commit
c466bec
1 Parent(s): 4265f56

Initial commit

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: AntBulletEnv-v0
17
  metrics:
18
  - type: mean_reward
19
- value: 926.85 +/- 364.89
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: AntBulletEnv-v0
17
  metrics:
18
  - type: mean_reward
19
+ value: 1833.67 +/- 155.85
20
  name: mean_reward
21
  verified: false
22
  ---
a2c-AntBulletEnv-v0.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ceb5ab21fd5ec9e93ae140f9df4340367d60e232eb616623d34797031bf44c20
3
- size 128989
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dfeb9558194719af6ec8cd2eb4ea75d9c43a855d36e01aa03bc987151bf7b64c
3
+ size 129248
a2c-AntBulletEnv-v0/data CHANGED
@@ -4,20 +4,20 @@
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
- "__init__": "<function ActorCriticPolicy.__init__ at 0x7f70bb76f880>",
8
- "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f70bb76f910>",
9
- "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f70bb76f9a0>",
10
- "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f70bb76fa30>",
11
- "_build": "<function ActorCriticPolicy._build at 0x7f70bb76fac0>",
12
- "forward": "<function ActorCriticPolicy.forward at 0x7f70bb76fb50>",
13
- "extract_features": "<function ActorCriticPolicy.extract_features at 0x7f70bb76fbe0>",
14
- "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f70bb76fc70>",
15
- "_predict": "<function ActorCriticPolicy._predict at 0x7f70bb76fd00>",
16
- "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f70bb76fd90>",
17
- "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f70bb76fe20>",
18
- "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f70bb76feb0>",
19
  "__abstractmethods__": "frozenset()",
20
- "_abc_impl": "<_abc._abc_data object at 0x7f70bb76b2c0>"
21
  },
22
  "verbose": 1,
23
  "policy_kwargs": {
@@ -37,7 +37,7 @@
37
  "_num_timesteps_at_start": 0,
38
  "seed": null,
39
  "action_noise": null,
40
- "start_time": 1686601019810748245,
41
  "learning_rate": 0.00096,
42
  "tensorboard_log": null,
43
  "lr_schedule": {
@@ -46,7 +46,7 @@
46
  },
47
  "_last_obs": {
48
  ":type:": "<class 'numpy.ndarray'>",
49
- ":serialized:": "gAWVNQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJbAAQAAAAAAAEOQMD2ALgDAwVSfwHFLRT+w90M/kUuSPixYIT5OjUK+cZTTvvFcfL/ZP4a+AMC0P2ZOhb35olE/lfN6PTYUUz8j4aY/LRCjvRadNrxywVk/Evwjvrp8pr/EonY+sqAaPs1ymb9Ml+o+vUQIP4YNTz8bVDI/CYfvvwy2mr9wG46/ufQ5QCocEL83GE8/N/9JvznCXD8Em4a+x2YIQO8yQT/THsO/7Cl0PZIkh70mV9O/ngqIP1t8j75zA6Y+YRdrP0+LBz8GWlO/DTeFv30ImT5Fi1U/cK4LwL1ECD9WQp6/y9OSP0cK/r9Fj8W/m0g0P1ypc74KzyO/s4PrPoUUqb8ZVpe/5WATQIXOMD5RmpY/JD8FP7rLZb9IoQA/fqCSv7PllT/Phou+bM0QvjislL2hOsG+GPzzP2XTBEC0vAfAzXKZv3CuC8C9RAg/hg1PP6lT4T+LJOy/Gf6Rv4AfAkA2Mv49qn1jP2OF+z9i+/q/w5bHv9kbTUBT1+y+Jci6P4Q6sD88Zps+DWbyPkVHE0BgDJU/N3/qvn9EOD9QFui6f9ZQv4hpnTyOHEI/zduQPM1ymb9Ml+o+vUQIP1ZCnr+UjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSwRLHIaUjAFDlHSUUpQu"
50
  },
51
  "_last_episode_starts": {
52
  ":type:": "<class 'numpy.ndarray'>",
@@ -54,7 +54,7 @@
54
  },
55
  "_last_original_obs": {
56
  ":type:": "<class 'numpy.ndarray'>",
57
- ":serialized:": "gAWVNQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJbAAQAAAAAAAAAAAAAZoT22AACAPwAAAAAAAAAAAAAAAAAAAAAAAACA+dKAPQAAAABxu+O/AAAAABF2VbwAAAAAaTX2PwAAAAB3tOO9AAAAACTL+T8AAAAA3AGRvQAAAAAjePq/AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAUZiAtgAAgD8AAAAAAAAAAAAAAAAAAAAAAAAAgAG+nT0AAAAAFS7vvwAAAACC35+9AAAAAGKY9D8AAAAAIW2wvQAAAACeKPE/AAAAADeioL0AAAAAm/H/vwAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAB/u4rYAAIA/AAAAAAAAAAAAAAAAAAAAAAAAAICvbN09AAAAAHch7b8AAAAARa0LvgAAAAAVLuY/AAAAAIVbJb0AAAAA2kHsPwAAAACWEXE8AAAAAFJ4278AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAABebSe1AACAPwAAAAAAAAAAAAAAAAAAAAAAAACA0xkCvQAAAABWo+6/AAAAAIUMTz0AAAAAwQL6PwAAAACPwce8AAAAABZD2T8AAAAAz5+mPQAAAACzad+/AAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSwRLHIaUjAFDlHSUUpQu"
58
  },
59
  "_episode_num": 0,
60
  "use_sde": true,
@@ -63,7 +63,7 @@
63
  "_stats_window_size": 100,
64
  "ep_info_buffer": {
65
  ":type:": "<class 'collections.deque'>",
66
- ":serialized:": "gAWVQwwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQJqnDqhUR4CMAWyUTegDjAF0lEdAsJVBEtuk13V9lChoBkdAVs7zpX6qKmgHS4xoCEdAsJW384xUN3V9lChoBkdAmhOj0QK8c2gHTegDaAhHQLCXnvK2a2F1fZQoaAZHQJ02qZgG8mNoB03oA2gIR0CwmZKhtcfOdX2UKGgGR0CbKNnRb8m8aAdN6ANoCEdAsJ2M/+sHSnV9lChoBkdAm4JOyRjjJmgHTegDaAhHQLCd/zu4PPN1fZQoaAZHQJjqDazu4PRoB03oA2gIR0CwoJK8g6ltdX2UKGgGR0CeHvYhMajvaAdN6ANoCEdAsKOWcurZJ3V9lChoBkdAnkPzSThYNmgHTegDaAhHQLCnd5vcafl1fZQoaAZHQJnU+dBjWkJoB03oA2gIR0Cwp+6jFhoedX2UKGgGR0Cex0hxYJVsaAdN6ANoCEdAsKnJTER8MXV9lChoBkdAnNFwSi/O+2gHTegDaAhHQLCrurQw9JV1fZQoaAZHQJ4gqIDYAbRoB03oA2gIR0CwrxfMSsbOdX2UKGgGR0Cb9AAyVObiaAdN6ANoCEdAsK/KctoSMHV9lChoBkdAlz/9CmdiD2gHTegDaAhHQLCymAYYR/V1fZQoaAZHQJ1x/fvWpZRoB03oA2gIR0CwtbRiXpnpdX2UKGgGR0Cb7Rf5k9U0aAdN6ANoCEdAsLkrYChexHV9lChoBkdAmu9uU+s5n2gHTegDaAhHQLC5o1q33Ht1fZQoaAZHQJkvB9gF5fNoB03oA2gIR0Cwu5A1NxlydX2UKGgGR0CbanHAymALaAdN6ANoCEdAsL10pc5bQnV9lChoBkdAmq/BdIGyHGgHTegDaAhHQLDBU4p+c6N1fZQoaAZHQJV4Q9GI9DBoB03oA2gIR0CwwgBScbzcdX2UKGgGR0CYT5g2ZRbbaAdN6ANoCEdAsMTlvJiiI3V9lChoBkdAl03vI0ZWJmgHTegDaAhHQLDHfeumrKh1fZQoaAZHQJgJmCDmKZVoB03oA2gIR0CwyuFvuPV/dX2UKGgGR0CbnKwaisXBaAdN6ANoCEdAsMtZm9QGfXV9lChoBkdAl5CiwKSgXmgHTegDaAhHQLDNOZn+Q2d1fZQoaAZHQJmzkIOYplVoB03oA2gIR0CwzyOTzND/dX2UKGgGR0CZhAY8+zMSaAdN6ANoCEdAsNNNf2K2rnV9lChoBkdAmL01rRBu42gHTegDaAhHQLDUEeI2wV11fZQoaAZHQJJ8Kh7E5yVoB03oA2gIR0Cw1wdoexOddX2UKGgGR0CRUjXvYvnKaAdN6ANoCEdAsNkl+NLlFXV9lChoBkdAm/aBzaK1omgHTegDaAhHQLDcivUz9CN1fZQoaAZHQJxHusNlRP5oB03oA2gIR0Cw3QLgCOm0dX2UKGgGR0CVYycynDR/aAdN6ANoCEdAsN72+6Ae73V9lChoBkdAltZk0m+j/WgHTegDaAhHQLDg+dXko4N1fZQoaAZHQIk5QChew9toB03oA2gIR0Cw5eL+kxh2dX2UKGgGR0CS0dA6dUbUaAdN6ANoCEdAsOahgtvn83V9lChoBkdAm/Q/PkaMrGgHTegDaAhHQLDpJXV9Wp91fZQoaAZHQJhqAL6UJOZoB03oA2gIR0Cw6xA5zYEodX2UKGgGR0CV63YOlO45aAdN6ANoCEdAsO5yQ2dd3XV9lChoBkdAlwBFFH8TBmgHTegDaAhHQLDu9aN+9al1fZQoaAZHQJyw3NKRMexoB03oA2gIR0Cw8NyyhSLqdX2UKGgGR0CbTyLn9vS/aAdN6ANoCEdAsPMJn+Q2dnV9lChoBkdAmRgizXz19WgHTegDaAhHQLD4OJUHY6J1fZQoaAZHQJs7kGHHmzVoB03oA2gIR0Cw+PyZnctYdX2UKGgGR0CbQC7mdRR/aAdN6ANoCEdAsPr+54GD+XV9lChoBkdAnIqYyGi5/mgHTegDaAhHQLD8+SeRPoF1fZQoaAZHQJjxnxBmf5FoB03oA2gIR0CxAF9zwMH9dX2UKGgGR0Cc93WY4Qz2aAdN6ANoCEdAsQDVyq+8G3V9lChoBkdAnH6g7tAs1GgHTegDaAhHQLECuNUOuq51fZQoaAZHQJd9yWrwOONoB03oA2gIR0CxBU13Qla9dX2UKGgGR0CYGtp1zQu3aAdN6ANoCEdAsQpOIvalDXV9lChoBkdAmsFrH2h7FGgHTegDaAhHQLEKxGhmGud1fZQoaAZHQJTTdiPQv6FoB03oA2gIR0CxDJqYJE6UdX2UKGgGR0Cc3iGc4HX3aAdN6ANoCEdAsQ6EfMfRu3V9lChoBkdAnnxfwuuie2gHTegDaAhHQLER6bzshPl1fZQoaAZHQJozHfl6qsFoB03oA2gIR0CxEmDrZ8KHdX2UKGgGR0CYOuIUJv5yaAdN6ANoCEdAsRRcT6BRRHV9lChoBkdAmVETq8lHBmgHTegDaAhHQLEXMjVQQ+V1fZQoaAZHQJmlcpMHryFoB03oA2gIR0CxG+956dDqdX2UKGgGR0CRoOnzxwyZaAdN6ANoCEdAsRxszguRLnV9lChoBkdAnHJ3fdhy82gHTegDaAhHQLEeVAoXsPd1fZQoaAZHQJBzas8xKxtoB03oA2gIR0CxIEndweeWdX2UKGgGR0Cb7/F6AvtdaAdN6ANoCEdAsSOoNXo1UHV9lChoBkdAjZqd1dPcjGgHTegDaAhHQLEkHyv9tMx1fZQoaAZHQJcR24SYgJVoB03oA2gIR0CxJo/lIVdpdX2UKGgGR0CZhpLt/nW8aAdN6ANoCEdAsSmUw22oenV9lChoBkdAmsNmXb/OuGgHTegDaAhHQLEtzAbyYol1fZQoaAZHQJncgIF/x2BoB03oA2gIR0CxLkhpL26DdX2UKGgGR0CdyKg/keZHaAdN6ANoCEdAsTBBd+ocaXV9lChoBkdAmix+Mhouf2gHTegDaAhHQLEyMbAUL2J1fZQoaAZHQJHqAOH31z1oB03oA2gIR0CxNaQhB7eEdX2UKGgGR0CU0leVLSNPaAdN6ANoCEdAsTZMfHPu5XV9lChoBkdAmb/ayB06o2gHTegDaAhHQLE5Mn3L3bp1fZQoaAZHQJnsu4+bExZoB03oA2gIR0CxPHRqwhW6dX2UKGgGR0Cc1Pwzch1UaAdN6ANoCEdAsT/5zhgmZ3V9lChoBkdAmTUlQIldC2gHTegDaAhHQLFAdzF+/g11fZQoaAZHQJ1g5yT6i0xoB03oA2gIR0CxQmRZU1htdX2UKGgGR0Ca1EP7el9CaAdN6ANoCEdAsURV38n/k3V9lChoBkdAoGKdNN8E3mgHTegDaAhHQLFIFVwxWT51fZQoaAZHQJ09cSyt3fRoB03oA2gIR0CxSMBi1AqvdX2UKGgGR0CeAAEP1+RYaAdN6ANoCEdAsUvCeWfK6nV9lChoBkdAksiz8HfMwGgHTegDaAhHQLFOadHlOoJ1fZQoaAZHQJ2tbtsvZh9oB03oA2gIR0CxUcpRfnfVdX2UKGgGR0CYy4h4dIXkaAdN6ANoCEdAsVJBMfzSTnV9lChoBkdAnObF1nuiOGgHTegDaAhHQLFUJgCwKSh1fZQoaAZHQJwpiN83MpxoB03oA2gIR0CxVhKkl/pddX2UKGgGR0Cb5OzQNTcZaAdN6ANoCEdAsVo0b4rSVnV9lChoBkdAnbZRy8zyjGgHTegDaAhHQLFa65v99+h1fZQoaAZHQJab4X531SRoB03oA2gIR0CxXgK3NLUTdX2UKGgGR0CaPPoa1kUcaAdN6ANoCEdAsWA0/B3zMHV9lChoBkdAm0lrR8c+7mgHTegDaAhHQLFjppHI6sB1fZQoaAZHQJtWS4I8hcJoB03oA2gIR0CxZByPZIxydX2UKGgGR0CYf4M5wOvuaAdN6ANoCEdAsWX+T/yXlnV9lChoBkdAk2oWeYlY2mgHTegDaAhHQLFoBBRhttR1fZQoaAZHQJlJyT1TR6ZoB03oA2gIR0CxbNq1XvH+dX2UKGgGR0CalrymQ8wIaAdN6ANoCEdAsW2WXjU/fXV9lChoBkdAkpotj5Kvm2gHTegDaAhHQLFwGA3T/hl1fZQoaAZHQJNO9dUsFt9oB03oA2gIR0CxcgvAsTWYdWUu"
67
  },
68
  "ep_success_buffer": {
69
  ":type:": "<class 'collections.deque'>",
 
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
+ "__init__": "<function ActorCriticPolicy.__init__ at 0x7fa2e2dd7370>",
8
+ "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7fa2e2dd7400>",
9
+ "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7fa2e2dd7490>",
10
+ "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7fa2e2dd7520>",
11
+ "_build": "<function ActorCriticPolicy._build at 0x7fa2e2dd75b0>",
12
+ "forward": "<function ActorCriticPolicy.forward at 0x7fa2e2dd7640>",
13
+ "extract_features": "<function ActorCriticPolicy.extract_features at 0x7fa2e2dd76d0>",
14
+ "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7fa2e2dd7760>",
15
+ "_predict": "<function ActorCriticPolicy._predict at 0x7fa2e2dd77f0>",
16
+ "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7fa2e2dd7880>",
17
+ "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7fa2e2dd7910>",
18
+ "predict_values": "<function ActorCriticPolicy.predict_values at 0x7fa2e2dd79a0>",
19
  "__abstractmethods__": "frozenset()",
20
+ "_abc_impl": "<_abc._abc_data object at 0x7fa2e2ddd8c0>"
21
  },
22
  "verbose": 1,
23
  "policy_kwargs": {
 
37
  "_num_timesteps_at_start": 0,
38
  "seed": null,
39
  "action_noise": null,
40
+ "start_time": 1686824918660744963,
41
  "learning_rate": 0.00096,
42
  "tensorboard_log": null,
43
  "lr_schedule": {
 
46
  },
47
  "_last_obs": {
48
  ":type:": "<class 'numpy.ndarray'>",
49
+ ":serialized:": "gAWVNQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJbAAQAAAAAAAHEKjL8MVTK/TAroPo7KsT1Gr7++wqUTPyDwmb5oht0+ZSQ9P9Zvkr0otxW/LyovPoLHGz+MD7G/9JQxP198OrvWg3c/yn0/v8UnAz6Rhhs+ZJdLv68hbT0hQRW/SzC8vjxJgT+6ltq/w0XlPsn/jb+K0WO/eh5BviHHDD+uY5A9QMAuvjn4xj5R9Qi/VOKuPlMe/D4y0Ys/2bYWv+br4z3WqfQ+N0IxPsWDMj9DEWm8PNSoPx+FqD4MMRu+A8baPZlgTr+h4QU+JkFDvQl+hL48SYE/NegVP8NF5T4Nw2Y/PMgUv7fflL5t+ws/DLXCP+F62D+tyzA9g02lvTa2iL7fHBw/Ojt3PulxSb8qSa4+KhKCP0FaMD/lWTI/GcLeu677oj8jmge/P4Q0PqIfu75sAUy/CLR2PVr0Wrr7prw7FHR9vzXoFT/DReU+DcNmP0Apdb+9d4s+NZPsPmnalz8zqoe/RDEZv33ifb4WsV4+2ZoyP4pIlL+vdRy/WJwBwFMzn7/vDnk9ARznPnVUbz8A3+K+pM4YPVXj0z6LLSvABnbhvuRGDr/JsT2+bxO6PjxJgT+6ltq/w0XlPsn/jb+UjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSwRLHIaUjAFDlHSUUpQu"
50
  },
51
  "_last_episode_starts": {
52
  ":type:": "<class 'numpy.ndarray'>",
 
54
  },
55
  "_last_original_obs": {
56
  ":type:": "<class 'numpy.ndarray'>",
57
+ ":serialized:": "gAWVNQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJbAAQAAAAAAAAAAAACTmFM2AACAPwAAAAAAAAAAAAAAAAAAAAAAAACA0Zh2OwAAAAA1W92/AAAAAEkHOT0AAAAAByXgPwAAAABwENw7AAAAALKfAEAAAAAAhe22vQAAAADqLum/AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAqYodtwAAgD8AAAAAAAAAAAAAAAAAAAAAAAAAgMipDj4AAAAA60LnvwAAAADqRL29AAAAAJ8f/T8AAAAAMvgOvgAAAADk8/k/AAAAAByzDz0AAAAAT+PfvwAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAABlztbYAAIA/AAAAAAAAAAAAAAAAAAAAAAAAAIAsoPs9AAAAAEO18r8AAAAA5RXDvQAAAABfbOw/AAAAAICkTT0AAAAAr2zcPwAAAAA5ZIs9AAAAALXU3L8AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAABkQ3c2AACAPwAAAAAAAAAAAAAAAAAAAAAAAACAaHn8vQAAAAAv5f2/AAAAAI7Q5z0AAAAAvd/ePwAAAADBj869AAAAALkF2z8AAAAA0XSMvAAAAADB5d+/AAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSwRLHIaUjAFDlHSUUpQu"
58
  },
59
  "_episode_num": 0,
60
  "use_sde": true,
 
63
  "_stats_window_size": 100,
64
  "ep_info_buffer": {
65
  ":type:": "<class 'collections.deque'>",
66
+ ":serialized:": "gAWVRAwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQJKvSv0RODeMAWyUTegDjAF0lEdAq4zzaufVZ3V9lChoBkdAl+z2IKtxMmgHTegDaAhHQKuXOSg5BC51fZQoaAZHQJt/XCJoCdVoB03oA2gIR0CrmRYxDb8FdX2UKGgGR0CarJlijL0SaAdN6ANoCEdAq5k/dfsu4HV9lChoBkdAmunPttygf2gHTegDaAhHQKudqKrJbMZ1fZQoaAZHQJrEu89Oh01oB03oA2gIR0CrpZqlgtvodX2UKGgGR0CVp55vLowFaAdN6ANoCEdAq6bQ4MnZ03V9lChoBkdAmUlhoZhrnGgHTegDaAhHQKum6pDu0C11fZQoaAZHQJoV6BshxHZoB03oA2gIR0CrqlhTGYKIdX2UKGgGR0CXBbE2YOUdaAdN6ANoCEdAq7MzB68g6nV9lChoBkdAmfqkSElE7WgHTegDaAhHQKu1DlAeJYV1fZQoaAZHQJnBaS4e9zxoB03oA2gIR0CrtTgHu7YkdX2UKGgGR0CWoZ5qubI+aAdN6ANoCEdAq7q2RmseXHV9lChoBkdAhEi4wIt16mgHTegDaAhHQKvDMwqy4Wl1fZQoaAZHQIw8Pl0YCQtoB03oA2gIR0CrxHBHLA58dX2UKGgGR0CY5wi9qUNbaAdN6ANoCEdAq8SJAprk83V9lChoBkdAmIiGphnanWgHTegDaAhHQKvH4RkEs8R1fZQoaAZHQJNf77zkIX1oB03oA2gIR0Crz7xXnyNGdX2UKGgGR0CYm+rq+rU9aAdN6ANoCEdAq9FiFdszmHV9lChoBkdAmUkUEC/47GgHTegDaAhHQKvRhhvR7Z51fZQoaAZHQJJ3rzAeq71oB03oA2gIR0Cr1rMwtapxdX2UKGgGR0CU85osZpBYaAdN6ANoCEdAq+DO10DEFXV9lChoBkdAlBELNfPX1GgHTegDaAhHQKviOTq0MPV1fZQoaAZHQJHBoj5bhWJoB03oA2gIR0Cr4mK2SdOJdX2UKGgGR0CVJZhYvFm4aAdN6ANoCEdAq+eg482aUnV9lChoBkdAlfCQkxASnWgHTegDaAhHQKvyv38n/kx1fZQoaAZHQJ46ngLqlgtoB03oA2gIR0Cr9I7xEv0zdX2UKGgGR0CUQ3W43FUAaAdN6ANoCEdAq/Sznkkrw3V9lChoBkdAlQ2ES26TXGgHTegDaAhHQKv6CkpI+W51fZQoaAZHQJQIbqcEvCdoB03oA2gIR0CsAt/+jua4dX2UKGgGR0CX5SklNUOvaAdN6ANoCEdArAQ2AoXsPnV9lChoBkdAlJbamoBJZmgHTegDaAhHQKwEUF/QSjB1fZQoaAZHQJcj78IiTt9oB03oA2gIR0CsB8Aood+5dX2UKGgGR0Cd2Rr433pOaAdN6ANoCEdArBBYvcrRSnV9lChoBkdAmJNuRxLkCGgHTegDaAhHQKwSUgMc6vJ1fZQoaAZHQJcLyliz9jxoB03oA2gIR0CsEnd+w1R+dX2UKGgGR0CXnBvZyuIRaAdN6ANoCEdArBfpaC+UQnV9lChoBkdAmFL+JpFkQWgHTegDaAhHQKwh9bfP5YZ1fZQoaAZHQJHW6yMUAT9oB03oA2gIR0CsI0VwHZ9NdX2UKGgGR0CWcOSjxkNGaAdN6ANoCEdArCNhmdy1eHV9lChoBkdAlO1S1uzhP2gHTegDaAhHQKwnAC1Z1V51fZQoaAZHQJEoHzxwyZdoB03oA2gIR0CsL7VaW5YpdX2UKGgGR0CWG21rZamoaAdN6ANoCEdArDFFIVdonXV9lChoBkdAjjtCQLeANGgHTegDaAhHQKwxalgMMJB1fZQoaAZHQJXwFhG6PKdoB03oA2gIR0CsNzXAM2FWdX2UKGgGR0CaZmLHuJDWaAdN6ANoCEdArEGZ0CA+ZHV9lChoBkdAlHkrVvuPWGgHTegDaAhHQKxC2lruYyB1fZQoaAZHQJb2iPV/c35oB03oA2gIR0CsQvVkUbkwdX2UKGgGR0CZwYYmLLpzaAdN6ANoCEdArEZ3Dm8ujHV9lChoBkdAlcB9ic5Ke2gHTegDaAhHQKxOndLxqfx1fZQoaAZHQJm2/Uz9CNVoB03oA2gIR0CsT9smOU+tdX2UKGgGR0CWFnhnJ1aGaAdN6ANoCEdArE/1U83dbnV9lChoBkdAl1U/W+XZ5GgHTegDaAhHQKxUsavRqoJ1fZQoaAZHQJV6Eg2ZRbdoB03oA2gIR0CsYFJZ4fOldX2UKGgGR0CaJiRh+fAcaAdN6ANoCEdArGGnhsImgXV9lChoBkdAl0d+UhV2imgHTegDaAhHQKxhwzGgi/x1fZQoaAZHQJUxk274BWBoB03oA2gIR0CsZXPKU3XJdX2UKGgGR0CX6z2OQyRCaAdN6ANoCEdArG4aJCSid3V9lChoBkdAmehgRf4REmgHTegDaAhHQKxvbD/lyR11fZQoaAZHQJburLyMDOloB03oA2gIR0Csb4dgfEGadX2UKGgGR0CYrEc6NlyzaAdN6ANoCEdArHPw593KS3V9lChoBkdAm57xDw6QvGgHTegDaAhHQKx/3BMSK3x1fZQoaAZHQJniGIxgy/NoB03oA2gIR0CsgR3EIgNgdX2UKGgGR0CY2RUxVQyiaAdN6ANoCEdArIE6Qq7ROXV9lChoBkdAnHpIrSVnmWgHTegDaAhHQKyErm5lOGl1fZQoaAZHQJpyfV6NVBFoB03oA2gIR0CsjKFs54nndX2UKGgGR0Cb6sAS39aVaAdN6ANoCEdArI3WluWKM3V9lChoBkdAnDtwow22omgHTegDaAhHQKyN8Vzp5eJ1fZQoaAZHQJs+fAdn005oB03oA2gIR0CskWVbzK9xdX2UKGgGR0CbHnKfnOjZaAdN6ANoCEdArJ2g3o9s8HV9lChoBkdAndAEJv5xi2gHTegDaAhHQKye+cWCVbB1fZQoaAZHQJyIYmv4dp9oB03oA2gIR0CsnxIouwotdX2UKGgGR0CbxTWu5jH5aAdN6ANoCEdArKJ+aQV9GHV9lChoBkdAm7O+/cnE22gHTegDaAhHQKyqhh/Aj6h1fZQoaAZHQJP1cz67/XJoB03oA2gIR0Csq79s7+1jdX2UKGgGR0Cc52gPmPo3aAdN6ANoCEdArKvYHRkVe3V9lChoBkdAmp8ryhBZ6mgHTegDaAhHQKyvPvPTodN1fZQoaAZHQJyYua+evp1oB03oA2gIR0Csuc30wrUcdX2UKGgGR0Cb9/BJqZc+aAdN6ANoCEdArLu6UgSvknV9lChoBkdAmEdO0G/vfGgHTegDaAhHQKy74K/mDDl1fZQoaAZHQJt/qitaIN5oB03oA2gIR0CswAAU+LWJdX2UKGgGR0CZ+3O2iL2paAdN6ANoCEdArMfhPIn0CnV9lChoBkdAlXu5PZZjhGgHTegDaAhHQKzJGXwb2lF1fZQoaAZHQJoL/VpbliloB03oA2gIR0CsyTKs2eg+dX2UKGgGR0CRhlEC/47BaAdN6ANoCEdArMySlabF0nV9lChoBkdAmmxfhhpg1GgHTegDaAhHQKzWDHxz7uV1fZQoaAZHQJjUmlDWsiloB03oA2gIR0Cs1/qgIyCWdX2UKGgGR0CXwYLkCFK1aAdN6ANoCEdArNgm/nGKh3V9lChoBkdAk5MiXlbNbGgHTegDaAhHQKzdj9G7SRd1fZQoaAZHQJvrdYeT3ZhoB03oA2gIR0Cs5bczZYgadX2UKGgGR0CaitvCMxXXaAdN6ANoCEdArObuhbnoxHV9lChoBkdAm3U6hUR3/2gHTegDaAhHQKznDNs3yZt1fZQoaAZHQJc6oOoYNy5oB03oA2gIR0Cs6nRPGhmHdX2UKGgGR0CTqsG8EmpmaAdN6ANoCEdArPLOLrHEM3V9lChoBkdAhdqte+mFamgHTegDaAhHQKz0kW9lEql1fZQoaAZHQJKtl0GNaQpoB03oA2gIR0Cs9LraM72ddX2UKGgGR0CYcWmwJPZaaAdN6ANoCEdArPngTqSowXV9lChoBkdAmuDF7x/d7GgHTegDaAhHQK0DVqzqrzZ1fZQoaAZHQJn7rblA/s5oB03oA2gIR0CtBIiHZbpvdX2UKGgGR0CZ50miQDFIaAdN6ANoCEdArQSj8P4EfXVlLg=="
67
  },
68
  "ep_success_buffer": {
69
  ":type:": "<class 'collections.deque'>",
a2c-AntBulletEnv-v0/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:04b88312758138febc2d6e2f9bb1f30dca06bd28442849933e5b9c88f200ff18
3
- size 56062
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e1a4f103bc31cbda26fb90b5eb6f22ba89d17d98b8ed1d524dc0ffc767de0714
3
+ size 56190
a2c-AntBulletEnv-v0/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c4068ee0294a07995972dcea098447ef3a4cdbae31c4de8e698f2a4288173189
3
- size 56766
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca9162805f7e0519c4851c738e77ed6df1bf9b23f5e8d272ea49dac79113ea25
3
+ size 56894
a2c-AntBulletEnv-v0/system_info.txt CHANGED
@@ -2,6 +2,6 @@
2
  - Python: 3.10.12
3
  - Stable-Baselines3: 1.8.0
4
  - PyTorch: 2.0.1+cu118
5
- - GPU Enabled: False
6
  - Numpy: 1.22.4
7
  - Gym: 0.21.0
 
2
  - Python: 3.10.12
3
  - Stable-Baselines3: 1.8.0
4
  - PyTorch: 2.0.1+cu118
5
+ - GPU Enabled: True
6
  - Numpy: 1.22.4
7
  - Gym: 0.21.0
config.json CHANGED
@@ -1 +1 @@
1
- {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f70bb76f880>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f70bb76f910>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f70bb76f9a0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f70bb76fa30>", "_build": "<function ActorCriticPolicy._build at 0x7f70bb76fac0>", "forward": "<function ActorCriticPolicy.forward at 0x7f70bb76fb50>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7f70bb76fbe0>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f70bb76fc70>", "_predict": "<function ActorCriticPolicy._predict at 0x7f70bb76fd00>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f70bb76fd90>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f70bb76fe20>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f70bb76feb0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7f70bb76b2c0>"}, "verbose": 1, "policy_kwargs": {":type:": "<class 'dict'>", ":serialized:": "gAWVowAAAAAAAAB9lCiMDGxvZ19zdGRfaW5pdJRK/v///4wKb3J0aG9faW5pdJSJjA9vcHRpbWl6ZXJfY2xhc3OUjBN0b3JjaC5vcHRpbS5ybXNwcm9wlIwHUk1TcHJvcJSTlIwQb3B0aW1pemVyX2t3YXJnc5R9lCiMBWFscGhhlEc/764UeuFHrowDZXBzlEc+5Pi1iONo8YwMd2VpZ2h0X2RlY2F5lEsAdXUu", "log_std_init": -2, "ortho_init": false, "optimizer_class": "<class 'torch.optim.rmsprop.RMSprop'>", "optimizer_kwargs": {"alpha": 0.99, "eps": 1e-05, "weight_decay": 0}}, "num_timesteps": 2000000, "_total_timesteps": 2000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1686601019810748245, "learning_rate": 0.00096, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuCQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz9PdRBNVR1phZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVNQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJbAAQAAAAAAAEOQMD2ALgDAwVSfwHFLRT+w90M/kUuSPixYIT5OjUK+cZTTvvFcfL/ZP4a+AMC0P2ZOhb35olE/lfN6PTYUUz8j4aY/LRCjvRadNrxywVk/Evwjvrp8pr/EonY+sqAaPs1ymb9Ml+o+vUQIP4YNTz8bVDI/CYfvvwy2mr9wG46/ufQ5QCocEL83GE8/N/9JvznCXD8Em4a+x2YIQO8yQT/THsO/7Cl0PZIkh70mV9O/ngqIP1t8j75zA6Y+YRdrP0+LBz8GWlO/DTeFv30ImT5Fi1U/cK4LwL1ECD9WQp6/y9OSP0cK/r9Fj8W/m0g0P1ypc74KzyO/s4PrPoUUqb8ZVpe/5WATQIXOMD5RmpY/JD8FP7rLZb9IoQA/fqCSv7PllT/Phou+bM0QvjislL2hOsG+GPzzP2XTBEC0vAfAzXKZv3CuC8C9RAg/hg1PP6lT4T+LJOy/Gf6Rv4AfAkA2Mv49qn1jP2OF+z9i+/q/w5bHv9kbTUBT1+y+Jci6P4Q6sD88Zps+DWbyPkVHE0BgDJU/N3/qvn9EOD9QFui6f9ZQv4hpnTyOHEI/zduQPM1ymb9Ml+o+vUQIP1ZCnr+UjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSwRLHIaUjAFDlHSUUpQu"}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYEAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwSFlIwBQ5R0lFKULg=="}, "_last_original_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVNQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJbAAQAAAAAAAAAAAAAZoT22AACAPwAAAAAAAAAAAAAAAAAAAAAAAACA+dKAPQAAAABxu+O/AAAAABF2VbwAAAAAaTX2PwAAAAB3tOO9AAAAACTL+T8AAAAA3AGRvQAAAAAjePq/AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAUZiAtgAAgD8AAAAAAAAAAAAAAAAAAAAAAAAAgAG+nT0AAAAAFS7vvwAAAACC35+9AAAAAGKY9D8AAAAAIW2wvQAAAACeKPE/AAAAADeioL0AAAAAm/H/vwAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAB/u4rYAAIA/AAAAAAAAAAAAAAAAAAAAAAAAAICvbN09AAAAAHch7b8AAAAARa0LvgAAAAAVLuY/AAAAAIVbJb0AAAAA2kHsPwAAAACWEXE8AAAAAFJ4278AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAABebSe1AACAPwAAAAAAAAAAAAAAAAAAAAAAAACA0xkCvQAAAABWo+6/AAAAAIUMTz0AAAAAwQL6PwAAAACPwce8AAAAABZD2T8AAAAAz5+mPQAAAACzad+/AAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSwRLHIaUjAFDlHSUUpQu"}, "_episode_num": 0, "use_sde": true, "sde_sample_freq": -1, "_current_progress_remaining": 0.0, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVQwwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQJqnDqhUR4CMAWyUTegDjAF0lEdAsJVBEtuk13V9lChoBkdAVs7zpX6qKmgHS4xoCEdAsJW384xUN3V9lChoBkdAmhOj0QK8c2gHTegDaAhHQLCXnvK2a2F1fZQoaAZHQJ02qZgG8mNoB03oA2gIR0CwmZKhtcfOdX2UKGgGR0CbKNnRb8m8aAdN6ANoCEdAsJ2M/+sHSnV9lChoBkdAm4JOyRjjJmgHTegDaAhHQLCd/zu4PPN1fZQoaAZHQJjqDazu4PRoB03oA2gIR0CwoJK8g6ltdX2UKGgGR0CeHvYhMajvaAdN6ANoCEdAsKOWcurZJ3V9lChoBkdAnkPzSThYNmgHTegDaAhHQLCnd5vcafl1fZQoaAZHQJnU+dBjWkJoB03oA2gIR0Cwp+6jFhoedX2UKGgGR0Cex0hxYJVsaAdN6ANoCEdAsKnJTER8MXV9lChoBkdAnNFwSi/O+2gHTegDaAhHQLCrurQw9JV1fZQoaAZHQJ4gqIDYAbRoB03oA2gIR0CwrxfMSsbOdX2UKGgGR0Cb9AAyVObiaAdN6ANoCEdAsK/KctoSMHV9lChoBkdAlz/9CmdiD2gHTegDaAhHQLCymAYYR/V1fZQoaAZHQJ1x/fvWpZRoB03oA2gIR0CwtbRiXpnpdX2UKGgGR0Cb7Rf5k9U0aAdN6ANoCEdAsLkrYChexHV9lChoBkdAmu9uU+s5n2gHTegDaAhHQLC5o1q33Ht1fZQoaAZHQJkvB9gF5fNoB03oA2gIR0Cwu5A1NxlydX2UKGgGR0CbanHAymALaAdN6ANoCEdAsL10pc5bQnV9lChoBkdAmq/BdIGyHGgHTegDaAhHQLDBU4p+c6N1fZQoaAZHQJV4Q9GI9DBoB03oA2gIR0CwwgBScbzcdX2UKGgGR0CYT5g2ZRbbaAdN6ANoCEdAsMTlvJiiI3V9lChoBkdAl03vI0ZWJmgHTegDaAhHQLDHfeumrKh1fZQoaAZHQJgJmCDmKZVoB03oA2gIR0CwyuFvuPV/dX2UKGgGR0CbnKwaisXBaAdN6ANoCEdAsMtZm9QGfXV9lChoBkdAl5CiwKSgXmgHTegDaAhHQLDNOZn+Q2d1fZQoaAZHQJmzkIOYplVoB03oA2gIR0CwzyOTzND/dX2UKGgGR0CZhAY8+zMSaAdN6ANoCEdAsNNNf2K2rnV9lChoBkdAmL01rRBu42gHTegDaAhHQLDUEeI2wV11fZQoaAZHQJJ8Kh7E5yVoB03oA2gIR0Cw1wdoexOddX2UKGgGR0CRUjXvYvnKaAdN6ANoCEdAsNkl+NLlFXV9lChoBkdAm/aBzaK1omgHTegDaAhHQLDcivUz9CN1fZQoaAZHQJxHusNlRP5oB03oA2gIR0Cw3QLgCOm0dX2UKGgGR0CVYycynDR/aAdN6ANoCEdAsN72+6Ae73V9lChoBkdAltZk0m+j/WgHTegDaAhHQLDg+dXko4N1fZQoaAZHQIk5QChew9toB03oA2gIR0Cw5eL+kxh2dX2UKGgGR0CS0dA6dUbUaAdN6ANoCEdAsOahgtvn83V9lChoBkdAm/Q/PkaMrGgHTegDaAhHQLDpJXV9Wp91fZQoaAZHQJhqAL6UJOZoB03oA2gIR0Cw6xA5zYEodX2UKGgGR0CV63YOlO45aAdN6ANoCEdAsO5yQ2dd3XV9lChoBkdAlwBFFH8TBmgHTegDaAhHQLDu9aN+9al1fZQoaAZHQJyw3NKRMexoB03oA2gIR0Cw8NyyhSLqdX2UKGgGR0CbTyLn9vS/aAdN6ANoCEdAsPMJn+Q2dnV9lChoBkdAmRgizXz19WgHTegDaAhHQLD4OJUHY6J1fZQoaAZHQJs7kGHHmzVoB03oA2gIR0Cw+PyZnctYdX2UKGgGR0CbQC7mdRR/aAdN6ANoCEdAsPr+54GD+XV9lChoBkdAnIqYyGi5/mgHTegDaAhHQLD8+SeRPoF1fZQoaAZHQJjxnxBmf5FoB03oA2gIR0CxAF9zwMH9dX2UKGgGR0Cc93WY4Qz2aAdN6ANoCEdAsQDVyq+8G3V9lChoBkdAnH6g7tAs1GgHTegDaAhHQLECuNUOuq51fZQoaAZHQJd9yWrwOONoB03oA2gIR0CxBU13Qla9dX2UKGgGR0CYGtp1zQu3aAdN6ANoCEdAsQpOIvalDXV9lChoBkdAmsFrH2h7FGgHTegDaAhHQLEKxGhmGud1fZQoaAZHQJTTdiPQv6FoB03oA2gIR0CxDJqYJE6UdX2UKGgGR0Cc3iGc4HX3aAdN6ANoCEdAsQ6EfMfRu3V9lChoBkdAnnxfwuuie2gHTegDaAhHQLER6bzshPl1fZQoaAZHQJozHfl6qsFoB03oA2gIR0CxEmDrZ8KHdX2UKGgGR0CYOuIUJv5yaAdN6ANoCEdAsRRcT6BRRHV9lChoBkdAmVETq8lHBmgHTegDaAhHQLEXMjVQQ+V1fZQoaAZHQJmlcpMHryFoB03oA2gIR0CxG+956dDqdX2UKGgGR0CRoOnzxwyZaAdN6ANoCEdAsRxszguRLnV9lChoBkdAnHJ3fdhy82gHTegDaAhHQLEeVAoXsPd1fZQoaAZHQJBzas8xKxtoB03oA2gIR0CxIEndweeWdX2UKGgGR0Cb7/F6AvtdaAdN6ANoCEdAsSOoNXo1UHV9lChoBkdAjZqd1dPcjGgHTegDaAhHQLEkHyv9tMx1fZQoaAZHQJcR24SYgJVoB03oA2gIR0CxJo/lIVdpdX2UKGgGR0CZhpLt/nW8aAdN6ANoCEdAsSmUw22oenV9lChoBkdAmsNmXb/OuGgHTegDaAhHQLEtzAbyYol1fZQoaAZHQJncgIF/x2BoB03oA2gIR0CxLkhpL26DdX2UKGgGR0CdyKg/keZHaAdN6ANoCEdAsTBBd+ocaXV9lChoBkdAmix+Mhouf2gHTegDaAhHQLEyMbAUL2J1fZQoaAZHQJHqAOH31z1oB03oA2gIR0CxNaQhB7eEdX2UKGgGR0CU0leVLSNPaAdN6ANoCEdAsTZMfHPu5XV9lChoBkdAmb/ayB06o2gHTegDaAhHQLE5Mn3L3bp1fZQoaAZHQJnsu4+bExZoB03oA2gIR0CxPHRqwhW6dX2UKGgGR0Cc1Pwzch1UaAdN6ANoCEdAsT/5zhgmZ3V9lChoBkdAmTUlQIldC2gHTegDaAhHQLFAdzF+/g11fZQoaAZHQJ1g5yT6i0xoB03oA2gIR0CxQmRZU1htdX2UKGgGR0Ca1EP7el9CaAdN6ANoCEdAsURV38n/k3V9lChoBkdAoGKdNN8E3mgHTegDaAhHQLFIFVwxWT51fZQoaAZHQJ09cSyt3fRoB03oA2gIR0CxSMBi1AqvdX2UKGgGR0CeAAEP1+RYaAdN6ANoCEdAsUvCeWfK6nV9lChoBkdAksiz8HfMwGgHTegDaAhHQLFOadHlOoJ1fZQoaAZHQJ2tbtsvZh9oB03oA2gIR0CxUcpRfnfVdX2UKGgGR0CYy4h4dIXkaAdN6ANoCEdAsVJBMfzSTnV9lChoBkdAnObF1nuiOGgHTegDaAhHQLFUJgCwKSh1fZQoaAZHQJwpiN83MpxoB03oA2gIR0CxVhKkl/pddX2UKGgGR0Cb5OzQNTcZaAdN6ANoCEdAsVo0b4rSVnV9lChoBkdAnbZRy8zyjGgHTegDaAhHQLFa65v99+h1fZQoaAZHQJab4X531SRoB03oA2gIR0CxXgK3NLUTdX2UKGgGR0CaPPoa1kUcaAdN6ANoCEdAsWA0/B3zMHV9lChoBkdAm0lrR8c+7mgHTegDaAhHQLFjppHI6sB1fZQoaAZHQJtWS4I8hcJoB03oA2gIR0CxZByPZIxydX2UKGgGR0CYf4M5wOvuaAdN6ANoCEdAsWX+T/yXlnV9lChoBkdAk2oWeYlY2mgHTegDaAhHQLFoBBRhttR1fZQoaAZHQJlJyT1TR6ZoB03oA2gIR0CxbNq1XvH+dX2UKGgGR0CalrymQ8wIaAdN6ANoCEdAsW2WXjU/fXV9lChoBkdAkpotj5Kvm2gHTegDaAhHQLFwGA3T/hl1fZQoaAZHQJNO9dUsFt9oB03oA2gIR0CxcgvAsTWYdWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 62500, "n_steps": 8, "gamma": 0.99, "gae_lambda": 0.9, "ent_coef": 0.0, "vf_coef": 0.4, "max_grad_norm": 0.5, "normalize_advantage": false, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVbQIAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLHIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWcAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/lGgLSxyFlIwBQ5R0lFKUjARoaWdolGgTKJZwAAAAAAAAAAAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH+UaAtLHIWUaBZ0lFKUjA1ib3VuZGVkX2JlbG93lGgTKJYcAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLHIWUaBZ0lFKUjA1ib3VuZGVkX2Fib3ZllGgTKJYcAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUaCJLHIWUaBZ0lFKUjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "_shape": [28], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf\n -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf inf inf inf inf inf inf inf inf inf inf\n inf inf inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False False False False False\n False False False False False False False False False False False False\n False False False False]", "bounded_above": "[False False False False False False False False False False False False\n False False False False False False False False False False False False\n False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVpQEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAIC/AACAvwAAgL8AAIC/AACAvwAAgL8AAIC/AACAv5RoC0sIhZSMAUOUdJRSlIwEaGlnaJRoEyiWIAAAAAAAAAAAAIA/AACAPwAAgD8AAIA/AACAPwAAgD8AAIA/AACAP5RoC0sIhZRoFnSUUpSMDWJvdW5kZWRfYmVsb3eUaBMolggAAAAAAAAAAQEBAQEBAQGUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBZ0lFKUjA1ib3VuZGVkX2Fib3ZllGgTKJYIAAAAAAAAAAEBAQEBAQEBlGgiSwiFlGgWdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [8], "low": "[-1. -1. -1. -1. -1. -1. -1. -1.]", "high": "[1. 1. 1. 1. 1. 1. 1. 1.]", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_np_random": null}, "n_envs": 4, "system_info": {"OS": "Linux-5.15.107+-x86_64-with-glibc2.31 # 1 SMP Sat Apr 29 09:15:28 UTC 2023", "Python": "3.10.12", "Stable-Baselines3": "1.8.0", "PyTorch": "2.0.1+cu118", "GPU Enabled": "False", "Numpy": "1.22.4", "Gym": "0.21.0"}}
 
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7fa2e2dd7370>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7fa2e2dd7400>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7fa2e2dd7490>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7fa2e2dd7520>", "_build": "<function ActorCriticPolicy._build at 0x7fa2e2dd75b0>", "forward": "<function ActorCriticPolicy.forward at 0x7fa2e2dd7640>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7fa2e2dd76d0>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7fa2e2dd7760>", "_predict": "<function ActorCriticPolicy._predict at 0x7fa2e2dd77f0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7fa2e2dd7880>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7fa2e2dd7910>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7fa2e2dd79a0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7fa2e2ddd8c0>"}, "verbose": 1, "policy_kwargs": {":type:": "<class 'dict'>", ":serialized:": "gAWVowAAAAAAAAB9lCiMDGxvZ19zdGRfaW5pdJRK/v///4wKb3J0aG9faW5pdJSJjA9vcHRpbWl6ZXJfY2xhc3OUjBN0b3JjaC5vcHRpbS5ybXNwcm9wlIwHUk1TcHJvcJSTlIwQb3B0aW1pemVyX2t3YXJnc5R9lCiMBWFscGhhlEc/764UeuFHrowDZXBzlEc+5Pi1iONo8YwMd2VpZ2h0X2RlY2F5lEsAdXUu", "log_std_init": -2, "ortho_init": false, "optimizer_class": "<class 'torch.optim.rmsprop.RMSprop'>", "optimizer_kwargs": {"alpha": 0.99, "eps": 1e-05, "weight_decay": 0}}, "num_timesteps": 2000000, "_total_timesteps": 2000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1686824918660744963, "learning_rate": 0.00096, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuCQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz9PdRBNVR1phZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVNQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJbAAQAAAAAAAHEKjL8MVTK/TAroPo7KsT1Gr7++wqUTPyDwmb5oht0+ZSQ9P9Zvkr0otxW/LyovPoLHGz+MD7G/9JQxP198OrvWg3c/yn0/v8UnAz6Rhhs+ZJdLv68hbT0hQRW/SzC8vjxJgT+6ltq/w0XlPsn/jb+K0WO/eh5BviHHDD+uY5A9QMAuvjn4xj5R9Qi/VOKuPlMe/D4y0Ys/2bYWv+br4z3WqfQ+N0IxPsWDMj9DEWm8PNSoPx+FqD4MMRu+A8baPZlgTr+h4QU+JkFDvQl+hL48SYE/NegVP8NF5T4Nw2Y/PMgUv7fflL5t+ws/DLXCP+F62D+tyzA9g02lvTa2iL7fHBw/Ojt3PulxSb8qSa4+KhKCP0FaMD/lWTI/GcLeu677oj8jmge/P4Q0PqIfu75sAUy/CLR2PVr0Wrr7prw7FHR9vzXoFT/DReU+DcNmP0Apdb+9d4s+NZPsPmnalz8zqoe/RDEZv33ifb4WsV4+2ZoyP4pIlL+vdRy/WJwBwFMzn7/vDnk9ARznPnVUbz8A3+K+pM4YPVXj0z6LLSvABnbhvuRGDr/JsT2+bxO6PjxJgT+6ltq/w0XlPsn/jb+UjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSwRLHIaUjAFDlHSUUpQu"}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYEAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwSFlIwBQ5R0lFKULg=="}, "_last_original_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVNQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJbAAQAAAAAAAAAAAACTmFM2AACAPwAAAAAAAAAAAAAAAAAAAAAAAACA0Zh2OwAAAAA1W92/AAAAAEkHOT0AAAAAByXgPwAAAABwENw7AAAAALKfAEAAAAAAhe22vQAAAADqLum/AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAqYodtwAAgD8AAAAAAAAAAAAAAAAAAAAAAAAAgMipDj4AAAAA60LnvwAAAADqRL29AAAAAJ8f/T8AAAAAMvgOvgAAAADk8/k/AAAAAByzDz0AAAAAT+PfvwAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAABlztbYAAIA/AAAAAAAAAAAAAAAAAAAAAAAAAIAsoPs9AAAAAEO18r8AAAAA5RXDvQAAAABfbOw/AAAAAICkTT0AAAAAr2zcPwAAAAA5ZIs9AAAAALXU3L8AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAABkQ3c2AACAPwAAAAAAAAAAAAAAAAAAAAAAAACAaHn8vQAAAAAv5f2/AAAAAI7Q5z0AAAAAvd/ePwAAAADBj869AAAAALkF2z8AAAAA0XSMvAAAAADB5d+/AAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSwRLHIaUjAFDlHSUUpQu"}, "_episode_num": 0, "use_sde": true, "sde_sample_freq": -1, "_current_progress_remaining": 0.0, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVRAwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQJKvSv0RODeMAWyUTegDjAF0lEdAq4zzaufVZ3V9lChoBkdAl+z2IKtxMmgHTegDaAhHQKuXOSg5BC51fZQoaAZHQJt/XCJoCdVoB03oA2gIR0CrmRYxDb8FdX2UKGgGR0CarJlijL0SaAdN6ANoCEdAq5k/dfsu4HV9lChoBkdAmunPttygf2gHTegDaAhHQKudqKrJbMZ1fZQoaAZHQJrEu89Oh01oB03oA2gIR0CrpZqlgtvodX2UKGgGR0CVp55vLowFaAdN6ANoCEdAq6bQ4MnZ03V9lChoBkdAmUlhoZhrnGgHTegDaAhHQKum6pDu0C11fZQoaAZHQJoV6BshxHZoB03oA2gIR0CrqlhTGYKIdX2UKGgGR0CXBbE2YOUdaAdN6ANoCEdAq7MzB68g6nV9lChoBkdAmfqkSElE7WgHTegDaAhHQKu1DlAeJYV1fZQoaAZHQJnBaS4e9zxoB03oA2gIR0CrtTgHu7YkdX2UKGgGR0CWoZ5qubI+aAdN6ANoCEdAq7q2RmseXHV9lChoBkdAhEi4wIt16mgHTegDaAhHQKvDMwqy4Wl1fZQoaAZHQIw8Pl0YCQtoB03oA2gIR0CrxHBHLA58dX2UKGgGR0CY5wi9qUNbaAdN6ANoCEdAq8SJAprk83V9lChoBkdAmIiGphnanWgHTegDaAhHQKvH4RkEs8R1fZQoaAZHQJNf77zkIX1oB03oA2gIR0Crz7xXnyNGdX2UKGgGR0CYm+rq+rU9aAdN6ANoCEdAq9FiFdszmHV9lChoBkdAmUkUEC/47GgHTegDaAhHQKvRhhvR7Z51fZQoaAZHQJJ3rzAeq71oB03oA2gIR0Cr1rMwtapxdX2UKGgGR0CU85osZpBYaAdN6ANoCEdAq+DO10DEFXV9lChoBkdAlBELNfPX1GgHTegDaAhHQKviOTq0MPV1fZQoaAZHQJHBoj5bhWJoB03oA2gIR0Cr4mK2SdOJdX2UKGgGR0CVJZhYvFm4aAdN6ANoCEdAq+eg482aUnV9lChoBkdAlfCQkxASnWgHTegDaAhHQKvyv38n/kx1fZQoaAZHQJ46ngLqlgtoB03oA2gIR0Cr9I7xEv0zdX2UKGgGR0CUQ3W43FUAaAdN6ANoCEdAq/Sznkkrw3V9lChoBkdAlQ2ES26TXGgHTegDaAhHQKv6CkpI+W51fZQoaAZHQJQIbqcEvCdoB03oA2gIR0CsAt/+jua4dX2UKGgGR0CX5SklNUOvaAdN6ANoCEdArAQ2AoXsPnV9lChoBkdAlJbamoBJZmgHTegDaAhHQKwEUF/QSjB1fZQoaAZHQJcj78IiTt9oB03oA2gIR0CsB8Aood+5dX2UKGgGR0Cd2Rr433pOaAdN6ANoCEdArBBYvcrRSnV9lChoBkdAmJNuRxLkCGgHTegDaAhHQKwSUgMc6vJ1fZQoaAZHQJcLyliz9jxoB03oA2gIR0CsEnd+w1R+dX2UKGgGR0CXnBvZyuIRaAdN6ANoCEdArBfpaC+UQnV9lChoBkdAmFL+JpFkQWgHTegDaAhHQKwh9bfP5YZ1fZQoaAZHQJHW6yMUAT9oB03oA2gIR0CsI0VwHZ9NdX2UKGgGR0CWcOSjxkNGaAdN6ANoCEdArCNhmdy1eHV9lChoBkdAlO1S1uzhP2gHTegDaAhHQKwnAC1Z1V51fZQoaAZHQJEoHzxwyZdoB03oA2gIR0CsL7VaW5YpdX2UKGgGR0CWG21rZamoaAdN6ANoCEdArDFFIVdonXV9lChoBkdAjjtCQLeANGgHTegDaAhHQKwxalgMMJB1fZQoaAZHQJXwFhG6PKdoB03oA2gIR0CsNzXAM2FWdX2UKGgGR0CaZmLHuJDWaAdN6ANoCEdArEGZ0CA+ZHV9lChoBkdAlHkrVvuPWGgHTegDaAhHQKxC2lruYyB1fZQoaAZHQJb2iPV/c35oB03oA2gIR0CsQvVkUbkwdX2UKGgGR0CZwYYmLLpzaAdN6ANoCEdArEZ3Dm8ujHV9lChoBkdAlcB9ic5Ke2gHTegDaAhHQKxOndLxqfx1fZQoaAZHQJm2/Uz9CNVoB03oA2gIR0CsT9smOU+tdX2UKGgGR0CWFnhnJ1aGaAdN6ANoCEdArE/1U83dbnV9lChoBkdAl1U/W+XZ5GgHTegDaAhHQKxUsavRqoJ1fZQoaAZHQJV6Eg2ZRbdoB03oA2gIR0CsYFJZ4fOldX2UKGgGR0CaJiRh+fAcaAdN6ANoCEdArGGnhsImgXV9lChoBkdAl0d+UhV2imgHTegDaAhHQKxhwzGgi/x1fZQoaAZHQJUxk274BWBoB03oA2gIR0CsZXPKU3XJdX2UKGgGR0CX6z2OQyRCaAdN6ANoCEdArG4aJCSid3V9lChoBkdAmehgRf4REmgHTegDaAhHQKxvbD/lyR11fZQoaAZHQJburLyMDOloB03oA2gIR0Csb4dgfEGadX2UKGgGR0CYrEc6NlyzaAdN6ANoCEdArHPw593KS3V9lChoBkdAm57xDw6QvGgHTegDaAhHQKx/3BMSK3x1fZQoaAZHQJniGIxgy/NoB03oA2gIR0CsgR3EIgNgdX2UKGgGR0CY2RUxVQyiaAdN6ANoCEdArIE6Qq7ROXV9lChoBkdAnHpIrSVnmWgHTegDaAhHQKyErm5lOGl1fZQoaAZHQJpyfV6NVBFoB03oA2gIR0CsjKFs54nndX2UKGgGR0Cb6sAS39aVaAdN6ANoCEdArI3WluWKM3V9lChoBkdAnDtwow22omgHTegDaAhHQKyN8Vzp5eJ1fZQoaAZHQJs+fAdn005oB03oA2gIR0CskWVbzK9xdX2UKGgGR0CbHnKfnOjZaAdN6ANoCEdArJ2g3o9s8HV9lChoBkdAndAEJv5xi2gHTegDaAhHQKye+cWCVbB1fZQoaAZHQJyIYmv4dp9oB03oA2gIR0CsnxIouwotdX2UKGgGR0CbxTWu5jH5aAdN6ANoCEdArKJ+aQV9GHV9lChoBkdAm7O+/cnE22gHTegDaAhHQKyqhh/Aj6h1fZQoaAZHQJP1cz67/XJoB03oA2gIR0Csq79s7+1jdX2UKGgGR0Cc52gPmPo3aAdN6ANoCEdArKvYHRkVe3V9lChoBkdAmp8ryhBZ6mgHTegDaAhHQKyvPvPTodN1fZQoaAZHQJyYua+evp1oB03oA2gIR0Csuc30wrUcdX2UKGgGR0Cb9/BJqZc+aAdN6ANoCEdArLu6UgSvknV9lChoBkdAmEdO0G/vfGgHTegDaAhHQKy74K/mDDl1fZQoaAZHQJt/qitaIN5oB03oA2gIR0CswAAU+LWJdX2UKGgGR0CZ+3O2iL2paAdN6ANoCEdArMfhPIn0CnV9lChoBkdAlXu5PZZjhGgHTegDaAhHQKzJGXwb2lF1fZQoaAZHQJoL/VpbliloB03oA2gIR0CsyTKs2eg+dX2UKGgGR0CRhlEC/47BaAdN6ANoCEdArMySlabF0nV9lChoBkdAmmxfhhpg1GgHTegDaAhHQKzWDHxz7uV1fZQoaAZHQJjUmlDWsiloB03oA2gIR0Cs1/qgIyCWdX2UKGgGR0CXwYLkCFK1aAdN6ANoCEdArNgm/nGKh3V9lChoBkdAk5MiXlbNbGgHTegDaAhHQKzdj9G7SRd1fZQoaAZHQJvrdYeT3ZhoB03oA2gIR0Cs5bczZYgadX2UKGgGR0CaitvCMxXXaAdN6ANoCEdArObuhbnoxHV9lChoBkdAm3U6hUR3/2gHTegDaAhHQKznDNs3yZt1fZQoaAZHQJc6oOoYNy5oB03oA2gIR0Cs6nRPGhmHdX2UKGgGR0CTqsG8EmpmaAdN6ANoCEdArPLOLrHEM3V9lChoBkdAhdqte+mFamgHTegDaAhHQKz0kW9lEql1fZQoaAZHQJKtl0GNaQpoB03oA2gIR0Cs9LraM72ddX2UKGgGR0CYcWmwJPZaaAdN6ANoCEdArPngTqSowXV9lChoBkdAmuDF7x/d7GgHTegDaAhHQK0DVqzqrzZ1fZQoaAZHQJn7rblA/s5oB03oA2gIR0CtBIiHZbpvdX2UKGgGR0CZ50miQDFIaAdN6ANoCEdArQSj8P4EfXVlLg=="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 62500, "n_steps": 8, "gamma": 0.99, "gae_lambda": 0.9, "ent_coef": 0.0, "vf_coef": 0.4, "max_grad_norm": 0.5, "normalize_advantage": false, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVbQIAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLHIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWcAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/lGgLSxyFlIwBQ5R0lFKUjARoaWdolGgTKJZwAAAAAAAAAAAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH+UaAtLHIWUaBZ0lFKUjA1ib3VuZGVkX2JlbG93lGgTKJYcAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLHIWUaBZ0lFKUjA1ib3VuZGVkX2Fib3ZllGgTKJYcAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUaCJLHIWUaBZ0lFKUjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "_shape": [28], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf\n -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf inf inf inf inf inf inf inf inf inf inf\n inf inf inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False False False False False\n False False False False False False False False False False False False\n False False False False]", "bounded_above": "[False False False False False False False False False False False False\n False False False False False False False False False False False False\n False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVpQEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAIC/AACAvwAAgL8AAIC/AACAvwAAgL8AAIC/AACAv5RoC0sIhZSMAUOUdJRSlIwEaGlnaJRoEyiWIAAAAAAAAAAAAIA/AACAPwAAgD8AAIA/AACAPwAAgD8AAIA/AACAP5RoC0sIhZRoFnSUUpSMDWJvdW5kZWRfYmVsb3eUaBMolggAAAAAAAAAAQEBAQEBAQGUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBZ0lFKUjA1ib3VuZGVkX2Fib3ZllGgTKJYIAAAAAAAAAAEBAQEBAQEBlGgiSwiFlGgWdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [8], "low": "[-1. -1. -1. -1. -1. -1. -1. -1.]", "high": "[1. 1. 1. 1. 1. 1. 1. 1.]", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_np_random": null}, "n_envs": 4, "system_info": {"OS": "Linux-5.15.107+-x86_64-with-glibc2.31 # 1 SMP Sat Apr 29 09:15:28 UTC 2023", "Python": "3.10.12", "Stable-Baselines3": "1.8.0", "PyTorch": "2.0.1+cu118", "GPU Enabled": "True", "Numpy": "1.22.4", "Gym": "0.21.0"}}
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:75f286715f4e85dbc99215723f4417fd721c3699ee4946c11b1da3d5d01d5d93
3
- size 1052683
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0ada5efe84a8e48e9b0267b9b1eb921e7994b3b586ccbd84b93f0c6b8436eafb
3
+ size 1019980
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 926.8504204986945, "std_reward": 364.8925103442384, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-06-12T21:33:06.269552"}
 
1
+ {"mean_reward": 1833.6746178464266, "std_reward": 155.8542943692614, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-06-15T11:31:25.545435"}
vec_normalize.pkl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1bdc90b4c67fbf6c6087e4ae94c061c6679afaeb28665cc07f298c4a02e736bc
3
  size 2176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4b8d25213605861eb58fc89dba17511639325d59b99672907732d7fcf5cc97d
3
  size 2176