Frorozcol commited on
Commit
03dc47e
1 Parent(s): 5275d89

Initial commit

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: AntBulletEnv-v0
17
  metrics:
18
  - type: mean_reward
19
- value: 1372.08 +/- 130.56
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: AntBulletEnv-v0
17
  metrics:
18
  - type: mean_reward
19
+ value: 1921.02 +/- 58.46
20
  name: mean_reward
21
  verified: false
22
  ---
a2c-AntBulletEnv-v0.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1489194551af4ed996898a1f215ef26a0187f19a9719ab0350cc8eaa7b71bcc8
3
  size 129265
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba2c9d786e668b1cefc26ee0b4f42efc5f354cf7dad61dc93b33bb06883ef044
3
  size 129265
a2c-AntBulletEnv-v0/data CHANGED
@@ -4,20 +4,20 @@
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
- "__init__": "<function ActorCriticPolicy.__init__ at 0x7f3271fa5550>",
8
- "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f3271fa55e0>",
9
- "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f3271fa5670>",
10
- "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f3271fa5700>",
11
- "_build": "<function ActorCriticPolicy._build at 0x7f3271fa5790>",
12
- "forward": "<function ActorCriticPolicy.forward at 0x7f3271fa5820>",
13
- "extract_features": "<function ActorCriticPolicy.extract_features at 0x7f3271fa58b0>",
14
- "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f3271fa5940>",
15
- "_predict": "<function ActorCriticPolicy._predict at 0x7f3271fa59d0>",
16
- "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f3271fa5a60>",
17
- "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f3271fa5af0>",
18
- "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f3271fa5b80>",
19
  "__abstractmethods__": "frozenset()",
20
- "_abc_impl": "<_abc._abc_data object at 0x7f3271fa4cc0>"
21
  },
22
  "verbose": 1,
23
  "policy_kwargs": {
@@ -59,12 +59,12 @@
59
  "_np_random": null
60
  },
61
  "n_envs": 4,
62
- "num_timesteps": 2000000,
63
- "_total_timesteps": 2000000,
64
  "_num_timesteps_at_start": 0,
65
  "seed": null,
66
  "action_noise": null,
67
- "start_time": 1678359694265281562,
68
  "learning_rate": 0.00096,
69
  "tensorboard_log": null,
70
  "lr_schedule": {
@@ -73,7 +73,7 @@
73
  },
74
  "_last_obs": {
75
  ":type:": "<class 'numpy.ndarray'>",
76
- ":serialized:": "gAWVNQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJbAAQAAAAAAAN+5rL7Ur04+gS0QP4wl/72/woM+xNW0v54LFz8g0ds8oYOHPk3vFL/cxUY+0TaQvwgfIL/tZ/Y+P4uBvkFqSj4frNg+L8ygP0uBDD/Q48S+jMCFvll3XD+ISRW/MCigP+c1Lj8Qt6g+vX0MPwdojr/D5i0/B3oFPrk8DD+mNlE//8ccwPgpBMA6bUO+Xt5XvxUdXz8zkVu/21waPxrrLcA8mRS/u0A7vxkRJD7LB+c/taOtv901KT947DE/zE1aPC+BLr8+IS68WfAfP99zaEDnNS4/jThCwCY96b8HaI6/8OIiPrM8Z76j8dY+zDoBQGfwsz9c6Ni++Wn3PtrRkT8bCJ2/hV0mvw/5Ub9Z8Rw/BVjSvvJxJEADqJ+/i6nXPslfyz/5Uls7DvQcvmvQCcDl1lu/RMDCuH0DlL5yPvQ9Hhi8vxC3qD4mPem/IhpmP+y+z73YzsE+U0wWP/Z9hj02y8C/eVaLP5N4a70jjUK/q1QZPtoWXT8Ym/k+h7N0vp567z7Cicw9TcJCP7L7T7ts3Ke+/OXovtCsID8rBia//+9Zv4VQoDzj20O/+3kFP+c1Lj8Qt6g+vX0MPwdojr+UjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSwRLHIaUjAFDlHSUUpQu"
77
  },
78
  "_last_episode_starts": {
79
  ":type:": "<class 'numpy.ndarray'>",
@@ -81,7 +81,7 @@
81
  },
82
  "_last_original_obs": {
83
  ":type:": "<class 'numpy.ndarray'>",
84
- ":serialized:": "gAWVNQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJbAAQAAAAAAAAAAAABHBvY1AACAPwAAAAAAAAAAAAAAAAAAAAAAAACA3JoQvgAAAAB1j/O/AAAAAG9ZBD4AAAAAdaDfPwAAAAA5o/a9AAAAANI04j8AAAAAzEWdPQAAAAAlXva/AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAdC22NgAAgD8AAAAAAAAAAAAAAAAAAAAAAAAAgETFor0AAAAAAOUAwAAAAABsv+Q9AAAAAD7x8z8AAAAAbhvhPQAAAADvUOM/AAAAAIHFiz0AAAAAWYn/vwAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAH8NlrUAAIA/AAAAAAAAAAAAAAAAAAAAAAAAAIAHmnc8AAAAAIPR+78AAAAANF9AvQAAAABBhPQ/AAAAAO8Gc70AAAAAje/6PwAAAADC1Zq9AAAAAD/e5r8AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA8CXm1AACAPwAAAAAAAAAAAAAAAAAAAAAAAACA/RFKvQAAAABf6Pm/AAAAAP/LzrwAAAAAVWnwPwAAAADJXoo9AAAAAOoX+z8AAAAAonEAPgAAAAARiPC/AAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSwRLHIaUjAFDlHSUUpQu"
85
  },
86
  "_episode_num": 0,
87
  "use_sde": true,
@@ -89,13 +89,13 @@
89
  "_current_progress_remaining": 0.0,
90
  "ep_info_buffer": {
91
  ":type:": "<class 'collections.deque'>",
92
- ":serialized:": "gAWVRAwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHHTNm+TNdKMAWyUTegDjAF0lEdAqsqeX9itrHV9lChoBkdAhOpneizsyGgHTegDaAhHQKrLXsgMc6x1fZQoaAZHQJF9+/RE4NtoB03oA2gIR0CqzMJ3PiT/dX2UKGgGR0CUvlJx//edaAdN6ANoCEdAqtFhXhfjTHV9lChoBkdAgwI0iY9gW2gHTegDaAhHQKrY4DSw4bV1fZQoaAZHQIwwtix3V09oB03oA2gIR0Cq2VKf4AS4dX2UKGgGR0CYnr1YhdMTaAdN6ANoCEdAqtov5rP+oHV9lChoBkdAl3QMtGus92gHTegDaAhHQKrdalv60pp1fZQoaAZHQIadpW1c+q1oB03oA2gIR0Cq5ZZ8rqdIdX2UKGgGR0CRxR1SflIVaAdN6ANoCEdAquZEB8x9HHV9lChoBkdAggeiXY150WgHTegDaAhHQKrnjuP3i711fZQoaAZHQJUuXu7YkE9oB03oA2gIR0Cq7JVVYISldX2UKGgGR0CRNKWU8mrsaAdN6ANoCEdAqvSL3XZoPHV9lChoBkdAfyubC79Q42gHTegDaAhHQKr1BBJqZc91fZQoaAZHQJQnEAxSHdpoB03oA2gIR0Cq9d6h6By0dX2UKGgGR0CTS72Yv38GaAdN6ANoCEdAqvk9d9lVcXV9lChoBkdAkwwitV7x/mgHTegDaAhHQKsAylk6Lfl1fZQoaAZHQJGK7oePq9poB03oA2gIR0CrAUJGFzuGdX2UKGgGR0CVXEJJGvwFaAdN6ANoCEdAqwJlNBWxQnV9lChoBkdAlZBeY2Kl6GgHTegDaAhHQKsHRRLK3d91fZQoaAZHQJWXcQZn+Q5oB03oA2gIR0CrEB17pmmMdX2UKGgGR0CL9mtapxWDaAdN6ANoCEdAqxCN4cFQmHV9lChoBkdAkinUlZ5iVmgHTegDaAhHQKsRb+3H7xd1fZQoaAZHQJE9Pi97F85oB03oA2gIR0CrFLjZ+QU6dX2UKGgGR0CT2+cR15jZaAdN6ANoCEdAqxxU5hjOLXV9lChoBkdAkBfBCUornWgHTegDaAhHQKscxUPQOWl1fZQoaAZHQJJctzvJA+poB03oA2gIR0CrHaTvqkdndX2UKGgGR0CTdxojv/ipaAdN6ANoCEdAqyHtUXHim3V9lChoBkdAk7cFUdaMaWgHTegDaAhHQKsrqMn7YTV1fZQoaAZHQJNzYAeaKDVoB03oA2gIR0CrLCARTS9edX2UKGgGR0CDI0y0KJEZaAdN6ANoCEdAqy0Dn3cpLHV9lChoBkdAkdpR3mmtQ2gHTegDaAhHQKswTKe05U91fZQoaAZHQI9bbDbah6BoB03oA2gIR0CrN9Lns9jgdX2UKGgGR0CQkZKR+z+naAdN6ANoCEdAqzhCfpUxVXV9lChoBkdAkGfN8E3bVWgHTegDaAhHQKs5JJeVs1t1fZQoaAZHQJDXcIHC4z9oB03oA2gIR0CrPMdtMwlCdX2UKGgGR0CIZQJa7mMgaAdN6ANoCEdAq0dHkDIRy3V9lChoBkdAlL42GRFI/mgHTegDaAhHQKtHuGyon8d1fZQoaAZHQJGtQYDTz/ZoB03oA2gIR0CrSJqHwgDBdX2UKGgGR0CJdMV+I/JOaAdN6ANoCEdAq0vuoYNy53V9lChoBkdAkXeVr6+FlGgHTegDaAhHQKtTsvM8ox51fZQoaAZHQId3G0PYnOVoB03oA2gIR0CrVCl4keIVdX2UKGgGR0CHYNFMqSX/aAdN6ANoCEdAq1UNOKwY+HV9lChoBkdAkvLmvfTCtWgHTegDaAhHQKtYX1pTMq11fZQoaAZHQJAZSlVLi/BoB03oA2gIR0CrYwaxPfsNdX2UKGgGR0CRTs+S8rZraAdN6ANoCEdAq2N+KCQLeHV9lChoBkdAkoq1ivxH5WgHTegDaAhHQKtkYIv8IiV1fZQoaAZHQI/g6Rhc7hhoB03oA2gIR0CrZ7Jkwvg4dX2UKGgGR0CR8vbY9Pk8aAdN6ANoCEdAq29YvJzT4XV9lChoBkdAkyoqx9oexWgHTegDaAhHQKtvzEpiI+J1fZQoaAZHQJSlQWSEDhdoB03oA2gIR0CrcKjDTBqLdX2UKGgGR0CUZLRfnfVJaAdN6ANoCEdAq3PgKMNtqHV9lChoBkdAkmdxaPjn3mgHTegDaAhHQKt+Et+1Bt11fZQoaAZHQJOx3B0p3HJoB03oA2gIR0Crfr8u8K5TdX2UKGgGR0CHsI6WgOBlaAdN6ANoCEdAq3+9dVvMr3V9lChoBkdAlpjpwbVBlmgHTegDaAhHQKuDDmcvugJ1fZQoaAZHQJFvJ8Rcu8NoB03oA2gIR0CripxFqi48dX2UKGgGR0CUpR9Gqgh9aAdN6ANoCEdAq4sSeiBXjnV9lChoBkdAkdEUCq6vq2gHTegDaAhHQKuL+XvYvnN1fZQoaAZHQJVVTFhoduJoB03oA2gIR0Crjz1MmF8HdX2UKGgGR0CWdS0Z3s5XaAdN6ANoCEdAq5iOACnxa3V9lChoBkdAlz6CDqW1MWgHTegDaAhHQKuZQZBLPD51fZQoaAZHQJTysIKMNttoB03oA2gIR0Crmpg2ZRbbdX2UKGgGR0CYW5yD7IkraAdN6ANoCEdAq55wiA2AG3V9lChoBkdAkwvVSflIVmgHTegDaAhHQKul6F23azx1fZQoaAZHQJKHNV0cOsloB03oA2gIR0CrplmQr+YMdX2UKGgGR0CTBIcnVoYfaAdN6ANoCEdAq6c9PtUn5XV9lChoBkdAl/hRgZ0jkmgHTegDaAhHQKuqexgRbr11fZQoaAZHQJXsU+2VmjFoB03oA2gIR0CrsqeCsfaIdX2UKGgGR0CVRFcPvrnlaAdN6ANoCEdAq7NPbmEGq3V9lChoBkdAlM8Risny/mgHTegDaAhHQKu0qT0QK8d1fZQoaAZHQIwsR17pmmNoB03oA2gIR0CruYZL7GeddX2UKGgGR0B6JmwHJLdvaAdN6ANoCEdAq8ELTtsvZnV9lChoBkdAlJQNCmdiD2gHTegDaAhHQKvBfp7CzkZ1fZQoaAZHQIXHptgrpaBoB03oA2gIR0CrwlsoUi6hdX2UKGgGR0CUNe5KvmozaAdN6ANoCEdAq8WkZJkGzXV9lChoBkdAk6n7ONYKY2gHTegDaAhHQKvNSlqrR0F1fZQoaAZHQJXTCe18b71oB03oA2gIR0Crzgm7rcCYdX2UKGgGR0CYsLFY+0PZaAdN6ANoCEdAq89Jy6tknXV9lChoBkdAkfCITfzjFWgHTegDaAhHQKvUQy6cy311fZQoaAZHQJVkbkzXSShoB03oA2gIR0Cr3HrZSNwSdX2UKGgGR0CDBBv0h/y5aAdN6ANoCEdAq9zp+4LCvXV9lChoBkdAkz12/zreImgHTegDaAhHQKvdxCb+cYt1fZQoaAZHQJh/Ndt2s7xoB03oA2gIR0Cr4QxSxZ+ydX2UKGgGR0CNS2cH4XXRaAdN6ANoCEdAq+iqzPa+OHV9lChoBkdAhrcdAHE/B2gHTegDaAhHQKvpGzhxYJV1fZQoaAZHQJJJtPci4axoB03oA2gIR0Cr6gIIWxhVdX2UKGgGR0CWLYkwevIPaAdN6ANoCEdAq+6k4m1IAnV9lChoBkdAj7uoVdonKGgHTegDaAhHQKv38wxFiKB1fZQoaAZHQI0xoQxvegtoB03oA2gIR0Cr+GUSAYpEdX2UKGgGR0CSQVYjSofkaAdN6ANoCEdAq/lIphF3IXV9lChoBkdAkejBGhEjPmgHTegDaAhHQKv8hNbkfcN1fZQoaAZHQIBAUR15jYtoB03oA2gIR0CsBCYm9g4PdX2UKGgGR0CUPBgPVd5ZaAdN6ANoCEdArASXQ+lj3HV9lChoBkdAksHpL26ClWgHTegDaAhHQKwFdF9a2Wp1fZQoaAZHQJQANNTLns9oB03oA2gIR0CsCUPWQOnVdX2UKGgGR0CXQ6Wf9P1taAdN6ANoCEdArBMvNRm9QHV9lChoBkdAlljNTDO1OWgHTegDaAhHQKwTrcyFfzB1fZQoaAZHQJULj+rELploB03oA2gIR0CsFI9W6shgdX2UKGgGR0CVhS1gH/tIaAdN6ANoCEdArBfMXxe9jHVlLg=="
93
  },
94
  "ep_success_buffer": {
95
  ":type:": "<class 'collections.deque'>",
96
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
97
  },
98
- "_n_updates": 62500,
99
  "n_steps": 8,
100
  "gamma": 0.99,
101
  "gae_lambda": 0.9,
 
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
+ "__init__": "<function ActorCriticPolicy.__init__ at 0x7f8a366e65e0>",
8
+ "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f8a366e6670>",
9
+ "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f8a366e6700>",
10
+ "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f8a366e6790>",
11
+ "_build": "<function ActorCriticPolicy._build at 0x7f8a366e6820>",
12
+ "forward": "<function ActorCriticPolicy.forward at 0x7f8a366e68b0>",
13
+ "extract_features": "<function ActorCriticPolicy.extract_features at 0x7f8a366e6940>",
14
+ "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f8a366e69d0>",
15
+ "_predict": "<function ActorCriticPolicy._predict at 0x7f8a366e6a60>",
16
+ "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f8a366e6af0>",
17
+ "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f8a366e6b80>",
18
+ "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f8a366e6c10>",
19
  "__abstractmethods__": "frozenset()",
20
+ "_abc_impl": "<_abc._abc_data object at 0x7f8a366e7a40>"
21
  },
22
  "verbose": 1,
23
  "policy_kwargs": {
 
59
  "_np_random": null
60
  },
61
  "n_envs": 4,
62
+ "num_timesteps": 1000000,
63
+ "_total_timesteps": 1000000,
64
  "_num_timesteps_at_start": 0,
65
  "seed": null,
66
  "action_noise": null,
67
+ "start_time": 1678394102036149900,
68
  "learning_rate": 0.00096,
69
  "tensorboard_log": null,
70
  "lr_schedule": {
 
73
  },
74
  "_last_obs": {
75
  ":type:": "<class 'numpy.ndarray'>",
76
+ ":serialized:": "gAWVNQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJbAAQAAAAAAAKJW0D5dNVA+WPQHPzydAkD8mSs+dpceP9icAr+ziYU+5gISPue7gT7sSWi/kR8BP901rT23f8I/gqTsvBSB0TxecQw/xq0PQBaPPL9FfzS/bZdpv2t6gL8pYB0/vaJ+PbvUmb+AFAo/yYamPlcsMT/mRY0+jhmhv0V8Ez8g0RNASmQKvoKxLT/9aRK/SZe4PgskcD9d29m+0s09vmQwID8RWVY/I1Pvv+tCuz2CcXy/lNGBP2E8DcCgX3i/K8FWP9bSQ748M7S+GJsIv9Uag8BUA1U/gBQKP8mGpj7v8ri/K6gaP3rYwT63Gd8+3iYPQG3/WT+hhL69zG8ePyWpB78RqHQ/XIV9v1vgRr/Jdzs/XOmJPzfJKD3nJse9jPe3P6cw7D+fEJ2/3/K8PZYE7z6noWa/RQQ2PRSGnj2dboC8u9SZv4AUCj/JhqY+VywxP7q7Xb/3/Ii/bR8kP3VfOz8Kl0nAbS0PPzVzH74csLm+7lZiP3v1bb/mJX6+B/ofvqOHWL9hHUPAJ98kP5utpL6/a8M9xlIDwMgfSD/VV6m7UEdnv0sfiTzBNnK/5diNvFQDVT+AFAo/yYamPu/yuL+UjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSwRLHIaUjAFDlHSUUpQu"
77
  },
78
  "_last_episode_starts": {
79
  ":type:": "<class 'numpy.ndarray'>",
 
81
  },
82
  "_last_original_obs": {
83
  ":type:": "<class 'numpy.ndarray'>",
84
+ ":serialized:": "gAWVNQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJbAAQAAAAAAAAAAAAAT6dK1AACAPwAAAAAAAAAAAAAAAAAAAAAAAACAw+z4PQAAAABYhdy/AAAAANeGtrwAAAAAIj/oPwAAAACD12E9AAAAAGVk4T8AAAAAalWSvAAAAACk2QDAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAApGNRtgAAgD8AAAAAAAAAAAAAAAAAAAAAAAAAgL14Ej4AAAAA33XlvwAAAABMZ/Y8AAAAAKrE/T8AAAAAy353vQAAAAAUx+o/AAAAAGhdCb0AAAAAe4vavwAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAG58BjYAAIA/AAAAAAAAAAAAAAAAAAAAAAAAAICYs7A9AAAAAHfy8r8AAAAA3L6xPQAAAADbW90/AAAAAOm6TzsAAAAAhzH6PwAAAAAliKG9AAAAAJOE678AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAABRUcC2AACAPwAAAAAAAAAAAAAAAAAAAAAAAACAU+MFvQAAAABdAuO/AAAAAHKf970AAAAA3xHjPwAAAAAq/ZC9AAAAAMBn+T8AAAAAMeq0PQAAAAA+fuG/AAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSwRLHIaUjAFDlHSUUpQu"
85
  },
86
  "_episode_num": 0,
87
  "use_sde": true,
 
89
  "_current_progress_remaining": 0.0,
90
  "ep_info_buffer": {
91
  ":type:": "<class 'collections.deque'>",
92
+ ":serialized:": "gAWVRAwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQJ4+akdmxt6MAWyUTegDjAF0lEdAmZ545HVf/nV9lChoBkdAmyhJ1Ng0CWgHTegDaAhHQJmn05tFa0R1fZQoaAZHQJ8Z+cYqG1xoB03oA2gIR0CZrtJrLyMDdX2UKGgGR0CZple4Cp3paAdN6ANoCEdAma80AcT8HnV9lChoBkdAmQVoePq9oWgHTegDaAhHQJm4eZ1FH8V1fZQoaAZHQJpJ0EEC/49oB03oA2gIR0CZv/N6PbPAdX2UKGgGR0CYBrVKPGQ0aAdN6ANoCEdAmcbJVGTcI3V9lChoBkdAk/8iRjjJdWgHTegDaAhHQJnHIjmjj711fZQoaAZHQJmL0tapxWFoB03oA2gIR0CZ0l+LWI43dX2UKGgGR0Cd1PZbY9PlaAdN6ANoCEdAmd33LA57xHV9lChoBkdAmss1yR0U5GgHTegDaAhHQJnlicf/3nJ1fZQoaAZHQJui89/z8P5oB03oA2gIR0CZ5eoRqXWwdX2UKGgGR0Cb8OjVhCtzaAdN6ANoCEdAme83BxgiNnV9lChoBkdAnomnTI/7i2gHTegDaAhHQJn2sjMV1wJ1fZQoaAZHQJ07l35eqrBoB03oA2gIR0CZ/dPEbYK6dX2UKGgGR0CdfTC+10DEaAdN6ANoCEdAmf40FB6a9nV9lChoBkdAmnPBxPwd82gHTegDaAhHQJoHc0cfeUJ1fZQoaAZHQJwt5wYLsrxoB03oA2gIR0CaEi482aUidX2UKGgGR0CfAek0rK/3aAdN6ANoCEdAmhzGUB4lhXV9lChoBkdAmykNVinYQWgHTegDaAhHQJodIxpL26F1fZQoaAZHQJrFK11GLDRoB03oA2gIR0CaJl0/nnuBdX2UKGgGR0CaM0a6z3RHaAdN6ANoCEdAmi2tsvZh8nV9lChoBkdAmmEhRMvh62gHTegDaAhHQJo0nTd+G491fZQoaAZHQJk19CPZIxxoB03oA2gIR0CaNPiEg4ffdX2UKGgGR0CXy7frrxAjaAdN6ANoCEdAmj4abe/HpHV9lChoBkdAmgjQw482aWgHTegDaAhHQJpGM8IRh+h1fZQoaAZHQJTFEogFHJ9oB03oA2gIR0CaUI8Djin6dX2UKGgGR0CMyMnNPgvUaAdN6ANoCEdAmlEtbLU1AXV9lChoBkdAmV1RXS0BwWgHTegDaAhHQJpdUxoIv8J1fZQoaAZHQJX/it+1Bt1oB03oA2gIR0CaZLRfWtlqdX2UKGgGR0CZQg3ZPEbYaAdN6ANoCEdAmmuFdC3PRnV9lChoBkdAmErczVMEimgHTegDaAhHQJpr34nF5v91fZQoaAZHQJm5WS2Yv39oB03oA2gIR0CadRctGus+dX2UKGgGR0CYq/fyf+S9aAdN6ANoCEdAmnxRqGlANXV9lChoBkdAlVwQn+hoNGgHTegDaAhHQJqEWr4nF5x1fZQoaAZHQJr3krqdH2BoB03oA2gIR0CahN3oLXtjdX2UKGgGR0CagDVRUFSsaAdN6ANoCEdAmpLXxnWat3V9lChoBkdAmnrxp1zQu2gHTegDaAhHQJqbQhyKekJ1fZQoaAZHQJw8NJe3QUpoB03oA2gIR0CaoiBMzuWsdX2UKGgGR0Cb/kku6ErYaAdN6ANoCEdAmqKBhH9WIXV9lChoBkdAmdBX9R77bmgHTegDaAhHQJqr8UoKD011fZQoaAZHQJVQovugHu9oB03oA2gIR0Cas2mjTKDDdX2UKGgGR0CZZyIyCWeIaAdN6ANoCEdAmrpP5DZ13nV9lChoBkdAl1hr349HMGgHTegDaAhHQJq6qUC7sfJ1fZQoaAZHQJwoTmV7hNxoB03oA2gIR0CaxuNGmUGFdX2UKGgGR0CWDC3evZAZaAdN6ANoCEdAmtJUvPC2t3V9lChoBkdAmHfzkU9IPWgHTegDaAhHQJrZKgvlEJB1fZQoaAZHQJledsqJ/G5oB03oA2gIR0Ca2YEhJRO2dX2UKGgGR0Cbs/Iv8IiUaAdN6ANoCEdAmuKsS9M9KXV9lChoBkdAmR8J9d/rjmgHTegDaAhHQJrqEVO9FnZ1fZQoaAZHQJqUtm7J4jdoB03oA2gIR0Ca8RQA+6iCdX2UKGgGR0CIFBN0NjLCaAdN6ANoCEdAmvFwMc6vJXV9lChoBkdAlt4hBE8aGmgHTegDaAhHQJr7Mo8ZDRd1fZQoaAZHQJaTkRnOB19oB03oA2gIR0CbBiE3bVSXdX2UKGgGR0CW95Pz4DcNaAdN6ANoCEdAmxAD987ZF3V9lChoBkdAnKFKqfe1r2gHTegDaAhHQJsQWnwXqJN1fZQoaAZHQJ6tgWEbo8poB03oA2gIR0CbGaRU3n6mdX2UKGgGR0CdMd+SKWLQaAdN6ANoCEdAmyDyquKXOXV9lChoBkdAmO9DO1OTJWgHTegDaAhHQJsnyF6Avtd1fZQoaAZHQJxfxEQXhwVoB03oA2gIR0CbKCqcVgx8dX2UKGgGR0CcNZ5UtI07aAdN6ANoCEdAmzGFndweeXV9lChoBkdAl/FEm6XjVGgHTegDaAhHQJs58CyQgcN1fZQoaAZHQJMOtjPOY6ZoB03oA2gIR0CbRIhpxm03dX2UKGgGR0CSHl5O8CgcaAdN6ANoCEdAm0Uv0h/y5XV9lChoBkdAi27zcIqsl2gHTegDaAhHQJtQ/b5/LDB1fZQoaAZHQJKeXe2uxKRoB03oA2gIR0CbWFo8IRh+dX2UKGgGR0CaIir2xptaaAdN6ANoCEdAm19U5EMLGHV9lChoBkdAl2ZuDFqBVmgHTegDaAhHQJtfrqTr3TN1fZQoaAZHQJkS0uZkTYdoB03oA2gIR0CbaOHtF8XvdX2UKGgGR0CYKQlkYoAoaAdN6ANoCEdAm3BhjawljXV9lChoBkdAlLubaVUuMGgHTegDaAhHQJt4/ZFocrB1fZQoaAZHQJXKzMdLg4xoB03oA2gIR0CbeX1xsEaEdX2UKGgGR0CT6SUWVNYbaAdN6ANoCEdAm4lUjgQ6IXV9lChoBkdAls2TFdcB2mgHTegDaAhHQJuUfS6UaAF1fZQoaAZHQJkAgG+sYEZoB03oA2gIR0Cbnax0+1SgdX2UKGgGR0CaRS1TBInSaAdN6ANoCEdAm54GGZeAu3V9lChoBkdAmJ6QLJCBw2gHTegDaAhHQJunU2R7qpt1fZQoaAZHQJjemUzKs+5oB03oA2gIR0CbrrT0xubadX2UKGgGR0CW5fqCHymRaAdN6ANoCEdAm7d9LxqfvnV9lChoBkdAnH+4DLbHqGgHTegDaAhHQJu3/esPrfN1fZQoaAZHQJqXnYbsF+xoB03oA2gIR0Cbxn+IMz/IdX2UKGgGR0CVzuwKjSG8aAdN6ANoCEdAm834BmwqzHV9lChoBkdAmMeodlum8GgHTegDaAhHQJvU+W6bvw51fZQoaAZHQJlk1wJgLJFoB03oA2gIR0Cb1VqLjxTbdX2UKGgGR0CbW5EFGG21aAdN6ANoCEdAm96h6a9bo3V9lChoBkdAnHMqdUbT+mgHTegDaAhHQJvmEXfqHGl1fZQoaAZHQJxIhdPci4doB03oA2gIR0Cb7RrrPdEcdX2UKGgGR0CePKaqjrRjaAdN6ANoCEdAm+2L3oLXtnV9lChoBkdAnJiahxo7FWgHTegDaAhHQJv66S4e9zx1fZQoaAZHQJ3X9eruIARoB03oA2gIR0CcBP2v0RODdX2UKGgGR0CZRaPkJa7maAdN6ANoCEdAnAv5LM9r43V9lChoBkdAnAZfFNtZWGgHTegDaAhHQJwMUk/r0J51fZQoaAZHQJuhbvUjLSxoB03oA2gIR0CcFY4gA6uGdX2UKGgGR0Ca++PxhDw6aAdN6ANoCEdAnBzqwMYuTXV9lChoBkdAm+rPMfRu0mgHTegDaAhHQJwjxOsT37F1fZQoaAZHQJ8OSMir1dxoB03oA2gIR0CcJDBfa6BidX2UKGgGR0CRDzTpgTh6aAdN6ANoCEdAnC6MC5mRNnV9lChoBkdAlzpCjL0SRWgHTegDaAhHQJw6QFA3T/h1fZQoaAZHQJ0DX/DLr5ZoB03oA2gIR0CcQ0MVDa4+dX2UKGgGR0CUJjZbY9PlaAdN6ANoCEdAnEOc2R7qp3VlLg=="
93
  },
94
  "ep_success_buffer": {
95
  ":type:": "<class 'collections.deque'>",
96
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
97
  },
98
+ "_n_updates": 31250,
99
  "n_steps": 8,
100
  "gamma": 0.99,
101
  "gae_lambda": 0.9,
a2c-AntBulletEnv-v0/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:95c95da9815b592867edf6b7a5315449236b174289dfb31cd86c174e18a83970
3
  size 56190
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bbd017cf9b4eee4207c3f8d0c757e340c02946307319827a43b87d4fb0d68343
3
  size 56190
a2c-AntBulletEnv-v0/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9c0744a244441e3128c01bb82f3051f94052591d039eaf7bb248d46d7a5fd76b
3
  size 56958
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8748e9041cd7d6740e945e1908c09dcceafc5e728ee6cf1258ec4195a63a246f
3
  size 56958
config.json CHANGED
@@ -1 +1 @@
1
- {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f3271fa5550>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f3271fa55e0>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f3271fa5670>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f3271fa5700>", "_build": "<function ActorCriticPolicy._build at 0x7f3271fa5790>", "forward": "<function ActorCriticPolicy.forward at 0x7f3271fa5820>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7f3271fa58b0>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f3271fa5940>", "_predict": "<function ActorCriticPolicy._predict at 0x7f3271fa59d0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f3271fa5a60>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f3271fa5af0>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f3271fa5b80>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7f3271fa4cc0>"}, "verbose": 1, "policy_kwargs": {":type:": "<class 'dict'>", ":serialized:": "gAWVowAAAAAAAAB9lCiMDGxvZ19zdGRfaW5pdJRK/v///4wKb3J0aG9faW5pdJSJjA9vcHRpbWl6ZXJfY2xhc3OUjBN0b3JjaC5vcHRpbS5ybXNwcm9wlIwHUk1TcHJvcJSTlIwQb3B0aW1pemVyX2t3YXJnc5R9lCiMBWFscGhhlEc/764UeuFHrowDZXBzlEc+5Pi1iONo8YwMd2VpZ2h0X2RlY2F5lEsAdXUu", "log_std_init": -2, "ortho_init": false, "optimizer_class": "<class 'torch.optim.rmsprop.RMSprop'>", "optimizer_kwargs": {"alpha": 0.99, "eps": 1e-05, "weight_decay": 0}}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVZwIAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLHIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWcAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/lGgKSxyFlIwBQ5R0lFKUjARoaWdolGgSKJZwAAAAAAAAAAAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH+UaApLHIWUaBV0lFKUjA1ib3VuZGVkX2JlbG93lGgSKJYcAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLHIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYcAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUaCFLHIWUaBV0lFKUjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "_shape": [28], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf\n -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf inf inf inf inf inf inf inf inf inf inf\n inf inf inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False False False False False\n False False False False False False False False False False False False\n False False False False]", "bounded_above": "[False False False False False False False False False False False False\n False False False False False False False False False False False False\n False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVnwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAIC/AACAvwAAgL8AAIC/AACAvwAAgL8AAIC/AACAv5RoCksIhZSMAUOUdJRSlIwEaGlnaJRoEiiWIAAAAAAAAAAAAIA/AACAPwAAgD8AAIA/AACAPwAAgD8AAIA/AACAP5RoCksIhZRoFXSUUpSMDWJvdW5kZWRfYmVsb3eUaBIolggAAAAAAAAAAQEBAQEBAQGUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYIAAAAAAAAAAEBAQEBAQEBlGghSwiFlGgVdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [8], "low": "[-1. -1. -1. -1. -1. -1. -1. -1.]", "high": "[1. 1. 1. 1. 1. 1. 1. 1.]", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_np_random": null}, "n_envs": 4, "num_timesteps": 2000000, "_total_timesteps": 2000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1678359694265281562, "learning_rate": 0.00096, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4JDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/T3UQTVUdaYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVNQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJbAAQAAAAAAAN+5rL7Ur04+gS0QP4wl/72/woM+xNW0v54LFz8g0ds8oYOHPk3vFL/cxUY+0TaQvwgfIL/tZ/Y+P4uBvkFqSj4frNg+L8ygP0uBDD/Q48S+jMCFvll3XD+ISRW/MCigP+c1Lj8Qt6g+vX0MPwdojr/D5i0/B3oFPrk8DD+mNlE//8ccwPgpBMA6bUO+Xt5XvxUdXz8zkVu/21waPxrrLcA8mRS/u0A7vxkRJD7LB+c/taOtv901KT947DE/zE1aPC+BLr8+IS68WfAfP99zaEDnNS4/jThCwCY96b8HaI6/8OIiPrM8Z76j8dY+zDoBQGfwsz9c6Ni++Wn3PtrRkT8bCJ2/hV0mvw/5Ub9Z8Rw/BVjSvvJxJEADqJ+/i6nXPslfyz/5Uls7DvQcvmvQCcDl1lu/RMDCuH0DlL5yPvQ9Hhi8vxC3qD4mPem/IhpmP+y+z73YzsE+U0wWP/Z9hj02y8C/eVaLP5N4a70jjUK/q1QZPtoWXT8Ym/k+h7N0vp567z7Cicw9TcJCP7L7T7ts3Ke+/OXovtCsID8rBia//+9Zv4VQoDzj20O/+3kFP+c1Lj8Qt6g+vX0MPwdojr+UjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSwRLHIaUjAFDlHSUUpQu"}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYEAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwSFlIwBQ5R0lFKULg=="}, "_last_original_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVNQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJbAAQAAAAAAAAAAAABHBvY1AACAPwAAAAAAAAAAAAAAAAAAAAAAAACA3JoQvgAAAAB1j/O/AAAAAG9ZBD4AAAAAdaDfPwAAAAA5o/a9AAAAANI04j8AAAAAzEWdPQAAAAAlXva/AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAdC22NgAAgD8AAAAAAAAAAAAAAAAAAAAAAAAAgETFor0AAAAAAOUAwAAAAABsv+Q9AAAAAD7x8z8AAAAAbhvhPQAAAADvUOM/AAAAAIHFiz0AAAAAWYn/vwAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAH8NlrUAAIA/AAAAAAAAAAAAAAAAAAAAAAAAAIAHmnc8AAAAAIPR+78AAAAANF9AvQAAAABBhPQ/AAAAAO8Gc70AAAAAje/6PwAAAADC1Zq9AAAAAD/e5r8AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA8CXm1AACAPwAAAAAAAAAAAAAAAAAAAAAAAACA/RFKvQAAAABf6Pm/AAAAAP/LzrwAAAAAVWnwPwAAAADJXoo9AAAAAOoX+z8AAAAAonEAPgAAAAARiPC/AAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSwRLHIaUjAFDlHSUUpQu"}, "_episode_num": 0, "use_sde": true, "sde_sample_freq": -1, "_current_progress_remaining": 0.0, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVRAwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHHTNm+TNdKMAWyUTegDjAF0lEdAqsqeX9itrHV9lChoBkdAhOpneizsyGgHTegDaAhHQKrLXsgMc6x1fZQoaAZHQJF9+/RE4NtoB03oA2gIR0CqzMJ3PiT/dX2UKGgGR0CUvlJx//edaAdN6ANoCEdAqtFhXhfjTHV9lChoBkdAgwI0iY9gW2gHTegDaAhHQKrY4DSw4bV1fZQoaAZHQIwwtix3V09oB03oA2gIR0Cq2VKf4AS4dX2UKGgGR0CYnr1YhdMTaAdN6ANoCEdAqtov5rP+oHV9lChoBkdAl3QMtGus92gHTegDaAhHQKrdalv60pp1fZQoaAZHQIadpW1c+q1oB03oA2gIR0Cq5ZZ8rqdIdX2UKGgGR0CRxR1SflIVaAdN6ANoCEdAquZEB8x9HHV9lChoBkdAggeiXY150WgHTegDaAhHQKrnjuP3i711fZQoaAZHQJUuXu7YkE9oB03oA2gIR0Cq7JVVYISldX2UKGgGR0CRNKWU8mrsaAdN6ANoCEdAqvSL3XZoPHV9lChoBkdAfyubC79Q42gHTegDaAhHQKr1BBJqZc91fZQoaAZHQJQnEAxSHdpoB03oA2gIR0Cq9d6h6By0dX2UKGgGR0CTS72Yv38GaAdN6ANoCEdAqvk9d9lVcXV9lChoBkdAkwwitV7x/mgHTegDaAhHQKsAylk6Lfl1fZQoaAZHQJGK7oePq9poB03oA2gIR0CrAUJGFzuGdX2UKGgGR0CVXEJJGvwFaAdN6ANoCEdAqwJlNBWxQnV9lChoBkdAlZBeY2Kl6GgHTegDaAhHQKsHRRLK3d91fZQoaAZHQJWXcQZn+Q5oB03oA2gIR0CrEB17pmmMdX2UKGgGR0CL9mtapxWDaAdN6ANoCEdAqxCN4cFQmHV9lChoBkdAkinUlZ5iVmgHTegDaAhHQKsRb+3H7xd1fZQoaAZHQJE9Pi97F85oB03oA2gIR0CrFLjZ+QU6dX2UKGgGR0CT2+cR15jZaAdN6ANoCEdAqxxU5hjOLXV9lChoBkdAkBfBCUornWgHTegDaAhHQKscxUPQOWl1fZQoaAZHQJJctzvJA+poB03oA2gIR0CrHaTvqkdndX2UKGgGR0CTdxojv/ipaAdN6ANoCEdAqyHtUXHim3V9lChoBkdAk7cFUdaMaWgHTegDaAhHQKsrqMn7YTV1fZQoaAZHQJNzYAeaKDVoB03oA2gIR0CrLCARTS9edX2UKGgGR0CDI0y0KJEZaAdN6ANoCEdAqy0Dn3cpLHV9lChoBkdAkdpR3mmtQ2gHTegDaAhHQKswTKe05U91fZQoaAZHQI9bbDbah6BoB03oA2gIR0CrN9Lns9jgdX2UKGgGR0CQkZKR+z+naAdN6ANoCEdAqzhCfpUxVXV9lChoBkdAkGfN8E3bVWgHTegDaAhHQKs5JJeVs1t1fZQoaAZHQJDXcIHC4z9oB03oA2gIR0CrPMdtMwlCdX2UKGgGR0CIZQJa7mMgaAdN6ANoCEdAq0dHkDIRy3V9lChoBkdAlL42GRFI/mgHTegDaAhHQKtHuGyon8d1fZQoaAZHQJGtQYDTz/ZoB03oA2gIR0CrSJqHwgDBdX2UKGgGR0CJdMV+I/JOaAdN6ANoCEdAq0vuoYNy53V9lChoBkdAkXeVr6+FlGgHTegDaAhHQKtTsvM8ox51fZQoaAZHQId3G0PYnOVoB03oA2gIR0CrVCl4keIVdX2UKGgGR0CHYNFMqSX/aAdN6ANoCEdAq1UNOKwY+HV9lChoBkdAkvLmvfTCtWgHTegDaAhHQKtYX1pTMq11fZQoaAZHQJAZSlVLi/BoB03oA2gIR0CrYwaxPfsNdX2UKGgGR0CRTs+S8rZraAdN6ANoCEdAq2N+KCQLeHV9lChoBkdAkoq1ivxH5WgHTegDaAhHQKtkYIv8IiV1fZQoaAZHQI/g6Rhc7hhoB03oA2gIR0CrZ7Jkwvg4dX2UKGgGR0CR8vbY9Pk8aAdN6ANoCEdAq29YvJzT4XV9lChoBkdAkyoqx9oexWgHTegDaAhHQKtvzEpiI+J1fZQoaAZHQJSlQWSEDhdoB03oA2gIR0CrcKjDTBqLdX2UKGgGR0CUZLRfnfVJaAdN6ANoCEdAq3PgKMNtqHV9lChoBkdAkmdxaPjn3mgHTegDaAhHQKt+Et+1Bt11fZQoaAZHQJOx3B0p3HJoB03oA2gIR0Crfr8u8K5TdX2UKGgGR0CHsI6WgOBlaAdN6ANoCEdAq3+9dVvMr3V9lChoBkdAlpjpwbVBlmgHTegDaAhHQKuDDmcvugJ1fZQoaAZHQJFvJ8Rcu8NoB03oA2gIR0CripxFqi48dX2UKGgGR0CUpR9Gqgh9aAdN6ANoCEdAq4sSeiBXjnV9lChoBkdAkdEUCq6vq2gHTegDaAhHQKuL+XvYvnN1fZQoaAZHQJVVTFhoduJoB03oA2gIR0Crjz1MmF8HdX2UKGgGR0CWdS0Z3s5XaAdN6ANoCEdAq5iOACnxa3V9lChoBkdAlz6CDqW1MWgHTegDaAhHQKuZQZBLPD51fZQoaAZHQJTysIKMNttoB03oA2gIR0Crmpg2ZRbbdX2UKGgGR0CYW5yD7IkraAdN6ANoCEdAq55wiA2AG3V9lChoBkdAkwvVSflIVmgHTegDaAhHQKul6F23azx1fZQoaAZHQJKHNV0cOsloB03oA2gIR0CrplmQr+YMdX2UKGgGR0CTBIcnVoYfaAdN6ANoCEdAq6c9PtUn5XV9lChoBkdAl/hRgZ0jkmgHTegDaAhHQKuqexgRbr11fZQoaAZHQJXsU+2VmjFoB03oA2gIR0CrsqeCsfaIdX2UKGgGR0CVRFcPvrnlaAdN6ANoCEdAq7NPbmEGq3V9lChoBkdAlM8Risny/mgHTegDaAhHQKu0qT0QK8d1fZQoaAZHQIwsR17pmmNoB03oA2gIR0CruYZL7GeddX2UKGgGR0B6JmwHJLdvaAdN6ANoCEdAq8ELTtsvZnV9lChoBkdAlJQNCmdiD2gHTegDaAhHQKvBfp7CzkZ1fZQoaAZHQIXHptgrpaBoB03oA2gIR0CrwlsoUi6hdX2UKGgGR0CUNe5KvmozaAdN6ANoCEdAq8WkZJkGzXV9lChoBkdAk6n7ONYKY2gHTegDaAhHQKvNSlqrR0F1fZQoaAZHQJXTCe18b71oB03oA2gIR0Crzgm7rcCYdX2UKGgGR0CYsLFY+0PZaAdN6ANoCEdAq89Jy6tknXV9lChoBkdAkfCITfzjFWgHTegDaAhHQKvUQy6cy311fZQoaAZHQJVkbkzXSShoB03oA2gIR0Cr3HrZSNwSdX2UKGgGR0CDBBv0h/y5aAdN6ANoCEdAq9zp+4LCvXV9lChoBkdAkz12/zreImgHTegDaAhHQKvdxCb+cYt1fZQoaAZHQJh/Ndt2s7xoB03oA2gIR0Cr4QxSxZ+ydX2UKGgGR0CNS2cH4XXRaAdN6ANoCEdAq+iqzPa+OHV9lChoBkdAhrcdAHE/B2gHTegDaAhHQKvpGzhxYJV1fZQoaAZHQJJJtPci4axoB03oA2gIR0Cr6gIIWxhVdX2UKGgGR0CWLYkwevIPaAdN6ANoCEdAq+6k4m1IAnV9lChoBkdAj7uoVdonKGgHTegDaAhHQKv38wxFiKB1fZQoaAZHQI0xoQxvegtoB03oA2gIR0Cr+GUSAYpEdX2UKGgGR0CSQVYjSofkaAdN6ANoCEdAq/lIphF3IXV9lChoBkdAkejBGhEjPmgHTegDaAhHQKv8hNbkfcN1fZQoaAZHQIBAUR15jYtoB03oA2gIR0CsBCYm9g4PdX2UKGgGR0CUPBgPVd5ZaAdN6ANoCEdArASXQ+lj3HV9lChoBkdAksHpL26ClWgHTegDaAhHQKwFdF9a2Wp1fZQoaAZHQJQANNTLns9oB03oA2gIR0CsCUPWQOnVdX2UKGgGR0CXQ6Wf9P1taAdN6ANoCEdArBMvNRm9QHV9lChoBkdAlljNTDO1OWgHTegDaAhHQKwTrcyFfzB1fZQoaAZHQJULj+rELploB03oA2gIR0CsFI9W6shgdX2UKGgGR0CVhS1gH/tIaAdN6ANoCEdArBfMXxe9jHVlLg=="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 62500, "n_steps": 8, "gamma": 0.99, "gae_lambda": 0.9, "ent_coef": 0.0, "vf_coef": 0.4, "max_grad_norm": 0.5, "normalize_advantage": false, "system_info": {"OS": "Linux-5.10.147+-x86_64-with-glibc2.31 # 1 SMP Sat Dec 10 16:00:40 UTC 2022", "Python": "3.9.16", "Stable-Baselines3": "1.7.0", "PyTorch": "1.13.1+cu116", "GPU Enabled": "True", "Numpy": "1.22.4", "Gym": "0.21.0"}}
 
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f8a366e65e0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f8a366e6670>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f8a366e6700>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f8a366e6790>", "_build": "<function ActorCriticPolicy._build at 0x7f8a366e6820>", "forward": "<function ActorCriticPolicy.forward at 0x7f8a366e68b0>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7f8a366e6940>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f8a366e69d0>", "_predict": "<function ActorCriticPolicy._predict at 0x7f8a366e6a60>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f8a366e6af0>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f8a366e6b80>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f8a366e6c10>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7f8a366e7a40>"}, "verbose": 1, "policy_kwargs": {":type:": "<class 'dict'>", ":serialized:": "gAWVowAAAAAAAAB9lCiMDGxvZ19zdGRfaW5pdJRK/v///4wKb3J0aG9faW5pdJSJjA9vcHRpbWl6ZXJfY2xhc3OUjBN0b3JjaC5vcHRpbS5ybXNwcm9wlIwHUk1TcHJvcJSTlIwQb3B0aW1pemVyX2t3YXJnc5R9lCiMBWFscGhhlEc/764UeuFHrowDZXBzlEc+5Pi1iONo8YwMd2VpZ2h0X2RlY2F5lEsAdXUu", "log_std_init": -2, "ortho_init": false, "optimizer_class": "<class 'torch.optim.rmsprop.RMSprop'>", "optimizer_kwargs": {"alpha": 0.99, "eps": 1e-05, "weight_decay": 0}}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVZwIAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLHIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWcAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/lGgKSxyFlIwBQ5R0lFKUjARoaWdolGgSKJZwAAAAAAAAAAAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH+UaApLHIWUaBV0lFKUjA1ib3VuZGVkX2JlbG93lGgSKJYcAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLHIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYcAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUaCFLHIWUaBV0lFKUjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "_shape": [28], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf\n -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf inf inf inf inf inf inf inf inf inf inf\n inf inf inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False False False False False\n False False False False False False False False False False False False\n False False False False]", "bounded_above": "[False False False False False False False False False False False False\n False False False False False False False False False False False False\n False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVnwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAIC/AACAvwAAgL8AAIC/AACAvwAAgL8AAIC/AACAv5RoCksIhZSMAUOUdJRSlIwEaGlnaJRoEiiWIAAAAAAAAAAAAIA/AACAPwAAgD8AAIA/AACAPwAAgD8AAIA/AACAP5RoCksIhZRoFXSUUpSMDWJvdW5kZWRfYmVsb3eUaBIolggAAAAAAAAAAQEBAQEBAQGUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYIAAAAAAAAAAEBAQEBAQEBlGghSwiFlGgVdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [8], "low": "[-1. -1. -1. -1. -1. -1. -1. -1.]", "high": "[1. 1. 1. 1. 1. 1. 1. 1.]", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_np_random": null}, "n_envs": 4, "num_timesteps": 1000000, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1678394102036149900, "learning_rate": 0.00096, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4JDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/T3UQTVUdaYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVNQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJbAAQAAAAAAAKJW0D5dNVA+WPQHPzydAkD8mSs+dpceP9icAr+ziYU+5gISPue7gT7sSWi/kR8BP901rT23f8I/gqTsvBSB0TxecQw/xq0PQBaPPL9FfzS/bZdpv2t6gL8pYB0/vaJ+PbvUmb+AFAo/yYamPlcsMT/mRY0+jhmhv0V8Ez8g0RNASmQKvoKxLT/9aRK/SZe4PgskcD9d29m+0s09vmQwID8RWVY/I1Pvv+tCuz2CcXy/lNGBP2E8DcCgX3i/K8FWP9bSQ748M7S+GJsIv9Uag8BUA1U/gBQKP8mGpj7v8ri/K6gaP3rYwT63Gd8+3iYPQG3/WT+hhL69zG8ePyWpB78RqHQ/XIV9v1vgRr/Jdzs/XOmJPzfJKD3nJse9jPe3P6cw7D+fEJ2/3/K8PZYE7z6noWa/RQQ2PRSGnj2dboC8u9SZv4AUCj/JhqY+VywxP7q7Xb/3/Ii/bR8kP3VfOz8Kl0nAbS0PPzVzH74csLm+7lZiP3v1bb/mJX6+B/ofvqOHWL9hHUPAJ98kP5utpL6/a8M9xlIDwMgfSD/VV6m7UEdnv0sfiTzBNnK/5diNvFQDVT+AFAo/yYamPu/yuL+UjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSwRLHIaUjAFDlHSUUpQu"}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYEAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwSFlIwBQ5R0lFKULg=="}, "_last_original_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVNQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJbAAQAAAAAAAAAAAAAT6dK1AACAPwAAAAAAAAAAAAAAAAAAAAAAAACAw+z4PQAAAABYhdy/AAAAANeGtrwAAAAAIj/oPwAAAACD12E9AAAAAGVk4T8AAAAAalWSvAAAAACk2QDAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAApGNRtgAAgD8AAAAAAAAAAAAAAAAAAAAAAAAAgL14Ej4AAAAA33XlvwAAAABMZ/Y8AAAAAKrE/T8AAAAAy353vQAAAAAUx+o/AAAAAGhdCb0AAAAAe4vavwAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAG58BjYAAIA/AAAAAAAAAAAAAAAAAAAAAAAAAICYs7A9AAAAAHfy8r8AAAAA3L6xPQAAAADbW90/AAAAAOm6TzsAAAAAhzH6PwAAAAAliKG9AAAAAJOE678AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAABRUcC2AACAPwAAAAAAAAAAAAAAAAAAAAAAAACAU+MFvQAAAABdAuO/AAAAAHKf970AAAAA3xHjPwAAAAAq/ZC9AAAAAMBn+T8AAAAAMeq0PQAAAAA+fuG/AAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSwRLHIaUjAFDlHSUUpQu"}, "_episode_num": 0, "use_sde": true, "sde_sample_freq": -1, "_current_progress_remaining": 0.0, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVRAwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQJ4+akdmxt6MAWyUTegDjAF0lEdAmZ545HVf/nV9lChoBkdAmyhJ1Ng0CWgHTegDaAhHQJmn05tFa0R1fZQoaAZHQJ8Z+cYqG1xoB03oA2gIR0CZrtJrLyMDdX2UKGgGR0CZple4Cp3paAdN6ANoCEdAma80AcT8HnV9lChoBkdAmQVoePq9oWgHTegDaAhHQJm4eZ1FH8V1fZQoaAZHQJpJ0EEC/49oB03oA2gIR0CZv/N6PbPAdX2UKGgGR0CYBrVKPGQ0aAdN6ANoCEdAmcbJVGTcI3V9lChoBkdAk/8iRjjJdWgHTegDaAhHQJnHIjmjj711fZQoaAZHQJmL0tapxWFoB03oA2gIR0CZ0l+LWI43dX2UKGgGR0Cd1PZbY9PlaAdN6ANoCEdAmd33LA57xHV9lChoBkdAmss1yR0U5GgHTegDaAhHQJnlicf/3nJ1fZQoaAZHQJui89/z8P5oB03oA2gIR0CZ5eoRqXWwdX2UKGgGR0Cb8OjVhCtzaAdN6ANoCEdAme83BxgiNnV9lChoBkdAnomnTI/7i2gHTegDaAhHQJn2sjMV1wJ1fZQoaAZHQJ07l35eqrBoB03oA2gIR0CZ/dPEbYK6dX2UKGgGR0CdfTC+10DEaAdN6ANoCEdAmf40FB6a9nV9lChoBkdAmnPBxPwd82gHTegDaAhHQJoHc0cfeUJ1fZQoaAZHQJwt5wYLsrxoB03oA2gIR0CaEi482aUidX2UKGgGR0CfAek0rK/3aAdN6ANoCEdAmhzGUB4lhXV9lChoBkdAmykNVinYQWgHTegDaAhHQJodIxpL26F1fZQoaAZHQJrFK11GLDRoB03oA2gIR0CaJl0/nnuBdX2UKGgGR0CaM0a6z3RHaAdN6ANoCEdAmi2tsvZh8nV9lChoBkdAmmEhRMvh62gHTegDaAhHQJo0nTd+G491fZQoaAZHQJk19CPZIxxoB03oA2gIR0CaNPiEg4ffdX2UKGgGR0CXy7frrxAjaAdN6ANoCEdAmj4abe/HpHV9lChoBkdAmgjQw482aWgHTegDaAhHQJpGM8IRh+h1fZQoaAZHQJTFEogFHJ9oB03oA2gIR0CaUI8Djin6dX2UKGgGR0CMyMnNPgvUaAdN6ANoCEdAmlEtbLU1AXV9lChoBkdAmV1RXS0BwWgHTegDaAhHQJpdUxoIv8J1fZQoaAZHQJX/it+1Bt1oB03oA2gIR0CaZLRfWtlqdX2UKGgGR0CZQg3ZPEbYaAdN6ANoCEdAmmuFdC3PRnV9lChoBkdAmErczVMEimgHTegDaAhHQJpr34nF5v91fZQoaAZHQJm5WS2Yv39oB03oA2gIR0CadRctGus+dX2UKGgGR0CYq/fyf+S9aAdN6ANoCEdAmnxRqGlANXV9lChoBkdAlVwQn+hoNGgHTegDaAhHQJqEWr4nF5x1fZQoaAZHQJr3krqdH2BoB03oA2gIR0CahN3oLXtjdX2UKGgGR0CagDVRUFSsaAdN6ANoCEdAmpLXxnWat3V9lChoBkdAmnrxp1zQu2gHTegDaAhHQJqbQhyKekJ1fZQoaAZHQJw8NJe3QUpoB03oA2gIR0CaoiBMzuWsdX2UKGgGR0Cb/kku6ErYaAdN6ANoCEdAmqKBhH9WIXV9lChoBkdAmdBX9R77bmgHTegDaAhHQJqr8UoKD011fZQoaAZHQJVQovugHu9oB03oA2gIR0Cas2mjTKDDdX2UKGgGR0CZZyIyCWeIaAdN6ANoCEdAmrpP5DZ13nV9lChoBkdAl1hr349HMGgHTegDaAhHQJq6qUC7sfJ1fZQoaAZHQJwoTmV7hNxoB03oA2gIR0CaxuNGmUGFdX2UKGgGR0CWDC3evZAZaAdN6ANoCEdAmtJUvPC2t3V9lChoBkdAmHfzkU9IPWgHTegDaAhHQJrZKgvlEJB1fZQoaAZHQJledsqJ/G5oB03oA2gIR0Ca2YEhJRO2dX2UKGgGR0Cbs/Iv8IiUaAdN6ANoCEdAmuKsS9M9KXV9lChoBkdAmR8J9d/rjmgHTegDaAhHQJrqEVO9FnZ1fZQoaAZHQJqUtm7J4jdoB03oA2gIR0Ca8RQA+6iCdX2UKGgGR0CIFBN0NjLCaAdN6ANoCEdAmvFwMc6vJXV9lChoBkdAlt4hBE8aGmgHTegDaAhHQJr7Mo8ZDRd1fZQoaAZHQJaTkRnOB19oB03oA2gIR0CbBiE3bVSXdX2UKGgGR0CW95Pz4DcNaAdN6ANoCEdAmxAD987ZF3V9lChoBkdAnKFKqfe1r2gHTegDaAhHQJsQWnwXqJN1fZQoaAZHQJ6tgWEbo8poB03oA2gIR0CbGaRU3n6mdX2UKGgGR0CdMd+SKWLQaAdN6ANoCEdAmyDyquKXOXV9lChoBkdAmO9DO1OTJWgHTegDaAhHQJsnyF6Avtd1fZQoaAZHQJxfxEQXhwVoB03oA2gIR0CbKCqcVgx8dX2UKGgGR0CcNZ5UtI07aAdN6ANoCEdAmzGFndweeXV9lChoBkdAl/FEm6XjVGgHTegDaAhHQJs58CyQgcN1fZQoaAZHQJMOtjPOY6ZoB03oA2gIR0CbRIhpxm03dX2UKGgGR0CSHl5O8CgcaAdN6ANoCEdAm0Uv0h/y5XV9lChoBkdAi27zcIqsl2gHTegDaAhHQJtQ/b5/LDB1fZQoaAZHQJKeXe2uxKRoB03oA2gIR0CbWFo8IRh+dX2UKGgGR0CaIir2xptaaAdN6ANoCEdAm19U5EMLGHV9lChoBkdAl2ZuDFqBVmgHTegDaAhHQJtfrqTr3TN1fZQoaAZHQJkS0uZkTYdoB03oA2gIR0CbaOHtF8XvdX2UKGgGR0CYKQlkYoAoaAdN6ANoCEdAm3BhjawljXV9lChoBkdAlLubaVUuMGgHTegDaAhHQJt4/ZFocrB1fZQoaAZHQJXKzMdLg4xoB03oA2gIR0CbeX1xsEaEdX2UKGgGR0CT6SUWVNYbaAdN6ANoCEdAm4lUjgQ6IXV9lChoBkdAls2TFdcB2mgHTegDaAhHQJuUfS6UaAF1fZQoaAZHQJkAgG+sYEZoB03oA2gIR0Cbnax0+1SgdX2UKGgGR0CaRS1TBInSaAdN6ANoCEdAm54GGZeAu3V9lChoBkdAmJ6QLJCBw2gHTegDaAhHQJunU2R7qpt1fZQoaAZHQJjemUzKs+5oB03oA2gIR0CbrrT0xubadX2UKGgGR0CW5fqCHymRaAdN6ANoCEdAm7d9LxqfvnV9lChoBkdAnH+4DLbHqGgHTegDaAhHQJu3/esPrfN1fZQoaAZHQJqXnYbsF+xoB03oA2gIR0Cbxn+IMz/IdX2UKGgGR0CVzuwKjSG8aAdN6ANoCEdAm834BmwqzHV9lChoBkdAmMeodlum8GgHTegDaAhHQJvU+W6bvw51fZQoaAZHQJlk1wJgLJFoB03oA2gIR0Cb1VqLjxTbdX2UKGgGR0CbW5EFGG21aAdN6ANoCEdAm96h6a9bo3V9lChoBkdAnHMqdUbT+mgHTegDaAhHQJvmEXfqHGl1fZQoaAZHQJxIhdPci4doB03oA2gIR0Cb7RrrPdEcdX2UKGgGR0CePKaqjrRjaAdN6ANoCEdAm+2L3oLXtnV9lChoBkdAnJiahxo7FWgHTegDaAhHQJv66S4e9zx1fZQoaAZHQJ3X9eruIARoB03oA2gIR0CcBP2v0RODdX2UKGgGR0CZRaPkJa7maAdN6ANoCEdAnAv5LM9r43V9lChoBkdAnAZfFNtZWGgHTegDaAhHQJwMUk/r0J51fZQoaAZHQJuhbvUjLSxoB03oA2gIR0CcFY4gA6uGdX2UKGgGR0Ca++PxhDw6aAdN6ANoCEdAnBzqwMYuTXV9lChoBkdAm+rPMfRu0mgHTegDaAhHQJwjxOsT37F1fZQoaAZHQJ8OSMir1dxoB03oA2gIR0CcJDBfa6BidX2UKGgGR0CRDzTpgTh6aAdN6ANoCEdAnC6MC5mRNnV9lChoBkdAlzpCjL0SRWgHTegDaAhHQJw6QFA3T/h1fZQoaAZHQJ0DX/DLr5ZoB03oA2gIR0CcQ0MVDa4+dX2UKGgGR0CUJjZbY9PlaAdN6ANoCEdAnEOc2R7qp3VlLg=="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 31250, "n_steps": 8, "gamma": 0.99, "gae_lambda": 0.9, "ent_coef": 0.0, "vf_coef": 0.4, "max_grad_norm": 0.5, "normalize_advantage": false, "system_info": {"OS": "Linux-5.10.147+-x86_64-with-glibc2.31 # 1 SMP Sat Dec 10 16:00:40 UTC 2022", "Python": "3.9.16", "Stable-Baselines3": "1.7.0", "PyTorch": "1.13.1+cu116", "GPU Enabled": "True", "Numpy": "1.22.4", "Gym": "0.21.0"}}
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fd6842ae12f8f893ed1789f6bbe9fdcf42c6b920cd7d184e4b1f333bcfae8bfc
3
- size 1007985
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3acbcbb596a86a110db590335ad65d6444069a75ec123ca15609e1abef7aefe5
3
+ size 1047779
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 1372.0752115952084, "std_reward": 130.56269936412838, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-03-09T12:01:05.393571"}
 
1
+ {"mean_reward": 1921.019142676075, "std_reward": 58.45747045939283, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-03-09T21:04:50.854958"}
vec_normalize.pkl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f685035646e46623d96e31c798ee960b02969500ab5487d88b1f9868e3f86713
3
  size 2136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85bd97a847759bec332370599050fa592ed32bc080adba881016591b5b8ec9db
3
  size 2136