AntiSquid commited on
Commit
f2e32b9
1 Parent(s): 1d1b936

Initial commit

Browse files
README.md CHANGED
@@ -8,17 +8,16 @@ tags:
8
  model-index:
9
  - name: A2C
10
  results:
11
- - task:
 
 
 
 
12
  type: reinforcement-learning
13
  name: reinforcement-learning
14
  dataset:
15
  name: AntBulletEnv-v0
16
  type: AntBulletEnv-v0
17
- metrics:
18
- - type: mean_reward
19
- value: 978.60 +/- 103.55
20
- name: mean_reward
21
- verified: false
22
  ---
23
 
24
  # **A2C** Agent playing **AntBulletEnv-v0**
 
8
  model-index:
9
  - name: A2C
10
  results:
11
+ - metrics:
12
+ - type: mean_reward
13
+ value: 911.55 +/- 62.62
14
+ name: mean_reward
15
+ task:
16
  type: reinforcement-learning
17
  name: reinforcement-learning
18
  dataset:
19
  name: AntBulletEnv-v0
20
  type: AntBulletEnv-v0
 
 
 
 
 
21
  ---
22
 
23
  # **A2C** Agent playing **AntBulletEnv-v0**
a2c-AntBulletEnv-v0.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fdd379a130b322112570c01378e2083ba797094b413dd1546434c284caedd12a
3
- size 129255
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16db8cbbd652988538246752fe292328ce0d18095ff2ba372b272dcaa097d621
3
+ size 128804
a2c-AntBulletEnv-v0/_stable_baselines3_version CHANGED
@@ -1 +1 @@
1
- 1.7.0
 
1
+ 1.5.0
a2c-AntBulletEnv-v0/data CHANGED
@@ -3,21 +3,20 @@
3
  ":type:": "<class 'abc.ABCMeta'>",
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
- "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
- "__init__": "<function ActorCriticPolicy.__init__ at 0x7f28d61b7040>",
8
- "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f28d61b70d0>",
9
- "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f28d61b7160>",
10
- "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f28d61b71f0>",
11
- "_build": "<function ActorCriticPolicy._build at 0x7f28d61b7280>",
12
- "forward": "<function ActorCriticPolicy.forward at 0x7f28d61b7310>",
13
- "extract_features": "<function ActorCriticPolicy.extract_features at 0x7f28d61b73a0>",
14
- "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f28d61b7430>",
15
- "_predict": "<function ActorCriticPolicy._predict at 0x7f28d61b74c0>",
16
- "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f28d61b7550>",
17
- "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f28d61b75e0>",
18
- "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f28d61b7670>",
19
  "__abstractmethods__": "frozenset()",
20
- "_abc_impl": "<_abc_data object at 0x7f28d61aeb40>"
21
  },
22
  "verbose": 1,
23
  "policy_kwargs": {
@@ -64,24 +63,24 @@
64
  "_num_timesteps_at_start": 0,
65
  "seed": null,
66
  "action_noise": null,
67
- "start_time": 1676834158394097657,
68
  "learning_rate": 0.0001,
69
  "tensorboard_log": null,
70
  "lr_schedule": {
71
  ":type:": "<class 'function'>",
72
- ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4JDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/Gjbi6xxDLYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="
73
  },
74
  "_last_obs": {
75
  ":type:": "<class 'numpy.ndarray'>",
76
- ":serialized:": "gAWVNQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJbAAQAAAAAAAJnXyb8wtk4/H37TPCr+3b4fVyS+cTynPffwmr6yWEw/bxdcP/MGBbxiNZa/ADIZvSWyk7+4ZuO7jmgsP3N3Fz2oyMc/PRksPAfpwT6IOzs93dIOvxCTbzytlFO/6PAvvW7e/z7XHug+2LfDPsKz7z69m4y/Y1TLP+ap5L+pvTw/+xQIP1Wzhz/THaw9cBwDPpTNLz+6Yt484TIcv+Tlaz5vXwU/l4Yev7ZWFj+OOWu+oguMPxvXFL/tnSc/EK37vYrBV78P3Qs9fU1Vv7Q4rT1u3v8+1x7oPti3wz7Cs+8+B3Bzv+9XGT/f4WU+DSGpP/Tvvb9Zwgs+HLX9Pf7jMT75WC0/o4O1viQ2B78HnfO9T39sv591GMB1/iU/6HYavtUvXD+GPIS/GbMXP2Ozor4fkkO/9k94P3mvU79CEqS7bt7/PgYrDcDYt8M+9bMIwIZUmr9R/Lk/eZdYwB476L623l+/EMJ5P0Jesb7Snno/FHxFPwvwm75wOo2/6VikvpSbBr4Bb9K/FruNPkN69z28ydY/eRNjvugBCj4u1li/4DRBPvbQAL4WvlK/5gWCPm7e/z7XHug+2LfDPsKz7z6UjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSwRLHIaUjAFDlHSUUpQu"
77
  },
78
  "_last_episode_starts": {
79
  ":type:": "<class 'numpy.ndarray'>",
80
- ":serialized:": "gAWVdwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYEAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwSFlIwBQ5R0lFKULg=="
81
  },
82
  "_last_original_obs": {
83
  ":type:": "<class 'numpy.ndarray'>",
84
- ":serialized:": "gAWVNQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJbAAQAAAAAAAAAAAADtjtM1AACAPwAAAAAAAAAAAAAAAAAAAAAAAACAMcW0vQAAAAA/Z/y/AAAAAGiSQb0AAAAAcZf3PwAAAAAGSBo9AAAAAP5H/j8AAAAAmKBiPAAAAAA3MvK/AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAG6k1tgAAgD8AAAAAAAAAAAAAAAAAAAAAAAAAgLRIQ70AAAAAEwT8vwAAAAD+Ueq9AAAAAFh1/T8AAAAAr8mPvAAAAADpzv8/AAAAALHNGD0AAAAAVWv1vwAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAADDYS7UAAIA/AAAAAAAAAAAAAAAAAAAAAAAAAIDqVxw9AAAAAHR8278AAAAAhkaTPAAAAAAFYwBAAAAAANVhnr0AAAAAzZntPwAAAAAcpYa9AAAAAHUa/b8AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAJi61AACAPwAAAAAAAAAAAAAAAAAAAAAAAACAJjNcvQAAAACQH/W/AAAAAESJTz0AAAAAwzTsPwAAAABwKtG9AAAAADTH8D8AAAAAfybiPAAAAACWVvu/AAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSwRLHIaUjAFDlHSUUpQu"
85
  },
86
  "_episode_num": 0,
87
  "use_sde": true,
@@ -89,7 +88,7 @@
89
  "_current_progress_remaining": 0.0,
90
  "ep_info_buffer": {
91
  ":type:": "<class 'collections.deque'>",
92
- ":serialized:": "gAWVQwwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQI0o6zHCGeuMAWyUTegDjAF0lEdAq3Mo3eenRHV9lChoBkdAjYXxG2Cul2gHTegDaAhHQKt1gBdUsFt1fZQoaAZHQIq9CfOD8LtoB03oA2gIR0CrdzKTjebedX2UKGgGR0CN8NbnoxHoaAdN6ANoCEdAq3+HGlyimHV9lChoBkdAjRrpkwvg32gHTegDaAhHQKuBoc+7lJZ1fZQoaAZHQI7HIuIyj59oB03oA2gIR0CrhXFAE+xGdX2UKGgGR0CRmabiIcioaAdN6ANoCEdAq4gfJYDDCXV9lChoBkdAkBhoIOYplWgHTegDaAhHQKuPpJbMX8B1fZQoaAZHQI6zr+WGATZoB03oA2gIR0CrkPMqril0dX2UKGgGR0COqR9vS+g2aAdN6ANoCEdAq5M7Jr+HanV9lChoBkdAkbXgRwqAjWgHTegDaAhHQKuU73M6ikB1fZQoaAZHQJAtcHu7YkFoB03oA2gIR0CrnGnU+cH4dX2UKGgGR0CMBKnVoYelaAdN6ANoCEdAq557PfKp1nV9lChoBkdAjawOVopQUGgHTegDaAhHQKuiCvLX+VF1fZQoaAZHQIwygmG/N7loB03oA2gIR0CrpMEYwZfldX2UKGgGR0BiwglByCFsaAdL8GgIR0CrpuOLaVUudX2UKGgGR0CNY0upS75EaAdN6ANoCEdAq6zylHjIaXV9lChoBkdAiwNJFb3XZ2gHTegDaAhHQKuuUY8+zMR1fZQoaAZHQIg+xNCZ4OdoB03oA2gIR0CrsjxRuTA4dX2UKGgGR0CNPMb4Ju2raAdN6ANoCEdAq7ODI7vG63V9lChoBkdAj9FGWUr08WgHTegDaAhHQKu5ZvcafjF1fZQoaAZHQItLG85CF9NoB03oA2gIR0CrurD0th/idX2UKGgGR0CQz98iOeasaAdN6ANoCEdAq8CYdZJTVHV9lChoBkdAj2F6b4Ju22gHTegDaAhHQKvCxTqjaf11fZQoaAZHQI6xrDZUT+NoB03oA2gIR0Cryi5QYUFjdX2UKGgGR0CP2BXfZVXFaAdN6ANoCEdAq8ugBmwqzHV9lChoBkdAjZT5nUUfxWgHTegDaAhHQKvPj2NedCp1fZQoaAZHQIv5vrrxAjZoB03oA2gIR0Cr0OoEB8x9dX2UKGgGR0CKmp7Kq4pdaAdN6ANoCEdAq9b5RyfcvnV9lChoBkdAjXZmh/RVqGgHTegDaAhHQKvYV/jsD4h1fZQoaAZHQJE9sw22oehoB03oA2gIR0Cr3Tr2QGOddX2UKGgGR0CQHLZi/fwaaAdN6ANoCEdAq99CsS00FnV9lChoBkdAkSDkvPC2t2gHTegDaAhHQKvn3aews5J1fZQoaAZHQJF5ubsniNtoB03oA2gIR0Cr6S79Q40edX2UKGgGR0CP/xL6k691aAdN6ANoCEdAq+07/Ot4iXV9lChoBkdAjPCINNJvpGgHTegDaAhHQKvuinEVFhJ1fZQoaAZHQI1cEkdFOO9oB03oA2gIR0Cr9KYH5aePdX2UKGgGR0CG2w8q4H5aaAdN6ANoCEdAq/YDcCYCyXV9lChoBkdAkFtS0OVgQmgHTegDaAhHQKv58L/jsD51fZQoaAZHQI4jAwyqMm5oB03oA2gIR0Cr++7lq8DkdX2UKGgGR0CM9vGhEjPfaAdN6ANoCEdArAVgk7fYSXV9lChoBkdAkICb2lEZzmgHTegDaAhHQKwGzEa2nbZ1fZQoaAZHQIu9O7+T/yZoB03oA2gIR0CsCsiYb83udX2UKGgGR0CLfVG+9Jz1aAdN6ANoCEdArAwXGGVRk3V9lChoBkdAkOdUjC53DGgHTegDaAhHQKwSHuAqd6N1fZQoaAZHQJDV7CCSRr9oB03oA2gIR0CsE4DSofjkdX2UKGgGR0CNgjZkkKNRaAdN6ANoCEdArBdfhESdv3V9lChoBkdAjiXsFt8/lmgHTegDaAhHQKwYsgWac7R1fZQoaAZHQJByKnqFAVxoB03oA2gIR0CsIaa+N96UdX2UKGgGR0CP+NcynDR/aAdN6ANoCEdArCPq/0ulGnV9lChoBkdAkjxi0WuX/2gHTegDaAhHQKwoMcz67/Z1fZQoaAZHQI/dcQmNR3xoB03oA2gIR0CsKY5Rjz7NdX2UKGgGR0CRoBKdxyXEaAdN6ANoCEdArC+KbMHKOnV9lChoBkdAiGJjhky1u2gHTegDaAhHQKww2IJqqOt1fZQoaAZHQI6hst03fhxoB03oA2gIR0CsNMkPDpC8dX2UKGgGR0CQw+LM9r44aAdN6ANoCEdArDYR3X7LuHV9lChoBkdAkFoVcUuct2gHTegDaAhHQKw97HZK3/h1fZQoaAZHQJBzTVhCtzVoB03oA2gIR0CsQBK7ROUMdX2UKGgGR0CRD3tm+TNdaAdN6ANoCEdArEW1v4ubqnV9lChoBkdAjgQUbkwN9mgHTegDaAhHQKxHARTS9dx1fZQoaAZHQI7+zQ5WBBloB03oA2gIR0CsTMPrWy1NdX2UKGgGR0CNbBSSeRPoaAdN6ANoCEdArE4T3AVO9HV9lChoBkdAhHdKur6tT2gHTegDaAhHQKxSAChew9t1fZQoaAZHQIrZ5jpcHGFoB03oA2gIR0CsU025hBqsdX2UKGgGR0CPSxPY4ACGaAdN6ANoCEdArFmekUKzA3V9lChoBkdAjk9glfJFLGgHTegDaAhHQKxbtigCfYl1fZQoaAZHQImoirzXjENoB03oA2gIR0CsYgPYe1a4dX2UKGgGR0CRiPdkauOkaAdN6ANoCEdArGPqPKdQPHV9lChoBkdAkrUi9Zid8WgHTegDaAhHQKxppM36yjZ1fZQoaAZHQI7lMXLvCuVoB03oA2gIR0CsavFdTo+wdX2UKGgGR0CO/8ZG8VYZaAdN6ANoCEdArG7dyNn5BXV9lChoBkdAkMW45cTrV2gHTegDaAhHQKxwLG7z06J1fZQoaAZHQIvEIEpy6tloB03oA2gIR0CsdgBQFcIJdX2UKGgGR0CRKd2/SH/MaAdN6ANoCEdArHdVZzPrwHV9lChoBkdAkCB0KArhBWgHTegDaAhHQKx9QZ4wAVB1fZQoaAZHQJFEgo7V8TloB03oA2gIR0Csf2h+F10UdX2UKGgGR0CQ8LHzYmLMaAdN6ANoCEdArIbLlmvnsHV9lChoBkdAihP+AVfu1GgHTegDaAhHQKyIJNiYsup1fZQoaAZHQJFChtsN2DBoB03oA2gIR0CsjAhZIQOGdX2UKGgGR0CSZ0RxLkCFaAdN6ANoCEdArI1TBsQ/YHV9lChoBkdAktRan752yWgHTegDaAhHQKyTAZn+Q2d1fZQoaAZHQI8sBt3wCr9oB03oA2gIR0CslFSmQ8wIdX2UKGgGR0CJ7yZfD1oQaAdN6ANoCEdArJkJmTTvzHV9lChoBkdAkTQA8nuy/2gHTegDaAhHQKybBqFh5Pd1fZQoaAZHQInwdz6rNnpoB03oA2gIR0Cso5zB68g7dX2UKGgGR0CRAXUc4o7WaAdN6ANoCEdArKT025xzaXV9lChoBkdAkPBgk5ZKWmgHTegDaAhHQKyo3UXpGF11fZQoaAZHQJHRcMXrMTxoB03oA2gIR0CsqiPoV2zOdX2UKGgGR0CQduHDJlreaAdN6ANoCEdArK/3/HYHxHV9lChoBkdAkkvTOcDr7mgHTegDaAhHQKyxQn2qT8p1fZQoaAZHQJK48UrTYuloB03oA2gIR0CstUT0Yj0MdX2UKGgGR0CSG8zyBkI5aAdN6ANoCEdArLbmK4x1xXV9lChoBkdAkN6ZHVf/m2gHTegDaAhHQKzAULxZuAJ1fZQoaAZHQJJ+0LeANG5oB03oA2gIR0Cswg4B3iaRdX2UKGgGR0COexFI/Z/TaAdN6ANoCEdArMYf9tMwlHV9lChoBkdAjtjMI3R5T2gHTegDaAhHQKzHaOtGNJh1fZQoaAZHQIubd43WFvhoB03oA2gIR0CszR/F72L6dX2UKGgGR0CSHqW1c+qzaAdN6ANoCEdArM5zJQtSRHV9lChoBkdAj+UU+C9RJmgHTegDaAhHQKzSZVJ+UhV1fZQoaAZHQI621T3qRlpoB03oA2gIR0Cs07B7eEZjdWUu"
93
  },
94
  "ep_success_buffer": {
95
  ":type:": "<class 'collections.deque'>",
 
3
  ":type:": "<class 'abc.ABCMeta'>",
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
+ "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
+ "__init__": "<function ActorCriticPolicy.__init__ at 0x7ff45eabb430>",
8
+ "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7ff45eabb4c0>",
9
+ "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7ff45eabb550>",
10
+ "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7ff45eabb5e0>",
11
+ "_build": "<function ActorCriticPolicy._build at 0x7ff45eabb670>",
12
+ "forward": "<function ActorCriticPolicy.forward at 0x7ff45eabb700>",
13
+ "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7ff45eabb790>",
14
+ "_predict": "<function ActorCriticPolicy._predict at 0x7ff45eabb820>",
15
+ "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7ff45eabb8b0>",
16
+ "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7ff45eabb940>",
17
+ "predict_values": "<function ActorCriticPolicy.predict_values at 0x7ff45eabb9d0>",
 
18
  "__abstractmethods__": "frozenset()",
19
+ "_abc_impl": "<_abc._abc_data object at 0x7ff45eab8f00>"
20
  },
21
  "verbose": 1,
22
  "policy_kwargs": {
 
63
  "_num_timesteps_at_start": 0,
64
  "seed": null,
65
  "action_noise": null,
66
+ "start_time": 1676847178.788033,
67
  "learning_rate": 0.0001,
68
  "tensorboard_log": null,
69
  "lr_schedule": {
70
  ":type:": "<class 'function'>",
71
+ ":serialized:": "gAWV2wIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAEsBSwFLE0MEiABTAJROhZQpjAFflIWUjFUvaG9tZS9hdXRvd2luL2FuYWNvbmRhMy9saWIvcHl0aG9uMy45L3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxVL2hvbWUvYXV0b3dpbi9hbmFjb25kYTMvbGliL3B5dGhvbjMuOS9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGggfZR9lChoF2gOjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoGIwHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/Gjbi6xxDLYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="
72
  },
73
  "_last_obs": {
74
  ":type:": "<class 'numpy.ndarray'>",
75
+ ":serialized:": "gAWVNQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJbAAQAAAAAAAPnV7z61cxG+VloXP8yhRkBWJmk/wDxwP4gZ8T5DX4c/2ypgv+5Rp78p1L2+HTD4Pz2thDzilOc+gcDtv4dKQT/ty4w+ioAnwMn6Qr89VLs/9r0wu579IMCROkC/595IP8TPAj8gXvI+XibmPrPmBD+7uyRAvL9ZvnfUFz8a1+q+6RuMvV9Jqj3ukLU9NnqGPg5Epr6vgt66VJYQwGgrCr25Bnq+GUdtunl87T+dtSo9brsdP6rahzugdPY/qtgyPTJQrT544oY7PSsJwAj1Ab1pf/q/FTMHwHVgDsAlj/a/WhHKvrNSV75T1Bc/P/F4PopI+z0qtb89FBg3P6ahjb7Y3F4/DWk9v0sulL4TcijAsDG1v0oWPz5htpu+CwKVO8m8IT+sfrO+gvFbP0LTNT/23I0+/GfkvqOXCL84AwY+aX/6vyBe8j5eJuY+s+YEPxKt6TzSymQ/4+nKPS0vJL5SeKi/0UKMvEBsdTwH42w/+lu0vtR63j3gOiG/uYuGvoHuHr3CCwfAb18ivjsaLkB1YmC/WKGEv/yCNL+MW14+YKFvv3igaDvj2sC+4lo3P8TPAj8VMwfAXibmPrPmBD+UjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSwRLHIaUjAFDlHSUUpQu"
76
  },
77
  "_last_episode_starts": {
78
  ":type:": "<class 'numpy.ndarray'>",
79
+ ":serialized:": "gAWVdwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYEAAAAAAAAAAABAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwSFlIwBQ5R0lFKULg=="
80
  },
81
  "_last_original_obs": {
82
  ":type:": "<class 'numpy.ndarray'>",
83
+ ":serialized:": "gAWVNQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJbAAQAAAAAAAAAAAADXItC1AACAPwAAAAAAAAAAAAAAAAAAAAAAAACAn3GQPQAAAAAufOO/AAAAACa6wL0AAAAAWt7xPwAAAACWCEw8AAAAAJmc3T8AAAAAMqqrvQAAAAAb7++/AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAx+uRtgAAgD8AAAAAAAAAAAAAAAAAAAAAAAAAgOBaAT4AAAAAUoXbvwAAAADjthK8AAAAAOp5+z8AAAAAC2muvAAAAABKBwBAAAAAANpXFT0AAAAAJZDuvwAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAKo0K7YAAIA/AAAAAAAAAAAAAAAAAAAAAAAAAID6K0U8AAAAAIHp6L8AAAAA1PTrvQAAAACL+/s/AAAAAMWl3L0AAAAApdXaPwAAAABxEQe+AAAAAH+S4b8AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAABtg422AACAPwAAAAAAAAAAAAAAAAAAAAAAAACAun56vAAAAACgcNq/AAAAAC7oALoAAAAAyWvhPwAAAABZ8G29AAAAAHF57D8AAAAApyUIPgAAAAA1oPa/AAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSwRLHIaUjAFDlHSUUpQu"
84
  },
85
  "_episode_num": 0,
86
  "use_sde": true,
 
88
  "_current_progress_remaining": 0.0,
89
  "ep_info_buffer": {
90
  ":type:": "<class 'collections.deque'>",
91
+ ":serialized:": "gAWVRAwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQJBZWEOAiFGMAWyUTegDjAF0lEdAm3dsabWmQHV9lChoBkdAijcfRE4NqmgHTegDaAhHQJt5BdQfp2V1fZQoaAZHQJBwnpfQa75oB03oA2gIR0CbetQ6IWP+dX2UKGgGR0CL2diyY5T7aAdN6ANoCEdAm3w5wGW2PXV9lChoBkdAiqaVxsEaEWgHTegDaAhHQJuF4kQf6oF1fZQoaAZHQItNWGh24d9oB03oA2gIR0Cbh1GxUvPDdX2UKGgGR0CLfJYXfqHHaAdN6ANoCEdAm4kdZV4oqnV9lChoBkdAiwjrJKaodmgHTegDaAhHQJuKe10DEFZ1fZQoaAZHQIqXkm2LHdZoB03oA2gIR0CblKkJ8fFKdX2UKGgGR0CKFFhrnDBNaAdN6ANoCEdAm5YYEGJN03V9lChoBkdAi4z22G7Bf2gHTegDaAhHQJuX+rZJ04l1fZQoaAZHQI+v9W0Z3s5oB03oA2gIR0CbmdGYa5wwdX2UKGgGR0CD3Cmv4dp7aAdNiQJoCEdAm6PsbFS88XV9lChoBkdAkbctmcvugGgHTegDaAhHQJukWXrt3Oh1fZQoaAZHQI48eajN6gNoB03oA2gIR0Cbpbn3cpLFdX2UKGgGR0CQB8SDAaegaAdN6ANoCEdAm6d/XsgMdHV9lChoBkdAj0YVKoQ4CWgHTegDaAhHQJuyP7TDwYt1fZQoaAZHQI6uTwBo24xoB03oA2gIR0CbsqnHeaa1dX2UKGgGR0CMLZG6PKdQaAdN6ANoCEdAm7Qh5s0pE3V9lChoBkdAjNmJNbkfcWgHTegDaAhHQJu14qSX+l11fZQoaAZHQIlaiT4cm0FoB03oA2gIR0CbwOwfhddFdX2UKGgGR0COhkacZtN0aAdN6ANoCEdAm8FiBkI5YHV9lChoBkdAjXBKMefZmWgHTegDaAhHQJvC37CSA6N1fZQoaAZHQIoVFfG+9J1oB03oA2gIR0CbxNIVdonKdX2UKGgGR0CMrZx2jfvXaAdN6ANoCEdAm9A7A57w8XV9lChoBkdAjv5FUyYXwmgHTegDaAhHQJvQpW8yvcJ1fZQoaAZHQIwPLronrptoB03oA2gIR0Cb0gTHKfWddX2UKGgGR0CNF7g/C66KaAdN6ANoCEdAm9PjZcs19HV9lChoBkdAj4D3668QI2gHTegDaAhHQJvgQauOjqR1fZQoaAZHQI3gWEqUeMhoB03oA2gIR0Cb4MOXVsk6dX2UKGgGR0CMoiraufVaaAdN6ANoCEdAm+JsrqdH2HV9lChoBkdAjPpQRGtp22gHTegDaAhHQJvkhttQ9A51fZQoaAZHQI90cqYqoZRoB03oA2gIR0Cb72jwQUYbdX2UKGgGR0COuu3974SIaAdN6ANoCEdAm+/edf9gnnV9lChoBkdAiz4Nga3qiWgHTegDaAhHQJvxRO32EkB1fZQoaAZHQI5+9P1tfoloB03oA2gIR0Cb8wFvAGjcdX2UKGgGR0CQWd1LJ0W/aAdN6ANoCEdAm/3V5WzWw3V9lChoBkdAkAybfDUExWgHTegDaAhHQJv+QU34sVd1fZQoaAZHQIwsV6E8JUpoB03oA2gIR0Cb/6yAhB7edX2UKGgGR0CK4locJdB0aAdN6ANoCEdAnAF7XUYsNHV9lChoBkdAjXkC2tuDSWgHTegDaAhHQJwMEzxgAp91fZQoaAZHQIoEkKw6hg5oB03oA2gIR0CcDHyOJcgRdX2UKGgGR0CNy+0ygwoLaAdN6ANoCEdAnA3fqLS/kHV9lChoBkdAjRwkgW8AaWgHTegDaAhHQJwPqGGmDUV1fZQoaAZHQI45AOlO45NoB03oA2gIR0CcGzmCROk+dX2UKGgGR0CJeaJkXk5qaAdN6ANoCEdAnBvvEwWWQnV9lChoBkdAi+4h6Skj5mgHTegDaAhHQJwd7iADq4Z1fZQoaAZHQIzwXYODrZ9oB03oA2gIR0CcH6k/KQq7dX2UKGgGR0CPcMJKraM8aAdN6ANoCEdAnCooVM23rnV9lChoBkdAjcOilSCOFWgHTegDaAhHQJwqj8Jlar51fZQoaAZHQI6954W1twdoB03oA2gIR0CcLBt2cJ+ldX2UKGgGR0CHHGVLzwtraAdN6ANoCEdAnC3yI55qunV9lChoBkdAjf5XOObRW2gHTegDaAhHQJw5DnzQNTd1fZQoaAZHQI1jUohIOH5oB03oA2gIR0CcOXj4pMHsdX2UKGgGR0CQFol0HQhPaAdN6ANoCEdAnDreAEt/WnV9lChoBkdAj0hL30wrUmgHTegDaAhHQJw8phBqsU91fZQoaAZHQI6kZn13+uNoB03oA2gIR0CcSUDFZPl/dX2UKGgGR0CMmDXtjTa1aAdN6ANoCEdAnEmrFwT/Q3V9lChoBkdAjgU7vgFX72gHTegDaAhHQJxLDJOnEVF1fZQoaAZHQI78zLfUF0RoB03oA2gIR0CcTOXko4MndX2UKGgGR0CLyo0fHPu5aAdN6ANoCEdAnFkIS13MZHV9lChoBkdAh/C/WDpTuWgHTegDaAhHQJxZgbzbvgF1fZQoaAZHQI7EU/r0J4VoB03oA2gIR0CcW0xKQJXydX2UKGgGR0CMOs99MK1HaAdN6ANoCEdAnF10CFK02XV9lChoBkdAkJTKNlyzX2gHTegDaAhHQJxpz1lGwzN1fZQoaAZHQI6v/GEPDpFoB03oA2gIR0Ccak5TZQHidX2UKGgGR0CLd97l7tzCaAdN6ANoCEdAnGvv0RODa3V9lChoBkdAjNugTZg5R2gHTegDaAhHQJxt+1x82Jl1fZQoaAZHQJCKrBqKxcFoB03oA2gIR0CceK2ZAprldX2UKGgGR0CP2QiX6ZYxaAdN6ANoCEdAnHkVhPTG53V9lChoBkdAjemPkaMrE2gHTegDaAhHQJx6el3yI551fZQoaAZHQI4sFUn5SFZoB03oA2gIR0CcfDYaYNRWdX2UKGgGR0CN76S9M9KVaAdN6ANoCEdAnIbAUpNKy3V9lChoBkdAj9dtkOI682gHTegDaAhHQJyHLBacI7h1fZQoaAZHQI0U8384xUNoB03oA2gIR0CciJI8yN4rdX2UKGgGR0CNJyKaXrt3aAdN6ANoCEdAnIpTwlSjxnV9lChoBkdAi58nvUjLS2gHTegDaAhHQJyVARbr1NB1fZQoaAZHQIjOjrs0HhVoB03oA2gIR0CclXLqlgtwdX2UKGgGR0CLzWkrPMSsaAdN6ANoCEdAnJb8zEaVEHV9lChoBkdAjvjG4I8hcWgHTegDaAhHQJyYxbr1M/R1fZQoaAZHQIx515t3wCtoB03oA2gIR0Cco4EXLvCudX2UKGgGR0CQClkqc3ERaAdN6ANoCEdAnKP3Wz4UOHV9lChoBkdAkCuwOnVG1GgHTegDaAhHQJylcAQxveh1fZQoaAZHQIwo7AnDziFoB03oA2gIR0Ccp2KuB+WodX2UKGgGR0CPX8kP+XJHaAdN6ANoCEdAnLJDIzWPLnV9lChoBkdAjXZYuK4x12gHTegDaAhHQJyysN9YwIt1fZQoaAZHQI+Oi1y/9HdoB03oA2gIR0CctBlgtvn9dX2UKGgGR0CNR9VwxWT5aAdN6ANoCEdAnLXeQQtjC3V9lChoBkdAi7CMQumJnGgHTegDaAhHQJzAeqXF98Z1fZQoaAZHQIzfnwZwXIloB03oA2gIR0CcwOaDPGADdX2UKGgGR0COTUFW4mTlaAdN6ANoCEdAnMJHxaxHG3V9lChoBkdAjjVZoGpuM2gHTegDaAhHQJzEENqgyuZ1fZQoaAZHQIY7y24NI9VoB03uAmgIR0CczNmuTzNEdX2UKGgGR0CO4KmrKeTWaAdN6ANoCEdAnM6W5paibnV9lChoBkdAjb6lN1yNoGgHTegDaAhHQJzPAxvegth1fZQoaAZHQI2mkLfDUExoB03oA2gIR0Cc0jSxJNCadX2UKGgGR0CNfii7CiyqaAdN6ANoCEdAnNs5NKyv93V9lChoBkdAiT7KA8Swn2gHTegDaAhHQJzdxqqOtGN1fZQoaAZHQI6Cec8TzupoB03oA2gIR0Cc3kHlfZ27dX2UKGgGR0CKi146fapQaAdN6ANoCEdAnOFpYxL0z3VlLg=="
92
  },
93
  "ep_success_buffer": {
94
  ":type:": "<class 'collections.deque'>",
a2c-AntBulletEnv-v0/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f134c58945bba2663d6f54d55b54f6dadde913e9d16225b81e13e101bd72cc41
3
- size 56190
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7728b85c5c1c518847966e83ec2beb24c9c45b435ec70e90982ce0caf8d0db3d
3
+ size 56062
a2c-AntBulletEnv-v0/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9772dfb65dbf981552eba15d9207c79b33a1eaad81abe3bae85890610168807e
3
- size 56958
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c8fdaf15b90571d9f22dc5e120c6b98f9663609aaac1c3ab20e7d0cb65a27e3
3
+ size 56638
a2c-AntBulletEnv-v0/system_info.txt CHANGED
@@ -1,7 +1,7 @@
1
- - OS: Linux-5.10.147+-x86_64-with-glibc2.29 # 1 SMP Sat Dec 10 16:00:40 UTC 2022
2
- - Python: 3.8.10
3
- - Stable-Baselines3: 1.7.0
4
- - PyTorch: 1.13.1+cu116
5
- - GPU Enabled: True
6
- - Numpy: 1.21.6
7
- - Gym: 0.21.0
 
1
+ OS: Linux-5.19.0-32-generic-x86_64-with-glibc2.35 #33~22.04.1-Ubuntu SMP PREEMPT_DYNAMIC Mon Jan 30 17:03:34 UTC 2
2
+ Python: 3.9.12
3
+ Stable-Baselines3: 1.5.0
4
+ PyTorch: 1.13.1
5
+ GPU Enabled: False
6
+ Numpy: 1.21.5
7
+ Gym: 0.21.0
config.json CHANGED
@@ -1 +1 @@
1
- {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f28d61b7040>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f28d61b70d0>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f28d61b7160>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f28d61b71f0>", "_build": "<function ActorCriticPolicy._build at 0x7f28d61b7280>", "forward": "<function ActorCriticPolicy.forward at 0x7f28d61b7310>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7f28d61b73a0>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f28d61b7430>", "_predict": "<function ActorCriticPolicy._predict at 0x7f28d61b74c0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f28d61b7550>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f28d61b75e0>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f28d61b7670>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc_data object at 0x7f28d61aeb40>"}, "verbose": 1, "policy_kwargs": {":type:": "<class 'dict'>", ":serialized:": "gAWVowAAAAAAAAB9lCiMDGxvZ19zdGRfaW5pdJRK/v///4wKb3J0aG9faW5pdJSJjA9vcHRpbWl6ZXJfY2xhc3OUjBN0b3JjaC5vcHRpbS5ybXNwcm9wlIwHUk1TcHJvcJSTlIwQb3B0aW1pemVyX2t3YXJnc5R9lCiMBWFscGhhlEc/764UeuFHrowDZXBzlEc+5Pi1iONo8YwMd2VpZ2h0X2RlY2F5lEsAdXUu", "log_std_init": -2, "ortho_init": false, "optimizer_class": "<class 'torch.optim.rmsprop.RMSprop'>", "optimizer_kwargs": {"alpha": 0.99, "eps": 1e-05, "weight_decay": 0}}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVZwIAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLHIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWcAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/lGgKSxyFlIwBQ5R0lFKUjARoaWdolGgSKJZwAAAAAAAAAAAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH+UaApLHIWUaBV0lFKUjA1ib3VuZGVkX2JlbG93lGgSKJYcAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLHIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYcAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUaCFLHIWUaBV0lFKUjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "_shape": [28], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf\n -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf inf inf inf inf inf inf inf inf inf inf\n inf inf inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False False False False False\n False False False False False False False False False False False False\n False False False False]", "bounded_above": "[False False False False False False False False False False False False\n False False False False False False False False False False False False\n False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVnwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAIC/AACAvwAAgL8AAIC/AACAvwAAgL8AAIC/AACAv5RoCksIhZSMAUOUdJRSlIwEaGlnaJRoEiiWIAAAAAAAAAAAAIA/AACAPwAAgD8AAIA/AACAPwAAgD8AAIA/AACAP5RoCksIhZRoFXSUUpSMDWJvdW5kZWRfYmVsb3eUaBIolggAAAAAAAAAAQEBAQEBAQGUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYIAAAAAAAAAAEBAQEBAQEBlGghSwiFlGgVdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [8], "low": "[-1. -1. -1. -1. -1. -1. -1. -1.]", "high": "[1. 1. 1. 1. 1. 1. 1. 1.]", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_np_random": null}, "n_envs": 4, "num_timesteps": 2000000, "_total_timesteps": 2000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1676834158394097657, "learning_rate": 0.0001, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4JDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/Gjbi6xxDLYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVNQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJbAAQAAAAAAAJnXyb8wtk4/H37TPCr+3b4fVyS+cTynPffwmr6yWEw/bxdcP/MGBbxiNZa/ADIZvSWyk7+4ZuO7jmgsP3N3Fz2oyMc/PRksPAfpwT6IOzs93dIOvxCTbzytlFO/6PAvvW7e/z7XHug+2LfDPsKz7z69m4y/Y1TLP+ap5L+pvTw/+xQIP1Wzhz/THaw9cBwDPpTNLz+6Yt484TIcv+Tlaz5vXwU/l4Yev7ZWFj+OOWu+oguMPxvXFL/tnSc/EK37vYrBV78P3Qs9fU1Vv7Q4rT1u3v8+1x7oPti3wz7Cs+8+B3Bzv+9XGT/f4WU+DSGpP/Tvvb9Zwgs+HLX9Pf7jMT75WC0/o4O1viQ2B78HnfO9T39sv591GMB1/iU/6HYavtUvXD+GPIS/GbMXP2Ozor4fkkO/9k94P3mvU79CEqS7bt7/PgYrDcDYt8M+9bMIwIZUmr9R/Lk/eZdYwB476L623l+/EMJ5P0Jesb7Snno/FHxFPwvwm75wOo2/6VikvpSbBr4Bb9K/FruNPkN69z28ydY/eRNjvugBCj4u1li/4DRBPvbQAL4WvlK/5gWCPm7e/z7XHug+2LfDPsKz7z6UjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSwRLHIaUjAFDlHSUUpQu"}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYEAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwSFlIwBQ5R0lFKULg=="}, "_last_original_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVNQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJbAAQAAAAAAAAAAAADtjtM1AACAPwAAAAAAAAAAAAAAAAAAAAAAAACAMcW0vQAAAAA/Z/y/AAAAAGiSQb0AAAAAcZf3PwAAAAAGSBo9AAAAAP5H/j8AAAAAmKBiPAAAAAA3MvK/AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAG6k1tgAAgD8AAAAAAAAAAAAAAAAAAAAAAAAAgLRIQ70AAAAAEwT8vwAAAAD+Ueq9AAAAAFh1/T8AAAAAr8mPvAAAAADpzv8/AAAAALHNGD0AAAAAVWv1vwAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAADDYS7UAAIA/AAAAAAAAAAAAAAAAAAAAAAAAAIDqVxw9AAAAAHR8278AAAAAhkaTPAAAAAAFYwBAAAAAANVhnr0AAAAAzZntPwAAAAAcpYa9AAAAAHUa/b8AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAJi61AACAPwAAAAAAAAAAAAAAAAAAAAAAAACAJjNcvQAAAACQH/W/AAAAAESJTz0AAAAAwzTsPwAAAABwKtG9AAAAADTH8D8AAAAAfybiPAAAAACWVvu/AAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSwRLHIaUjAFDlHSUUpQu"}, "_episode_num": 0, "use_sde": true, "sde_sample_freq": -1, "_current_progress_remaining": 0.0, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVQwwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQI0o6zHCGeuMAWyUTegDjAF0lEdAq3Mo3eenRHV9lChoBkdAjYXxG2Cul2gHTegDaAhHQKt1gBdUsFt1fZQoaAZHQIq9CfOD8LtoB03oA2gIR0CrdzKTjebedX2UKGgGR0CN8NbnoxHoaAdN6ANoCEdAq3+HGlyimHV9lChoBkdAjRrpkwvg32gHTegDaAhHQKuBoc+7lJZ1fZQoaAZHQI7HIuIyj59oB03oA2gIR0CrhXFAE+xGdX2UKGgGR0CRmabiIcioaAdN6ANoCEdAq4gfJYDDCXV9lChoBkdAkBhoIOYplWgHTegDaAhHQKuPpJbMX8B1fZQoaAZHQI6zr+WGATZoB03oA2gIR0CrkPMqril0dX2UKGgGR0COqR9vS+g2aAdN6ANoCEdAq5M7Jr+HanV9lChoBkdAkbXgRwqAjWgHTegDaAhHQKuU73M6ikB1fZQoaAZHQJAtcHu7YkFoB03oA2gIR0CrnGnU+cH4dX2UKGgGR0CMBKnVoYelaAdN6ANoCEdAq557PfKp1nV9lChoBkdAjawOVopQUGgHTegDaAhHQKuiCvLX+VF1fZQoaAZHQIwygmG/N7loB03oA2gIR0CrpMEYwZfldX2UKGgGR0BiwglByCFsaAdL8GgIR0CrpuOLaVUudX2UKGgGR0CNY0upS75EaAdN6ANoCEdAq6zylHjIaXV9lChoBkdAiwNJFb3XZ2gHTegDaAhHQKuuUY8+zMR1fZQoaAZHQIg+xNCZ4OdoB03oA2gIR0CrsjxRuTA4dX2UKGgGR0CNPMb4Ju2raAdN6ANoCEdAq7ODI7vG63V9lChoBkdAj9FGWUr08WgHTegDaAhHQKu5ZvcafjF1fZQoaAZHQItLG85CF9NoB03oA2gIR0CrurD0th/idX2UKGgGR0CQz98iOeasaAdN6ANoCEdAq8CYdZJTVHV9lChoBkdAj2F6b4Ju22gHTegDaAhHQKvCxTqjaf11fZQoaAZHQI6xrDZUT+NoB03oA2gIR0Cryi5QYUFjdX2UKGgGR0CP2BXfZVXFaAdN6ANoCEdAq8ugBmwqzHV9lChoBkdAjZT5nUUfxWgHTegDaAhHQKvPj2NedCp1fZQoaAZHQIv5vrrxAjZoB03oA2gIR0Cr0OoEB8x9dX2UKGgGR0CKmp7Kq4pdaAdN6ANoCEdAq9b5RyfcvnV9lChoBkdAjXZmh/RVqGgHTegDaAhHQKvYV/jsD4h1fZQoaAZHQJE9sw22oehoB03oA2gIR0Cr3Tr2QGOddX2UKGgGR0CQHLZi/fwaaAdN6ANoCEdAq99CsS00FnV9lChoBkdAkSDkvPC2t2gHTegDaAhHQKvn3aews5J1fZQoaAZHQJF5ubsniNtoB03oA2gIR0Cr6S79Q40edX2UKGgGR0CP/xL6k691aAdN6ANoCEdAq+07/Ot4iXV9lChoBkdAjPCINNJvpGgHTegDaAhHQKvuinEVFhJ1fZQoaAZHQI1cEkdFOO9oB03oA2gIR0Cr9KYH5aePdX2UKGgGR0CG2w8q4H5aaAdN6ANoCEdAq/YDcCYCyXV9lChoBkdAkFtS0OVgQmgHTegDaAhHQKv58L/jsD51fZQoaAZHQI4jAwyqMm5oB03oA2gIR0Cr++7lq8DkdX2UKGgGR0CM9vGhEjPfaAdN6ANoCEdArAVgk7fYSXV9lChoBkdAkICb2lEZzmgHTegDaAhHQKwGzEa2nbZ1fZQoaAZHQIu9O7+T/yZoB03oA2gIR0CsCsiYb83udX2UKGgGR0CLfVG+9Jz1aAdN6ANoCEdArAwXGGVRk3V9lChoBkdAkOdUjC53DGgHTegDaAhHQKwSHuAqd6N1fZQoaAZHQJDV7CCSRr9oB03oA2gIR0CsE4DSofjkdX2UKGgGR0CNgjZkkKNRaAdN6ANoCEdArBdfhESdv3V9lChoBkdAjiXsFt8/lmgHTegDaAhHQKwYsgWac7R1fZQoaAZHQJByKnqFAVxoB03oA2gIR0CsIaa+N96UdX2UKGgGR0CP+NcynDR/aAdN6ANoCEdArCPq/0ulGnV9lChoBkdAkjxi0WuX/2gHTegDaAhHQKwoMcz67/Z1fZQoaAZHQI/dcQmNR3xoB03oA2gIR0CsKY5Rjz7NdX2UKGgGR0CRoBKdxyXEaAdN6ANoCEdArC+KbMHKOnV9lChoBkdAiGJjhky1u2gHTegDaAhHQKww2IJqqOt1fZQoaAZHQI6hst03fhxoB03oA2gIR0CsNMkPDpC8dX2UKGgGR0CQw+LM9r44aAdN6ANoCEdArDYR3X7LuHV9lChoBkdAkFoVcUuct2gHTegDaAhHQKw97HZK3/h1fZQoaAZHQJBzTVhCtzVoB03oA2gIR0CsQBK7ROUMdX2UKGgGR0CRD3tm+TNdaAdN6ANoCEdArEW1v4ubqnV9lChoBkdAjgQUbkwN9mgHTegDaAhHQKxHARTS9dx1fZQoaAZHQI7+zQ5WBBloB03oA2gIR0CsTMPrWy1NdX2UKGgGR0CNbBSSeRPoaAdN6ANoCEdArE4T3AVO9HV9lChoBkdAhHdKur6tT2gHTegDaAhHQKxSAChew9t1fZQoaAZHQIrZ5jpcHGFoB03oA2gIR0CsU025hBqsdX2UKGgGR0CPSxPY4ACGaAdN6ANoCEdArFmekUKzA3V9lChoBkdAjk9glfJFLGgHTegDaAhHQKxbtigCfYl1fZQoaAZHQImoirzXjENoB03oA2gIR0CsYgPYe1a4dX2UKGgGR0CRiPdkauOkaAdN6ANoCEdArGPqPKdQPHV9lChoBkdAkrUi9Zid8WgHTegDaAhHQKxppM36yjZ1fZQoaAZHQI7lMXLvCuVoB03oA2gIR0CsavFdTo+wdX2UKGgGR0CO/8ZG8VYZaAdN6ANoCEdArG7dyNn5BXV9lChoBkdAkMW45cTrV2gHTegDaAhHQKxwLG7z06J1fZQoaAZHQIvEIEpy6tloB03oA2gIR0CsdgBQFcIJdX2UKGgGR0CRKd2/SH/MaAdN6ANoCEdArHdVZzPrwHV9lChoBkdAkCB0KArhBWgHTegDaAhHQKx9QZ4wAVB1fZQoaAZHQJFEgo7V8TloB03oA2gIR0Csf2h+F10UdX2UKGgGR0CQ8LHzYmLMaAdN6ANoCEdArIbLlmvnsHV9lChoBkdAihP+AVfu1GgHTegDaAhHQKyIJNiYsup1fZQoaAZHQJFChtsN2DBoB03oA2gIR0CsjAhZIQOGdX2UKGgGR0CSZ0RxLkCFaAdN6ANoCEdArI1TBsQ/YHV9lChoBkdAktRan752yWgHTegDaAhHQKyTAZn+Q2d1fZQoaAZHQI8sBt3wCr9oB03oA2gIR0CslFSmQ8wIdX2UKGgGR0CJ7yZfD1oQaAdN6ANoCEdArJkJmTTvzHV9lChoBkdAkTQA8nuy/2gHTegDaAhHQKybBqFh5Pd1fZQoaAZHQInwdz6rNnpoB03oA2gIR0Cso5zB68g7dX2UKGgGR0CRAXUc4o7WaAdN6ANoCEdArKT025xzaXV9lChoBkdAkPBgk5ZKWmgHTegDaAhHQKyo3UXpGF11fZQoaAZHQJHRcMXrMTxoB03oA2gIR0CsqiPoV2zOdX2UKGgGR0CQduHDJlreaAdN6ANoCEdArK/3/HYHxHV9lChoBkdAkkvTOcDr7mgHTegDaAhHQKyxQn2qT8p1fZQoaAZHQJK48UrTYuloB03oA2gIR0CstUT0Yj0MdX2UKGgGR0CSG8zyBkI5aAdN6ANoCEdArLbmK4x1xXV9lChoBkdAkN6ZHVf/m2gHTegDaAhHQKzAULxZuAJ1fZQoaAZHQJJ+0LeANG5oB03oA2gIR0Cswg4B3iaRdX2UKGgGR0COexFI/Z/TaAdN6ANoCEdArMYf9tMwlHV9lChoBkdAjtjMI3R5T2gHTegDaAhHQKzHaOtGNJh1fZQoaAZHQIubd43WFvhoB03oA2gIR0CszR/F72L6dX2UKGgGR0CSHqW1c+qzaAdN6ANoCEdArM5zJQtSRHV9lChoBkdAj+UU+C9RJmgHTegDaAhHQKzSZVJ+UhV1fZQoaAZHQI621T3qRlpoB03oA2gIR0Cs07B7eEZjdWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 62500, "n_steps": 8, "gamma": 0.99, "gae_lambda": 0.9, "ent_coef": 0.0, "vf_coef": 0.4, "max_grad_norm": 0.5, "normalize_advantage": false, "system_info": {"OS": "Linux-5.10.147+-x86_64-with-glibc2.29 # 1 SMP Sat Dec 10 16:00:40 UTC 2022", "Python": "3.8.10", "Stable-Baselines3": "1.7.0", "PyTorch": "1.13.1+cu116", "GPU Enabled": "True", "Numpy": "1.21.6", "Gym": "0.21.0"}}
 
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7ff45eabb430>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7ff45eabb4c0>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7ff45eabb550>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7ff45eabb5e0>", "_build": "<function ActorCriticPolicy._build at 0x7ff45eabb670>", "forward": "<function ActorCriticPolicy.forward at 0x7ff45eabb700>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7ff45eabb790>", "_predict": "<function ActorCriticPolicy._predict at 0x7ff45eabb820>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7ff45eabb8b0>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7ff45eabb940>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7ff45eabb9d0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7ff45eab8f00>"}, "verbose": 1, "policy_kwargs": {":type:": "<class 'dict'>", ":serialized:": "gAWVowAAAAAAAAB9lCiMDGxvZ19zdGRfaW5pdJRK/v///4wKb3J0aG9faW5pdJSJjA9vcHRpbWl6ZXJfY2xhc3OUjBN0b3JjaC5vcHRpbS5ybXNwcm9wlIwHUk1TcHJvcJSTlIwQb3B0aW1pemVyX2t3YXJnc5R9lCiMBWFscGhhlEc/764UeuFHrowDZXBzlEc+5Pi1iONo8YwMd2VpZ2h0X2RlY2F5lEsAdXUu", "log_std_init": -2, "ortho_init": false, "optimizer_class": "<class 'torch.optim.rmsprop.RMSprop'>", "optimizer_kwargs": {"alpha": 0.99, "eps": 1e-05, "weight_decay": 0}}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVZwIAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLHIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWcAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/lGgKSxyFlIwBQ5R0lFKUjARoaWdolGgSKJZwAAAAAAAAAAAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH+UaApLHIWUaBV0lFKUjA1ib3VuZGVkX2JlbG93lGgSKJYcAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLHIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYcAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUaCFLHIWUaBV0lFKUjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "_shape": [28], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf\n -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf inf inf inf inf inf inf inf inf inf inf\n inf inf inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False False False False False\n False False False False False False False False False False False False\n False False False False]", "bounded_above": "[False False False False False False False False False False False False\n False False False False False False False False False False False False\n False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVnwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAIC/AACAvwAAgL8AAIC/AACAvwAAgL8AAIC/AACAv5RoCksIhZSMAUOUdJRSlIwEaGlnaJRoEiiWIAAAAAAAAAAAAIA/AACAPwAAgD8AAIA/AACAPwAAgD8AAIA/AACAP5RoCksIhZRoFXSUUpSMDWJvdW5kZWRfYmVsb3eUaBIolggAAAAAAAAAAQEBAQEBAQGUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYIAAAAAAAAAAEBAQEBAQEBlGghSwiFlGgVdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [8], "low": "[-1. -1. -1. -1. -1. -1. -1. -1.]", "high": "[1. 1. 1. 1. 1. 1. 1. 1.]", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_np_random": null}, "n_envs": 4, "num_timesteps": 2000000, "_total_timesteps": 2000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1676847178.788033, "learning_rate": 0.0001, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWV2wIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAEsBSwFLE0MEiABTAJROhZQpjAFflIWUjFUvaG9tZS9hdXRvd2luL2FuYWNvbmRhMy9saWIvcHl0aG9uMy45L3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxVL2hvbWUvYXV0b3dpbi9hbmFjb25kYTMvbGliL3B5dGhvbjMuOS9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGggfZR9lChoF2gOjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoGIwHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/Gjbi6xxDLYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVNQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJbAAQAAAAAAAPnV7z61cxG+VloXP8yhRkBWJmk/wDxwP4gZ8T5DX4c/2ypgv+5Rp78p1L2+HTD4Pz2thDzilOc+gcDtv4dKQT/ty4w+ioAnwMn6Qr89VLs/9r0wu579IMCROkC/595IP8TPAj8gXvI+XibmPrPmBD+7uyRAvL9ZvnfUFz8a1+q+6RuMvV9Jqj3ukLU9NnqGPg5Epr6vgt66VJYQwGgrCr25Bnq+GUdtunl87T+dtSo9brsdP6rahzugdPY/qtgyPTJQrT544oY7PSsJwAj1Ab1pf/q/FTMHwHVgDsAlj/a/WhHKvrNSV75T1Bc/P/F4PopI+z0qtb89FBg3P6ahjb7Y3F4/DWk9v0sulL4TcijAsDG1v0oWPz5htpu+CwKVO8m8IT+sfrO+gvFbP0LTNT/23I0+/GfkvqOXCL84AwY+aX/6vyBe8j5eJuY+s+YEPxKt6TzSymQ/4+nKPS0vJL5SeKi/0UKMvEBsdTwH42w/+lu0vtR63j3gOiG/uYuGvoHuHr3CCwfAb18ivjsaLkB1YmC/WKGEv/yCNL+MW14+YKFvv3igaDvj2sC+4lo3P8TPAj8VMwfAXibmPrPmBD+UjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSwRLHIaUjAFDlHSUUpQu"}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYEAAAAAAAAAAABAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwSFlIwBQ5R0lFKULg=="}, "_last_original_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVNQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJbAAQAAAAAAAAAAAADXItC1AACAPwAAAAAAAAAAAAAAAAAAAAAAAACAn3GQPQAAAAAufOO/AAAAACa6wL0AAAAAWt7xPwAAAACWCEw8AAAAAJmc3T8AAAAAMqqrvQAAAAAb7++/AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAx+uRtgAAgD8AAAAAAAAAAAAAAAAAAAAAAAAAgOBaAT4AAAAAUoXbvwAAAADjthK8AAAAAOp5+z8AAAAAC2muvAAAAABKBwBAAAAAANpXFT0AAAAAJZDuvwAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAKo0K7YAAIA/AAAAAAAAAAAAAAAAAAAAAAAAAID6K0U8AAAAAIHp6L8AAAAA1PTrvQAAAACL+/s/AAAAAMWl3L0AAAAApdXaPwAAAABxEQe+AAAAAH+S4b8AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAABtg422AACAPwAAAAAAAAAAAAAAAAAAAAAAAACAun56vAAAAACgcNq/AAAAAC7oALoAAAAAyWvhPwAAAABZ8G29AAAAAHF57D8AAAAApyUIPgAAAAA1oPa/AAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiSwRLHIaUjAFDlHSUUpQu"}, "_episode_num": 0, "use_sde": true, "sde_sample_freq": -1, "_current_progress_remaining": 0.0, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVRAwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQJBZWEOAiFGMAWyUTegDjAF0lEdAm3dsabWmQHV9lChoBkdAijcfRE4NqmgHTegDaAhHQJt5BdQfp2V1fZQoaAZHQJBwnpfQa75oB03oA2gIR0CbetQ6IWP+dX2UKGgGR0CL2diyY5T7aAdN6ANoCEdAm3w5wGW2PXV9lChoBkdAiqaVxsEaEWgHTegDaAhHQJuF4kQf6oF1fZQoaAZHQItNWGh24d9oB03oA2gIR0Cbh1GxUvPDdX2UKGgGR0CLfJYXfqHHaAdN6ANoCEdAm4kdZV4oqnV9lChoBkdAiwjrJKaodmgHTegDaAhHQJuKe10DEFZ1fZQoaAZHQIqXkm2LHdZoB03oA2gIR0CblKkJ8fFKdX2UKGgGR0CKFFhrnDBNaAdN6ANoCEdAm5YYEGJN03V9lChoBkdAi4z22G7Bf2gHTegDaAhHQJuX+rZJ04l1fZQoaAZHQI+v9W0Z3s5oB03oA2gIR0CbmdGYa5wwdX2UKGgGR0CD3Cmv4dp7aAdNiQJoCEdAm6PsbFS88XV9lChoBkdAkbctmcvugGgHTegDaAhHQJukWXrt3Oh1fZQoaAZHQI48eajN6gNoB03oA2gIR0Cbpbn3cpLFdX2UKGgGR0CQB8SDAaegaAdN6ANoCEdAm6d/XsgMdHV9lChoBkdAj0YVKoQ4CWgHTegDaAhHQJuyP7TDwYt1fZQoaAZHQI6uTwBo24xoB03oA2gIR0CbsqnHeaa1dX2UKGgGR0CMLZG6PKdQaAdN6ANoCEdAm7Qh5s0pE3V9lChoBkdAjNmJNbkfcWgHTegDaAhHQJu14qSX+l11fZQoaAZHQIlaiT4cm0FoB03oA2gIR0CbwOwfhddFdX2UKGgGR0COhkacZtN0aAdN6ANoCEdAm8FiBkI5YHV9lChoBkdAjXBKMefZmWgHTegDaAhHQJvC37CSA6N1fZQoaAZHQIoVFfG+9J1oB03oA2gIR0CbxNIVdonKdX2UKGgGR0CMrZx2jfvXaAdN6ANoCEdAm9A7A57w8XV9lChoBkdAjv5FUyYXwmgHTegDaAhHQJvQpW8yvcJ1fZQoaAZHQIwPLronrptoB03oA2gIR0Cb0gTHKfWddX2UKGgGR0CNF7g/C66KaAdN6ANoCEdAm9PjZcs19HV9lChoBkdAj4D3668QI2gHTegDaAhHQJvgQauOjqR1fZQoaAZHQI3gWEqUeMhoB03oA2gIR0Cb4MOXVsk6dX2UKGgGR0CMoiraufVaaAdN6ANoCEdAm+JsrqdH2HV9lChoBkdAjPpQRGtp22gHTegDaAhHQJvkhttQ9A51fZQoaAZHQI90cqYqoZRoB03oA2gIR0Cb72jwQUYbdX2UKGgGR0COuu3974SIaAdN6ANoCEdAm+/edf9gnnV9lChoBkdAiz4Nga3qiWgHTegDaAhHQJvxRO32EkB1fZQoaAZHQI5+9P1tfoloB03oA2gIR0Cb8wFvAGjcdX2UKGgGR0CQWd1LJ0W/aAdN6ANoCEdAm/3V5WzWw3V9lChoBkdAkAybfDUExWgHTegDaAhHQJv+QU34sVd1fZQoaAZHQIwsV6E8JUpoB03oA2gIR0Cb/6yAhB7edX2UKGgGR0CK4locJdB0aAdN6ANoCEdAnAF7XUYsNHV9lChoBkdAjXkC2tuDSWgHTegDaAhHQJwMEzxgAp91fZQoaAZHQIoEkKw6hg5oB03oA2gIR0CcDHyOJcgRdX2UKGgGR0CNy+0ygwoLaAdN6ANoCEdAnA3fqLS/kHV9lChoBkdAjRwkgW8AaWgHTegDaAhHQJwPqGGmDUV1fZQoaAZHQI45AOlO45NoB03oA2gIR0CcGzmCROk+dX2UKGgGR0CJeaJkXk5qaAdN6ANoCEdAnBvvEwWWQnV9lChoBkdAi+4h6Skj5mgHTegDaAhHQJwd7iADq4Z1fZQoaAZHQIzwXYODrZ9oB03oA2gIR0CcH6k/KQq7dX2UKGgGR0CPcMJKraM8aAdN6ANoCEdAnCooVM23rnV9lChoBkdAjcOilSCOFWgHTegDaAhHQJwqj8Jlar51fZQoaAZHQI6954W1twdoB03oA2gIR0CcLBt2cJ+ldX2UKGgGR0CHHGVLzwtraAdN6ANoCEdAnC3yI55qunV9lChoBkdAjf5XOObRW2gHTegDaAhHQJw5DnzQNTd1fZQoaAZHQI1jUohIOH5oB03oA2gIR0CcOXj4pMHsdX2UKGgGR0CQFol0HQhPaAdN6ANoCEdAnDreAEt/WnV9lChoBkdAj0hL30wrUmgHTegDaAhHQJw8phBqsU91fZQoaAZHQI6kZn13+uNoB03oA2gIR0CcSUDFZPl/dX2UKGgGR0CMmDXtjTa1aAdN6ANoCEdAnEmrFwT/Q3V9lChoBkdAjgU7vgFX72gHTegDaAhHQJxLDJOnEVF1fZQoaAZHQI78zLfUF0RoB03oA2gIR0CcTOXko4MndX2UKGgGR0CLyo0fHPu5aAdN6ANoCEdAnFkIS13MZHV9lChoBkdAh/C/WDpTuWgHTegDaAhHQJxZgbzbvgF1fZQoaAZHQI7EU/r0J4VoB03oA2gIR0CcW0xKQJXydX2UKGgGR0CMOs99MK1HaAdN6ANoCEdAnF10CFK02XV9lChoBkdAkJTKNlyzX2gHTegDaAhHQJxpz1lGwzN1fZQoaAZHQI6v/GEPDpFoB03oA2gIR0Ccak5TZQHidX2UKGgGR0CLd97l7tzCaAdN6ANoCEdAnGvv0RODa3V9lChoBkdAjNugTZg5R2gHTegDaAhHQJxt+1x82Jl1fZQoaAZHQJCKrBqKxcFoB03oA2gIR0CceK2ZAprldX2UKGgGR0CP2QiX6ZYxaAdN6ANoCEdAnHkVhPTG53V9lChoBkdAjemPkaMrE2gHTegDaAhHQJx6el3yI551fZQoaAZHQI4sFUn5SFZoB03oA2gIR0CcfDYaYNRWdX2UKGgGR0CN76S9M9KVaAdN6ANoCEdAnIbAUpNKy3V9lChoBkdAj9dtkOI682gHTegDaAhHQJyHLBacI7h1fZQoaAZHQI0U8384xUNoB03oA2gIR0CciJI8yN4rdX2UKGgGR0CNJyKaXrt3aAdN6ANoCEdAnIpTwlSjxnV9lChoBkdAi58nvUjLS2gHTegDaAhHQJyVARbr1NB1fZQoaAZHQIjOjrs0HhVoB03oA2gIR0CclXLqlgtwdX2UKGgGR0CLzWkrPMSsaAdN6ANoCEdAnJb8zEaVEHV9lChoBkdAjvjG4I8hcWgHTegDaAhHQJyYxbr1M/R1fZQoaAZHQIx515t3wCtoB03oA2gIR0Cco4EXLvCudX2UKGgGR0CQClkqc3ERaAdN6ANoCEdAnKP3Wz4UOHV9lChoBkdAkCuwOnVG1GgHTegDaAhHQJylcAQxveh1fZQoaAZHQIwo7AnDziFoB03oA2gIR0Ccp2KuB+WodX2UKGgGR0CPX8kP+XJHaAdN6ANoCEdAnLJDIzWPLnV9lChoBkdAjXZYuK4x12gHTegDaAhHQJyysN9YwIt1fZQoaAZHQI+Oi1y/9HdoB03oA2gIR0CctBlgtvn9dX2UKGgGR0CNR9VwxWT5aAdN6ANoCEdAnLXeQQtjC3V9lChoBkdAi7CMQumJnGgHTegDaAhHQJzAeqXF98Z1fZQoaAZHQIzfnwZwXIloB03oA2gIR0CcwOaDPGADdX2UKGgGR0COTUFW4mTlaAdN6ANoCEdAnMJHxaxHG3V9lChoBkdAjjVZoGpuM2gHTegDaAhHQJzEENqgyuZ1fZQoaAZHQIY7y24NI9VoB03uAmgIR0CczNmuTzNEdX2UKGgGR0CO4KmrKeTWaAdN6ANoCEdAnM6W5paibnV9lChoBkdAjb6lN1yNoGgHTegDaAhHQJzPAxvegth1fZQoaAZHQI2mkLfDUExoB03oA2gIR0Cc0jSxJNCadX2UKGgGR0CNfii7CiyqaAdN6ANoCEdAnNs5NKyv93V9lChoBkdAiT7KA8Swn2gHTegDaAhHQJzdxqqOtGN1fZQoaAZHQI6Cec8TzupoB03oA2gIR0Cc3kHlfZ27dX2UKGgGR0CKi146fapQaAdN6ANoCEdAnOFpYxL0z3VlLg=="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 62500, "n_steps": 8, "gamma": 0.99, "gae_lambda": 0.9, "ent_coef": 0.0, "vf_coef": 0.4, "max_grad_norm": 0.5, "normalize_advantage": false, "system_info": {"OS": "Linux-5.19.0-32-generic-x86_64-with-glibc2.35 #33~22.04.1-Ubuntu SMP PREEMPT_DYNAMIC Mon Jan 30 17:03:34 UTC 2", "Python": "3.9.12", "Stable-Baselines3": "1.5.0", "PyTorch": "1.13.1", "GPU Enabled": "False", "Numpy": "1.21.5", "Gym": "0.21.0"}}
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 978.60454724757, "std_reward": 103.5525640639164, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-02-19T20:21:26.833456"}
 
1
+ {"mean_reward": 911.5514172405004, "std_reward": 62.62223687512884, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-02-19T23:26:31.802350"}
vec_normalize.pkl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0bce46a402c7a94ed285298a1616b986427cc0ed6c0068094cae504f656d9ce0
3
  size 2136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d2c7b2d72079d9102bbc5a74a0e326d382d0b55b0d8469cda58eeb886b78fbea
3
  size 2136