ntinosmg commited on
Commit
8625493
1 Parent(s): f7d2750

Upload PPO LunarLander-v2 agaent

Browse files
README.md CHANGED
@@ -8,16 +8,17 @@ tags:
8
  model-index:
9
  - name: PPO
10
  results:
11
- - metrics:
12
- - type: mean_reward
13
- value: 254.13 +/- 18.54
14
- name: mean_reward
15
- task:
16
  type: reinforcement-learning
17
  name: reinforcement-learning
18
  dataset:
19
  name: LunarLander-v2
20
  type: LunarLander-v2
 
 
 
 
 
21
  ---
22
 
23
  # **PPO** Agent playing **LunarLander-v2**
8
  model-index:
9
  - name: PPO
10
  results:
11
+ - task:
 
 
 
 
12
  type: reinforcement-learning
13
  name: reinforcement-learning
14
  dataset:
15
  name: LunarLander-v2
16
  type: LunarLander-v2
17
+ metrics:
18
+ - type: mean_reward
19
+ value: 249.90 +/- 12.94
20
+ name: mean_reward
21
+ verified: false
22
  ---
23
 
24
  # **PPO** Agent playing **LunarLander-v2**
config.json CHANGED
@@ -1 +1 @@
1
- {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f9375a68950>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f9375a689e0>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f9375a68a70>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f9375a68b00>", "_build": "<function ActorCriticPolicy._build at 0x7f9375a68b90>", "forward": "<function ActorCriticPolicy.forward at 0x7f9375a68c20>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f9375a68cb0>", "_predict": "<function ActorCriticPolicy._predict at 0x7f9375a68d40>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f9375a68dd0>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f9375a68e60>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f9375a68ef0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc_data object at 0x7f9375a38750>"}, "verbose": 1, "policy_kwargs": {}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVngEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBXNoYXBllEsIhZSMA2xvd5SMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYgAAAAAAAAAAAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/lGgKSwiFlIwBQ5R0lFKUjARoaWdolGgSKJYgAAAAAAAAAAAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/lGgKSwiFlGgVdJRSlIwNYm91bmRlZF9iZWxvd5RoEiiWCAAAAAAAAAAAAAAAAAAAAJRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZRoFXSUUpSMDWJvdW5kZWRfYWJvdmWUaBIolggAAAAAAAAAAAAAAAAAAACUaCFLCIWUaBV0lFKUjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "shape": [8], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False]", "bounded_above": "[False False False False False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gAWVgQAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwFc2hhcGWUKYwFZHR5cGWUjAVudW1weZRoB5OUjAJpOJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRijApfbnBfcmFuZG9tlE51Yi4=", "n": 4, "shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "num_timesteps": 1015808, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1658858481.9140642, "learning_rate": 0.0003, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVvwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAUsBSxNDBIgAUwCUToWUKYwBX5SFlIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCB9lH2UKGgXaA6MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgYjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAALPaED0e+rg/4hExPw23gD6/kLK87p7IuwAAAAAAAAAAc6zUva6Fl7ruT1Q8tVdZNpSxETpmIFI1AACAPwAAAABmesG79nRkuru10rn3aWA1ivW7ulVa9zgAAIA/AACAP03SNz4oWTo/rjVvvs6dfb6k5G29w9MNvQAAAAAAAAAAzSHYPQUO8LuK7Ai9s6H7PFy/OL2QZ849AAAAAAAAgD8a8KA9BDqcP21hJj5RZ6G+7FQHPuoytToAAAAAAAAAAKB9Gb5kF0U+neEAPjR2Nr7LevQ6iyUUPQAAAAAAAAAAM1kRvNIMwLsruYE7STmdPDfewbud2li8AACAPwAAgD/Nt3W9S53ZPWqUiT0B+CW+XI3/PDIP07wAAAAAAAAAADP0Yb14Ick89inVPZxiML7bpY08EoxyPQAAAAAAAAAAzQenvR9N77mGVHk8QZ6INC6rpbrAWPUyAAAAAAAAAADN18c8KbhYukrVKDiGVhMz1uFfuhvCRrcAAIA/AACAP2ZYqL0fvaC5hU3iOjW4DDazEbA6rwwEugAAgD8AAIA/WjjXPdvFAj80RwG+Qd1fvjAx9bvmiZ+5AAAAAAAAAADzk5Q9ObAXP0oPhL1D95u+CNWbPE5mLT0AAAAAAAAAAJoZVDsp2BG6KXDLu8wv8Tcrsq076ckRtwAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.015808000000000044, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVgRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIzXUaaSkGYkCUhpRSlIwBbJRN6AOMAXSUR0CR43xZuAI6dX2UKGgGaAloD0MIC+9yEV9dZECUhpRSlGgVTegDaBZHQJHmNHvttyh1fZQoaAZoCWgPQwjiBKbTulNjQJSGlFKUaBVN6ANoFkdAkeiTeXRgJHV9lChoBmgJaA9DCNnr3R/vTSnAlIaUUpRoFU0lAWgWR0CR+xWOp84QdX2UKGgGaAloD0MIsi0DztKNZkCUhpRSlGgVTegDaBZHQJH8BMSK3ux1fZQoaAZoCWgPQwhuTiUDwAdjQJSGlFKUaBVN6ANoFkdAkgNBjSXt0HV9lChoBmgJaA9DCNRkxtvK7mRAlIaUUpRoFU3oA2gWR0CSD5A5Jbt7dX2UKGgGaAloD0MIyECeXT7CY0CUhpRSlGgVTegDaBZHQJIPvdGiHqN1fZQoaAZoCWgPQwhv10tTBLVfQJSGlFKUaBVN6ANoFkdAkhbFqzqrzXV9lChoBmgJaA9DCFqEYitoy2RAlIaUUpRoFU3oA2gWR0CSGYIT4+KTdX2UKGgGaAloD0MIem8MAcAab0CUhpRSlGgVTY0CaBZHQJIdAtL+PzZ1fZQoaAZoCWgPQwhOm3Eaoo1kQJSGlFKUaBVN6ANoFkdAkiJjMJQcgnV9lChoBmgJaA9DCBFuMqoMHmNAlIaUUpRoFU3oA2gWR0CSJ7OH31zydX2UKGgGaAloD0MI6fAQxs8nYkCUhpRSlGgVTegDaBZHQJIn+0kWykd1fZQoaAZoCWgPQwgsLLgf8DdeQJSGlFKUaBVN6ANoFkdAkitHVG0/nnV9lChoBmgJaA9DCLBUF/Ay3m5AlIaUUpRoFU15AWgWR0CSL+z67/XHdX2UKGgGaAloD0MI58b0hKVfZkCUhpRSlGgVTegDaBZHQJIwAgxJul51fZQoaAZoCWgPQwiSWb3D7StlQJSGlFKUaBVN6ANoFkdAkjBnAEdNnHV9lChoBmgJaA9DCLa8cr1tbGVAlIaUUpRoFU3oA2gWR0CSNOBZZB9kdX2UKGgGaAloD0MIyLWhYhzIbECUhpRSlGgVTboDaBZHQJI2M8Tzund1fZQoaAZoCWgPQwgvv9NkRtFgQJSGlFKUaBVN6ANoFkdAkjc00iyIHnV9lChoBmgJaA9DCIszhjnBBWZAlIaUUpRoFU3oA2gWR0CSN5f0VafSdX2UKGgGaAloD0MI/B2KAn2na0CUhpRSlGgVTW0CaBZHQJJNOZ1FH8V1fZQoaAZoCWgPQwhvERjrW+NwQJSGlFKUaBVNmANoFkdAkk10m6XjVHV9lChoBmgJaA9DCBJMNbOW2m5AlIaUUpRoFU31AWgWR0CSUNqCYkVvdX2UKGgGaAloD0MIZVHYRdHKb0CUhpRSlGgVTUMDaBZHQJJSVQVKwpx1fZQoaAZoCWgPQwgNNQpJpiNxQJSGlFKUaBVNHwFoFkdAklcUx7AtWnV9lChoBmgJaA9DCLHCLR9J025AlIaUUpRoFU1jAWgWR0CSWcgVGkN4dX2UKGgGaAloD0MIJLa7B2j7YUCUhpRSlGgVTegDaBZHQJJb0S+QEIR1fZQoaAZoCWgPQwg+k/3ztLFjQJSGlFKUaBVN6ANoFkdAkmo+4kNWl3V9lChoBmgJaA9DCEXXhR+com1AlIaUUpRoFU1/AWgWR0CSapYnOSntdX2UKGgGaAloD0MIZ/M4DOafcECUhpRSlGgVTZcBaBZHQJJxl1uBMBZ1fZQoaAZoCWgPQwjyKJXwRKpwQJSGlFKUaBVNvANoFkdAknMl4s3AEnV9lChoBmgJaA9DCNO84xSdJmNAlIaUUpRoFU3oA2gWR0CSdWgHNX5ndX2UKGgGaAloD0MIMSQnE7fHW0CUhpRSlGgVTegDaBZHQJJ43WEsasJ1fZQoaAZoCWgPQwhqwCDpk/FwQJSGlFKUaBVN9AJoFkdAknre/tY0VXV9lChoBmgJaA9DCN16TQ8K+mVAlIaUUpRoFU3oA2gWR0CSfRGEwnIAdX2UKGgGaAloD0MI2Ne61Ai8YUCUhpRSlGgVTegDaBZHQJJ9JbNbC791fZQoaAZoCWgPQwhBYrt7gD5kQJSGlFKUaBVN6ANoFkdAkn146CDmKnV9lChoBmgJaA9DCEhwI2WLSmNAlIaUUpRoFU3oA2gWR0CSgwS2H+IedX2UKGgGaAloD0MI1VqYhfb2YkCUhpRSlGgVTegDaBZHQJKDcnkT6BR1fZQoaAZoCWgPQwj9TShEwHFkQJSGlFKUaBVN6ANoFkdAkpmyKekHlnV9lChoBmgJaA9DCJ29M9oqEGFAlIaUUpRoFU3oA2gWR0CSnhi6g/TtdX2UKGgGaAloD0MIgxPRr626akCUhpRSlGgVTUoDaBZHQJKgLsVtXPt1fZQoaAZoCWgPQwgF+dnI9fdwQJSGlFKUaBVNbQFoFkdAkqO0it7rs3V9lChoBmgJaA9DCFLzVfIxNXFAlIaUUpRoFU3VAWgWR0CSpt6OHWSVdX2UKGgGaAloD0MIteGwNPDPXECUhpRSlGgVTegDaBZHQJKnSFFlTWJ1fZQoaAZoCWgPQwipFhHFZIptQJSGlFKUaBVNyAFoFkdAkqhczl90BHV9lChoBmgJaA9DCOokW10OT3FAlIaUUpRoFU0iAWgWR0CSqgq1w5vMdX2UKGgGaAloD0MIeqaXGItbcECUhpRSlGgVTaoCaBZHQJKq2OuJUHZ1fZQoaAZoCWgPQwjRWtHmOItrQJSGlFKUaBVNeAFoFkdAkqrzkdV/+nV9lChoBmgJaA9DCDi/YaJBwm1AlIaUUpRoFU3tAmgWR0CSr+Mqz7djdX2UKGgGaAloD0MIdOygElf6Y0CUhpRSlGgVTegDaBZHQJKzqCDmKZV1fZQoaAZoCWgPQwjpmzQNCpZhQJSGlFKUaBVN6ANoFkdAkrPsyBTXKHV9lChoBmgJaA9DCCHp0yr6h29AlIaUUpRoFU2PAWgWR0CSuHDyvs7ddX2UKGgGaAloD0MI3L3cJ8c4YECUhpRSlGgVTegDaBZHQJK53W+XZ5B1fZQoaAZoCWgPQwhTWRR2kcRxQJSGlFKUaBVNAQJoFkdAkrtBc/t6X3V9lChoBmgJaA9DCG0ANiBCl25AlIaUUpRoFU1vAWgWR0CSvb+LWI43dX2UKGgGaAloD0MI598u+3V+b0CUhpRSlGgVTboDaBZHQJK+AY64lQd1fZQoaAZoCWgPQwjGwaVjzohsQJSGlFKUaBVNgwJoFkdAksAFhPTG53V9lChoBmgJaA9DCJ2dDI4Sa2BAlIaUUpRoFU3oA2gWR0CSxEBGQSzxdX2UKGgGaAloD0MIDag3o+YTZkCUhpRSlGgVTegDaBZHQJLLWQYDT0B1fZQoaAZoCWgPQwixwi0fyXRxQJSGlFKUaBVNAQJoFkdAkstslHBk7XV9lChoBmgJaA9DCHODoQ6r7GxAlIaUUpRoFU3PAWgWR0CSzMPVNHpbdX2UKGgGaAloD0MIJh5QNmUIbkCUhpRSlGgVTYcBaBZHQJLNr24/eLx1fZQoaAZoCWgPQwhBRkCFI2ptQJSGlFKUaBVNawFoFkdAks77Zi/fwnV9lChoBmgJaA9DCIYgByXM6G5AlIaUUpRoFU38AmgWR0CSz0j9XLeRdX2UKGgGaAloD0MIeTpXlJJAbECUhpRSlGgVTdoBaBZHQJLnvJW/8EV1fZQoaAZoCWgPQwjHSPYIdcNxQJSGlFKUaBVNAQNoFkdAkufqjSG8EnV9lChoBmgJaA9DCO+NIQC4r29AlIaUUpRoFU2tAWgWR0CS6V90zTF3dX2UKGgGaAloD0MIyAiocIQwa0CUhpRSlGgVTWADaBZHQJLqDcDbJwN1fZQoaAZoCWgPQwgA4xk0dCpuQJSGlFKUaBVNcQNoFkdAkux9hRZU1nV9lChoBmgJaA9DCNo8DoP5JUhAlIaUUpRoFU0zAWgWR0CS75MHKOktdX2UKGgGaAloD0MI+rfLft2cZUCUhpRSlGgVTegDaBZHQJLv4oy9EkV1fZQoaAZoCWgPQwgBUMWNW9huQJSGlFKUaBVNKQJoFkdAkvG0BOpKjHV9lChoBmgJaA9DCMDnhxHCOmxAlIaUUpRoFU36AWgWR0CS819EkSmJdX2UKGgGaAloD0MIqP3WThS9bUCUhpRSlGgVTY0CaBZHQJL0Mk0Jng51fZQoaAZoCWgPQwj1aRX9IcluQJSGlFKUaBVNmAFoFkdAkvZkFGG21HV9lChoBmgJaA9DCNJT5BAxinBAlIaUUpRoFU3bAWgWR0CS98TN+so2dX2UKGgGaAloD0MIelORCuMvbkCUhpRSlGgVTeYBaBZHQJL5ZppN9IB1fZQoaAZoCWgPQwgNMzSeSPdxQJSGlFKUaBVNngFoFkdAkvwNqUNayXV9lChoBmgJaA9DCOkrSDMWZ2NAlIaUUpRoFU3oA2gWR0CS/DYq5LAYdX2UKGgGaAloD0MIisvxCkTJUECUhpRSlGgVTQcBaBZHQJL8p4/u9e11fZQoaAZoCWgPQwjLhcq/FrNyQJSGlFKUaBVNoAFoFkdAkv2o3WFvh3V9lChoBmgJaA9DCNfCLLTzBHFAlIaUUpRoFU1tAWgWR0CS/jWjXWe6dX2UKGgGaAloD0MITwRxHk6kOECUhpRSlGgVTR0BaBZHQJL/CACnxax1fZQoaAZoCWgPQwh+Vpkprc8awJSGlFKUaBVNBQFoFkdAkwN1j/dZaHV9lChoBmgJaA9DCCZUcHhBOHFAlIaUUpRoFU18AWgWR0CTBLgRsdkrdX2UKGgGaAloD0MI+8qD9FTkcECUhpRSlGgVTcACaBZHQJMFJTisGPh1fZQoaAZoCWgPQwi6vg8HCVlvQJSGlFKUaBVNSAJoFkdAkwVpzT4L1HV9lChoBmgJaA9DCIhJuJBHjXFAlIaUUpRoFU1/AmgWR0CTBdTdLxqgdX2UKGgGaAloD0MIsBu2LUqQckCUhpRSlGgVTa8BaBZHQJMHVmh/RVp1fZQoaAZoCWgPQwgmHeVgNnVtQJSGlFKUaBVNXAFoFkdAkwhKol2NenV9lChoBmgJaA9DCMuGNZVFyXBAlIaUUpRoFU0tAmgWR0CTCIR5kbxWdX2UKGgGaAloD0MIAJATJkwucUCUhpRSlGgVTVQBaBZHQJMJ9sbedkJ1fZQoaAZoCWgPQwjc8pGUdGNyQJSGlFKUaBVNTQNoFkdAkwor3Cbc5HV9lChoBmgJaA9DCOl/uRYt3GxAlIaUUpRoFU1ZAWgWR0CTC+osI3R5dX2UKGgGaAloD0MI2V92T56vb0CUhpRSlGgVTf8BaBZHQJML/iYLLIR1fZQoaAZoCWgPQwg89N2trJpuQJSGlFKUaBVN0AFoFkdAkxBMWGh24nV9lChoBmgJaA9DCExSmWIOQ3BAlIaUUpRoFU3QAWgWR0CTEfk5IYm+dWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 248, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVvwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAUsBSxNDBIgAUwCUToWUKYwBX5SFlIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCB9lH2UKGgXaA6MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgYjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "system_info": {"OS": "Linux-5.4.188+-x86_64-with-Ubuntu-18.04-bionic #1 SMP Sun Apr 24 10:03:06 PDT 2022", "Python": "3.7.13", "Stable-Baselines3": "1.6.0", "PyTorch": "1.12.0+cu113", "GPU Enabled": "True", "Numpy": "1.21.6", "Gym": "0.17.3"}}
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f736e7cdf70>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f736e754040>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f736e7540d0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f736e754160>", "_build": "<function ActorCriticPolicy._build at 0x7f736e7541f0>", "forward": "<function ActorCriticPolicy.forward at 0x7f736e754280>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f736e754310>", "_predict": "<function ActorCriticPolicy._predict at 0x7f736e7543a0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f736e754430>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f736e7544c0>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f736e754550>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc_data object at 0x7f736e7d1120>"}, "verbose": 1, "policy_kwargs": {}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVnwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/5RoCksIhZSMAUOUdJRSlIwEaGlnaJRoEiiWIAAAAAAAAAAAAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAf5RoCksIhZRoFXSUUpSMDWJvdW5kZWRfYmVsb3eUaBIolggAAAAAAAAAAAAAAAAAAACUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYIAAAAAAAAAAAAAAAAAAAAlGghSwiFlGgVdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [8], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False]", "bounded_above": "[False False False False False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gAWVggAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUaAeTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu", "n": 4, "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "num_timesteps": 1015808, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1670418421450258399, "learning_rate": 0.0003, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4BDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/M6kqMFUyYYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAMDF7z17a5U/sxiOPmJIm74rdRg+w6IZPgAAAAAAAAAAAJGkPcO5Nrpm3fA6UQCLNcD6WDolpwu6AACAPwAAgD/NtBk9H4W1NmmfN7gHZMK2HInVul0s1TYAAIA/AACAP03Vxz3DzVK61EMCvK8VJ7VNcA27d1ijNAAAgD8AAIA/jaIrPpW0Xj5i1ES+Xot5viEJNr0O4as9AAAAAAAAAADNUgk8+QIzPvbIeL0CRoS+YroOPbrRj70AAAAAAAAAAGaH7jz2fCy6oitLOq/hKTWCoFI6GDFruQAAgD8AAIA/DTeKvfZ8L7ridQ667eePtAtxK7lH7ic5AACAPwAAgD+AmAE99oRaupYQOLt3/M03Z7Kxuh4m+zkAAIA/AACAPw3VAD5KLJA/ShGBPoFOp762S849IRerPQAAAAAAAAAAWu/PveHAh7o9Fh43hsEIMuCzQ7luiTi2AACAPwAAAAAzZ7E9uH7jOPaMxzWR2BQ2xMFfOkp3NLUAAIA/AAAAAI2fuz2Pxk+6Bt/pukA4FbZ+Cqw6++8EOgAAgD8AAIA/AF/7vOlZfD6QJXw9RBFovputSDuSuXY9AAAAAAAAAACmr5W9e6aBuj3yZ7v1UpE2XcWOOrZDhzoAAIA/AACAP014NL179ou66iphO5m6lzgIXiS6oi0FugAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.015808000000000044, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVfhAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIuf3yyQrpY0CUhpRSlIwBbJRN6AOMAXSUR0CQr5qI7/4qdX2UKGgGaAloD0MIY7g6AGLqY0CUhpRSlGgVTegDaBZHQJCwcBaLXMB1fZQoaAZoCWgPQwi0Hr5MFEJfQJSGlFKUaBVN6ANoFkdAkLQZnL7oCHV9lChoBmgJaA9DCO571F+vZ15AlIaUUpRoFU3oA2gWR0CQuqXbuc+adX2UKGgGaAloD0MIrd9MTJeiYECUhpRSlGgVTegDaBZHQJC942n889x1fZQoaAZoCWgPQwhnuWx0TlJmQJSGlFKUaBVN6ANoFkdAkL5d2ki2UnV9lChoBmgJaA9DCBJMNbOWEGtAlIaUUpRoFU2yA2gWR0CQwPPrv9cbdX2UKGgGaAloD0MIDjDzHfxoTECUhpRSlGgVS/xoFkdAkMOS/fwZwXV9lChoBmgJaA9DCDZbecn/IGNAlIaUUpRoFU3oA2gWR0CQxZpQk5ZKdX2UKGgGaAloD0MIW+uLhLZ8XkCUhpRSlGgVTegDaBZHQJDHKaZx7zF1fZQoaAZoCWgPQwgKEXAI1WpiQJSGlFKUaBVN6ANoFkdAkNCcPatcOnV9lChoBmgJaA9DCH/3jhoT1GRAlIaUUpRoFU3oA2gWR0CQ0e8Aq/dqdX2UKGgGaAloD0MIDJOpglHCXkCUhpRSlGgVTegDaBZHQJDYLEcbR4R1fZQoaAZoCWgPQwjbpQ2HJWJgQJSGlFKUaBVN6ANoFkdAkNoTakAPu3V9lChoBmgJaA9DCAGG5c+3UmVAlIaUUpRoFU3oA2gWR0CQ9eAFPi1idX2UKGgGaAloD0MIX5Z2aq6FZECUhpRSlGgVTegDaBZHQJD2iCjDbah1fZQoaAZoCWgPQwhAogkUscJkQJSGlFKUaBVN6ANoFkdAkQBEbT+efHV9lChoBmgJaA9DCCU+d4L9DWFAlIaUUpRoFU3oA2gWR0CRAJVZcLSedX2UKGgGaAloD0MIrp6T3rcEZkCUhpRSlGgVTegDaBZHQJEBbWbwz+F1fZQoaAZoCWgPQwg8wf7r3OVkQJSGlFKUaBVN6ANoFkdAkQtpEc81XXV9lChoBmgJaA9DCKaAtP8BcWZAlIaUUpRoFU3oA2gWR0CRDnaFEiMYdX2UKGgGaAloD0MI1VxuMFRAZkCUhpRSlGgVTegDaBZHQJEO7gQ6IWR1fZQoaAZoCWgPQwi7mdGPhhVnQJSGlFKUaBVN6ANoFkdAkRGIRAbADnV9lChoBmgJaA9DCPSHZp5cyU5AlIaUUpRoFU0tAWgWR0CRE6SkTHsDdX2UKGgGaAloD0MICr/Uz5s6YkCUhpRSlGgVTegDaBZHQJEUMY51eSl1fZQoaAZoCWgPQwgHswkwrE1kQJSGlFKUaBVN6ANoFkdAkRXlLeyiVXV9lChoBmgJaA9DCCZV203w6WFAlIaUUpRoFU3oA2gWR0CRF2nLJSzgdX2UKGgGaAloD0MIqwfMQybMYECUhpRSlGgVTegDaBZHQJEf196Tnq51fZQoaAZoCWgPQwhSRfEq68xkQJSGlFKUaBVN6ANoFkdAkSEryH2ys3V9lChoBmgJaA9DCGCxhovc+2FAlIaUUpRoFU3oA2gWR0CRJ2Ssr/bTdX2UKGgGaAloD0MIizVc5J5EZECUhpRSlGgVTegDaBZHQJEpOLgn+hp1fZQoaAZoCWgPQwi+TurL0ixfQJSGlFKUaBVN6ANoFkdAkUQNmxt52XV9lChoBmgJaA9DCNWytb5IW11AlIaUUpRoFU3oA2gWR0CRRJ12aDwpdX2UKGgGaAloD0MIgEi/fZ0IZECUhpRSlGgVTegDaBZHQJFNkeU6gdx1fZQoaAZoCWgPQwhwQEtXsOFeQJSGlFKUaBVN6ANoFkdAkU3RmkFfRnV9lChoBmgJaA9DCK5JtyVy9WZAlIaUUpRoFU3oA2gWR0CRWMJng5zYdX2UKGgGaAloD0MIvXMoQ1WTY0CUhpRSlGgVTegDaBZHQJFcGqfe1rt1fZQoaAZoCWgPQwigGFkyx31jQJSGlFKUaBVN6ANoFkdAkVydbkfcOHV9lChoBmgJaA9DCPPn24Kl9F9AlIaUUpRoFU3oA2gWR0CRX2DF6zE8dX2UKGgGaAloD0MIfA4sR8hRXUCUhpRSlGgVTegDaBZHQJFhmQJXyRV1fZQoaAZoCWgPQwgeNSbE3GNmQJSGlFKUaBVN6ANoFkdAkWIvM8ox6HV9lChoBmgJaA9DCK3AkNWtgmFAlIaUUpRoFU3oA2gWR0CRZAt7rs0IdX2UKGgGaAloD0MIAFKbODkPYUCUhpRSlGgVTegDaBZHQJFlokOZssR1fZQoaAZoCWgPQwgoSddMvitlQJSGlFKUaBVN6ANoFkdAkW+JccENfHV9lChoBmgJaA9DCC13ZoJhDmJAlIaUUpRoFU3oA2gWR0CRcPvSMLncdX2UKGgGaAloD0MIVS+/02SsYkCUhpRSlGgVTegDaBZHQJF3/vv0AcV1fZQoaAZoCWgPQwj76xUW3N5fQJSGlFKUaBVN6ANoFkdAkXni0jTrmnV9lChoBmgJaA9DCACpTZzc4V1AlIaUUpRoFU3oA2gWR0CRlWqz7di2dX2UKGgGaAloD0MIjDBFuTQmZkCUhpRSlGgVTegDaBZHQJGWA4HX2/V1fZQoaAZoCWgPQwinrnyW5ytlQJSGlFKUaBVN6ANoFkdAkZ9668QI2XV9lChoBmgJaA9DCGB2Tx4WCVtAlIaUUpRoFU3oA2gWR0CRn74mkWRBdX2UKGgGaAloD0MIJbIPsqzpZECUhpRSlGgVTegDaBZHQJGqkjOcDr91fZQoaAZoCWgPQwiASSpTTK9jQJSGlFKUaBVN6ANoFkdAka4JZbILgHV9lChoBmgJaA9DCJjg1AeSaGRAlIaUUpRoFU3oA2gWR0CRrox4ptrLdX2UKGgGaAloD0MILSRgdPnQYUCUhpRSlGgVTegDaBZHQJGxSW3Sa3J1fZQoaAZoCWgPQwiGjh1U4iBeQJSGlFKUaBVN6ANoFkdAkbNKHsTnJXV9lChoBmgJaA9DCKWEYFW9ZmVAlIaUUpRoFU3oA2gWR0CRs9iZfD1odX2UKGgGaAloD0MIfewuUNLDZUCUhpRSlGgVTegDaBZHQJG1hun/DLt1fZQoaAZoCWgPQwjwTdNnh1pgQJSGlFKUaBVN6ANoFkdAkbbaHbh3q3V9lChoBmgJaA9DCLEYda29LUxAlIaUUpRoFUvhaBZHQJG3YzbeuV51fZQoaAZoCWgPQwiXj6Skh8JkQJSGlFKUaBVN6ANoFkdAkb6/+GXXy3V9lChoBmgJaA9DCNrlWx9WJ2NAlIaUUpRoFU3oA2gWR0CRv/3lCCz1dX2UKGgGaAloD0MIG9e/6zMOY0CUhpRSlGgVTegDaBZHQJHF03FUADJ1fZQoaAZoCWgPQwimSL4SyLdjQJSGlFKUaBVN6ANoFkdAkceNVWCEpXV9lChoBmgJaA9DCNcYdELop15AlIaUUpRoFU3oA2gWR0CR4iNVinYQdX2UKGgGaAloD0MIkXwlkBL2ZECUhpRSlGgVTegDaBZHQJHisZMtbs51fZQoaAZoCWgPQwjN5nEYzOhfQJSGlFKUaBVN6ANoFkdAkesyXD3ueHV9lChoBmgJaA9DCJCg+DFmaWNAlIaUUpRoFU3oA2gWR0CR62w6QvHtdX2UKGgGaAloD0MIbVSnA9ncYkCUhpRSlGgVTegDaBZHQJH5H2wmmch1fZQoaAZoCWgPQwhpq5LIPiJdQJSGlFKUaBVN6ANoFkdAkfmoQe3hGnV9lChoBmgJaA9DCAJHAg02C1xAlIaUUpRoFU3oA2gWR0CR/DrTH80ldX2UKGgGaAloD0MI2UKQgxKoZECUhpRSlGgVTegDaBZHQJH+RbJOnEV1fZQoaAZoCWgPQwhPyTmxhw5kQJSGlFKUaBVN6ANoFkdAkf7Qtrbg0nV9lChoBmgJaA9DCOZ2L/fJPVxAlIaUUpRoFU3oA2gWR0CSAHLlFMIvdX2UKGgGaAloD0MIoMTnTjCMY0CUhpRSlGgVTegDaBZHQJIB0RwqAjJ1fZQoaAZoCWgPQwhqM05D1BllQJSGlFKUaBVN6ANoFkdAkgJipeeFtnV9lChoBmgJaA9DCIRnQpPE62FAlIaUUpRoFU3oA2gWR0CSCmiyY5T7dX2UKGgGaAloD0MIwO0JEltKZUCUhpRSlGgVTegDaBZHQJILn1L8Jld1fZQoaAZoCWgPQwg0SSwp999iQJSGlFKUaBVN6ANoFkdAkhGH+ERJ3HV9lChoBmgJaA9DCO9Z12i5GGBAlIaUUpRoFU3oA2gWR0CSE0N+so2GdX2UKGgGaAloD0MIzox+NJyvY0CUhpRSlGgVTegDaBZHQJIb1B/qgRN1fZQoaAZoCWgPQwis4/ih0q9jQJSGlFKUaBVN6ANoFkdAkhx4zrNW2nV9lChoBmgJaA9DCA1yF2GKV2NAlIaUUpRoFU3oA2gWR0CSN9kQPI4mdX2UKGgGaAloD0MI0zJS7ykfYkCUhpRSlGgVTegDaBZHQJI4FWsA/9p1fZQoaAZoCWgPQwhOfLWjOFpiQJSGlFKUaBVN6ANoFkdAkkWlpblijXV9lChoBmgJaA9DCAk4hCq1zGFAlIaUUpRoFU3oA2gWR0CSRhyBClabdX2UKGgGaAloD0MIr3d/vFeBSUCUhpRSlGgVS/1oFkdAkkcxKg7HQ3V9lChoBmgJaA9DCKVneokx+WNAlIaUUpRoFU3oA2gWR0CSSLADq4YrdX2UKGgGaAloD0MI04cuqG/XZ0CUhpRSlGgVTegDaBZHQJJKrYxtYSx1fZQoaAZoCWgPQwi/YDdsW7djQJSGlFKUaBVN6ANoFkdAkktMibDuSnV9lChoBmgJaA9DCIC5Fi1AOGJAlIaUUpRoFU3oA2gWR0CSTQVqesgddX2UKGgGaAloD0MIqb7zi5LiZUCUhpRSlGgVTegDaBZHQJJOZC/oJRh1fZQoaAZoCWgPQwjByMua2LllQJSGlFKUaBVN6ANoFkdAkk7tPpIMB3V9lChoBmgJaA9DCD1DOGbZBWVAlIaUUpRoFU3oA2gWR0CSVegccU/OdX2UKGgGaAloD0MIhnXj3ZFKYUCUhpRSlGgVTegDaBZHQJJXArrgOz91fZQoaAZoCWgPQwg5Y5gTtEZgQJSGlFKUaBVN6ANoFkdAkl0iw4bS7XV9lChoBmgJaA9DCCZRL/g032tAlIaUUpRoFU2mAWgWR0CSXsVZs9B9dX2UKGgGaAloD0MIPnWsUvrEY0CUhpRSlGgVTegDaBZHQJJe98XvYvp1fZQoaAZoCWgPQwjzdRn+UwplQJSGlFKUaBVN6ANoFkdAkmdWT1TR6XV9lChoBmgJaA9DCAADQYCM32JAlIaUUpRoFU3oA2gWR0CSZ/WTot+TdWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 248, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4BDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/yZmZmZmZmoWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "system_info": {"OS": "Linux-5.10.133+-x86_64-with-glibc2.27 #1 SMP Fri Aug 26 08:44:51 UTC 2022", "Python": "3.8.15", "Stable-Baselines3": "1.6.2", "PyTorch": "1.12.1+cu113", "GPU Enabled": "True", "Numpy": "1.21.6", "Gym": "0.21.0"}}
ppo-LunarLander-v2.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:75ab15e1f1204e6dc264180626a90a29cbf8911eee9af0601db3aef194c3f8f5
3
- size 147144
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:63e20496f1d3e8917393169d1d9be7f1e82c5dc28b893dbe66e7e881e62f7a52
3
+ size 147150
ppo-LunarLander-v2/_stable_baselines3_version CHANGED
@@ -1 +1 @@
1
- 1.6.0
1
+ 1.6.2
ppo-LunarLander-v2/data CHANGED
@@ -4,27 +4,27 @@
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
- "__init__": "<function ActorCriticPolicy.__init__ at 0x7f9375a68950>",
8
- "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f9375a689e0>",
9
- "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f9375a68a70>",
10
- "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f9375a68b00>",
11
- "_build": "<function ActorCriticPolicy._build at 0x7f9375a68b90>",
12
- "forward": "<function ActorCriticPolicy.forward at 0x7f9375a68c20>",
13
- "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f9375a68cb0>",
14
- "_predict": "<function ActorCriticPolicy._predict at 0x7f9375a68d40>",
15
- "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f9375a68dd0>",
16
- "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f9375a68e60>",
17
- "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f9375a68ef0>",
18
  "__abstractmethods__": "frozenset()",
19
- "_abc_impl": "<_abc_data object at 0x7f9375a38750>"
20
  },
21
  "verbose": 1,
22
  "policy_kwargs": {},
23
  "observation_space": {
24
  ":type:": "<class 'gym.spaces.box.Box'>",
25
- ":serialized:": "gAWVngEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBXNoYXBllEsIhZSMA2xvd5SMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYgAAAAAAAAAAAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/lGgKSwiFlIwBQ5R0lFKUjARoaWdolGgSKJYgAAAAAAAAAAAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/lGgKSwiFlGgVdJRSlIwNYm91bmRlZF9iZWxvd5RoEiiWCAAAAAAAAAAAAAAAAAAAAJRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZRoFXSUUpSMDWJvdW5kZWRfYWJvdmWUaBIolggAAAAAAAAAAAAAAAAAAACUaCFLCIWUaBV0lFKUjApfbnBfcmFuZG9tlE51Yi4=",
26
  "dtype": "float32",
27
- "shape": [
28
  8
29
  ],
30
  "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]",
@@ -35,9 +35,9 @@
35
  },
36
  "action_space": {
37
  ":type:": "<class 'gym.spaces.discrete.Discrete'>",
38
- ":serialized:": "gAWVgQAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwFc2hhcGWUKYwFZHR5cGWUjAVudW1weZRoB5OUjAJpOJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRijApfbnBfcmFuZG9tlE51Yi4=",
39
  "n": 4,
40
- "shape": [],
41
  "dtype": "int64",
42
  "_np_random": null
43
  },
@@ -47,16 +47,16 @@
47
  "_num_timesteps_at_start": 0,
48
  "seed": null,
49
  "action_noise": null,
50
- "start_time": 1658858481.9140642,
51
  "learning_rate": 0.0003,
52
  "tensorboard_log": null,
53
  "lr_schedule": {
54
  ":type:": "<class 'function'>",
55
- ":serialized:": "gAWVvwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAUsBSxNDBIgAUwCUToWUKYwBX5SFlIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCB9lH2UKGgXaA6MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgYjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"
56
  },
57
  "_last_obs": {
58
  ":type:": "<class 'numpy.ndarray'>",
59
- ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAALPaED0e+rg/4hExPw23gD6/kLK87p7IuwAAAAAAAAAAc6zUva6Fl7ruT1Q8tVdZNpSxETpmIFI1AACAPwAAAABmesG79nRkuru10rn3aWA1ivW7ulVa9zgAAIA/AACAP03SNz4oWTo/rjVvvs6dfb6k5G29w9MNvQAAAAAAAAAAzSHYPQUO8LuK7Ai9s6H7PFy/OL2QZ849AAAAAAAAgD8a8KA9BDqcP21hJj5RZ6G+7FQHPuoytToAAAAAAAAAAKB9Gb5kF0U+neEAPjR2Nr7LevQ6iyUUPQAAAAAAAAAAM1kRvNIMwLsruYE7STmdPDfewbud2li8AACAPwAAgD/Nt3W9S53ZPWqUiT0B+CW+XI3/PDIP07wAAAAAAAAAADP0Yb14Ick89inVPZxiML7bpY08EoxyPQAAAAAAAAAAzQenvR9N77mGVHk8QZ6INC6rpbrAWPUyAAAAAAAAAADN18c8KbhYukrVKDiGVhMz1uFfuhvCRrcAAIA/AACAP2ZYqL0fvaC5hU3iOjW4DDazEbA6rwwEugAAgD8AAIA/WjjXPdvFAj80RwG+Qd1fvjAx9bvmiZ+5AAAAAAAAAADzk5Q9ObAXP0oPhL1D95u+CNWbPE5mLT0AAAAAAAAAAJoZVDsp2BG6KXDLu8wv8Tcrsq076ckRtwAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
60
  },
61
  "_last_episode_starts": {
62
  ":type:": "<class 'numpy.ndarray'>",
@@ -69,7 +69,7 @@
69
  "_current_progress_remaining": -0.015808000000000044,
70
  "ep_info_buffer": {
71
  ":type:": "<class 'collections.deque'>",
72
- ":serialized:": "gAWVgRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIzXUaaSkGYkCUhpRSlIwBbJRN6AOMAXSUR0CR43xZuAI6dX2UKGgGaAloD0MIC+9yEV9dZECUhpRSlGgVTegDaBZHQJHmNHvttyh1fZQoaAZoCWgPQwjiBKbTulNjQJSGlFKUaBVN6ANoFkdAkeiTeXRgJHV9lChoBmgJaA9DCNnr3R/vTSnAlIaUUpRoFU0lAWgWR0CR+xWOp84QdX2UKGgGaAloD0MIsi0DztKNZkCUhpRSlGgVTegDaBZHQJH8BMSK3ux1fZQoaAZoCWgPQwhuTiUDwAdjQJSGlFKUaBVN6ANoFkdAkgNBjSXt0HV9lChoBmgJaA9DCNRkxtvK7mRAlIaUUpRoFU3oA2gWR0CSD5A5Jbt7dX2UKGgGaAloD0MIyECeXT7CY0CUhpRSlGgVTegDaBZHQJIPvdGiHqN1fZQoaAZoCWgPQwhv10tTBLVfQJSGlFKUaBVN6ANoFkdAkhbFqzqrzXV9lChoBmgJaA9DCFqEYitoy2RAlIaUUpRoFU3oA2gWR0CSGYIT4+KTdX2UKGgGaAloD0MIem8MAcAab0CUhpRSlGgVTY0CaBZHQJIdAtL+PzZ1fZQoaAZoCWgPQwhOm3Eaoo1kQJSGlFKUaBVN6ANoFkdAkiJjMJQcgnV9lChoBmgJaA9DCBFuMqoMHmNAlIaUUpRoFU3oA2gWR0CSJ7OH31zydX2UKGgGaAloD0MI6fAQxs8nYkCUhpRSlGgVTegDaBZHQJIn+0kWykd1fZQoaAZoCWgPQwgsLLgf8DdeQJSGlFKUaBVN6ANoFkdAkitHVG0/nnV9lChoBmgJaA9DCLBUF/Ay3m5AlIaUUpRoFU15AWgWR0CSL+z67/XHdX2UKGgGaAloD0MI58b0hKVfZkCUhpRSlGgVTegDaBZHQJIwAgxJul51fZQoaAZoCWgPQwiSWb3D7StlQJSGlFKUaBVN6ANoFkdAkjBnAEdNnHV9lChoBmgJaA9DCLa8cr1tbGVAlIaUUpRoFU3oA2gWR0CSNOBZZB9kdX2UKGgGaAloD0MIyLWhYhzIbECUhpRSlGgVTboDaBZHQJI2M8Tzund1fZQoaAZoCWgPQwgvv9NkRtFgQJSGlFKUaBVN6ANoFkdAkjc00iyIHnV9lChoBmgJaA9DCIszhjnBBWZAlIaUUpRoFU3oA2gWR0CSN5f0VafSdX2UKGgGaAloD0MI/B2KAn2na0CUhpRSlGgVTW0CaBZHQJJNOZ1FH8V1fZQoaAZoCWgPQwhvERjrW+NwQJSGlFKUaBVNmANoFkdAkk10m6XjVHV9lChoBmgJaA9DCBJMNbOW2m5AlIaUUpRoFU31AWgWR0CSUNqCYkVvdX2UKGgGaAloD0MIZVHYRdHKb0CUhpRSlGgVTUMDaBZHQJJSVQVKwpx1fZQoaAZoCWgPQwgNNQpJpiNxQJSGlFKUaBVNHwFoFkdAklcUx7AtWnV9lChoBmgJaA9DCLHCLR9J025AlIaUUpRoFU1jAWgWR0CSWcgVGkN4dX2UKGgGaAloD0MIJLa7B2j7YUCUhpRSlGgVTegDaBZHQJJb0S+QEIR1fZQoaAZoCWgPQwg+k/3ztLFjQJSGlFKUaBVN6ANoFkdAkmo+4kNWl3V9lChoBmgJaA9DCEXXhR+com1AlIaUUpRoFU1/AWgWR0CSapYnOSntdX2UKGgGaAloD0MIZ/M4DOafcECUhpRSlGgVTZcBaBZHQJJxl1uBMBZ1fZQoaAZoCWgPQwjyKJXwRKpwQJSGlFKUaBVNvANoFkdAknMl4s3AEnV9lChoBmgJaA9DCNO84xSdJmNAlIaUUpRoFU3oA2gWR0CSdWgHNX5ndX2UKGgGaAloD0MIMSQnE7fHW0CUhpRSlGgVTegDaBZHQJJ43WEsasJ1fZQoaAZoCWgPQwhqwCDpk/FwQJSGlFKUaBVN9AJoFkdAknre/tY0VXV9lChoBmgJaA9DCN16TQ8K+mVAlIaUUpRoFU3oA2gWR0CSfRGEwnIAdX2UKGgGaAloD0MI2Ne61Ai8YUCUhpRSlGgVTegDaBZHQJJ9JbNbC791fZQoaAZoCWgPQwhBYrt7gD5kQJSGlFKUaBVN6ANoFkdAkn146CDmKnV9lChoBmgJaA9DCEhwI2WLSmNAlIaUUpRoFU3oA2gWR0CSgwS2H+IedX2UKGgGaAloD0MI1VqYhfb2YkCUhpRSlGgVTegDaBZHQJKDcnkT6BR1fZQoaAZoCWgPQwj9TShEwHFkQJSGlFKUaBVN6ANoFkdAkpmyKekHlnV9lChoBmgJaA9DCJ29M9oqEGFAlIaUUpRoFU3oA2gWR0CSnhi6g/TtdX2UKGgGaAloD0MIgxPRr626akCUhpRSlGgVTUoDaBZHQJKgLsVtXPt1fZQoaAZoCWgPQwgF+dnI9fdwQJSGlFKUaBVNbQFoFkdAkqO0it7rs3V9lChoBmgJaA9DCFLzVfIxNXFAlIaUUpRoFU3VAWgWR0CSpt6OHWSVdX2UKGgGaAloD0MIteGwNPDPXECUhpRSlGgVTegDaBZHQJKnSFFlTWJ1fZQoaAZoCWgPQwipFhHFZIptQJSGlFKUaBVNyAFoFkdAkqhczl90BHV9lChoBmgJaA9DCOokW10OT3FAlIaUUpRoFU0iAWgWR0CSqgq1w5vMdX2UKGgGaAloD0MIeqaXGItbcECUhpRSlGgVTaoCaBZHQJKq2OuJUHZ1fZQoaAZoCWgPQwjRWtHmOItrQJSGlFKUaBVNeAFoFkdAkqrzkdV/+nV9lChoBmgJaA9DCDi/YaJBwm1AlIaUUpRoFU3tAmgWR0CSr+Mqz7djdX2UKGgGaAloD0MIdOygElf6Y0CUhpRSlGgVTegDaBZHQJKzqCDmKZV1fZQoaAZoCWgPQwjpmzQNCpZhQJSGlFKUaBVN6ANoFkdAkrPsyBTXKHV9lChoBmgJaA9DCCHp0yr6h29AlIaUUpRoFU2PAWgWR0CSuHDyvs7ddX2UKGgGaAloD0MI3L3cJ8c4YECUhpRSlGgVTegDaBZHQJK53W+XZ5B1fZQoaAZoCWgPQwhTWRR2kcRxQJSGlFKUaBVNAQJoFkdAkrtBc/t6X3V9lChoBmgJaA9DCG0ANiBCl25AlIaUUpRoFU1vAWgWR0CSvb+LWI43dX2UKGgGaAloD0MI598u+3V+b0CUhpRSlGgVTboDaBZHQJK+AY64lQd1fZQoaAZoCWgPQwjGwaVjzohsQJSGlFKUaBVNgwJoFkdAksAFhPTG53V9lChoBmgJaA9DCJ2dDI4Sa2BAlIaUUpRoFU3oA2gWR0CSxEBGQSzxdX2UKGgGaAloD0MIDag3o+YTZkCUhpRSlGgVTegDaBZHQJLLWQYDT0B1fZQoaAZoCWgPQwixwi0fyXRxQJSGlFKUaBVNAQJoFkdAkstslHBk7XV9lChoBmgJaA9DCHODoQ6r7GxAlIaUUpRoFU3PAWgWR0CSzMPVNHpbdX2UKGgGaAloD0MIJh5QNmUIbkCUhpRSlGgVTYcBaBZHQJLNr24/eLx1fZQoaAZoCWgPQwhBRkCFI2ptQJSGlFKUaBVNawFoFkdAks77Zi/fwnV9lChoBmgJaA9DCIYgByXM6G5AlIaUUpRoFU38AmgWR0CSz0j9XLeRdX2UKGgGaAloD0MIeTpXlJJAbECUhpRSlGgVTdoBaBZHQJLnvJW/8EV1fZQoaAZoCWgPQwjHSPYIdcNxQJSGlFKUaBVNAQNoFkdAkufqjSG8EnV9lChoBmgJaA9DCO+NIQC4r29AlIaUUpRoFU2tAWgWR0CS6V90zTF3dX2UKGgGaAloD0MIyAiocIQwa0CUhpRSlGgVTWADaBZHQJLqDcDbJwN1fZQoaAZoCWgPQwgA4xk0dCpuQJSGlFKUaBVNcQNoFkdAkux9hRZU1nV9lChoBmgJaA9DCNo8DoP5JUhAlIaUUpRoFU0zAWgWR0CS75MHKOktdX2UKGgGaAloD0MI+rfLft2cZUCUhpRSlGgVTegDaBZHQJLv4oy9EkV1fZQoaAZoCWgPQwgBUMWNW9huQJSGlFKUaBVNKQJoFkdAkvG0BOpKjHV9lChoBmgJaA9DCMDnhxHCOmxAlIaUUpRoFU36AWgWR0CS819EkSmJdX2UKGgGaAloD0MIqP3WThS9bUCUhpRSlGgVTY0CaBZHQJL0Mk0Jng51fZQoaAZoCWgPQwj1aRX9IcluQJSGlFKUaBVNmAFoFkdAkvZkFGG21HV9lChoBmgJaA9DCNJT5BAxinBAlIaUUpRoFU3bAWgWR0CS98TN+so2dX2UKGgGaAloD0MIelORCuMvbkCUhpRSlGgVTeYBaBZHQJL5ZppN9IB1fZQoaAZoCWgPQwgNMzSeSPdxQJSGlFKUaBVNngFoFkdAkvwNqUNayXV9lChoBmgJaA9DCOkrSDMWZ2NAlIaUUpRoFU3oA2gWR0CS/DYq5LAYdX2UKGgGaAloD0MIisvxCkTJUECUhpRSlGgVTQcBaBZHQJL8p4/u9e11fZQoaAZoCWgPQwjLhcq/FrNyQJSGlFKUaBVNoAFoFkdAkv2o3WFvh3V9lChoBmgJaA9DCNfCLLTzBHFAlIaUUpRoFU1tAWgWR0CS/jWjXWe6dX2UKGgGaAloD0MITwRxHk6kOECUhpRSlGgVTR0BaBZHQJL/CACnxax1fZQoaAZoCWgPQwh+Vpkprc8awJSGlFKUaBVNBQFoFkdAkwN1j/dZaHV9lChoBmgJaA9DCCZUcHhBOHFAlIaUUpRoFU18AWgWR0CTBLgRsdkrdX2UKGgGaAloD0MI+8qD9FTkcECUhpRSlGgVTcACaBZHQJMFJTisGPh1fZQoaAZoCWgPQwi6vg8HCVlvQJSGlFKUaBVNSAJoFkdAkwVpzT4L1HV9lChoBmgJaA9DCIhJuJBHjXFAlIaUUpRoFU1/AmgWR0CTBdTdLxqgdX2UKGgGaAloD0MIsBu2LUqQckCUhpRSlGgVTa8BaBZHQJMHVmh/RVp1fZQoaAZoCWgPQwgmHeVgNnVtQJSGlFKUaBVNXAFoFkdAkwhKol2NenV9lChoBmgJaA9DCMuGNZVFyXBAlIaUUpRoFU0tAmgWR0CTCIR5kbxWdX2UKGgGaAloD0MIAJATJkwucUCUhpRSlGgVTVQBaBZHQJMJ9sbedkJ1fZQoaAZoCWgPQwjc8pGUdGNyQJSGlFKUaBVNTQNoFkdAkwor3Cbc5HV9lChoBmgJaA9DCOl/uRYt3GxAlIaUUpRoFU1ZAWgWR0CTC+osI3R5dX2UKGgGaAloD0MI2V92T56vb0CUhpRSlGgVTf8BaBZHQJML/iYLLIR1fZQoaAZoCWgPQwg89N2trJpuQJSGlFKUaBVN0AFoFkdAkxBMWGh24nV9lChoBmgJaA9DCExSmWIOQ3BAlIaUUpRoFU3QAWgWR0CTEfk5IYm+dWUu"
73
  },
74
  "ep_success_buffer": {
75
  ":type:": "<class 'collections.deque'>",
@@ -86,7 +86,7 @@
86
  "n_epochs": 4,
87
  "clip_range": {
88
  ":type:": "<class 'function'>",
89
- ":serialized:": "gAWVvwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAUsBSxNDBIgAUwCUToWUKYwBX5SFlIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCB9lH2UKGgXaA6MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgYjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"
90
  },
91
  "clip_range_vf": null,
92
  "normalize_advantage": true,
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
+ "__init__": "<function ActorCriticPolicy.__init__ at 0x7f736e7cdf70>",
8
+ "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f736e754040>",
9
+ "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f736e7540d0>",
10
+ "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f736e754160>",
11
+ "_build": "<function ActorCriticPolicy._build at 0x7f736e7541f0>",
12
+ "forward": "<function ActorCriticPolicy.forward at 0x7f736e754280>",
13
+ "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f736e754310>",
14
+ "_predict": "<function ActorCriticPolicy._predict at 0x7f736e7543a0>",
15
+ "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f736e754430>",
16
+ "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f736e7544c0>",
17
+ "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f736e754550>",
18
  "__abstractmethods__": "frozenset()",
19
+ "_abc_impl": "<_abc_data object at 0x7f736e7d1120>"
20
  },
21
  "verbose": 1,
22
  "policy_kwargs": {},
23
  "observation_space": {
24
  ":type:": "<class 'gym.spaces.box.Box'>",
25
+ ":serialized:": "gAWVnwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/5RoCksIhZSMAUOUdJRSlIwEaGlnaJRoEiiWIAAAAAAAAAAAAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAf5RoCksIhZRoFXSUUpSMDWJvdW5kZWRfYmVsb3eUaBIolggAAAAAAAAAAAAAAAAAAACUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYIAAAAAAAAAAAAAAAAAAAAlGghSwiFlGgVdJRSlIwKX25wX3JhbmRvbZROdWIu",
26
  "dtype": "float32",
27
+ "_shape": [
28
  8
29
  ],
30
  "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]",
35
  },
36
  "action_space": {
37
  ":type:": "<class 'gym.spaces.discrete.Discrete'>",
38
+ ":serialized:": "gAWVggAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUaAeTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu",
39
  "n": 4,
40
+ "_shape": [],
41
  "dtype": "int64",
42
  "_np_random": null
43
  },
47
  "_num_timesteps_at_start": 0,
48
  "seed": null,
49
  "action_noise": null,
50
+ "start_time": 1670418421450258399,
51
  "learning_rate": 0.0003,
52
  "tensorboard_log": null,
53
  "lr_schedule": {
54
  ":type:": "<class 'function'>",
55
+ ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4BDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/M6kqMFUyYYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="
56
  },
57
  "_last_obs": {
58
  ":type:": "<class 'numpy.ndarray'>",
59
+ ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAMDF7z17a5U/sxiOPmJIm74rdRg+w6IZPgAAAAAAAAAAAJGkPcO5Nrpm3fA6UQCLNcD6WDolpwu6AACAPwAAgD/NtBk9H4W1NmmfN7gHZMK2HInVul0s1TYAAIA/AACAP03Vxz3DzVK61EMCvK8VJ7VNcA27d1ijNAAAgD8AAIA/jaIrPpW0Xj5i1ES+Xot5viEJNr0O4as9AAAAAAAAAADNUgk8+QIzPvbIeL0CRoS+YroOPbrRj70AAAAAAAAAAGaH7jz2fCy6oitLOq/hKTWCoFI6GDFruQAAgD8AAIA/DTeKvfZ8L7ridQ667eePtAtxK7lH7ic5AACAPwAAgD+AmAE99oRaupYQOLt3/M03Z7Kxuh4m+zkAAIA/AACAPw3VAD5KLJA/ShGBPoFOp762S849IRerPQAAAAAAAAAAWu/PveHAh7o9Fh43hsEIMuCzQ7luiTi2AACAPwAAAAAzZ7E9uH7jOPaMxzWR2BQ2xMFfOkp3NLUAAIA/AAAAAI2fuz2Pxk+6Bt/pukA4FbZ+Cqw6++8EOgAAgD8AAIA/AF/7vOlZfD6QJXw9RBFovputSDuSuXY9AAAAAAAAAACmr5W9e6aBuj3yZ7v1UpE2XcWOOrZDhzoAAIA/AACAP014NL179ou66iphO5m6lzgIXiS6oi0FugAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
60
  },
61
  "_last_episode_starts": {
62
  ":type:": "<class 'numpy.ndarray'>",
69
  "_current_progress_remaining": -0.015808000000000044,
70
  "ep_info_buffer": {
71
  ":type:": "<class 'collections.deque'>",
72
+ ":serialized:": "gAWVfhAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIuf3yyQrpY0CUhpRSlIwBbJRN6AOMAXSUR0CQr5qI7/4qdX2UKGgGaAloD0MIY7g6AGLqY0CUhpRSlGgVTegDaBZHQJCwcBaLXMB1fZQoaAZoCWgPQwi0Hr5MFEJfQJSGlFKUaBVN6ANoFkdAkLQZnL7oCHV9lChoBmgJaA9DCO571F+vZ15AlIaUUpRoFU3oA2gWR0CQuqXbuc+adX2UKGgGaAloD0MIrd9MTJeiYECUhpRSlGgVTegDaBZHQJC942n889x1fZQoaAZoCWgPQwhnuWx0TlJmQJSGlFKUaBVN6ANoFkdAkL5d2ki2UnV9lChoBmgJaA9DCBJMNbOWEGtAlIaUUpRoFU2yA2gWR0CQwPPrv9cbdX2UKGgGaAloD0MIDjDzHfxoTECUhpRSlGgVS/xoFkdAkMOS/fwZwXV9lChoBmgJaA9DCDZbecn/IGNAlIaUUpRoFU3oA2gWR0CQxZpQk5ZKdX2UKGgGaAloD0MIW+uLhLZ8XkCUhpRSlGgVTegDaBZHQJDHKaZx7zF1fZQoaAZoCWgPQwgKEXAI1WpiQJSGlFKUaBVN6ANoFkdAkNCcPatcOnV9lChoBmgJaA9DCH/3jhoT1GRAlIaUUpRoFU3oA2gWR0CQ0e8Aq/dqdX2UKGgGaAloD0MIDJOpglHCXkCUhpRSlGgVTegDaBZHQJDYLEcbR4R1fZQoaAZoCWgPQwjbpQ2HJWJgQJSGlFKUaBVN6ANoFkdAkNoTakAPu3V9lChoBmgJaA9DCAGG5c+3UmVAlIaUUpRoFU3oA2gWR0CQ9eAFPi1idX2UKGgGaAloD0MIX5Z2aq6FZECUhpRSlGgVTegDaBZHQJD2iCjDbah1fZQoaAZoCWgPQwhAogkUscJkQJSGlFKUaBVN6ANoFkdAkQBEbT+efHV9lChoBmgJaA9DCCU+d4L9DWFAlIaUUpRoFU3oA2gWR0CRAJVZcLSedX2UKGgGaAloD0MIrp6T3rcEZkCUhpRSlGgVTegDaBZHQJEBbWbwz+F1fZQoaAZoCWgPQwg8wf7r3OVkQJSGlFKUaBVN6ANoFkdAkQtpEc81XXV9lChoBmgJaA9DCKaAtP8BcWZAlIaUUpRoFU3oA2gWR0CRDnaFEiMYdX2UKGgGaAloD0MI1VxuMFRAZkCUhpRSlGgVTegDaBZHQJEO7gQ6IWR1fZQoaAZoCWgPQwi7mdGPhhVnQJSGlFKUaBVN6ANoFkdAkRGIRAbADnV9lChoBmgJaA9DCPSHZp5cyU5AlIaUUpRoFU0tAWgWR0CRE6SkTHsDdX2UKGgGaAloD0MICr/Uz5s6YkCUhpRSlGgVTegDaBZHQJEUMY51eSl1fZQoaAZoCWgPQwgHswkwrE1kQJSGlFKUaBVN6ANoFkdAkRXlLeyiVXV9lChoBmgJaA9DCCZV203w6WFAlIaUUpRoFU3oA2gWR0CRF2nLJSzgdX2UKGgGaAloD0MIqwfMQybMYECUhpRSlGgVTegDaBZHQJEf196Tnq51fZQoaAZoCWgPQwhSRfEq68xkQJSGlFKUaBVN6ANoFkdAkSEryH2ys3V9lChoBmgJaA9DCGCxhovc+2FAlIaUUpRoFU3oA2gWR0CRJ2Ssr/bTdX2UKGgGaAloD0MIizVc5J5EZECUhpRSlGgVTegDaBZHQJEpOLgn+hp1fZQoaAZoCWgPQwi+TurL0ixfQJSGlFKUaBVN6ANoFkdAkUQNmxt52XV9lChoBmgJaA9DCNWytb5IW11AlIaUUpRoFU3oA2gWR0CRRJ12aDwpdX2UKGgGaAloD0MIgEi/fZ0IZECUhpRSlGgVTegDaBZHQJFNkeU6gdx1fZQoaAZoCWgPQwhwQEtXsOFeQJSGlFKUaBVN6ANoFkdAkU3RmkFfRnV9lChoBmgJaA9DCK5JtyVy9WZAlIaUUpRoFU3oA2gWR0CRWMJng5zYdX2UKGgGaAloD0MIvXMoQ1WTY0CUhpRSlGgVTegDaBZHQJFcGqfe1rt1fZQoaAZoCWgPQwigGFkyx31jQJSGlFKUaBVN6ANoFkdAkVydbkfcOHV9lChoBmgJaA9DCPPn24Kl9F9AlIaUUpRoFU3oA2gWR0CRX2DF6zE8dX2UKGgGaAloD0MIfA4sR8hRXUCUhpRSlGgVTegDaBZHQJFhmQJXyRV1fZQoaAZoCWgPQwgeNSbE3GNmQJSGlFKUaBVN6ANoFkdAkWIvM8ox6HV9lChoBmgJaA9DCK3AkNWtgmFAlIaUUpRoFU3oA2gWR0CRZAt7rs0IdX2UKGgGaAloD0MIAFKbODkPYUCUhpRSlGgVTegDaBZHQJFlokOZssR1fZQoaAZoCWgPQwgoSddMvitlQJSGlFKUaBVN6ANoFkdAkW+JccENfHV9lChoBmgJaA9DCC13ZoJhDmJAlIaUUpRoFU3oA2gWR0CRcPvSMLncdX2UKGgGaAloD0MIVS+/02SsYkCUhpRSlGgVTegDaBZHQJF3/vv0AcV1fZQoaAZoCWgPQwj76xUW3N5fQJSGlFKUaBVN6ANoFkdAkXni0jTrmnV9lChoBmgJaA9DCACpTZzc4V1AlIaUUpRoFU3oA2gWR0CRlWqz7di2dX2UKGgGaAloD0MIjDBFuTQmZkCUhpRSlGgVTegDaBZHQJGWA4HX2/V1fZQoaAZoCWgPQwinrnyW5ytlQJSGlFKUaBVN6ANoFkdAkZ9668QI2XV9lChoBmgJaA9DCGB2Tx4WCVtAlIaUUpRoFU3oA2gWR0CRn74mkWRBdX2UKGgGaAloD0MIJbIPsqzpZECUhpRSlGgVTegDaBZHQJGqkjOcDr91fZQoaAZoCWgPQwiASSpTTK9jQJSGlFKUaBVN6ANoFkdAka4JZbILgHV9lChoBmgJaA9DCJjg1AeSaGRAlIaUUpRoFU3oA2gWR0CRrox4ptrLdX2UKGgGaAloD0MILSRgdPnQYUCUhpRSlGgVTegDaBZHQJGxSW3Sa3J1fZQoaAZoCWgPQwiGjh1U4iBeQJSGlFKUaBVN6ANoFkdAkbNKHsTnJXV9lChoBmgJaA9DCKWEYFW9ZmVAlIaUUpRoFU3oA2gWR0CRs9iZfD1odX2UKGgGaAloD0MIfewuUNLDZUCUhpRSlGgVTegDaBZHQJG1hun/DLt1fZQoaAZoCWgPQwjwTdNnh1pgQJSGlFKUaBVN6ANoFkdAkbbaHbh3q3V9lChoBmgJaA9DCLEYda29LUxAlIaUUpRoFUvhaBZHQJG3YzbeuV51fZQoaAZoCWgPQwiXj6Skh8JkQJSGlFKUaBVN6ANoFkdAkb6/+GXXy3V9lChoBmgJaA9DCNrlWx9WJ2NAlIaUUpRoFU3oA2gWR0CRv/3lCCz1dX2UKGgGaAloD0MIG9e/6zMOY0CUhpRSlGgVTegDaBZHQJHF03FUADJ1fZQoaAZoCWgPQwimSL4SyLdjQJSGlFKUaBVN6ANoFkdAkceNVWCEpXV9lChoBmgJaA9DCNcYdELop15AlIaUUpRoFU3oA2gWR0CR4iNVinYQdX2UKGgGaAloD0MIkXwlkBL2ZECUhpRSlGgVTegDaBZHQJHisZMtbs51fZQoaAZoCWgPQwjN5nEYzOhfQJSGlFKUaBVN6ANoFkdAkesyXD3ueHV9lChoBmgJaA9DCJCg+DFmaWNAlIaUUpRoFU3oA2gWR0CR62w6QvHtdX2UKGgGaAloD0MIbVSnA9ncYkCUhpRSlGgVTegDaBZHQJH5H2wmmch1fZQoaAZoCWgPQwhpq5LIPiJdQJSGlFKUaBVN6ANoFkdAkfmoQe3hGnV9lChoBmgJaA9DCAJHAg02C1xAlIaUUpRoFU3oA2gWR0CR/DrTH80ldX2UKGgGaAloD0MI2UKQgxKoZECUhpRSlGgVTegDaBZHQJH+RbJOnEV1fZQoaAZoCWgPQwhPyTmxhw5kQJSGlFKUaBVN6ANoFkdAkf7Qtrbg0nV9lChoBmgJaA9DCOZ2L/fJPVxAlIaUUpRoFU3oA2gWR0CSAHLlFMIvdX2UKGgGaAloD0MIoMTnTjCMY0CUhpRSlGgVTegDaBZHQJIB0RwqAjJ1fZQoaAZoCWgPQwhqM05D1BllQJSGlFKUaBVN6ANoFkdAkgJipeeFtnV9lChoBmgJaA9DCIRnQpPE62FAlIaUUpRoFU3oA2gWR0CSCmiyY5T7dX2UKGgGaAloD0MIwO0JEltKZUCUhpRSlGgVTegDaBZHQJILn1L8Jld1fZQoaAZoCWgPQwg0SSwp999iQJSGlFKUaBVN6ANoFkdAkhGH+ERJ3HV9lChoBmgJaA9DCO9Z12i5GGBAlIaUUpRoFU3oA2gWR0CSE0N+so2GdX2UKGgGaAloD0MIzox+NJyvY0CUhpRSlGgVTegDaBZHQJIb1B/qgRN1fZQoaAZoCWgPQwis4/ih0q9jQJSGlFKUaBVN6ANoFkdAkhx4zrNW2nV9lChoBmgJaA9DCA1yF2GKV2NAlIaUUpRoFU3oA2gWR0CSN9kQPI4mdX2UKGgGaAloD0MI0zJS7ykfYkCUhpRSlGgVTegDaBZHQJI4FWsA/9p1fZQoaAZoCWgPQwhOfLWjOFpiQJSGlFKUaBVN6ANoFkdAkkWlpblijXV9lChoBmgJaA9DCAk4hCq1zGFAlIaUUpRoFU3oA2gWR0CSRhyBClabdX2UKGgGaAloD0MIr3d/vFeBSUCUhpRSlGgVS/1oFkdAkkcxKg7HQ3V9lChoBmgJaA9DCKVneokx+WNAlIaUUpRoFU3oA2gWR0CSSLADq4YrdX2UKGgGaAloD0MI04cuqG/XZ0CUhpRSlGgVTegDaBZHQJJKrYxtYSx1fZQoaAZoCWgPQwi/YDdsW7djQJSGlFKUaBVN6ANoFkdAkktMibDuSnV9lChoBmgJaA9DCIC5Fi1AOGJAlIaUUpRoFU3oA2gWR0CSTQVqesgddX2UKGgGaAloD0MIqb7zi5LiZUCUhpRSlGgVTegDaBZHQJJOZC/oJRh1fZQoaAZoCWgPQwjByMua2LllQJSGlFKUaBVN6ANoFkdAkk7tPpIMB3V9lChoBmgJaA9DCD1DOGbZBWVAlIaUUpRoFU3oA2gWR0CSVegccU/OdX2UKGgGaAloD0MIhnXj3ZFKYUCUhpRSlGgVTegDaBZHQJJXArrgOz91fZQoaAZoCWgPQwg5Y5gTtEZgQJSGlFKUaBVN6ANoFkdAkl0iw4bS7XV9lChoBmgJaA9DCCZRL/g032tAlIaUUpRoFU2mAWgWR0CSXsVZs9B9dX2UKGgGaAloD0MIPnWsUvrEY0CUhpRSlGgVTegDaBZHQJJe98XvYvp1fZQoaAZoCWgPQwjzdRn+UwplQJSGlFKUaBVN6ANoFkdAkmdWT1TR6XV9lChoBmgJaA9DCAADQYCM32JAlIaUUpRoFU3oA2gWR0CSZ/WTot+TdWUu"
73
  },
74
  "ep_success_buffer": {
75
  ":type:": "<class 'collections.deque'>",
86
  "n_epochs": 4,
87
  "clip_range": {
88
  ":type:": "<class 'function'>",
89
+ ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4BDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/yZmZmZmZmoWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="
90
  },
91
  "clip_range_vf": null,
92
  "normalize_advantage": true,
ppo-LunarLander-v2/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4d92e24601e3f31f5d301a84b22da266e278b3bbf2393ed3bb2c8962fa121712
3
  size 87865
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:41b9b8278d1b9f1e3325173f8c479cca60312e9b58ebea517b00407b45ab93a2
3
  size 87865
ppo-LunarLander-v2/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9cb18bde5f418fa03f65ac89765127ef2d68330fa395ef11202d8ca62063922f
3
  size 43201
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2615305a72ff3561578b3d02f177c59d57e6a5b17fe28c60c8c9c50675359881
3
  size 43201
ppo-LunarLander-v2/system_info.txt CHANGED
@@ -1,7 +1,7 @@
1
- OS: Linux-5.4.188+-x86_64-with-Ubuntu-18.04-bionic #1 SMP Sun Apr 24 10:03:06 PDT 2022
2
- Python: 3.7.13
3
- Stable-Baselines3: 1.6.0
4
- PyTorch: 1.12.0+cu113
5
  GPU Enabled: True
6
  Numpy: 1.21.6
7
- Gym: 0.17.3
1
+ OS: Linux-5.10.133+-x86_64-with-glibc2.27 #1 SMP Fri Aug 26 08:44:51 UTC 2022
2
+ Python: 3.8.15
3
+ Stable-Baselines3: 1.6.2
4
+ PyTorch: 1.12.1+cu113
5
  GPU Enabled: True
6
  Numpy: 1.21.6
7
+ Gym: 0.21.0
replay.mp4 CHANGED
Binary files a/replay.mp4 and b/replay.mp4 differ
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 254.12968476857185, "std_reward": 18.544371676441052, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2022-07-26T18:41:23.437511"}
1
+ {"mean_reward": 249.9023040223091, "std_reward": 12.935156030646995, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2022-12-07T13:30:21.036493"}