745H1N commited on
Commit
c743750
1 Parent(s): 4927163

lunar lander v2 with ppo epochs (10) timestamps (500,000 -> 1000,000)

Browse files
README.md CHANGED
@@ -10,7 +10,7 @@ model-index:
10
  results:
11
  - metrics:
12
  - type: mean_reward
13
- value: 230.34 +/- 17.55
14
  name: mean_reward
15
  task:
16
  type: reinforcement-learning
 
10
  results:
11
  - metrics:
12
  - type: mean_reward
13
+ value: 271.03 +/- 12.91
14
  name: mean_reward
15
  task:
16
  type: reinforcement-learning
config.json CHANGED
@@ -1 +1 @@
1
- {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f7629c25ef0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f7629c25f80>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f7629c2b050>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f7629c2b0e0>", "_build": "<function ActorCriticPolicy._build at 0x7f7629c2b170>", "forward": "<function ActorCriticPolicy.forward at 0x7f7629c2b200>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f7629c2b290>", "_predict": "<function ActorCriticPolicy._predict at 0x7f7629c2b320>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f7629c2b3b0>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f7629c2b440>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f7629c2b4d0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc_data object at 0x7f7629c75a50>"}, "verbose": 1, "policy_kwargs": {}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVnwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/5RoCksIhZSMAUOUdJRSlIwEaGlnaJRoEiiWIAAAAAAAAAAAAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAf5RoCksIhZRoFXSUUpSMDWJvdW5kZWRfYmVsb3eUaBIolggAAAAAAAAAAAAAAAAAAACUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYIAAAAAAAAAAAAAAAAAAAAlGghSwiFlGgVdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [8], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False]", "bounded_above": "[False False False False False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gAWVggAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUaAeTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu", "n": 4, "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "num_timesteps": 507904, "_total_timesteps": 500000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1652084949.9720929, "learning_rate": 0.0003, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVvwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAUsBSxNDBIgAUwCUToWUKYwBX5SFlIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCB9lH2UKGgXaA6MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgYjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAGZWyzqPzgW6YbqiOrxrgLPGCpo6xrS+uQAAgD8AAIA/ANqVvFxPSTmuuO87m5K6tv79ATv6Urm1AACAPwAAgD/mAwu99qQ0uh38oDs179M3WyqROhr33bQAAIA/AACAP51mgj60+0G9zp3xul8KyTmYQ6m+gzQuOgAAgD8AAIA/mpUGvvaXEzsO7us79/8juo7y1rxmuRQ7AACAPwAAgD+NL5c9FEieugPId7tVoi04ivneOnHKADcAAIA/AACAP2ZdQT2uoai649A/O7m6GjhqZ5M6AJ3ZNQAAgD8AAIA/Zhe/PcqNHz94w3i95RlhvsZ/7zwzgg+7AAAAAAAAAABe8o2+b/+MPwqsxL2qvK2+UWSfvkEysj0AAAAAAAAAAE1ZDD0pSCy6BlbevP/UsjVyH+I6elEmtQAAgD8AAIA/LgyAvsqfIjxe/FK6cbMxONFPrb2yanY5AACAPwAAgD9aOqa9wzVRuljkervrrJg4X3Dxuon1wTkAAIA/AACAP8bbab40hvU9DCI0vfo44L15L8C8+c+SvQAAAAAAAAAAJmxHPrz4SD1KokO9/uVSvuln5jznvre8AAAAAAAAAAAm2Bi+hfmNu0DypTo/lDw3zw24PLZzwLkAAIA/AACAP81qDjz2bAa6q9Xvujf1LjcBwUm6E0SZtgAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.015808000000000044, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVfxAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIyY/4FWunVUCUhpRSlIwBbJRN6AOMAXSUR0CnVg+i8FpxdX2UKGgGaAloD0MIMrCO4wd8YUCUhpRSlGgVTegDaBZHQKdXXWEK3NN1fZQoaAZoCWgPQwitpBXfUOZeQJSGlFKUaBVN6ANoFkdAp1k2tOmBOHV9lChoBmgJaA9DCNEjRs8twlxAlIaUUpRoFU3oA2gWR0CnWgvgNwzddX2UKGgGaAloD0MIuhXCaix8X0CUhpRSlGgVTegDaBZHQKda8ZG8VYZ1fZQoaAZoCWgPQwgw2A3bFq5hQJSGlFKUaBVN6ANoFkdAp1tI0Kqn33V9lChoBmgJaA9DCDjAzHdwLWFAlIaUUpRoFU3oA2gWR0CnXIKjSG8FdX2UKGgGaAloD0MI/U/+7p18Y0CUhpRSlGgVTegDaBZHQKdhxTcZccF1fZQoaAZoCWgPQwiiYTHqWrszQJSGlFKUaBVL7WgWR0CnYzYc/+sHdX2UKGgGaAloD0MItaUO8noYZUCUhpRSlGgVTegDaBZHQKdnMU5dWyV1fZQoaAZoCWgPQwieRe9UwPdXQJSGlFKUaBVN6ANoFkdAp3AjgXMyJ3V9lChoBmgJaA9DCFhyFYvfiGJAlIaUUpRoFU3oA2gWR0CnmnP+4smOdX2UKGgGaAloD0MIowc+BiuwYkCUhpRSlGgVTegDaBZHQKedeHpr1ul1fZQoaAZoCWgPQwhoyk4/KKFiQJSGlFKUaBVN6ANoFkdAp563Xf642HV9lChoBmgJaA9DCByygXSx5GNAlIaUUpRoFU3oA2gWR0CnobrXlKbsdX2UKGgGaAloD0MICrq9pDF4XUCUhpRSlGgVTegDaBZHQKeh2qvNeMR1fZQoaAZoCWgPQwj3V4/7Vr1iQJSGlFKUaBVN6ANoFkdAp6I8o4MnZ3V9lChoBmgJaA9DCF7zqs5qfVdAlIaUUpRoFU3oA2gWR0Cnos64UeuFdX2UKGgGaAloD0MID3wMVhyHY0CUhpRSlGgVTegDaBZHQKekPIvrWy11fZQoaAZoCWgPQwh7FoTyPnVaQJSGlFKUaBVN6ANoFkdAp6YdVDKHPHV9lChoBmgJaA9DCB8tzhjmmF5AlIaUUpRoFU3oA2gWR0CnpvggX/HYdX2UKGgGaAloD0MI8UknEkzpTUCUhpRSlGgVTegDaBZHQKenzcTrVvx1fZQoaAZoCWgPQwhjm1Q01r75v5SGlFKUaBVL8WgWR0CnqDhgVoHtdX2UKGgGaAloD0MIPIcyVEUbYUCUhpRSlGgVTegDaBZHQKepYUMXrMV1fZQoaAZoCWgPQwh4l4v4TlZbQJSGlFKUaBVN6ANoFkdAp66vDFZPmHV9lChoBmgJaA9DCB77WSxFUFRAlIaUUpRoFU3oA2gWR0CnsAVaOgg6dX2UKGgGaAloD0MIMxXikfhZYUCUhpRSlGgVTegDaBZHQKezjYjjaPF1fZQoaAZoCWgPQwi8df7tsp/2P5SGlFKUaBVNNAFoFkdAp7QztG/etXV9lChoBmgJaA9DCI3TEFX4ZzFAlIaUUpRoFU0EAWgWR0Cnugn7gsK9dX2UKGgGaAloD0MIrTB9ryEMW0CUhpRSlGgVTegDaBZHQKe7DrD63y91fZQoaAZoCWgPQwj8xteeWbIOQJSGlFKUaBVNJgFoFkdAp798jmjj73V9lChoBmgJaA9DCEpiSbl7GmJAlIaUUpRoFU3oA2gWR0Cn5Aepn6EbdX2UKGgGaAloD0MI2nQEcLMbXUCUhpRSlGgVTegDaBZHQKfmpu4PPLR1fZQoaAZoCWgPQwhoz2VqEvVbQJSGlFKUaBVN6ANoFkdAp+p5P/JeV3V9lChoBmgJaA9DCFKBk21gIWNAlIaUUpRoFU3oA2gWR0Cn6pSNOuaGdX2UKGgGaAloD0MIF35wPnUjXECUhpRSlGgVTegDaBZHQKfq8VEd/8V1fZQoaAZoCWgPQwi8W1mis8hcQJSGlFKUaBVN6ANoFkdAp+t9f3N9pnV9lChoBmgJaA9DCGADIsQV2mJAlIaUUpRoFU3oA2gWR0Cn7NJQ+EAYdX2UKGgGaAloD0MIH/MBgc54XUCUhpRSlGgVTegDaBZHQKfurzBAOax1fZQoaAZoCWgPQwglsDkHz/FcQJSGlFKUaBVN6ANoFkdAp++Zw6ySm3V9lChoBmgJaA9DCK4oJQSr/11AlIaUUpRoFU3oA2gWR0Cn8IHskY4ydX2UKGgGaAloD0MIB5W4jnEqXkCUhpRSlGgVTegDaBZHQKfw6QlruYx1fZQoaAZoCWgPQwizfF2G/xJEwJSGlFKUaBVNIwFoFkdAp/G1AE+xGHV9lChoBmgJaA9DCAVu3c1TBF5AlIaUUpRoFU3oA2gWR0Cn99+N96TodX2UKGgGaAloD0MIUOPe/Ia5YkCUhpRSlGgVTegDaBZHQKf+Uv2Xb/R1fZQoaAZoCWgPQwj12mysRAhiQJSGlFKUaBVN6ANoFkdAqAU32RJVbXV9lChoBmgJaA9DCDpAMEePElJAlIaUUpRoFU3oA2gWR0CoBlFfqoqDdX2UKGgGaAloD0MIraOqCaLSV0CUhpRSlGgVTegDaBZHQKgLAp8WsRx1fZQoaAZoCWgPQwihuyTOivteQJSGlFKUaBVN6ANoFkdAqA0/5k9U0nV9lChoBmgJaA9DCL0BZr4DSWRAlIaUUpRoFU3oA2gWR0CoNaz9KmKqdX2UKGgGaAloD0MIehhanZxcXUCUhpRSlGgVTegDaBZHQKg1xgeii7F1fZQoaAZoCWgPQwghQIaOnUdkQJSGlFKUaBVN6ANoFkdAqDYgKUmlZXV9lChoBmgJaA9DCIwtBDko+lhAlIaUUpRoFU3oA2gWR0CoNqgDifg8dX2UKGgGaAloD0MIw7zHmSZqWkCUhpRSlGgVTegDaBZHQKg4EPqcEvF1fZQoaAZoCWgPQwjG+ZtQiG5hQJSGlFKUaBVN6ANoFkdAqDnbNyHVPXV9lChoBmgJaA9DCO7rwDkjWl9AlIaUUpRoFU3oA2gWR0CoOq8B+4LDdX2UKGgGaAloD0MIHsTOFDqyX0CUhpRSlGgVTegDaBZHQKg7ll8w5/91fZQoaAZoCWgPQwiGjh1U4gxhQJSGlFKUaBVN6ANoFkdAqDwAVh1DB3V9lChoBmgJaA9DCNgqweJwImZAlIaUUpRoFU3oA2gWR0CoPLz8pCrtdX2UKGgGaAloD0MIhH8RNGZCTUCUhpRSlGgVTRoBaBZHQKg/EF8ohIR1fZQoaAZoCWgPQwhZMzLIXYJaQJSGlFKUaBVN6ANoFkdAqEIpRsMy8HV9lChoBmgJaA9DCCEgX0IFZylAlIaUUpRoFU0nAWgWR0CoRULRBu4xdX2UKGgGaAloD0MIc6Hyr+XlX0CUhpRSlGgVTegDaBZHQKhH67aIval1fZQoaAZoCWgPQwj4/DBCeJldQJSGlFKUaBVN6ANoFkdAqE5ZrLyMDXV9lChoBmgJaA9DCMP1KFyPRVhAlIaUUpRoFU3oA2gWR0CoT2pLVWjodX2UKGgGaAloD0MIXwmkxK4+XkCUhpRSlGgVTegDaBZHQKhUIPIXCTF1fZQoaAZoCWgPQwgE4+DSMR1kQJSGlFKUaBVN6ANoFkdAqFZotSQ5m3V9lChoBmgJaA9DCHFYGvhRvWFAlIaUUpRoFU3oA2gWR0CogEHq3VkMdX2UKGgGaAloD0MIEywOZ36kYUCUhpRSlGgVTegDaBZHQKiAsdZJTVF1fZQoaAZoCWgPQwjkTX6LTqxZQJSGlFKUaBVN6ANoFkdAqIFOMqBmPHV9lChoBmgJaA9DCJvkR/yKzWFAlIaUUpRoFU3oA2gWR0CogtIB7u2JdX2UKGgGaAloD0MIWvPjLy3DWUCUhpRSlGgVTegDaBZHQKiE7TfixV11fZQoaAZoCWgPQwgXEcXkjd5gQJSGlFKUaBVN6ANoFkdAqIXnA9FF2HV9lChoBmgJaA9DCEZCW84lMWFAlIaUUpRoFU3oA2gWR0Coh3NMPBi1dX2UKGgGaAloD0MIkrBvJ5FUYECUhpRSlGgVTegDaBZHQKiIbeqrBCV1fZQoaAZoCWgPQwi4eHjPgbNaQJSGlFKUaBVN6ANoFkdAqItza/RE4XV9lChoBmgJaA9DCLVOXI5X01hAlIaUUpRoFU3oA2gWR0Coj2azE74jdX2UKGgGaAloD0MIqyUd5eDUYkCUhpRSlGgVTegDaBZHQKiTJLmITGp1fZQoaAZoCWgPQwgt7j8ynX1iQJSGlFKUaBVN6ANoFkdAqJYyV4X403V9lChoBmgJaA9DCFPpJ5zdB2BAlIaUUpRoFU3oA2gWR0ConWCsOoYOdX2UKGgGaAloD0MI6gjgZvEQWkCUhpRSlGgVTegDaBZHQKiehpGnXNF1fZQoaAZoCWgPQwio4PCCiINdQJSGlFKUaBVN6ANoFkdAqKNicAimmHV9lChoBmgJaA9DCL3/jxMm7lxAlIaUUpRoFU3oA2gWR0CopaUWVNYbdX2UKGgGaAloD0MIBvTCnQtDYECUhpRSlGgVTegDaBZHQKjOuPp6hQF1fZQoaAZoCWgPQwhMjdDP1J5gQJSGlFKUaBVN6ANoFkdAqM8ewu/UOXV9lChoBmgJaA9DCM1aCkj7jWFAlIaUUpRoFU3oA2gWR0Coz7L92ovSdX2UKGgGaAloD0MImL7XEJzYYkCUhpRSlGgVTegDaBZHQKjRJkmQbMp1fZQoaAZoCWgPQwivIqMDEnFkQJSGlFKUaBVN6ANoFkdAqNMp0Syt3nV9lChoBmgJaA9DCE9Xdyy2dGFAlIaUUpRoFU3oA2gWR0Co1CdAxBVudX2UKGgGaAloD0MIBRVVv9ILY0CUhpRSlGgVTegDaBZHQKjVtZ8rqdJ1fZQoaAZoCWgPQwhDjUKS2ZdiQJSGlFKUaBVN6ANoFkdAqNam/rSmZXV9lChoBmgJaA9DCDc10HzOxFhAlIaUUpRoFU3oA2gWR0Co2YJpN9H+dX2UKGgGaAloD0MIGNALdy6AT0CUhpRSlGgVTREBaBZHQKjaFm7rcCZ1fZQoaAZoCWgPQwg9uhEWFd9SQJSGlFKUaBVN6ANoFkdAqN0NTxXnyXV9lChoBmgJaA9DCAHBHD1+Bl5AlIaUUpRoFU3oA2gWR0Co4IGvwEyMdX2UKGgGaAloD0MI4LvNG6dPYECUhpRSlGgVTegDaBZHQKjjexB3Roh1fZQoaAZoCWgPQwjAPc+ftiRgQJSGlFKUaBVN6ANoFkdAqOqhMDfWMHV9lChoBmgJaA9DCOARFaobZWNAlIaUUpRoFU3oA2gWR0Co68+1SflIdX2UKGgGaAloD0MIxJeJIqS3Y0CUhpRSlGgVTegDaBZHQKjwuWweNkx1fZQoaAZoCWgPQwjEB3b8FyRhQJSGlFKUaBVN6ANoFkdAqPMXGEPDpHVlLg=="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 310, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 10, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVvwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAUsBSxNDBIgAUwCUToWUKYwBX5SFlIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCB9lH2UKGgXaA6MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgYjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "system_info": {"OS": "Linux-5.4.188+-x86_64-with-Ubuntu-18.04-bionic #1 SMP Sun Apr 24 10:03:06 PDT 2022", "Python": "3.7.13", "Stable-Baselines3": "1.5.0", "PyTorch": "1.11.0+cu113", "GPU Enabled": "True", "Numpy": "1.21.6", "Gym": "0.21.0"}}
 
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7fafecdddef0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7fafecdddf80>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7fafecde3050>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7fafecde30e0>", "_build": "<function ActorCriticPolicy._build at 0x7fafecde3170>", "forward": "<function ActorCriticPolicy.forward at 0x7fafecde3200>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7fafecde3290>", "_predict": "<function ActorCriticPolicy._predict at 0x7fafecde3320>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7fafecde33b0>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7fafecde3440>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7fafecde34d0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc_data object at 0x7fafece1edb0>"}, "verbose": 1, "policy_kwargs": {}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVnwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/5RoCksIhZSMAUOUdJRSlIwEaGlnaJRoEiiWIAAAAAAAAAAAAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAf5RoCksIhZRoFXSUUpSMDWJvdW5kZWRfYmVsb3eUaBIolggAAAAAAAAAAAAAAAAAAACUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYIAAAAAAAAAAAAAAAAAAAAlGghSwiFlGgVdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [8], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False]", "bounded_above": "[False False False False False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gAWVggAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUaAeTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu", "n": 4, "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "num_timesteps": 1015808, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1652091708.80915, "learning_rate": 0.0003, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVvwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAUsBSxNDBIgAUwCUToWUKYwBX5SFlIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCB9lH2UKGgXaA6MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgYjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAGZR6bwDsYg/QbShvXa4EL8Obpq9E9q1PAAAAAAAAAAAZraWu2TOsD0yiJ+9v1xhvrsXvbsGARq8AAAAAAAAAADNLYG8BY/QPtBTjby38a++/BKKvQZcLb0AAAAAAAAAAGZCwzt7np669JJJM9Vrqy/1W9M5TgO9swAAgD8AAIA/ZmzhPGY1wD8PuxA+LWc6u4R/3zz+zI89AAAAAAAAAAATJHs+xHSHPgNR/74c9bO+M3iFPMmQOb4AAAAAAAAAADP39TuuIYy6oL+yu/1bUTiKf2+6M87fNwAAAAAAAAAAZo+ivKQ1e7sNEoA8+fSVPOAzwbw+DIA9AACAPwAAgD8trkc+EIKBPrBJy75kgaC+e6oePBv2tr0AAAAAAAAAAK3KMT4Plsw+srnCvme2yb4bkpA7fw8qvgAAAAAAAAAAZraMPKToebtDWUg7UuaUPO+QmbxNnH49AACAPwAAgD8A4Bu7j850uo7wg7sMKc81hmpRu3svQLUAAAAAAAAAAJq3DTxccUa8NYGQPMkeADt4E6G9hp6SvQAAgD8AAIA/M3R6PdYofj8zWYO8YFsTv9Nxmz0dFJa9AAAAAAAAAAAbg9W+0/d7Py6YIbyeWPq+h84Iv05C0T0AAAAAAAAAAGaEKr32CHa6n3SmtmbTNrFgfwc7ioPFNQAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.015808000000000044, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIBAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIK6T8pBp3ckCUhpRSlIwBbJRL44wBdJRHQJrAG6oVEeB1fZQoaAZoCWgPQwiiJCTSds1yQJSGlFKUaBVL7WgWR0CawIY1YQrddX2UKGgGaAloD0MI/+kGCvy8cECUhpRSlGgVS8poFkdAmsCdHYpUgnV9lChoBmgJaA9DCIoEU80s1m1AlIaUUpRoFUvLaBZHQJrAzp1RtP51fZQoaAZoCWgPQwgNVMa/T/xyQJSGlFKUaBVLxWgWR0CawYK1G9YfdX2UKGgGaAloD0MIINEEipjxcECUhpRSlGgVS9VoFkdAmsGB+az/qHV9lChoBmgJaA9DCL4UHjT7N3BAlIaUUpRoFUvpaBZHQJrBt7+kxh51fZQoaAZoCWgPQwjT+IVX0pJwQJSGlFKUaBVLxWgWR0CawgSXt0FKdX2UKGgGaAloD0MIS1gbYydPcUCUhpRSlGgVS/doFkdAmsI0nw5NoXV9lChoBmgJaA9DCGtKsg7H1nNAlIaUUpRoFUvlaBZHQJrCVsEaESN1fZQoaAZoCWgPQwh8DcFxWUJwQJSGlFKUaBVL1GgWR0Caw01IRRMwdX2UKGgGaAloD0MITaPJxRiPcUCUhpRSlGgVS/doFkdAmsOEpy6tknV9lChoBmgJaA9DCHcRpihXpXJAlIaUUpRoFUvhaBZHQJrD7KYAsCl1fZQoaAZoCWgPQwhB8s6hzDFyQJSGlFKUaBVL52gWR0CaxHbBGhEjdX2UKGgGaAloD0MI14aKcX4Kc0CUhpRSlGgVS85oFkdAmsSQSrYGuHV9lChoBmgJaA9DCOQSRx4Iu29AlIaUUpRoFUvQaBZHQJrGSzUqhDh1fZQoaAZoCWgPQwihhJm2f2pyQJSGlFKUaBVL0mgWR0CaxnSQo1DTdX2UKGgGaAloD0MI2J3uPDF3c0CUhpRSlGgVS/VoFkdAmsaZeVs1sXV9lChoBmgJaA9DCA7z5QXYkHNAlIaUUpRoFUv5aBZHQJrHKhHskY51fZQoaAZoCWgPQwi28/3UuGRyQJSGlFKUaBVL1GgWR0Cax6u0TlDGdX2UKGgGaAloD0MIpwUv+sq1cUCUhpRSlGgVS/FoFkdAmshJ3PiT+3V9lChoBmgJaA9DCPBRf71C1G1AlIaUUpRoFUvaaBZHQJrIW6bvw3J1fZQoaAZoCWgPQwiIEi15vONuQJSGlFKUaBVL4mgWR0CayMCxeLNwdX2UKGgGaAloD0MISG3i5P7TckCUhpRSlGgVS/FoFkdAmsjXUH6dlXV9lChoBmgJaA9DCNgpVg0CNnBAlIaUUpRoFUvKaBZHQJrJzLyMDOl1fZQoaAZoCWgPQwitodRexNluQJSGlFKUaBVL42gWR0CayhNGEwnIdX2UKGgGaAloD0MItd5vtCMuc0CUhpRSlGgVS/poFkdAmsp9v0h/zHV9lChoBmgJaA9DCPesa7TcZ3BAlIaUUpRoFUvgaBZHQJrLBuyeI2x1fZQoaAZoCWgPQwgjL2tigZBzQJSGlFKUaBVL4WgWR0Cayyh4MWoFdX2UKGgGaAloD0MIVS5U/jWncUCUhpRSlGgVS+hoFkdAms03jdYW+HV9lChoBmgJaA9DCA2qDU5Eu29AlIaUUpRoFUvKaBZHQJrNxa/yoXN1fZQoaAZoCWgPQwi1NSIYx75xQJSGlFKUaBVL9WgWR0Cazf8EV32VdX2UKGgGaAloD0MIE3zT9BnlcUCUhpRSlGgVS+VoFkdAms4Vl05lv3V9lChoBmgJaA9DCO9Z12i56nJAlIaUUpRoFUv+aBZHQJrOI4vN/vx1fZQoaAZoCWgPQwhPBkfJK5xtQJSGlFKUaBVL2WgWR0CbEIrwvxpddX2UKGgGaAloD0MIHjUmxJwBckCUhpRSlGgVS+hoFkdAmxD7qt5lfHV9lChoBmgJaA9DCOIFEalpK3JAlIaUUpRoFUvgaBZHQJsROzu4PPN1fZQoaAZoCWgPQwjPLt/6sCNzQJSGlFKUaBVL72gWR0CbEdGdqcmTdX2UKGgGaAloD0MI+aI9Xgh2cUCUhpRSlGgVS+hoFkdAmxK6JEYwZnV9lChoBmgJaA9DCDFfXoB9znBAlIaUUpRoFUvnaBZHQJsS/xy4nWt1fZQoaAZoCWgPQwiSByKLNMpyQJSGlFKUaBVL0GgWR0CbE282Jiy6dX2UKGgGaAloD0MI+BisOBWgckCUhpRSlGgVS/xoFkdAmxQgcYIjW3V9lChoBmgJaA9DCLGIYYfxUHJAlIaUUpRoFUvraBZHQJsUKTINmUZ1fZQoaAZoCWgPQwiTGW8rvVFtQJSGlFKUaBVLzGgWR0CbFWUKArhBdX2UKGgGaAloD0MILVxWYbO7cUCUhpRSlGgVS8hoFkdAmxXJJ5E+gXV9lChoBmgJaA9DCEloy7lUk3JAlIaUUpRoFUvMaBZHQJsWH71qWTp1fZQoaAZoCWgPQwgKFLGIYb5wQJSGlFKUaBVL5GgWR0CbFwIa99MLdX2UKGgGaAloD0MI0JuKVBhJbkCUhpRSlGgVS91oFkdAmxeyv5gw5HV9lChoBmgJaA9DCI4+5gMCfnNAlIaUUpRoFUvXaBZHQJsX6KFZgXx1fZQoaAZoCWgPQwhXeQJhp6BxQJSGlFKUaBVNAwFoFkdAmxf5Hy3CsXV9lChoBmgJaA9DCEPFOH/TcXJAlIaUUpRoFUveaBZHQJsY+OR1X/51fZQoaAZoCWgPQwguOllq/ZhwQJSGlFKUaBVL8mgWR0CbGQo7FKkEdX2UKGgGaAloD0MIKLUX0TZEc0CUhpRSlGgVS81oFkdAmxoBu0kWynV9lChoBmgJaA9DCGb35GGhcG9AlIaUUpRoFUvjaBZHQJsaQlAu7H11fZQoaAZoCWgPQwhh/DTuTSxzQJSGlFKUaBVL9WgWR0CbGpC3gDRudX2UKGgGaAloD0MIKbLWUOrZcECUhpRSlGgVTQUDaBZHQJsaotCiRGN1fZQoaAZoCWgPQwiiYweVuO9uQJSGlFKUaBVL0mgWR0CbGtHuJDVpdX2UKGgGaAloD0MI/RGGAQukcUCUhpRSlGgVS8BoFkdAmxtuIdlunHV9lChoBmgJaA9DCCb8Uj/vwHFAlIaUUpRoFUv0aBZHQJsbyXqqwQl1fZQoaAZoCWgPQwhioGtfwFhyQJSGlFKUaBVL42gWR0CbHR3dbgTAdX2UKGgGaAloD0MIB5s6j4qWc0CUhpRSlGgVS/ZoFkdAmx1iF49ovnV9lChoBmgJaA9DCPJh9rIt4HBAlIaUUpRoFUvRaBZHQJsdcv9LpRp1fZQoaAZoCWgPQwg7Vik90/lvQJSGlFKUaBVL4WgWR0CbHshYvFm4dX2UKGgGaAloD0MIcZAQ5YteckCUhpRSlGgVS8JoFkdAmx7XjENvwXV9lChoBmgJaA9DCLMLBtccdnNAlIaUUpRoFUvoaBZHQJse8daMaS91fZQoaAZoCWgPQwj2lQfpKQl0QJSGlFKUaBVL82gWR0CbHxEA5q/NdX2UKGgGaAloD0MIuB6F6xFqcECUhpRSlGgVS+RoFkdAmx/JX6qKg3V9lChoBmgJaA9DCHTOT3Ecj2RAlIaUUpRoFU3oA2gWR0CbIJOZ9d/sdX2UKGgGaAloD0MIDd5X5cLccECUhpRSlGgVS+FoFkdAmyCqaTfR/nV9lChoBmgJaA9DCK2JBb7i13JAlIaUUpRoFUvlaBZHQJshbIT4+KV1fZQoaAZoCWgPQwjXFwltOVpzQJSGlFKUaBVL5mgWR0CbIa+HJtBOdX2UKGgGaAloD0MIfJi9bPsScECUhpRSlGgVS/5oFkdAmyHWitaIN3V9lChoBmgJaA9DCJl+iXhr93FAlIaUUpRoFUvnaBZHQJsiU25xzaN1fZQoaAZoCWgPQwgrFyr/2lpyQJSGlFKUaBVL6GgWR0CbIriV0Lc9dX2UKGgGaAloD0MIA7LXu38Rc0CUhpRSlGgVS8VoFkdAmyM5OSGJvnV9lChoBmgJaA9DCC6NX3glzHJAlIaUUpRoFUvkaBZHQJsj586V+ql1fZQoaAZoCWgPQwjR60/is2lwQJSGlFKUaBVL2WgWR0CbI+PyCnP3dX2UKGgGaAloD0MId4apLTX3cECUhpRSlGgVS9doFkdAmyVDcM3IdXV9lChoBmgJaA9DCDhIiPKFBnJAlIaUUpRoFUvuaBZHQJsmIXenAIp1fZQoaAZoCWgPQwjaOGItfmdzQJSGlFKUaBVL7mgWR0CbJmfra/RFdX2UKGgGaAloD0MIIZIhx1Y9b0CUhpRSlGgVS9doFkdAmyZyU5dWyXV9lChoBmgJaA9DCH+8V62M5HFAlIaUUpRoFUv7aBZHQJsmsgjhUBJ1fZQoaAZoCWgPQwjqeqLrgjRwQJSGlFKUaBVL22gWR0CbJ4OxjawmdX2UKGgGaAloD0MIqi11kNe5cUCUhpRSlGgVS+doFkdAmyfNGus90XV9lChoBmgJaA9DCCtqMA1DtG9AlIaUUpRoFUvYaBZHQJsok/QjUut1fZQoaAZoCWgPQwiYMnBAS41vQJSGlFKUaBVL9mgWR0CbKSeqaPS2dX2UKGgGaAloD0MIy/W2mQq+cECUhpRSlGgVS/JoFkdAmylKGxlg+nV9lChoBmgJaA9DCGJqSx1ky3JAlIaUUpRoFUvZaBZHQJspruKGcnV1fZQoaAZoCWgPQwj60AX1LdByQJSGlFKUaBVL9GgWR0CbKg/qxC6ZdX2UKGgGaAloD0MIdO/hkmPXc0CUhpRSlGgVS9hoFkdAmyouY2Kl6HV9lChoBmgJaA9DCPxtT5AY6nBAlIaUUpRoFUvjaBZHQJsrKa4MF2V1fZQoaAZoCWgPQwjrAl5mGFBzQJSGlFKUaBVL5GgWR0CbKy2TPjXGdX2UKGgGaAloD0MI8NqlDQclc0CUhpRSlGgVS91oFkdAmyxEMCtA9nV9lChoBmgJaA9DCJfhP91AIW9AlIaUUpRoFUvEaBZHQJssh9jPOY91fZQoaAZoCWgPQwge3J21myZzQJSGlFKUaBVLzmgWR0CbLJBzFMqSdX2UKGgGaAloD0MIqUwxBwGJcECUhpRSlGgVS8ZoFkdAmyzOtGNJe3V9lChoBmgJaA9DCFA1ejVAGnJAlIaUUpRoFUvpaBZHQJstmPbO/tZ1fZQoaAZoCWgPQwhsPUM4ZvFxQJSGlFKUaBVLyGgWR0CbLewVCXyBdX2UKGgGaAloD0MIjZYDPZRlcUCUhpRSlGgVS/hoFkdAmy8V7IDHO3V9lChoBmgJaA9DCEw0SMFTznBAlIaUUpRoFUvMaBZHQJsvSvECNjt1ZS4="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 620, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 10, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVvwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAUsBSxNDBIgAUwCUToWUKYwBX5SFlIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCB9lH2UKGgXaA6MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgYjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "system_info": {"OS": "Linux-5.4.188+-x86_64-with-Ubuntu-18.04-bionic #1 SMP Sun Apr 24 10:03:06 PDT 2022", "Python": "3.7.13", "Stable-Baselines3": "1.5.0", "PyTorch": "1.11.0+cu113", "GPU Enabled": "True", "Numpy": "1.21.6", "Gym": "0.21.0"}}
ppo-LunarLander-v2.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:15a50aa005a95c06274ba158d46be2978789aa6c00869b3d3afe7d79d600cedb
3
- size 144113
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6b2af6a12a7aff24a4780113edf9029ad03d17db445c4062131a7808c0d3671
3
+ size 143985
ppo-LunarLander-v2/data CHANGED
@@ -4,19 +4,19 @@
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
- "__init__": "<function ActorCriticPolicy.__init__ at 0x7f7629c25ef0>",
8
- "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f7629c25f80>",
9
- "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f7629c2b050>",
10
- "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f7629c2b0e0>",
11
- "_build": "<function ActorCriticPolicy._build at 0x7f7629c2b170>",
12
- "forward": "<function ActorCriticPolicy.forward at 0x7f7629c2b200>",
13
- "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f7629c2b290>",
14
- "_predict": "<function ActorCriticPolicy._predict at 0x7f7629c2b320>",
15
- "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f7629c2b3b0>",
16
- "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f7629c2b440>",
17
- "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f7629c2b4d0>",
18
  "__abstractmethods__": "frozenset()",
19
- "_abc_impl": "<_abc_data object at 0x7f7629c75a50>"
20
  },
21
  "verbose": 1,
22
  "policy_kwargs": {},
@@ -42,12 +42,12 @@
42
  "_np_random": null
43
  },
44
  "n_envs": 16,
45
- "num_timesteps": 507904,
46
- "_total_timesteps": 500000,
47
  "_num_timesteps_at_start": 0,
48
  "seed": null,
49
  "action_noise": null,
50
- "start_time": 1652084949.9720929,
51
  "learning_rate": 0.0003,
52
  "tensorboard_log": null,
53
  "lr_schedule": {
@@ -56,7 +56,7 @@
56
  },
57
  "_last_obs": {
58
  ":type:": "<class 'numpy.ndarray'>",
59
- ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAGZWyzqPzgW6YbqiOrxrgLPGCpo6xrS+uQAAgD8AAIA/ANqVvFxPSTmuuO87m5K6tv79ATv6Urm1AACAPwAAgD/mAwu99qQ0uh38oDs179M3WyqROhr33bQAAIA/AACAP51mgj60+0G9zp3xul8KyTmYQ6m+gzQuOgAAgD8AAIA/mpUGvvaXEzsO7us79/8juo7y1rxmuRQ7AACAPwAAgD+NL5c9FEieugPId7tVoi04ivneOnHKADcAAIA/AACAP2ZdQT2uoai649A/O7m6GjhqZ5M6AJ3ZNQAAgD8AAIA/Zhe/PcqNHz94w3i95RlhvsZ/7zwzgg+7AAAAAAAAAABe8o2+b/+MPwqsxL2qvK2+UWSfvkEysj0AAAAAAAAAAE1ZDD0pSCy6BlbevP/UsjVyH+I6elEmtQAAgD8AAIA/LgyAvsqfIjxe/FK6cbMxONFPrb2yanY5AACAPwAAgD9aOqa9wzVRuljkervrrJg4X3Dxuon1wTkAAIA/AACAP8bbab40hvU9DCI0vfo44L15L8C8+c+SvQAAAAAAAAAAJmxHPrz4SD1KokO9/uVSvuln5jznvre8AAAAAAAAAAAm2Bi+hfmNu0DypTo/lDw3zw24PLZzwLkAAIA/AACAP81qDjz2bAa6q9Xvujf1LjcBwUm6E0SZtgAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
60
  },
61
  "_last_episode_starts": {
62
  ":type:": "<class 'numpy.ndarray'>",
@@ -69,13 +69,13 @@
69
  "_current_progress_remaining": -0.015808000000000044,
70
  "ep_info_buffer": {
71
  ":type:": "<class 'collections.deque'>",
72
- ":serialized:": "gAWVfxAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIyY/4FWunVUCUhpRSlIwBbJRN6AOMAXSUR0CnVg+i8FpxdX2UKGgGaAloD0MIMrCO4wd8YUCUhpRSlGgVTegDaBZHQKdXXWEK3NN1fZQoaAZoCWgPQwitpBXfUOZeQJSGlFKUaBVN6ANoFkdAp1k2tOmBOHV9lChoBmgJaA9DCNEjRs8twlxAlIaUUpRoFU3oA2gWR0CnWgvgNwzddX2UKGgGaAloD0MIuhXCaix8X0CUhpRSlGgVTegDaBZHQKda8ZG8VYZ1fZQoaAZoCWgPQwgw2A3bFq5hQJSGlFKUaBVN6ANoFkdAp1tI0Kqn33V9lChoBmgJaA9DCDjAzHdwLWFAlIaUUpRoFU3oA2gWR0CnXIKjSG8FdX2UKGgGaAloD0MI/U/+7p18Y0CUhpRSlGgVTegDaBZHQKdhxTcZccF1fZQoaAZoCWgPQwiiYTHqWrszQJSGlFKUaBVL7WgWR0CnYzYc/+sHdX2UKGgGaAloD0MItaUO8noYZUCUhpRSlGgVTegDaBZHQKdnMU5dWyV1fZQoaAZoCWgPQwieRe9UwPdXQJSGlFKUaBVN6ANoFkdAp3AjgXMyJ3V9lChoBmgJaA9DCFhyFYvfiGJAlIaUUpRoFU3oA2gWR0CnmnP+4smOdX2UKGgGaAloD0MIowc+BiuwYkCUhpRSlGgVTegDaBZHQKedeHpr1ul1fZQoaAZoCWgPQwhoyk4/KKFiQJSGlFKUaBVN6ANoFkdAp563Xf642HV9lChoBmgJaA9DCByygXSx5GNAlIaUUpRoFU3oA2gWR0CnobrXlKbsdX2UKGgGaAloD0MICrq9pDF4XUCUhpRSlGgVTegDaBZHQKeh2qvNeMR1fZQoaAZoCWgPQwj3V4/7Vr1iQJSGlFKUaBVN6ANoFkdAp6I8o4MnZ3V9lChoBmgJaA9DCF7zqs5qfVdAlIaUUpRoFU3oA2gWR0Cnos64UeuFdX2UKGgGaAloD0MID3wMVhyHY0CUhpRSlGgVTegDaBZHQKekPIvrWy11fZQoaAZoCWgPQwh7FoTyPnVaQJSGlFKUaBVN6ANoFkdAp6YdVDKHPHV9lChoBmgJaA9DCB8tzhjmmF5AlIaUUpRoFU3oA2gWR0CnpvggX/HYdX2UKGgGaAloD0MI8UknEkzpTUCUhpRSlGgVTegDaBZHQKenzcTrVvx1fZQoaAZoCWgPQwhjm1Q01r75v5SGlFKUaBVL8WgWR0CnqDhgVoHtdX2UKGgGaAloD0MIPIcyVEUbYUCUhpRSlGgVTegDaBZHQKepYUMXrMV1fZQoaAZoCWgPQwh4l4v4TlZbQJSGlFKUaBVN6ANoFkdAp66vDFZPmHV9lChoBmgJaA9DCB77WSxFUFRAlIaUUpRoFU3oA2gWR0CnsAVaOgg6dX2UKGgGaAloD0MIMxXikfhZYUCUhpRSlGgVTegDaBZHQKezjYjjaPF1fZQoaAZoCWgPQwi8df7tsp/2P5SGlFKUaBVNNAFoFkdAp7QztG/etXV9lChoBmgJaA9DCI3TEFX4ZzFAlIaUUpRoFU0EAWgWR0Cnugn7gsK9dX2UKGgGaAloD0MIrTB9ryEMW0CUhpRSlGgVTegDaBZHQKe7DrD63y91fZQoaAZoCWgPQwj8xteeWbIOQJSGlFKUaBVNJgFoFkdAp798jmjj73V9lChoBmgJaA9DCEpiSbl7GmJAlIaUUpRoFU3oA2gWR0Cn5Aepn6EbdX2UKGgGaAloD0MI2nQEcLMbXUCUhpRSlGgVTegDaBZHQKfmpu4PPLR1fZQoaAZoCWgPQwhoz2VqEvVbQJSGlFKUaBVN6ANoFkdAp+p5P/JeV3V9lChoBmgJaA9DCFKBk21gIWNAlIaUUpRoFU3oA2gWR0Cn6pSNOuaGdX2UKGgGaAloD0MIF35wPnUjXECUhpRSlGgVTegDaBZHQKfq8VEd/8V1fZQoaAZoCWgPQwi8W1mis8hcQJSGlFKUaBVN6ANoFkdAp+t9f3N9pnV9lChoBmgJaA9DCGADIsQV2mJAlIaUUpRoFU3oA2gWR0Cn7NJQ+EAYdX2UKGgGaAloD0MIH/MBgc54XUCUhpRSlGgVTegDaBZHQKfurzBAOax1fZQoaAZoCWgPQwglsDkHz/FcQJSGlFKUaBVN6ANoFkdAp++Zw6ySm3V9lChoBmgJaA9DCK4oJQSr/11AlIaUUpRoFU3oA2gWR0Cn8IHskY4ydX2UKGgGaAloD0MIB5W4jnEqXkCUhpRSlGgVTegDaBZHQKfw6QlruYx1fZQoaAZoCWgPQwizfF2G/xJEwJSGlFKUaBVNIwFoFkdAp/G1AE+xGHV9lChoBmgJaA9DCAVu3c1TBF5AlIaUUpRoFU3oA2gWR0Cn99+N96TodX2UKGgGaAloD0MIUOPe/Ia5YkCUhpRSlGgVTegDaBZHQKf+Uv2Xb/R1fZQoaAZoCWgPQwj12mysRAhiQJSGlFKUaBVN6ANoFkdAqAU32RJVbXV9lChoBmgJaA9DCDpAMEePElJAlIaUUpRoFU3oA2gWR0CoBlFfqoqDdX2UKGgGaAloD0MIraOqCaLSV0CUhpRSlGgVTegDaBZHQKgLAp8WsRx1fZQoaAZoCWgPQwihuyTOivteQJSGlFKUaBVN6ANoFkdAqA0/5k9U0nV9lChoBmgJaA9DCL0BZr4DSWRAlIaUUpRoFU3oA2gWR0CoNaz9KmKqdX2UKGgGaAloD0MIehhanZxcXUCUhpRSlGgVTegDaBZHQKg1xgeii7F1fZQoaAZoCWgPQwghQIaOnUdkQJSGlFKUaBVN6ANoFkdAqDYgKUmlZXV9lChoBmgJaA9DCIwtBDko+lhAlIaUUpRoFU3oA2gWR0CoNqgDifg8dX2UKGgGaAloD0MIw7zHmSZqWkCUhpRSlGgVTegDaBZHQKg4EPqcEvF1fZQoaAZoCWgPQwjG+ZtQiG5hQJSGlFKUaBVN6ANoFkdAqDnbNyHVPXV9lChoBmgJaA9DCO7rwDkjWl9AlIaUUpRoFU3oA2gWR0CoOq8B+4LDdX2UKGgGaAloD0MIHsTOFDqyX0CUhpRSlGgVTegDaBZHQKg7ll8w5/91fZQoaAZoCWgPQwiGjh1U4gxhQJSGlFKUaBVN6ANoFkdAqDwAVh1DB3V9lChoBmgJaA9DCNgqweJwImZAlIaUUpRoFU3oA2gWR0CoPLz8pCrtdX2UKGgGaAloD0MIhH8RNGZCTUCUhpRSlGgVTRoBaBZHQKg/EF8ohIR1fZQoaAZoCWgPQwhZMzLIXYJaQJSGlFKUaBVN6ANoFkdAqEIpRsMy8HV9lChoBmgJaA9DCCEgX0IFZylAlIaUUpRoFU0nAWgWR0CoRULRBu4xdX2UKGgGaAloD0MIc6Hyr+XlX0CUhpRSlGgVTegDaBZHQKhH67aIval1fZQoaAZoCWgPQwj4/DBCeJldQJSGlFKUaBVN6ANoFkdAqE5ZrLyMDXV9lChoBmgJaA9DCMP1KFyPRVhAlIaUUpRoFU3oA2gWR0CoT2pLVWjodX2UKGgGaAloD0MIXwmkxK4+XkCUhpRSlGgVTegDaBZHQKhUIPIXCTF1fZQoaAZoCWgPQwgE4+DSMR1kQJSGlFKUaBVN6ANoFkdAqFZotSQ5m3V9lChoBmgJaA9DCHFYGvhRvWFAlIaUUpRoFU3oA2gWR0CogEHq3VkMdX2UKGgGaAloD0MIEywOZ36kYUCUhpRSlGgVTegDaBZHQKiAsdZJTVF1fZQoaAZoCWgPQwjkTX6LTqxZQJSGlFKUaBVN6ANoFkdAqIFOMqBmPHV9lChoBmgJaA9DCJvkR/yKzWFAlIaUUpRoFU3oA2gWR0CogtIB7u2JdX2UKGgGaAloD0MIWvPjLy3DWUCUhpRSlGgVTegDaBZHQKiE7TfixV11fZQoaAZoCWgPQwgXEcXkjd5gQJSGlFKUaBVN6ANoFkdAqIXnA9FF2HV9lChoBmgJaA9DCEZCW84lMWFAlIaUUpRoFU3oA2gWR0Coh3NMPBi1dX2UKGgGaAloD0MIkrBvJ5FUYECUhpRSlGgVTegDaBZHQKiIbeqrBCV1fZQoaAZoCWgPQwi4eHjPgbNaQJSGlFKUaBVN6ANoFkdAqItza/RE4XV9lChoBmgJaA9DCLVOXI5X01hAlIaUUpRoFU3oA2gWR0Coj2azE74jdX2UKGgGaAloD0MIqyUd5eDUYkCUhpRSlGgVTegDaBZHQKiTJLmITGp1fZQoaAZoCWgPQwgt7j8ynX1iQJSGlFKUaBVN6ANoFkdAqJYyV4X403V9lChoBmgJaA9DCFPpJ5zdB2BAlIaUUpRoFU3oA2gWR0ConWCsOoYOdX2UKGgGaAloD0MI6gjgZvEQWkCUhpRSlGgVTegDaBZHQKiehpGnXNF1fZQoaAZoCWgPQwio4PCCiINdQJSGlFKUaBVN6ANoFkdAqKNicAimmHV9lChoBmgJaA9DCL3/jxMm7lxAlIaUUpRoFU3oA2gWR0CopaUWVNYbdX2UKGgGaAloD0MIBvTCnQtDYECUhpRSlGgVTegDaBZHQKjOuPp6hQF1fZQoaAZoCWgPQwhMjdDP1J5gQJSGlFKUaBVN6ANoFkdAqM8ewu/UOXV9lChoBmgJaA9DCM1aCkj7jWFAlIaUUpRoFU3oA2gWR0Coz7L92ovSdX2UKGgGaAloD0MImL7XEJzYYkCUhpRSlGgVTegDaBZHQKjRJkmQbMp1fZQoaAZoCWgPQwivIqMDEnFkQJSGlFKUaBVN6ANoFkdAqNMp0Syt3nV9lChoBmgJaA9DCE9Xdyy2dGFAlIaUUpRoFU3oA2gWR0Co1CdAxBVudX2UKGgGaAloD0MIBRVVv9ILY0CUhpRSlGgVTegDaBZHQKjVtZ8rqdJ1fZQoaAZoCWgPQwhDjUKS2ZdiQJSGlFKUaBVN6ANoFkdAqNam/rSmZXV9lChoBmgJaA9DCDc10HzOxFhAlIaUUpRoFU3oA2gWR0Co2YJpN9H+dX2UKGgGaAloD0MIGNALdy6AT0CUhpRSlGgVTREBaBZHQKjaFm7rcCZ1fZQoaAZoCWgPQwg9uhEWFd9SQJSGlFKUaBVN6ANoFkdAqN0NTxXnyXV9lChoBmgJaA9DCAHBHD1+Bl5AlIaUUpRoFU3oA2gWR0Co4IGvwEyMdX2UKGgGaAloD0MI4LvNG6dPYECUhpRSlGgVTegDaBZHQKjjexB3Roh1fZQoaAZoCWgPQwjAPc+ftiRgQJSGlFKUaBVN6ANoFkdAqOqhMDfWMHV9lChoBmgJaA9DCOARFaobZWNAlIaUUpRoFU3oA2gWR0Co68+1SflIdX2UKGgGaAloD0MIxJeJIqS3Y0CUhpRSlGgVTegDaBZHQKjwuWweNkx1fZQoaAZoCWgPQwjEB3b8FyRhQJSGlFKUaBVN6ANoFkdAqPMXGEPDpHVlLg=="
73
  },
74
  "ep_success_buffer": {
75
  ":type:": "<class 'collections.deque'>",
76
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
77
  },
78
- "_n_updates": 310,
79
  "n_steps": 1024,
80
  "gamma": 0.999,
81
  "gae_lambda": 0.98,
 
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
+ "__init__": "<function ActorCriticPolicy.__init__ at 0x7fafecdddef0>",
8
+ "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7fafecdddf80>",
9
+ "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7fafecde3050>",
10
+ "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7fafecde30e0>",
11
+ "_build": "<function ActorCriticPolicy._build at 0x7fafecde3170>",
12
+ "forward": "<function ActorCriticPolicy.forward at 0x7fafecde3200>",
13
+ "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7fafecde3290>",
14
+ "_predict": "<function ActorCriticPolicy._predict at 0x7fafecde3320>",
15
+ "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7fafecde33b0>",
16
+ "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7fafecde3440>",
17
+ "predict_values": "<function ActorCriticPolicy.predict_values at 0x7fafecde34d0>",
18
  "__abstractmethods__": "frozenset()",
19
+ "_abc_impl": "<_abc_data object at 0x7fafece1edb0>"
20
  },
21
  "verbose": 1,
22
  "policy_kwargs": {},
 
42
  "_np_random": null
43
  },
44
  "n_envs": 16,
45
+ "num_timesteps": 1015808,
46
+ "_total_timesteps": 1000000,
47
  "_num_timesteps_at_start": 0,
48
  "seed": null,
49
  "action_noise": null,
50
+ "start_time": 1652091708.80915,
51
  "learning_rate": 0.0003,
52
  "tensorboard_log": null,
53
  "lr_schedule": {
 
56
  },
57
  "_last_obs": {
58
  ":type:": "<class 'numpy.ndarray'>",
59
+ ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAGZR6bwDsYg/QbShvXa4EL8Obpq9E9q1PAAAAAAAAAAAZraWu2TOsD0yiJ+9v1xhvrsXvbsGARq8AAAAAAAAAADNLYG8BY/QPtBTjby38a++/BKKvQZcLb0AAAAAAAAAAGZCwzt7np669JJJM9Vrqy/1W9M5TgO9swAAgD8AAIA/ZmzhPGY1wD8PuxA+LWc6u4R/3zz+zI89AAAAAAAAAAATJHs+xHSHPgNR/74c9bO+M3iFPMmQOb4AAAAAAAAAADP39TuuIYy6oL+yu/1bUTiKf2+6M87fNwAAAAAAAAAAZo+ivKQ1e7sNEoA8+fSVPOAzwbw+DIA9AACAPwAAgD8trkc+EIKBPrBJy75kgaC+e6oePBv2tr0AAAAAAAAAAK3KMT4Plsw+srnCvme2yb4bkpA7fw8qvgAAAAAAAAAAZraMPKToebtDWUg7UuaUPO+QmbxNnH49AACAPwAAgD8A4Bu7j850uo7wg7sMKc81hmpRu3svQLUAAAAAAAAAAJq3DTxccUa8NYGQPMkeADt4E6G9hp6SvQAAgD8AAIA/M3R6PdYofj8zWYO8YFsTv9Nxmz0dFJa9AAAAAAAAAAAbg9W+0/d7Py6YIbyeWPq+h84Iv05C0T0AAAAAAAAAAGaEKr32CHa6n3SmtmbTNrFgfwc7ioPFNQAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
60
  },
61
  "_last_episode_starts": {
62
  ":type:": "<class 'numpy.ndarray'>",
 
69
  "_current_progress_remaining": -0.015808000000000044,
70
  "ep_info_buffer": {
71
  ":type:": "<class 'collections.deque'>",
72
+ ":serialized:": "gAWVIBAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIK6T8pBp3ckCUhpRSlIwBbJRL44wBdJRHQJrAG6oVEeB1fZQoaAZoCWgPQwiiJCTSds1yQJSGlFKUaBVL7WgWR0CawIY1YQrddX2UKGgGaAloD0MI/+kGCvy8cECUhpRSlGgVS8poFkdAmsCdHYpUgnV9lChoBmgJaA9DCIoEU80s1m1AlIaUUpRoFUvLaBZHQJrAzp1RtP51fZQoaAZoCWgPQwgNVMa/T/xyQJSGlFKUaBVLxWgWR0CawYK1G9YfdX2UKGgGaAloD0MIINEEipjxcECUhpRSlGgVS9VoFkdAmsGB+az/qHV9lChoBmgJaA9DCL4UHjT7N3BAlIaUUpRoFUvpaBZHQJrBt7+kxh51fZQoaAZoCWgPQwjT+IVX0pJwQJSGlFKUaBVLxWgWR0CawgSXt0FKdX2UKGgGaAloD0MIS1gbYydPcUCUhpRSlGgVS/doFkdAmsI0nw5NoXV9lChoBmgJaA9DCGtKsg7H1nNAlIaUUpRoFUvlaBZHQJrCVsEaESN1fZQoaAZoCWgPQwh8DcFxWUJwQJSGlFKUaBVL1GgWR0Caw01IRRMwdX2UKGgGaAloD0MITaPJxRiPcUCUhpRSlGgVS/doFkdAmsOEpy6tknV9lChoBmgJaA9DCHcRpihXpXJAlIaUUpRoFUvhaBZHQJrD7KYAsCl1fZQoaAZoCWgPQwhB8s6hzDFyQJSGlFKUaBVL52gWR0CaxHbBGhEjdX2UKGgGaAloD0MI14aKcX4Kc0CUhpRSlGgVS85oFkdAmsSQSrYGuHV9lChoBmgJaA9DCOQSRx4Iu29AlIaUUpRoFUvQaBZHQJrGSzUqhDh1fZQoaAZoCWgPQwihhJm2f2pyQJSGlFKUaBVL0mgWR0CaxnSQo1DTdX2UKGgGaAloD0MI2J3uPDF3c0CUhpRSlGgVS/VoFkdAmsaZeVs1sXV9lChoBmgJaA9DCA7z5QXYkHNAlIaUUpRoFUv5aBZHQJrHKhHskY51fZQoaAZoCWgPQwi28/3UuGRyQJSGlFKUaBVL1GgWR0Cax6u0TlDGdX2UKGgGaAloD0MIpwUv+sq1cUCUhpRSlGgVS/FoFkdAmshJ3PiT+3V9lChoBmgJaA9DCPBRf71C1G1AlIaUUpRoFUvaaBZHQJrIW6bvw3J1fZQoaAZoCWgPQwiIEi15vONuQJSGlFKUaBVL4mgWR0CayMCxeLNwdX2UKGgGaAloD0MISG3i5P7TckCUhpRSlGgVS/FoFkdAmsjXUH6dlXV9lChoBmgJaA9DCNgpVg0CNnBAlIaUUpRoFUvKaBZHQJrJzLyMDOl1fZQoaAZoCWgPQwitodRexNluQJSGlFKUaBVL42gWR0CayhNGEwnIdX2UKGgGaAloD0MItd5vtCMuc0CUhpRSlGgVS/poFkdAmsp9v0h/zHV9lChoBmgJaA9DCPesa7TcZ3BAlIaUUpRoFUvgaBZHQJrLBuyeI2x1fZQoaAZoCWgPQwgjL2tigZBzQJSGlFKUaBVL4WgWR0Cayyh4MWoFdX2UKGgGaAloD0MIVS5U/jWncUCUhpRSlGgVS+hoFkdAms03jdYW+HV9lChoBmgJaA9DCA2qDU5Eu29AlIaUUpRoFUvKaBZHQJrNxa/yoXN1fZQoaAZoCWgPQwi1NSIYx75xQJSGlFKUaBVL9WgWR0Cazf8EV32VdX2UKGgGaAloD0MIE3zT9BnlcUCUhpRSlGgVS+VoFkdAms4Vl05lv3V9lChoBmgJaA9DCO9Z12i56nJAlIaUUpRoFUv+aBZHQJrOI4vN/vx1fZQoaAZoCWgPQwhPBkfJK5xtQJSGlFKUaBVL2WgWR0CbEIrwvxpddX2UKGgGaAloD0MIHjUmxJwBckCUhpRSlGgVS+hoFkdAmxD7qt5lfHV9lChoBmgJaA9DCOIFEalpK3JAlIaUUpRoFUvgaBZHQJsROzu4PPN1fZQoaAZoCWgPQwjPLt/6sCNzQJSGlFKUaBVL72gWR0CbEdGdqcmTdX2UKGgGaAloD0MI+aI9Xgh2cUCUhpRSlGgVS+hoFkdAmxK6JEYwZnV9lChoBmgJaA9DCDFfXoB9znBAlIaUUpRoFUvnaBZHQJsS/xy4nWt1fZQoaAZoCWgPQwiSByKLNMpyQJSGlFKUaBVL0GgWR0CbE282Jiy6dX2UKGgGaAloD0MI+BisOBWgckCUhpRSlGgVS/xoFkdAmxQgcYIjW3V9lChoBmgJaA9DCLGIYYfxUHJAlIaUUpRoFUvraBZHQJsUKTINmUZ1fZQoaAZoCWgPQwiTGW8rvVFtQJSGlFKUaBVLzGgWR0CbFWUKArhBdX2UKGgGaAloD0MILVxWYbO7cUCUhpRSlGgVS8hoFkdAmxXJJ5E+gXV9lChoBmgJaA9DCEloy7lUk3JAlIaUUpRoFUvMaBZHQJsWH71qWTp1fZQoaAZoCWgPQwgKFLGIYb5wQJSGlFKUaBVL5GgWR0CbFwIa99MLdX2UKGgGaAloD0MI0JuKVBhJbkCUhpRSlGgVS91oFkdAmxeyv5gw5HV9lChoBmgJaA9DCI4+5gMCfnNAlIaUUpRoFUvXaBZHQJsX6KFZgXx1fZQoaAZoCWgPQwhXeQJhp6BxQJSGlFKUaBVNAwFoFkdAmxf5Hy3CsXV9lChoBmgJaA9DCEPFOH/TcXJAlIaUUpRoFUveaBZHQJsY+OR1X/51fZQoaAZoCWgPQwguOllq/ZhwQJSGlFKUaBVL8mgWR0CbGQo7FKkEdX2UKGgGaAloD0MIKLUX0TZEc0CUhpRSlGgVS81oFkdAmxoBu0kWynV9lChoBmgJaA9DCGb35GGhcG9AlIaUUpRoFUvjaBZHQJsaQlAu7H11fZQoaAZoCWgPQwhh/DTuTSxzQJSGlFKUaBVL9WgWR0CbGpC3gDRudX2UKGgGaAloD0MIKbLWUOrZcECUhpRSlGgVTQUDaBZHQJsaotCiRGN1fZQoaAZoCWgPQwiiYweVuO9uQJSGlFKUaBVL0mgWR0CbGtHuJDVpdX2UKGgGaAloD0MI/RGGAQukcUCUhpRSlGgVS8BoFkdAmxtuIdlunHV9lChoBmgJaA9DCCb8Uj/vwHFAlIaUUpRoFUv0aBZHQJsbyXqqwQl1fZQoaAZoCWgPQwhioGtfwFhyQJSGlFKUaBVL42gWR0CbHR3dbgTAdX2UKGgGaAloD0MIB5s6j4qWc0CUhpRSlGgVS/ZoFkdAmx1iF49ovnV9lChoBmgJaA9DCPJh9rIt4HBAlIaUUpRoFUvRaBZHQJsdcv9LpRp1fZQoaAZoCWgPQwg7Vik90/lvQJSGlFKUaBVL4WgWR0CbHshYvFm4dX2UKGgGaAloD0MIcZAQ5YteckCUhpRSlGgVS8JoFkdAmx7XjENvwXV9lChoBmgJaA9DCLMLBtccdnNAlIaUUpRoFUvoaBZHQJse8daMaS91fZQoaAZoCWgPQwj2lQfpKQl0QJSGlFKUaBVL82gWR0CbHxEA5q/NdX2UKGgGaAloD0MIuB6F6xFqcECUhpRSlGgVS+RoFkdAmx/JX6qKg3V9lChoBmgJaA9DCHTOT3Ecj2RAlIaUUpRoFU3oA2gWR0CbIJOZ9d/sdX2UKGgGaAloD0MIDd5X5cLccECUhpRSlGgVS+FoFkdAmyCqaTfR/nV9lChoBmgJaA9DCK2JBb7i13JAlIaUUpRoFUvlaBZHQJshbIT4+KV1fZQoaAZoCWgPQwjXFwltOVpzQJSGlFKUaBVL5mgWR0CbIa+HJtBOdX2UKGgGaAloD0MIfJi9bPsScECUhpRSlGgVS/5oFkdAmyHWitaIN3V9lChoBmgJaA9DCJl+iXhr93FAlIaUUpRoFUvnaBZHQJsiU25xzaN1fZQoaAZoCWgPQwgrFyr/2lpyQJSGlFKUaBVL6GgWR0CbIriV0Lc9dX2UKGgGaAloD0MIA7LXu38Rc0CUhpRSlGgVS8VoFkdAmyM5OSGJvnV9lChoBmgJaA9DCC6NX3glzHJAlIaUUpRoFUvkaBZHQJsj586V+ql1fZQoaAZoCWgPQwjR60/is2lwQJSGlFKUaBVL2WgWR0CbI+PyCnP3dX2UKGgGaAloD0MId4apLTX3cECUhpRSlGgVS9doFkdAmyVDcM3IdXV9lChoBmgJaA9DCDhIiPKFBnJAlIaUUpRoFUvuaBZHQJsmIXenAIp1fZQoaAZoCWgPQwjaOGItfmdzQJSGlFKUaBVL7mgWR0CbJmfra/RFdX2UKGgGaAloD0MIIZIhx1Y9b0CUhpRSlGgVS9doFkdAmyZyU5dWyXV9lChoBmgJaA9DCH+8V62M5HFAlIaUUpRoFUv7aBZHQJsmsgjhUBJ1fZQoaAZoCWgPQwjqeqLrgjRwQJSGlFKUaBVL22gWR0CbJ4OxjawmdX2UKGgGaAloD0MIqi11kNe5cUCUhpRSlGgVS+doFkdAmyfNGus90XV9lChoBmgJaA9DCCtqMA1DtG9AlIaUUpRoFUvYaBZHQJsok/QjUut1fZQoaAZoCWgPQwiYMnBAS41vQJSGlFKUaBVL9mgWR0CbKSeqaPS2dX2UKGgGaAloD0MIy/W2mQq+cECUhpRSlGgVS/JoFkdAmylKGxlg+nV9lChoBmgJaA9DCGJqSx1ky3JAlIaUUpRoFUvZaBZHQJspruKGcnV1fZQoaAZoCWgPQwj60AX1LdByQJSGlFKUaBVL9GgWR0CbKg/qxC6ZdX2UKGgGaAloD0MIdO/hkmPXc0CUhpRSlGgVS9hoFkdAmyouY2Kl6HV9lChoBmgJaA9DCPxtT5AY6nBAlIaUUpRoFUvjaBZHQJsrKa4MF2V1fZQoaAZoCWgPQwjrAl5mGFBzQJSGlFKUaBVL5GgWR0CbKy2TPjXGdX2UKGgGaAloD0MI8NqlDQclc0CUhpRSlGgVS91oFkdAmyxEMCtA9nV9lChoBmgJaA9DCJfhP91AIW9AlIaUUpRoFUvEaBZHQJssh9jPOY91fZQoaAZoCWgPQwge3J21myZzQJSGlFKUaBVLzmgWR0CbLJBzFMqSdX2UKGgGaAloD0MIqUwxBwGJcECUhpRSlGgVS8ZoFkdAmyzOtGNJe3V9lChoBmgJaA9DCFA1ejVAGnJAlIaUUpRoFUvpaBZHQJstmPbO/tZ1fZQoaAZoCWgPQwhsPUM4ZvFxQJSGlFKUaBVLyGgWR0CbLewVCXyBdX2UKGgGaAloD0MIjZYDPZRlcUCUhpRSlGgVS/hoFkdAmy8V7IDHO3V9lChoBmgJaA9DCEw0SMFTznBAlIaUUpRoFUvMaBZHQJsvSvECNjt1ZS4="
73
  },
74
  "ep_success_buffer": {
75
  ":type:": "<class 'collections.deque'>",
76
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
77
  },
78
+ "_n_updates": 620,
79
  "n_steps": 1024,
80
  "gamma": 0.999,
81
  "gae_lambda": 0.98,
ppo-LunarLander-v2/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4c1a0ee456242548af650f4c380481f490d274f5e0e9a3bb080372668dd44a68
3
  size 84893
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:227e71d3af59b00017d0e0c3aa8b456d8a10b34ce3589c5c919904700023b8d8
3
  size 84893
ppo-LunarLander-v2/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:594bb7bd11046227d87d84415431b27965acff15f2ea737aeda545cdfb609b3a
3
  size 43201
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a76deb6c59e187526ad25d474ff2073f7448b29e4d3ca642d9741f51b69d921
3
  size 43201
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6c140b385d947094fa783dca2304ab77f318e85b06fadcccf70315fafb113685
3
- size 257238
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3625658eb71700c5e6b40d07af82deae2bbf1c4863fa36d9073c82d214604467
3
+ size 214752
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 230.33608992699777, "std_reward": 17.546111034331567, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2022-05-09T08:49:02.391081"}
 
1
+ {"mean_reward": 271.03430059217396, "std_reward": 12.912696775193375, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2022-05-09T10:53:10.731245"}