kws commited on
Commit
5f13406
1 Parent(s): b426f2b

600k steps trained. mean_reward= 209.20 +/- 39.6

Browse files
'LunarLander-ppo-500k.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2360b031a78869c408f6ec185c96d2d06a68d0d7b1e3bb4d810c9923f932797d
3
- size 144203
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59d892c004f445cca00f89c95b90be667e35324c809881ca829d6ec72a67d70f
3
+ size 144222
'LunarLander-ppo-500k/data CHANGED
@@ -4,50 +4,50 @@
4
  ":serialized:": "gASVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
- "__init__": "<function ActorCriticPolicy.__init__ at 0x7f83faae7680>",
8
- "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f83faae7710>",
9
- "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f83faae77a0>",
10
- "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f83faae7830>",
11
- "_build": "<function ActorCriticPolicy._build at 0x7f83faae78c0>",
12
- "forward": "<function ActorCriticPolicy.forward at 0x7f83faae7950>",
13
- "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f83faae79e0>",
14
- "_predict": "<function ActorCriticPolicy._predict at 0x7f83faae7a70>",
15
- "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f83faae7b00>",
16
- "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f83faae7b90>",
17
- "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f83faae7c20>",
18
  "__abstractmethods__": "frozenset()",
19
- "_abc_impl": "<_abc_data object at 0x7f83fab39420>"
20
  },
21
  "verbose": 1,
22
  "policy_kwargs": {},
23
  "observation_space": {
24
  ":type:": "<class 'gym.spaces.box.Box'>",
25
- ":serialized:": "gASVwgEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBXNoYXBllEsIhZSMA2xvd5SMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMDF9yZWNvbnN0cnVjdJSTlGgGjAduZGFycmF5lJOUSwCFlEMBYpSHlFKUKEsBSwiFlGgKiUMgAACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP+UdJRijARoaWdolGgSaBRLAIWUaBaHlFKUKEsBSwiFlGgKiUMgAACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH+UdJRijA1ib3VuZGVkX2JlbG93lGgSaBRLAIWUaBaHlFKUKEsBSwiFlGgHjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiiUMIAAAAAAAAAACUdJRijA1ib3VuZGVkX2Fib3ZllGgSaBRLAIWUaBaHlFKUKEsBSwiFlGgqiUMIAAAAAAAAAACUdJRijApfbnBfcmFuZG9tlE51Yi4=",
26
  "dtype": "float32",
27
- "shape": [
28
- 8
29
- ],
30
  "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]",
31
  "high": "[inf inf inf inf inf inf inf inf]",
32
  "bounded_below": "[False False False False False False False False]",
33
  "bounded_above": "[False False False False False False False False]",
34
- "_np_random": null
 
 
 
35
  },
36
  "action_space": {
37
  ":type:": "<class 'gym.spaces.discrete.Discrete'>",
38
- ":serialized:": "gASVgQAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwFc2hhcGWUKYwFZHR5cGWUjAVudW1weZRoB5OUjAJpOJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRijApfbnBfcmFuZG9tlE51Yi4=",
39
  "n": 4,
40
- "shape": [],
41
  "dtype": "int64",
42
- "_np_random": null
 
43
  },
44
  "n_envs": 16,
45
- "num_timesteps": 131072,
46
- "_total_timesteps": 100000,
47
  "_num_timesteps_at_start": 0,
48
  "seed": null,
49
  "action_noise": null,
50
- "start_time": 1657003619.1741638,
51
  "learning_rate": 0.0003,
52
  "tensorboard_log": null,
53
  "lr_schedule": {
@@ -56,7 +56,7 @@
56
  },
57
  "_last_obs": {
58
  ":type:": "<class 'numpy.ndarray'>",
59
- ":serialized:": "gASVjQIAAAAAAACMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMDF9yZWNvbnN0cnVjdJSTlIwFbnVtcHmUjAduZGFycmF5lJOUSwCFlEMBYpSHlFKUKEsBSxBLCIaUaAOMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiiUIAAgAAAJCSuw16tj/kBo+9LcMsPXHNUrz2U1m9AAAAAAAAAACAOo29yJGGP6RjA76Bn+i+zFugvQhaib0AAAAAAAAAADOIK717Vq26UnsAunV03bTTSIY65z8TOQAAgD8AAIA/zsgQP6+l+r0p/Zo9hf7BuoFR3b0Yo+E8AAAAAAAAgD+Adxe+RFIIP1TBGj3v4Iy+vCKtvHJ4zzwAAAAAAAAAAFqlOz5kHJE/Nv33Pt1P676RLDM+kTClPQAAAAAAAAAAw6ngvoJ/pz5O1+w9yQ+ivrm10bwRtom8AAAAAAAAAAAo7Ac/zQoNP1oonD0To4m+KEjRPUpjDrwAAAAAAAAAANDgCj/7M0c/rvs5Ptrps771fi4+EQsWugAAAAAAAAAAU4YwvocObj9K1Lm98DK6vuI95L1oML66AAAAAAAAAAA6x0Y/ze14vqBZ2DOqwQ4x9YPKvWZiKLQAAIA/AACAP+bCUb7WUVI/av4Lvrtpu7776ua97IAiPQAAAAAAAAAAgLUtvVsNcT+f1hE94GTjvrz5Ib0m0Pg8AAAAAAAAAAAmU30+KATZvCpC/jqq1yi5eEZBvtL8DLoAAIA/AACAP7PB6L1JkBc9EeKxPbWrSb5IT/W8hXRnPQAAAAAAAAAARU2Dvjs1irxWDRi7djo2uQMq/D1/IDU6AACAPwAAgD+UdJRiLg=="
60
  },
61
  "_last_episode_starts": {
62
  ":type:": "<class 'numpy.ndarray'>",
@@ -66,16 +66,16 @@
66
  "_episode_num": 0,
67
  "use_sde": false,
68
  "sde_sample_freq": -1,
69
- "_current_progress_remaining": -0.3107200000000001,
70
  "ep_info_buffer": {
71
  ":type:": "<class 'collections.deque'>",
72
- ":serialized:": "gASVeBAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIU3jQ7LqMcECUhpRSlIwBbJRNXwGMAXSUR0CaWeTPSlWPdX2UKGgGaAloD0MIaRoUzYPfa0CUhpRSlGgVTTABaBZHQJpaFuuRs/J1fZQoaAZoCWgPQwiMTSuFQHRaQJSGlFKUaBVN6ANoFkdAmlrufNA1N3V9lChoBmgJaA9DCBQGZRqNgHBAlIaUUpRoFU24AWgWR0CaXh5FPSDzdX2UKGgGaAloD0MIpg7yejDAbkCUhpRSlGgVTS4DaBZHQJpgyznied11fZQoaAZoCWgPQwjs20lE+AtYQJSGlFKUaBVN6ANoFkdAmmFCJO32EnV9lChoBmgJaA9DCKIIqdvZGHBAlIaUUpRoFU0FAWgWR0CaYiXbM5fddX2UKGgGaAloD0MIrDdqhSkqcMCUhpRSlGgVTZQCaBZHQJpi6r/82rJ1fZQoaAZoCWgPQwiDE9GvrZ+yP5SGlFKUaBVL22gWR0CaY9pXZGrkdX2UKGgGaAloD0MIkunQ6fkMbkCUhpRSlGgVTRcBaBZHQJpkEr4Fia11fZQoaAZoCWgPQwhiu3uAri1zQJSGlFKUaBVNhAFoFkdAmmQ7Ms6JZXV9lChoBmgJaA9DCETEzalknFNAlIaUUpRoFU3oA2gWR0CaZFK7qY7adX2UKGgGaAloD0MICI82jljLF8CUhpRSlGgVTb4CaBZHQJq/4f5k9U11fZQoaAZoCWgPQwhf8GlOHjRwQJSGlFKUaBVNKAFoFkdAmsBRzV+ZxHV9lChoBmgJaA9DCH0lkBK7/m9AlIaUUpRoFU1WAWgWR0CawhtVrAP/dX2UKGgGaAloD0MIBK3AkBX+cUCUhpRSlGgVTR4BaBZHQJrDJBrvb491fZQoaAZoCWgPQwjsGFdcnKJlwJSGlFKUaBVNlgFoFkdAmsUD6WPcSHV9lChoBmgJaA9DCG3kuimlH3BAlIaUUpRoFU0RAWgWR0CaxR9VFQVLdX2UKGgGaAloD0MI+3lTkQpKcECUhpRSlGgVTTUBaBZHQJrGE4DLbHp1fZQoaAZoCWgPQwgyyF2EqexwQJSGlFKUaBVNDwFoFkdAmsZ3dXT3I3V9lChoBmgJaA9DCCMWMeywkW9AlIaUUpRoFU27A2gWR0Cax19K28ZldX2UKGgGaAloD0MI0Eaum1IxcECUhpRSlGgVTTwBaBZHQJrHaIRAbAF1fZQoaAZoCWgPQwg7NZcbjIFhQJSGlFKUaBVN6ANoFkdAmsiIdU83dnV9lChoBmgJaA9DCICbxYsFMm9AlIaUUpRoFU1vAWgWR0Cayq3ljmSydX2UKGgGaAloD0MIxm8KKxV4cUCUhpRSlGgVTTcBaBZHQJrKx9qk/KR1fZQoaAZoCWgPQwgpQup29sFeQJSGlFKUaBVN6ANoFkdAmsvzT4L1EnV9lChoBmgJaA9DCG3F/rL7v2xAlIaUUpRoFU1ZAWgWR0CazFflp48mdX2UKGgGaAloD0MIOdTvwhavcUCUhpRSlGgVTbgBaBZHQJrNZMxoIv91fZQoaAZoCWgPQwjSbYlccBdwQJSGlFKUaBVNKgFoFkdAms2P+CK77XV9lChoBmgJaA9DCEVighq+PT5AlIaUUpRoFU0KAWgWR0CazjTxoZhsdX2UKGgGaAloD0MIn47HDFSYb0CUhpRSlGgVTSQBaBZHQJrQKg2606Z1fZQoaAZoCWgPQwhLAtTUct9wQJSGlFKUaBVL/mgWR0Ca0XauOjqOdX2UKGgGaAloD0MIVisTfqlBbkCUhpRSlGgVTSIBaBZHQJrRlGFzuF91fZQoaAZoCWgPQwjO/dXjfvtxQJSGlFKUaBVNTgFoFkdAmtIvtIClrXV9lChoBmgJaA9DCC52+6wynW1AlIaUUpRoFU3cAWgWR0Ca0vMRYigTdX2UKGgGaAloD0MIXvI/+bt35j+UhpRSlGgVS7JoFkdAmtPPepGWlnV9lChoBmgJaA9DCAlvD0JAu29AlIaUUpRoFU0KAWgWR0Ca1B1KoQ4CdX2UKGgGaAloD0MIVpv/Vx39ZUCUhpRSlGgVTa8BaBZHQJrURxkupS91fZQoaAZoCWgPQwirsYS1sXBwQJSGlFKUaBVNCgFoFkdAmtW3UH6dlXV9lChoBmgJaA9DCLMmFviKmjtAlIaUUpRoFUv1aBZHQJrW0kIHC411fZQoaAZoCWgPQwgEq+rld3BqQJSGlFKUaBVNPAFoFkdAmtcC6Ymb9nV9lChoBmgJaA9DCC6thsS9mG1AlIaUUpRoFU0oAWgWR0Ca19yUs4DLdX2UKGgGaAloD0MISpaTUHocbkCUhpRSlGgVTRUBaBZHQJrZw+aBqbl1fZQoaAZoCWgPQwjsoX2s4A1xQJSGlFKUaBVNGQFoFkdAmtsbe67NCHV9lChoBmgJaA9DCBIWFXF6h3FAlIaUUpRoFUvxaBZHQJrbJhqj8DV1fZQoaAZoCWgPQwgYeO49XFFwQJSGlFKUaBVNAgFoFkdAmt0kZm7J4nV9lChoBmgJaA9DCJ90IsFUszzAlIaUUpRoFUu8aBZHQJrdlrP+n651fZQoaAZoCWgPQwh5XFSLiDJuQJSGlFKUaBVNKwFoFkdAmt5TwQUYbnV9lChoBmgJaA9DCLjkuFO6OmdAlIaUUpRoFU2QAmgWR0Ca3mNlAeJYdX2UKGgGaAloD0MICvMeZ5p3bECUhpRSlGgVTR0BaBZHQJrf5CPZIxx1fZQoaAZoCWgPQwh9PPTdrUVyQJSGlFKUaBVNYQJoFkdAmuBEwnH/+HV9lChoBmgJaA9DCFBUNqypTW5AlIaUUpRoFU0IAWgWR0Ca4HZb6guidX2UKGgGaAloD0MIXynLEIf1cECUhpRSlGgVS/doFkdAmuDBzvJA+3V9lChoBmgJaA9DCBXl0viFIlxAlIaUUpRoFU3oA2gWR0Ca4MrWAf+1dX2UKGgGaAloD0MISrTk8TQ5YECUhpRSlGgVTegDaBZHQJrhCRfWtlt1fZQoaAZoCWgPQwhRZoNMMgRwQJSGlFKUaBVNygFoFkdAmuHaCL/CInV9lChoBmgJaA9DCE7tDFNb3G5AlIaUUpRoFUvyaBZHQJriGQmu1Wt1fZQoaAZoCWgPQwiMaaZ7HfVuQJSGlFKUaBVNDAFoFkdAmuQBzmwJPnV9lChoBmgJaA9DCNmz5zJ1vXFAlIaUUpRoFU0pAWgWR0Ca5O3iJfpmdX2UKGgGaAloD0MISu6wicyWb0CUhpRSlGgVTUECaBZHQJrk+i48U211fZQoaAZoCWgPQwhWEANdO1RwQJSGlFKUaBVN/QFoFkdAmuVD5GjKxXV9lChoBmgJaA9DCCR/MPCcu3BAlIaUUpRoFU0LAWgWR0Ca6GlQMx46dX2UKGgGaAloD0MIG53zUxwJbUCUhpRSlGgVTQ0BaBZHQJro8djoZAJ1fZQoaAZoCWgPQwj4xhAAXC9xQJSGlFKUaBVNCAFoFkdAmuj8MRYigXV9lChoBmgJaA9DCFTgZBs4EXFAlIaUUpRoFU1QAWgWR0Ca6WfGuLaVdX2UKGgGaAloD0MI+aBns2oHcECUhpRSlGgVTY0BaBZHQJrqWu2Zy+91fZQoaAZoCWgPQwjTLxFv3alyQJSGlFKUaBVNPwFoFkdAmus7Zi/fwnV9lChoBmgJaA9DCD8buW5KOm9AlIaUUpRoFU0mAWgWR0Ca7ArjYI0JdX2UKGgGaAloD0MIw9fXutT2bkCUhpRSlGgVTVkBaBZHQJrtjDZUT+N1fZQoaAZoCWgPQwiNDHIXYTBkQJSGlFKUaBVN5wFoFkdAmu3rronrp3V9lChoBmgJaA9DCK8FvTeGG1rAlIaUUpRoFU3XAWgWR0Ca7g9zfaYedX2UKGgGaAloD0MIipRm8ziPb0CUhpRSlGgVTSABaBZHQJruGPp6hQF1fZQoaAZoCWgPQwh+qgoNRFxwQJSGlFKUaBVNHwFoFkdAmu7tJvo/zXV9lChoBmgJaA9DCCrJOhzdlXBAlIaUUpRoFU0uAWgWR0Ca72omXw9adX2UKGgGaAloD0MIcVrwoq+4bUCUhpRSlGgVTdUBaBZHQJrwf7zkIX11fZQoaAZoCWgPQwg5C3va4a9wQJSGlFKUaBVNCgFoFkdAmvFrnLaEjHV9lChoBmgJaA9DCKInZVJDfW5AlIaUUpRoFU0FAWgWR0Ca8bM4LkS3dX2UKGgGaAloD0MIKEcBouB8bkCUhpRSlGgVTRABaBZHQJrydMajveB1fZQoaAZoCWgPQwjHTKJecMlwQJSGlFKUaBVNCQFoFkdAmvP7Llmvn3V9lChoBmgJaA9DCGdGPxpO/mtAlIaUUpRoFU3LAWgWR0Ca9O95yEL6dX2UKGgGaAloD0MImyFVFK88cUCUhpRSlGgVTQIBaBZHQJr2HMNc4YJ1fZQoaAZoCWgPQwh/h6JAH1VxQJSGlFKUaBVNnAFoFkdAmvb6/VRUFXV9lChoBmgJaA9DCKgZUkXxbXBAlIaUUpRoFU1LAWgWR0Ca+Z5dnkDIdX2UKGgGaAloD0MI0LNZ9TkQb0CUhpRSlGgVTS8BaBZHQJr6XMqz7dl1fZQoaAZoCWgPQwjYgXNG1JRwQJSGlFKUaBVNQQFoFkdAmvprSVnmJXV9lChoBmgJaA9DCDUNiuaBW29AlIaUUpRoFUv9aBZHQJr7KWyC4Bp1fZQoaAZoCWgPQwjK4ZNOJIxsQJSGlFKUaBVNEgFoFkdAmvuhAbADaHV9lChoBmgJaA9DCFFoWfePnGxAlIaUUpRoFU2HAWgWR0Ca/A80k4WDdX2UKGgGaAloD0MI5wEs8uuVaUCUhpRSlGgVTSkCaBZHQJr9+GmDUVl1fZQoaAZoCWgPQwhtWb4uQ7ZsQJSGlFKUaBVNIAFoFkdAmv/id4FA3XV9lChoBmgJaA9DCFvOpbhqDXBAlIaUUpRoFU00AWgWR0CbAeWhysCDdX2UKGgGaAloD0MIcSGP4EY6bkCUhpRSlGgVTYgBaBZHQJsC4ypJf6Z1fZQoaAZoCWgPQwjRsYNK3DJiQJSGlFKUaBVN6ANoFkdAmwPS4Bmwq3V9lChoBmgJaA9DCNXt7CuPtm5AlIaUUpRoFU0QAWgWR0CbA/VObiIddX2UKGgGaAloD0MIhAzk2WV5bkCUhpRSlGgVTSABaBZHQJsFK99MK1J1fZQoaAZoCWgPQwgzwAXZMjZtQJSGlFKUaBVNDQFoFkdAmwU2Nm16V3V9lChoBmgJaA9DCPWdX5SgOnBAlIaUUpRoFU10AWgWR0CbBUcnE2pAdX2UKGgGaAloD0MIMUCiCRT5bkCUhpRSlGgVTaICaBZHQJsGSg7HQyB1fZQoaAZoCWgPQwhsBU1LLFJvQJSGlFKUaBVNFwFoFkdAmwZULDye7XV9lChoBmgJaA9DCJs3TgpzkW5AlIaUUpRoFU0/AWgWR0CbBxo2n88+dWUu"
73
  },
74
  "ep_success_buffer": {
75
  ":type:": "<class 'collections.deque'>",
76
  ":serialized:": "gASVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
77
  },
78
- "_n_updates": 200,
79
  "n_steps": 2048,
80
  "gamma": 0.99,
81
  "gae_lambda": 0.95,
 
4
  ":serialized:": "gASVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
+ "__init__": "<function ActorCriticPolicy.__init__ at 0x7f4cb2065a70>",
8
+ "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f4cb2065b00>",
9
+ "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f4cb2065b90>",
10
+ "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f4cb2065c20>",
11
+ "_build": "<function ActorCriticPolicy._build at 0x7f4cb2065cb0>",
12
+ "forward": "<function ActorCriticPolicy.forward at 0x7f4cb2065d40>",
13
+ "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f4cb2065dd0>",
14
+ "_predict": "<function ActorCriticPolicy._predict at 0x7f4cb2065e60>",
15
+ "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f4cb2065ef0>",
16
+ "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f4cb2065f80>",
17
+ "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f4cb206b050>",
18
  "__abstractmethods__": "frozenset()",
19
+ "_abc_impl": "<_abc_data object at 0x7f4cb20b39c0>"
20
  },
21
  "verbose": 1,
22
  "policy_kwargs": {},
23
  "observation_space": {
24
  ":type:": "<class 'gym.spaces.box.Box'>",
25
+ ":serialized:": "gASVwwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMA2xvd5SMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMDF9yZWNvbnN0cnVjdJSTlGgGjAduZGFycmF5lJOUSwCFlEMBYpSHlFKUKEsBSwiFlGgKiUMgAACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP+UdJRijARoaWdolGgQaBJLAIWUaBSHlFKUKEsBSwiFlGgKiUMgAACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH+UdJRijA1ib3VuZGVkX2JlbG93lGgQaBJLAIWUaBSHlFKUKEsBSwiFlGgHjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiiUMIAAAAAAAAAACUdJRijA1ib3VuZGVkX2Fib3ZllGgQaBJLAIWUaBSHlFKUKEsBSwiFlGgoiUMIAAAAAAAAAACUdJRijApfbnBfcmFuZG9tlE6MBl9zaGFwZZRLCIWUdWIu",
26
  "dtype": "float32",
 
 
 
27
  "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]",
28
  "high": "[inf inf inf inf inf inf inf inf]",
29
  "bounded_below": "[False False False False False False False False]",
30
  "bounded_above": "[False False False False False False False False]",
31
+ "_np_random": null,
32
+ "_shape": [
33
+ 8
34
+ ]
35
  },
36
  "action_space": {
37
  ":type:": "<class 'gym.spaces.discrete.Discrete'>",
38
+ ":serialized:": "gASViAAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwFZHR5cGWUjAVudW1weZSMBWR0eXBllJOUjAJpOJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRijApfbnBfcmFuZG9tlE6MBl9zaGFwZZQpdWIu",
39
  "n": 4,
 
40
  "dtype": "int64",
41
+ "_np_random": null,
42
+ "_shape": []
43
  },
44
  "n_envs": 16,
45
+ "num_timesteps": 524288,
46
+ "_total_timesteps": 500000,
47
  "_num_timesteps_at_start": 0,
48
  "seed": null,
49
  "action_noise": null,
50
+ "start_time": 1657002407.1366575,
51
  "learning_rate": 0.0003,
52
  "tensorboard_log": null,
53
  "lr_schedule": {
 
56
  },
57
  "_last_obs": {
58
  ":type:": "<class 'numpy.ndarray'>",
59
+ ":serialized:": "gASVjQIAAAAAAACMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMDF9yZWNvbnN0cnVjdJSTlIwFbnVtcHmUjAduZGFycmF5lJOUSwCFlEMBYpSHlFKUKEsBSxBLCIaUaAOMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiiUIAAgAARoQgvlyLNbrLFAa3s+2CMae6sLp6exk2AACAPwAAgD+m3X2+HPKlPgP1j7swJGO+ovymOo49CTsAAAAAAAAAAIBzXj5PVwi84JUlu28A1TjDlH29YVBGOgAAgD8AAIA/ZpKqPPYceroUVBS2r0+UsEZPvjpICjk1AACAPwAAgD8A/A68e+KEuvZPbzm8sLI0boPMOj06iLgAAIA/AACAP1osIb6ukos7UoMqPN9cELrHqy+9J2ACOwAAgD8AAIA/DQmmPmEP3bxgFsq3/m8cNtIqEr4PMAU3AACAPwAAgD8z0jq+2+HNvLLoAr68Eam8J+80PurTgj0AAIA/AACAP+YUeD6xmJI/eN4UP05YBr//PFw+po3mPQAAAAAAAAAANniFPlSYkD8d3vM+KkzWvg+hHj4ppAM+AAAAAAAAAAAaVHa9wyVtukHcNDtQAbE2dE0oO/PRTLoAAIA/AACAP/1wjj7uVd68CO0zu6MlrDkF/EO+kJVhOgAAgD8AAIA/1i+Avj26KrmauhS8RVVhPL0+sLt2xxW8AACAPwAAgD998pe+SDyZvEMzp7q/r+u4nbADPkEAxTkAAIA/AACAP03SSL3DgWK6odMhOXcIgDTE5ck6xws3uAAAgD8AAIA/AOCBu4UbsbmqpDU8XRr9uBQv7jtgDPe3AACAPwAAgD+UdJRiLg=="
60
  },
61
  "_last_episode_starts": {
62
  ":type:": "<class 'numpy.ndarray'>",
 
66
  "_episode_num": 0,
67
  "use_sde": false,
68
  "sde_sample_freq": -1,
69
+ "_current_progress_remaining": -0.04857599999999995,
70
  "ep_info_buffer": {
71
  ":type:": "<class 'collections.deque'>",
72
+ ":serialized:": "gASVfBAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMI6e3PRcM8YECUhpRSlIwBbJRN6AOMAXSUR0CN7i8V58jSdX2UKGgGaAloD0MIXyhgOxjIYkCUhpRSlGgVTegDaBZHQI3uTRjSXt11fZQoaAZoCWgPQwhbttYXCaFGwJSGlFKUaBVL22gWR0CN9+lSCOFQdX2UKGgGaAloD0MI14UfnE/1VkCUhpRSlGgVTegDaBZHQI3/kyeqaPV1fZQoaAZoCWgPQwiO5zOg3mFeQJSGlFKUaBVN6ANoFkdAjgEslsxfwHV9lChoBmgJaA9DCC457pQOO15AlIaUUpRoFU3oA2gWR0COEJvw3HaOdX2UKGgGaAloD0MIR1Z+GYzrVkCUhpRSlGgVTegDaBZHQI4VM9yLhrF1fZQoaAZoCWgPQwiIRncQu4xhQJSGlFKUaBVN6ANoFkdAjilUJOWSlnV9lChoBmgJaA9DCAzJycStN11AlIaUUpRoFU3oA2gWR0COKrun/DLsdX2UKGgGaAloD0MI9Ik8SboXW0CUhpRSlGgVTegDaBZHQI44jeO4oZ11fZQoaAZoCWgPQwgktOVciiBfQJSGlFKUaBVN6ANoFkdAjj7eGfwqiHV9lChoBmgJaA9DCAwepn1z0GFAlIaUUpRoFU3oA2gWR0COQgsdT5wgdX2UKGgGaAloD0MI0sYRa/G+XkCUhpRSlGgVTegDaBZHQI5F0AxSHdp1fZQoaAZoCWgPQwjWqfI9I5diQJSGlFKUaBVN6ANoFkdAjkXy6DoQnXV9lChoBmgJaA9DCFDgnXz6lWBAlIaUUpRoFU3oA2gWR0COSSk2P1cudX2UKGgGaAloD0MIYYxIFFpeZECUhpRSlGgVTegDaBZHQI5jmwNb1RN1fZQoaAZoCWgPQwipSltc41pTQJSGlFKUaBVN6ANoFkdAjmP74SHuZ3V9lChoBmgJaA9DCDnQQ20bWl1AlIaUUpRoFU3oA2gWR0COZBbAUL2IdX2UKGgGaAloD0MIaXBbW/h+a0CUhpRSlGgVTTkBaBZHQI5kZ6rvLHN1fZQoaAZoCWgPQwhbsb/snitdQJSGlFKUaBVN6ANoFkdAjmyHYg7o0XV9lChoBmgJaA9DCNzVq8jo5lBAlIaUUpRoFU3oA2gWR0COcsyMUAT7dX2UKGgGaAloD0MIFto5zQItX0CUhpRSlGgVTegDaBZHQI50G5z5oGp1fZQoaAZoCWgPQwghlPdxNCJVQJSGlFKUaBVN6ANoFkdAjoE6VD8cdnV9lChoBmgJaA9DCBL7BFAMEmBAlIaUUpRoFU3oA2gWR0COhThm5DqodX2UKGgGaAloD0MIXB/WG7UrYECUhpRSlGgVTegDaBZHQI6WcIzFdcB1fZQoaAZoCWgPQwgjZ2FPu3ZhQJSGlFKUaBVN6ANoFkdAjpe6TwDvE3V9lChoBmgJaA9DCKfMzTeicUFAlIaUUpRoFUvxaBZHQI6gGEdvKlp1fZQoaAZoCWgPQwjpYz4g0ANhQJSGlFKUaBVN6ANoFkdAjqSc8cMmW3V9lChoBmgJaA9DCH/eVKTC1V5AlIaUUpRoFU3oA2gWR0CPXmyAxzq9dX2UKGgGaAloD0MIFCS2u4cUYUCUhpRSlGgVTegDaBZHQI9lhfQa73B1fZQoaAZoCWgPQwio5JzYQ7BdQJSGlFKUaBVN6ANoFkdAj2Wpy6tknXV9lChoBmgJaA9DCBJPdjOjIVtAlIaUUpRoFU3oA2gWR0CPaRqoIfKZdX2UKGgGaAloD0MIO8JpwQugZUCUhpRSlGgVTSoDaBZHQI9uIA4n4PB1fZQoaAZoCWgPQwhdwqG3+EZxQJSGlFKUaBVN1ANoFkdAj4BpGnXNDHV9lChoBmgJaA9DCP0QGywcHmFAlIaUUpRoFU3oA2gWR0CPgkcf/3nIdX2UKGgGaAloD0MIhJohVRR2XUCUhpRSlGgVTegDaBZHQI+DAIdELIB1fZQoaAZoCWgPQwglICbhQkVeQJSGlFKUaBVN6ANoFkdAj4sl90A93nV9lChoBmgJaA9DCAkaM4n6DGNAlIaUUpRoFU3oA2gWR0CPkZ60IC2ddX2UKGgGaAloD0MIkNyadFvtXECUhpRSlGgVTegDaBZHQI+S8w35vcd1fZQoaAZoCWgPQwhiEi7kkb5nQJSGlFKUaBVNRQJoFkdAj5Vh1LamGnV9lChoBmgJaA9DCL6jxoSYmyXAlIaUUpRoFUvkaBZHQI+YkXSBshx1fZQoaAZoCWgPQwjVB5J3Dr03QJSGlFKUaBVL72gWR0CPmjhlUZNxdX2UKGgGaAloD0MIxhaCHJTMXkCUhpRSlGgVTegDaBZHQI+erfgrH2h1fZQoaAZoCWgPQwiKc9TRcRNdQJSGlFKUaBVN6ANoFkdAj7MkwnH/+HV9lChoBmgJaA9DCPiImBLJNmNAlIaUUpRoFU3oA2gWR0CPtG7K7qY7dX2UKGgGaAloD0MIU1vqIK9sa0CUhpRSlGgVTUADaBZHQI+7e+sYEW91fZQoaAZoCWgPQwhyT1d3rJ9oQJSGlFKUaBVN2wFoFkdAj7u3V9Wp63V9lChoBmgJaA9DCCtqMA3DIl9AlIaUUpRoFU3oA2gWR0CPvLRceKbbdX2UKGgGaAloD0MI/wbt1ccfY0CUhpRSlGgVTegDaBZHQI/G9q+Jxed1fZQoaAZoCWgPQwggXWxaKfRbQJSGlFKUaBVN6ANoFkdAj84Y2jwhGHV9lChoBmgJaA9DCPOPvknTmEJAlIaUUpRoFU3oA2gWR0CP0geHSF4+dX2UKGgGaAloD0MI7Nrebkk0WkCUhpRSlGgVTegDaBZHQI/Xo150KZ51fZQoaAZoCWgPQwi2MXbCSydfQJSGlFKUaBVN6ANoFkdAj+1t7a7EpHV9lChoBmgJaA9DCDBLOzWXJ2JAlIaUUpRoFU3oA2gWR0CQAuoAn2IwdX2UKGgGaAloD0MIHqm+84uaYkCUhpRSlGgVTegDaBZHQJAD1AC4jKR1fZQoaAZoCWgPQwhMx5xn7LlYQJSGlFKUaBVN6ANoFkdAkAWvDDTBqXV9lChoBmgJaA9DCIwv2uMFBGFAlIaUUpRoFU3oA2gWR0CQCByFfzBidX2UKGgGaAloD0MI+3lTkQpxYkCUhpRSlGgVTewCaBZHQJAIt5IH1OF1fZQoaAZoCWgPQwgqUmFsIRpaQJSGlFKUaBVN6ANoFkdAkAlMunMt9XV9lChoBmgJaA9DCNYCe0ykbl5AlIaUUpRoFU3oA2gWR0CQDCASFoL5dX2UKGgGaAloD0MI8pTVdD0icUCUhpRSlGgVTXoDaBZHQJAWaEGqxTt1fZQoaAZoCWgPQwi1xTU+k1taQJSGlFKUaBVN6ANoFkdAkBjUxqO94HV9lChoBmgJaA9DCEWfjzLixGFAlIaUUpRoFU3oA2gWR0CQHPaUiY9gdX2UKGgGaAloD0MIrMq+KwJvYUCUhpRSlGgVTegDaBZHQJAdGZPVNHp1fZQoaAZoCWgPQwhZh6OrdGBiQJSGlFKUaBVN6ANoFkdAkIGYR7JGOXV9lChoBmgJaA9DCFqfckwWR1JAlIaUUpRoFU3oA2gWR0CQhYmjCYTkdX2UKGgGaAloD0MIK4TVWMLAWUCUhpRSlGgVTegDaBZHQJCHmVRk3CN1fZQoaAZoCWgPQwi3RC44A6FhQJSGlFKUaBVN6ANoFkdAkIpv3ai9I3V9lChoBmgJaA9DCIeowp/hC2JAlIaUUpRoFU3oA2gWR0CQlA8KG+K1dX2UKGgGaAloD0MIVAJiEq5cbECUhpRSlGgVTQ4DaBZHQJCVkP3BYV91fZQoaAZoCWgPQwj11VWBWjVeQJSGlFKUaBVN6ANoFkdAkJ37LMcIaHV9lChoBmgJaA9DCLyTT49tOWBAlIaUUpRoFU3oA2gWR0CQnrGmUGFBdX2UKGgGaAloD0MIwha7fVYrYUCUhpRSlGgVTegDaBZHQJCgG2LHdXV1fZQoaAZoCWgPQwgVN24xv35gQJSGlFKUaBVN6ANoFkdAkKJ0RzzVc3V9lChoBmgJaA9DCNP2r6w0NVlAlIaUUpRoFU3oA2gWR0CQouRUm2LHdX2UKGgGaAloD0MICmZMwZp7YUCUhpRSlGgVTegDaBZHQJClQbdadMF1fZQoaAZoCWgPQwgJ/OHnP6dvQJSGlFKUaBVNjgNoFkdAkKrv73wkPnV9lChoBmgJaA9DCM+EJoklu1xAlIaUUpRoFU3oA2gWR0CQrhsyBTXKdX2UKGgGaAloD0MIo+iBj0GEakCUhpRSlGgVTbgDaBZHQJCxBk5IYm91fZQoaAZoCWgPQwgst7QakoJhQJSGlFKUaBVN6ANoFkdAkLOUw35vcnV9lChoBmgJaA9DCBL3WPpQc2RAlIaUUpRoFU3oA2gWR0CQuX1qWToudX2UKGgGaAloD0MIX5Z2aq7Mb0CUhpRSlGgVTRQCaBZHQJC9Dc9GI9F1fZQoaAZoCWgPQwiOeR1xSHlhQJSGlFKUaBVN6ANoFkdAkL1CB9TgmHV9lChoBmgJaA9DCGtgqwSL029AlIaUUpRoFU1RAWgWR0CQviYVqN6xdX2UKGgGaAloD0MIZt0/FqItY0CUhpRSlGgVTegDaBZHQJC+598Z1mt1fZQoaAZoCWgPQwire2Rz1UJfQJSGlFKUaBVN6ANoFkdAkMEjot+TeXV9lChoBmgJaA9DCHe8yW9RX21AlIaUUpRoFU0NA2gWR0CQxzfP5YYBdX2UKGgGaAloD0MIDFwea8ZVYUCUhpRSlGgVTegDaBZHQJDJGt+1Bt11fZQoaAZoCWgPQwh2+kFdpKViQJSGlFKUaBVN6ANoFkdAkMpyJsO5KHV9lChoBmgJaA9DCIBjz55LLW9AlIaUUpRoFU1PAmgWR0CQz1tY0VJudX2UKGgGaAloD0MIdlCJ6xiPYECUhpRSlGgVTegDaBZHQJDR/WI42jx1fZQoaAZoCWgPQwgpdjQO9dlWQJSGlFKUaBVN6ANoFkdAkNaqZ6Uqx3V9lChoBmgJaA9DCMOgTKPJCllAlIaUUpRoFU3oA2gWR0CQ1yr8R+SbdX2UKGgGaAloD0MIGmt/Z3swYUCUhpRSlGgVTegDaBZHQJDZ39zfaYh1fZQoaAZoCWgPQwind/F+3MlsQJSGlFKUaBVNLQJoFkdAkNphGx2SuHV9lChoBmgJaA9DCG5MT1jis0RAlIaUUpRoFUupaBZHQJDgR+w1R+B1fZQoaAZoCWgPQwgFiljEMNVjQJSGlFKUaBVN6ANoFkdAkOO29+PRzHV9lChoBmgJaA9DCM/AyMuab15AlIaUUpRoFU3oA2gWR0CQ6eqoZQ54dX2UKGgGaAloD0MILLgf8EBbZUCUhpRSlGgVTegDaBZHQJDv8F1SwW51fZQoaAZoCWgPQwisGoS53TlrQJSGlFKUaBVNjQNoFkdAkPBN/SYw7HVlLg=="
73
  },
74
  "ep_success_buffer": {
75
  ":type:": "<class 'collections.deque'>",
76
  ":serialized:": "gASVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
77
  },
78
+ "_n_updates": 160,
79
  "n_steps": 2048,
80
  "gamma": 0.99,
81
  "gae_lambda": 0.95,
'LunarLander-ppo-500k/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4be36e6768c02f1df8e2a541d220ef2e6681cf898da1bd3f043ea4e783f9f62e
3
  size 84893
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:567823a31dfbe8b99c41deb9ec8c7a142c917b82d46be9ed845c9ea0ff096e68
3
  size 84893
'LunarLander-ppo-500k/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0040481a4769fa861ae40dc903a3cff442deb0862d419e8a55c3502b1e894146
3
  size 43201
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ea3abbc61e65a909498f10d80568772fb1a1a4cde03890f8d3be177bc07ea93
3
  size 43201
'LunarLander-ppo-500k/system_info.txt CHANGED
@@ -4,4 +4,4 @@ Stable-Baselines3: 1.5.0
4
  PyTorch: 1.11.0+cu113
5
  GPU Enabled: True
6
  Numpy: 1.21.6
7
- Gym: 0.17.3
 
4
  PyTorch: 1.11.0+cu113
5
  GPU Enabled: True
6
  Numpy: 1.21.6
7
+ Gym: 0.21.0
README.md ADDED
@@ -0,0 +1,36 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: stable-baselines3
3
+ tags:
4
+ - LunarLander-v2
5
+ - deep-reinforcement-learning
6
+ - reinforcement-learning
7
+ - stable-baselines3
8
+ model-index:
9
+ - name: PPO
10
+ results:
11
+ - metrics:
12
+ - type: mean_reward
13
+ value: 177.16 +/- 93.23
14
+ name: mean_reward
15
+ task:
16
+ type: reinforcement-learning
17
+ name: reinforcement-learning
18
+ dataset:
19
+ name: LunarLander-v2
20
+ type: LunarLander-v2
21
+ ---
22
+
23
+ # **PPO** Agent playing **LunarLander-v2**
24
+ This is a trained model of a **PPO** agent playing **LunarLander-v2**
25
+ using the [stable-baselines3 library](https://github.com/DLR-RM/stable-baselines3).
26
+
27
+ ## Usage (with Stable-baselines3)
28
+ TODO: Add your code
29
+
30
+
31
+ ```python
32
+ from stable_baselines3 import ...
33
+ from huggingface_sb3 import load_from_hub
34
+
35
+ ...
36
+ ```
config.json CHANGED
@@ -1 +1 @@
1
- {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gASVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f83faae7680>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f83faae7710>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f83faae77a0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f83faae7830>", "_build": "<function ActorCriticPolicy._build at 0x7f83faae78c0>", "forward": "<function ActorCriticPolicy.forward at 0x7f83faae7950>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f83faae79e0>", "_predict": "<function ActorCriticPolicy._predict at 0x7f83faae7a70>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f83faae7b00>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f83faae7b90>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f83faae7c20>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc_data object at 0x7f83fab39420>"}, "verbose": 1, "policy_kwargs": {}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gASVwgEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBXNoYXBllEsIhZSMA2xvd5SMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMDF9yZWNvbnN0cnVjdJSTlGgGjAduZGFycmF5lJOUSwCFlEMBYpSHlFKUKEsBSwiFlGgKiUMgAACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP+UdJRijARoaWdolGgSaBRLAIWUaBaHlFKUKEsBSwiFlGgKiUMgAACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH+UdJRijA1ib3VuZGVkX2JlbG93lGgSaBRLAIWUaBaHlFKUKEsBSwiFlGgHjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiiUMIAAAAAAAAAACUdJRijA1ib3VuZGVkX2Fib3ZllGgSaBRLAIWUaBaHlFKUKEsBSwiFlGgqiUMIAAAAAAAAAACUdJRijApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "shape": [8], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False]", "bounded_above": "[False False False False False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gASVgQAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwFc2hhcGWUKYwFZHR5cGWUjAVudW1weZRoB5OUjAJpOJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRijApfbnBfcmFuZG9tlE51Yi4=", "n": 4, "shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "num_timesteps": 131072, "_total_timesteps": 100000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1657003619.1741638, "learning_rate": 0.0003, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gASVvwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAUsBSxNDBIgAUwCUToWUKYwBX5SFlIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCB9lH2UKGgXaA6MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgYjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gASVjQIAAAAAAACMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMDF9yZWNvbnN0cnVjdJSTlIwFbnVtcHmUjAduZGFycmF5lJOUSwCFlEMBYpSHlFKUKEsBSxBLCIaUaAOMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiiUIAAgAAAJCSuw16tj/kBo+9LcMsPXHNUrz2U1m9AAAAAAAAAACAOo29yJGGP6RjA76Bn+i+zFugvQhaib0AAAAAAAAAADOIK717Vq26UnsAunV03bTTSIY65z8TOQAAgD8AAIA/zsgQP6+l+r0p/Zo9hf7BuoFR3b0Yo+E8AAAAAAAAgD+Adxe+RFIIP1TBGj3v4Iy+vCKtvHJ4zzwAAAAAAAAAAFqlOz5kHJE/Nv33Pt1P676RLDM+kTClPQAAAAAAAAAAw6ngvoJ/pz5O1+w9yQ+ivrm10bwRtom8AAAAAAAAAAAo7Ac/zQoNP1oonD0To4m+KEjRPUpjDrwAAAAAAAAAANDgCj/7M0c/rvs5Ptrps771fi4+EQsWugAAAAAAAAAAU4YwvocObj9K1Lm98DK6vuI95L1oML66AAAAAAAAAAA6x0Y/ze14vqBZ2DOqwQ4x9YPKvWZiKLQAAIA/AACAP+bCUb7WUVI/av4Lvrtpu7776ua97IAiPQAAAAAAAAAAgLUtvVsNcT+f1hE94GTjvrz5Ib0m0Pg8AAAAAAAAAAAmU30+KATZvCpC/jqq1yi5eEZBvtL8DLoAAIA/AACAP7PB6L1JkBc9EeKxPbWrSb5IT/W8hXRnPQAAAAAAAAAARU2Dvjs1irxWDRi7djo2uQMq/D1/IDU6AACAPwAAgD+UdJRiLg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gASVmAAAAAAAAACMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMDF9yZWNvbnN0cnVjdJSTlIwFbnVtcHmUjAduZGFycmF5lJOUSwCFlEMBYpSHlFKUKEsBSxCFlGgDjAVkdHlwZZSTlIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYolDEAAAAAAAAAAAAAAAAAAAAACUdJRiLg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.3107200000000001, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gASVeBAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIU3jQ7LqMcECUhpRSlIwBbJRNXwGMAXSUR0CaWeTPSlWPdX2UKGgGaAloD0MIaRoUzYPfa0CUhpRSlGgVTTABaBZHQJpaFuuRs/J1fZQoaAZoCWgPQwiMTSuFQHRaQJSGlFKUaBVN6ANoFkdAmlrufNA1N3V9lChoBmgJaA9DCBQGZRqNgHBAlIaUUpRoFU24AWgWR0CaXh5FPSDzdX2UKGgGaAloD0MIpg7yejDAbkCUhpRSlGgVTS4DaBZHQJpgyznied11fZQoaAZoCWgPQwjs20lE+AtYQJSGlFKUaBVN6ANoFkdAmmFCJO32EnV9lChoBmgJaA9DCKIIqdvZGHBAlIaUUpRoFU0FAWgWR0CaYiXbM5fddX2UKGgGaAloD0MIrDdqhSkqcMCUhpRSlGgVTZQCaBZHQJpi6r/82rJ1fZQoaAZoCWgPQwiDE9GvrZ+yP5SGlFKUaBVL22gWR0CaY9pXZGrkdX2UKGgGaAloD0MIkunQ6fkMbkCUhpRSlGgVTRcBaBZHQJpkEr4Fia11fZQoaAZoCWgPQwhiu3uAri1zQJSGlFKUaBVNhAFoFkdAmmQ7Ms6JZXV9lChoBmgJaA9DCETEzalknFNAlIaUUpRoFU3oA2gWR0CaZFK7qY7adX2UKGgGaAloD0MICI82jljLF8CUhpRSlGgVTb4CaBZHQJq/4f5k9U11fZQoaAZoCWgPQwhf8GlOHjRwQJSGlFKUaBVNKAFoFkdAmsBRzV+ZxHV9lChoBmgJaA9DCH0lkBK7/m9AlIaUUpRoFU1WAWgWR0CawhtVrAP/dX2UKGgGaAloD0MIBK3AkBX+cUCUhpRSlGgVTR4BaBZHQJrDJBrvb491fZQoaAZoCWgPQwjsGFdcnKJlwJSGlFKUaBVNlgFoFkdAmsUD6WPcSHV9lChoBmgJaA9DCG3kuimlH3BAlIaUUpRoFU0RAWgWR0CaxR9VFQVLdX2UKGgGaAloD0MI+3lTkQpKcECUhpRSlGgVTTUBaBZHQJrGE4DLbHp1fZQoaAZoCWgPQwgyyF2EqexwQJSGlFKUaBVNDwFoFkdAmsZ3dXT3I3V9lChoBmgJaA9DCCMWMeywkW9AlIaUUpRoFU27A2gWR0Cax19K28ZldX2UKGgGaAloD0MI0Eaum1IxcECUhpRSlGgVTTwBaBZHQJrHaIRAbAF1fZQoaAZoCWgPQwg7NZcbjIFhQJSGlFKUaBVN6ANoFkdAmsiIdU83dnV9lChoBmgJaA9DCICbxYsFMm9AlIaUUpRoFU1vAWgWR0Cayq3ljmSydX2UKGgGaAloD0MIxm8KKxV4cUCUhpRSlGgVTTcBaBZHQJrKx9qk/KR1fZQoaAZoCWgPQwgpQup29sFeQJSGlFKUaBVN6ANoFkdAmsvzT4L1EnV9lChoBmgJaA9DCG3F/rL7v2xAlIaUUpRoFU1ZAWgWR0CazFflp48mdX2UKGgGaAloD0MIOdTvwhavcUCUhpRSlGgVTbgBaBZHQJrNZMxoIv91fZQoaAZoCWgPQwjSbYlccBdwQJSGlFKUaBVNKgFoFkdAms2P+CK77XV9lChoBmgJaA9DCEVighq+PT5AlIaUUpRoFU0KAWgWR0CazjTxoZhsdX2UKGgGaAloD0MIn47HDFSYb0CUhpRSlGgVTSQBaBZHQJrQKg2606Z1fZQoaAZoCWgPQwhLAtTUct9wQJSGlFKUaBVL/mgWR0Ca0XauOjqOdX2UKGgGaAloD0MIVisTfqlBbkCUhpRSlGgVTSIBaBZHQJrRlGFzuF91fZQoaAZoCWgPQwjO/dXjfvtxQJSGlFKUaBVNTgFoFkdAmtIvtIClrXV9lChoBmgJaA9DCC52+6wynW1AlIaUUpRoFU3cAWgWR0Ca0vMRYigTdX2UKGgGaAloD0MIXvI/+bt35j+UhpRSlGgVS7JoFkdAmtPPepGWlnV9lChoBmgJaA9DCAlvD0JAu29AlIaUUpRoFU0KAWgWR0Ca1B1KoQ4CdX2UKGgGaAloD0MIVpv/Vx39ZUCUhpRSlGgVTa8BaBZHQJrURxkupS91fZQoaAZoCWgPQwirsYS1sXBwQJSGlFKUaBVNCgFoFkdAmtW3UH6dlXV9lChoBmgJaA9DCLMmFviKmjtAlIaUUpRoFUv1aBZHQJrW0kIHC411fZQoaAZoCWgPQwgEq+rld3BqQJSGlFKUaBVNPAFoFkdAmtcC6Ymb9nV9lChoBmgJaA9DCC6thsS9mG1AlIaUUpRoFU0oAWgWR0Ca19yUs4DLdX2UKGgGaAloD0MISpaTUHocbkCUhpRSlGgVTRUBaBZHQJrZw+aBqbl1fZQoaAZoCWgPQwjsoX2s4A1xQJSGlFKUaBVNGQFoFkdAmtsbe67NCHV9lChoBmgJaA9DCBIWFXF6h3FAlIaUUpRoFUvxaBZHQJrbJhqj8DV1fZQoaAZoCWgPQwgYeO49XFFwQJSGlFKUaBVNAgFoFkdAmt0kZm7J4nV9lChoBmgJaA9DCJ90IsFUszzAlIaUUpRoFUu8aBZHQJrdlrP+n651fZQoaAZoCWgPQwh5XFSLiDJuQJSGlFKUaBVNKwFoFkdAmt5TwQUYbnV9lChoBmgJaA9DCLjkuFO6OmdAlIaUUpRoFU2QAmgWR0Ca3mNlAeJYdX2UKGgGaAloD0MICvMeZ5p3bECUhpRSlGgVTR0BaBZHQJrf5CPZIxx1fZQoaAZoCWgPQwh9PPTdrUVyQJSGlFKUaBVNYQJoFkdAmuBEwnH/+HV9lChoBmgJaA9DCFBUNqypTW5AlIaUUpRoFU0IAWgWR0Ca4HZb6guidX2UKGgGaAloD0MIXynLEIf1cECUhpRSlGgVS/doFkdAmuDBzvJA+3V9lChoBmgJaA9DCBXl0viFIlxAlIaUUpRoFU3oA2gWR0Ca4MrWAf+1dX2UKGgGaAloD0MISrTk8TQ5YECUhpRSlGgVTegDaBZHQJrhCRfWtlt1fZQoaAZoCWgPQwhRZoNMMgRwQJSGlFKUaBVNygFoFkdAmuHaCL/CInV9lChoBmgJaA9DCE7tDFNb3G5AlIaUUpRoFUvyaBZHQJriGQmu1Wt1fZQoaAZoCWgPQwiMaaZ7HfVuQJSGlFKUaBVNDAFoFkdAmuQBzmwJPnV9lChoBmgJaA9DCNmz5zJ1vXFAlIaUUpRoFU0pAWgWR0Ca5O3iJfpmdX2UKGgGaAloD0MISu6wicyWb0CUhpRSlGgVTUECaBZHQJrk+i48U211fZQoaAZoCWgPQwhWEANdO1RwQJSGlFKUaBVN/QFoFkdAmuVD5GjKxXV9lChoBmgJaA9DCCR/MPCcu3BAlIaUUpRoFU0LAWgWR0Ca6GlQMx46dX2UKGgGaAloD0MIG53zUxwJbUCUhpRSlGgVTQ0BaBZHQJro8djoZAJ1fZQoaAZoCWgPQwj4xhAAXC9xQJSGlFKUaBVNCAFoFkdAmuj8MRYigXV9lChoBmgJaA9DCFTgZBs4EXFAlIaUUpRoFU1QAWgWR0Ca6WfGuLaVdX2UKGgGaAloD0MI+aBns2oHcECUhpRSlGgVTY0BaBZHQJrqWu2Zy+91fZQoaAZoCWgPQwjTLxFv3alyQJSGlFKUaBVNPwFoFkdAmus7Zi/fwnV9lChoBmgJaA9DCD8buW5KOm9AlIaUUpRoFU0mAWgWR0Ca7ArjYI0JdX2UKGgGaAloD0MIw9fXutT2bkCUhpRSlGgVTVkBaBZHQJrtjDZUT+N1fZQoaAZoCWgPQwiNDHIXYTBkQJSGlFKUaBVN5wFoFkdAmu3rronrp3V9lChoBmgJaA9DCK8FvTeGG1rAlIaUUpRoFU3XAWgWR0Ca7g9zfaYedX2UKGgGaAloD0MIipRm8ziPb0CUhpRSlGgVTSABaBZHQJruGPp6hQF1fZQoaAZoCWgPQwh+qgoNRFxwQJSGlFKUaBVNHwFoFkdAmu7tJvo/zXV9lChoBmgJaA9DCCrJOhzdlXBAlIaUUpRoFU0uAWgWR0Ca72omXw9adX2UKGgGaAloD0MIcVrwoq+4bUCUhpRSlGgVTdUBaBZHQJrwf7zkIX11fZQoaAZoCWgPQwg5C3va4a9wQJSGlFKUaBVNCgFoFkdAmvFrnLaEjHV9lChoBmgJaA9DCKInZVJDfW5AlIaUUpRoFU0FAWgWR0Ca8bM4LkS3dX2UKGgGaAloD0MIKEcBouB8bkCUhpRSlGgVTRABaBZHQJrydMajveB1fZQoaAZoCWgPQwjHTKJecMlwQJSGlFKUaBVNCQFoFkdAmvP7Llmvn3V9lChoBmgJaA9DCGdGPxpO/mtAlIaUUpRoFU3LAWgWR0Ca9O95yEL6dX2UKGgGaAloD0MImyFVFK88cUCUhpRSlGgVTQIBaBZHQJr2HMNc4YJ1fZQoaAZoCWgPQwh/h6JAH1VxQJSGlFKUaBVNnAFoFkdAmvb6/VRUFXV9lChoBmgJaA9DCKgZUkXxbXBAlIaUUpRoFU1LAWgWR0Ca+Z5dnkDIdX2UKGgGaAloD0MI0LNZ9TkQb0CUhpRSlGgVTS8BaBZHQJr6XMqz7dl1fZQoaAZoCWgPQwjYgXNG1JRwQJSGlFKUaBVNQQFoFkdAmvprSVnmJXV9lChoBmgJaA9DCDUNiuaBW29AlIaUUpRoFUv9aBZHQJr7KWyC4Bp1fZQoaAZoCWgPQwjK4ZNOJIxsQJSGlFKUaBVNEgFoFkdAmvuhAbADaHV9lChoBmgJaA9DCFFoWfePnGxAlIaUUpRoFU2HAWgWR0Ca/A80k4WDdX2UKGgGaAloD0MI5wEs8uuVaUCUhpRSlGgVTSkCaBZHQJr9+GmDUVl1fZQoaAZoCWgPQwhtWb4uQ7ZsQJSGlFKUaBVNIAFoFkdAmv/id4FA3XV9lChoBmgJaA9DCFvOpbhqDXBAlIaUUpRoFU00AWgWR0CbAeWhysCDdX2UKGgGaAloD0MIcSGP4EY6bkCUhpRSlGgVTYgBaBZHQJsC4ypJf6Z1fZQoaAZoCWgPQwjRsYNK3DJiQJSGlFKUaBVN6ANoFkdAmwPS4Bmwq3V9lChoBmgJaA9DCNXt7CuPtm5AlIaUUpRoFU0QAWgWR0CbA/VObiIddX2UKGgGaAloD0MIhAzk2WV5bkCUhpRSlGgVTSABaBZHQJsFK99MK1J1fZQoaAZoCWgPQwgzwAXZMjZtQJSGlFKUaBVNDQFoFkdAmwU2Nm16V3V9lChoBmgJaA9DCPWdX5SgOnBAlIaUUpRoFU10AWgWR0CbBUcnE2pAdX2UKGgGaAloD0MIMUCiCRT5bkCUhpRSlGgVTaICaBZHQJsGSg7HQyB1fZQoaAZoCWgPQwhsBU1LLFJvQJSGlFKUaBVNFwFoFkdAmwZULDye7XV9lChoBmgJaA9DCJs3TgpzkW5AlIaUUpRoFU0/AWgWR0CbBxo2n88+dWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gASVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 200, "n_steps": 2048, "gamma": 0.99, "gae_lambda": 0.95, "ent_coef": 0.0, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 10, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gASVvwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAUsBSxNDBIgAUwCUToWUKYwBX5SFlIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCB9lH2UKGgXaA6MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgYjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "system_info": {"OS": "Linux-5.4.188+-x86_64-with-Ubuntu-18.04-bionic #1 SMP Sun Apr 24 10:03:06 PDT 2022", "Python": "3.7.13", "Stable-Baselines3": "1.5.0", "PyTorch": "1.11.0+cu113", "GPU Enabled": "True", "Numpy": "1.21.6", "Gym": "0.17.3"}}
 
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gASVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f4cb2065a70>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f4cb2065b00>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f4cb2065b90>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f4cb2065c20>", "_build": "<function ActorCriticPolicy._build at 0x7f4cb2065cb0>", "forward": "<function ActorCriticPolicy.forward at 0x7f4cb2065d40>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f4cb2065dd0>", "_predict": "<function ActorCriticPolicy._predict at 0x7f4cb2065e60>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f4cb2065ef0>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f4cb2065f80>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f4cb206b050>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc_data object at 0x7f4cb20b39c0>"}, "verbose": 1, "policy_kwargs": {}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gASVwwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMA2xvd5SMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMDF9yZWNvbnN0cnVjdJSTlGgGjAduZGFycmF5lJOUSwCFlEMBYpSHlFKUKEsBSwiFlGgKiUMgAACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP+UdJRijARoaWdolGgQaBJLAIWUaBSHlFKUKEsBSwiFlGgKiUMgAACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH+UdJRijA1ib3VuZGVkX2JlbG93lGgQaBJLAIWUaBSHlFKUKEsBSwiFlGgHjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiiUMIAAAAAAAAAACUdJRijA1ib3VuZGVkX2Fib3ZllGgQaBJLAIWUaBSHlFKUKEsBSwiFlGgoiUMIAAAAAAAAAACUdJRijApfbnBfcmFuZG9tlE6MBl9zaGFwZZRLCIWUdWIu", "dtype": "float32", "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False]", "bounded_above": "[False False False False False False False False]", "_np_random": null, "_shape": [8]}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gASViAAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwFZHR5cGWUjAVudW1weZSMBWR0eXBllJOUjAJpOJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRijApfbnBfcmFuZG9tlE6MBl9zaGFwZZQpdWIu", "n": 4, "dtype": "int64", "_np_random": null, "_shape": []}, "n_envs": 16, "num_timesteps": 524288, "_total_timesteps": 500000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1657002407.1366575, "learning_rate": 0.0003, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gASVvwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAUsBSxNDBIgAUwCUToWUKYwBX5SFlIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCB9lH2UKGgXaA6MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgYjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gASVjQIAAAAAAACMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMDF9yZWNvbnN0cnVjdJSTlIwFbnVtcHmUjAduZGFycmF5lJOUSwCFlEMBYpSHlFKUKEsBSxBLCIaUaAOMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiiUIAAgAARoQgvlyLNbrLFAa3s+2CMae6sLp6exk2AACAPwAAgD+m3X2+HPKlPgP1j7swJGO+ovymOo49CTsAAAAAAAAAAIBzXj5PVwi84JUlu28A1TjDlH29YVBGOgAAgD8AAIA/ZpKqPPYceroUVBS2r0+UsEZPvjpICjk1AACAPwAAgD8A/A68e+KEuvZPbzm8sLI0boPMOj06iLgAAIA/AACAP1osIb6ukos7UoMqPN9cELrHqy+9J2ACOwAAgD8AAIA/DQmmPmEP3bxgFsq3/m8cNtIqEr4PMAU3AACAPwAAgD8z0jq+2+HNvLLoAr68Eam8J+80PurTgj0AAIA/AACAP+YUeD6xmJI/eN4UP05YBr//PFw+po3mPQAAAAAAAAAANniFPlSYkD8d3vM+KkzWvg+hHj4ppAM+AAAAAAAAAAAaVHa9wyVtukHcNDtQAbE2dE0oO/PRTLoAAIA/AACAP/1wjj7uVd68CO0zu6MlrDkF/EO+kJVhOgAAgD8AAIA/1i+Avj26KrmauhS8RVVhPL0+sLt2xxW8AACAPwAAgD998pe+SDyZvEMzp7q/r+u4nbADPkEAxTkAAIA/AACAP03SSL3DgWK6odMhOXcIgDTE5ck6xws3uAAAgD8AAIA/AOCBu4UbsbmqpDU8XRr9uBQv7jtgDPe3AACAPwAAgD+UdJRiLg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gASVmAAAAAAAAACMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMDF9yZWNvbnN0cnVjdJSTlIwFbnVtcHmUjAduZGFycmF5lJOUSwCFlEMBYpSHlFKUKEsBSxCFlGgDjAVkdHlwZZSTlIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYolDEAAAAAAAAAAAAAAAAAAAAACUdJRiLg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.04857599999999995, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gASVfBAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMI6e3PRcM8YECUhpRSlIwBbJRN6AOMAXSUR0CN7i8V58jSdX2UKGgGaAloD0MIXyhgOxjIYkCUhpRSlGgVTegDaBZHQI3uTRjSXt11fZQoaAZoCWgPQwhbttYXCaFGwJSGlFKUaBVL22gWR0CN9+lSCOFQdX2UKGgGaAloD0MI14UfnE/1VkCUhpRSlGgVTegDaBZHQI3/kyeqaPV1fZQoaAZoCWgPQwiO5zOg3mFeQJSGlFKUaBVN6ANoFkdAjgEslsxfwHV9lChoBmgJaA9DCC457pQOO15AlIaUUpRoFU3oA2gWR0COEJvw3HaOdX2UKGgGaAloD0MIR1Z+GYzrVkCUhpRSlGgVTegDaBZHQI4VM9yLhrF1fZQoaAZoCWgPQwiIRncQu4xhQJSGlFKUaBVN6ANoFkdAjilUJOWSlnV9lChoBmgJaA9DCAzJycStN11AlIaUUpRoFU3oA2gWR0COKrun/DLsdX2UKGgGaAloD0MI9Ik8SboXW0CUhpRSlGgVTegDaBZHQI44jeO4oZ11fZQoaAZoCWgPQwgktOVciiBfQJSGlFKUaBVN6ANoFkdAjj7eGfwqiHV9lChoBmgJaA9DCAwepn1z0GFAlIaUUpRoFU3oA2gWR0COQgsdT5wgdX2UKGgGaAloD0MI0sYRa/G+XkCUhpRSlGgVTegDaBZHQI5F0AxSHdp1fZQoaAZoCWgPQwjWqfI9I5diQJSGlFKUaBVN6ANoFkdAjkXy6DoQnXV9lChoBmgJaA9DCFDgnXz6lWBAlIaUUpRoFU3oA2gWR0COSSk2P1cudX2UKGgGaAloD0MIYYxIFFpeZECUhpRSlGgVTegDaBZHQI5jmwNb1RN1fZQoaAZoCWgPQwipSltc41pTQJSGlFKUaBVN6ANoFkdAjmP74SHuZ3V9lChoBmgJaA9DCDnQQ20bWl1AlIaUUpRoFU3oA2gWR0COZBbAUL2IdX2UKGgGaAloD0MIaXBbW/h+a0CUhpRSlGgVTTkBaBZHQI5kZ6rvLHN1fZQoaAZoCWgPQwhbsb/snitdQJSGlFKUaBVN6ANoFkdAjmyHYg7o0XV9lChoBmgJaA9DCNzVq8jo5lBAlIaUUpRoFU3oA2gWR0COcsyMUAT7dX2UKGgGaAloD0MIFto5zQItX0CUhpRSlGgVTegDaBZHQI50G5z5oGp1fZQoaAZoCWgPQwghlPdxNCJVQJSGlFKUaBVN6ANoFkdAjoE6VD8cdnV9lChoBmgJaA9DCBL7BFAMEmBAlIaUUpRoFU3oA2gWR0COhThm5DqodX2UKGgGaAloD0MIXB/WG7UrYECUhpRSlGgVTegDaBZHQI6WcIzFdcB1fZQoaAZoCWgPQwgjZ2FPu3ZhQJSGlFKUaBVN6ANoFkdAjpe6TwDvE3V9lChoBmgJaA9DCKfMzTeicUFAlIaUUpRoFUvxaBZHQI6gGEdvKlp1fZQoaAZoCWgPQwjpYz4g0ANhQJSGlFKUaBVN6ANoFkdAjqSc8cMmW3V9lChoBmgJaA9DCH/eVKTC1V5AlIaUUpRoFU3oA2gWR0CPXmyAxzq9dX2UKGgGaAloD0MIFCS2u4cUYUCUhpRSlGgVTegDaBZHQI9lhfQa73B1fZQoaAZoCWgPQwio5JzYQ7BdQJSGlFKUaBVN6ANoFkdAj2Wpy6tknXV9lChoBmgJaA9DCBJPdjOjIVtAlIaUUpRoFU3oA2gWR0CPaRqoIfKZdX2UKGgGaAloD0MIO8JpwQugZUCUhpRSlGgVTSoDaBZHQI9uIA4n4PB1fZQoaAZoCWgPQwhdwqG3+EZxQJSGlFKUaBVN1ANoFkdAj4BpGnXNDHV9lChoBmgJaA9DCP0QGywcHmFAlIaUUpRoFU3oA2gWR0CPgkcf/3nIdX2UKGgGaAloD0MIhJohVRR2XUCUhpRSlGgVTegDaBZHQI+DAIdELIB1fZQoaAZoCWgPQwglICbhQkVeQJSGlFKUaBVN6ANoFkdAj4sl90A93nV9lChoBmgJaA9DCAkaM4n6DGNAlIaUUpRoFU3oA2gWR0CPkZ60IC2ddX2UKGgGaAloD0MIkNyadFvtXECUhpRSlGgVTegDaBZHQI+S8w35vcd1fZQoaAZoCWgPQwhiEi7kkb5nQJSGlFKUaBVNRQJoFkdAj5Vh1LamGnV9lChoBmgJaA9DCL6jxoSYmyXAlIaUUpRoFUvkaBZHQI+YkXSBshx1fZQoaAZoCWgPQwjVB5J3Dr03QJSGlFKUaBVL72gWR0CPmjhlUZNxdX2UKGgGaAloD0MIxhaCHJTMXkCUhpRSlGgVTegDaBZHQI+erfgrH2h1fZQoaAZoCWgPQwiKc9TRcRNdQJSGlFKUaBVN6ANoFkdAj7MkwnH/+HV9lChoBmgJaA9DCPiImBLJNmNAlIaUUpRoFU3oA2gWR0CPtG7K7qY7dX2UKGgGaAloD0MIU1vqIK9sa0CUhpRSlGgVTUADaBZHQI+7e+sYEW91fZQoaAZoCWgPQwhyT1d3rJ9oQJSGlFKUaBVN2wFoFkdAj7u3V9Wp63V9lChoBmgJaA9DCCtqMA3DIl9AlIaUUpRoFU3oA2gWR0CPvLRceKbbdX2UKGgGaAloD0MI/wbt1ccfY0CUhpRSlGgVTegDaBZHQI/G9q+Jxed1fZQoaAZoCWgPQwggXWxaKfRbQJSGlFKUaBVN6ANoFkdAj84Y2jwhGHV9lChoBmgJaA9DCPOPvknTmEJAlIaUUpRoFU3oA2gWR0CP0geHSF4+dX2UKGgGaAloD0MI7Nrebkk0WkCUhpRSlGgVTegDaBZHQI/Xo150KZ51fZQoaAZoCWgPQwi2MXbCSydfQJSGlFKUaBVN6ANoFkdAj+1t7a7EpHV9lChoBmgJaA9DCDBLOzWXJ2JAlIaUUpRoFU3oA2gWR0CQAuoAn2IwdX2UKGgGaAloD0MIHqm+84uaYkCUhpRSlGgVTegDaBZHQJAD1AC4jKR1fZQoaAZoCWgPQwhMx5xn7LlYQJSGlFKUaBVN6ANoFkdAkAWvDDTBqXV9lChoBmgJaA9DCIwv2uMFBGFAlIaUUpRoFU3oA2gWR0CQCByFfzBidX2UKGgGaAloD0MI+3lTkQpxYkCUhpRSlGgVTewCaBZHQJAIt5IH1OF1fZQoaAZoCWgPQwgqUmFsIRpaQJSGlFKUaBVN6ANoFkdAkAlMunMt9XV9lChoBmgJaA9DCNYCe0ykbl5AlIaUUpRoFU3oA2gWR0CQDCASFoL5dX2UKGgGaAloD0MI8pTVdD0icUCUhpRSlGgVTXoDaBZHQJAWaEGqxTt1fZQoaAZoCWgPQwi1xTU+k1taQJSGlFKUaBVN6ANoFkdAkBjUxqO94HV9lChoBmgJaA9DCEWfjzLixGFAlIaUUpRoFU3oA2gWR0CQHPaUiY9gdX2UKGgGaAloD0MIrMq+KwJvYUCUhpRSlGgVTegDaBZHQJAdGZPVNHp1fZQoaAZoCWgPQwhZh6OrdGBiQJSGlFKUaBVN6ANoFkdAkIGYR7JGOXV9lChoBmgJaA9DCFqfckwWR1JAlIaUUpRoFU3oA2gWR0CQhYmjCYTkdX2UKGgGaAloD0MIK4TVWMLAWUCUhpRSlGgVTegDaBZHQJCHmVRk3CN1fZQoaAZoCWgPQwi3RC44A6FhQJSGlFKUaBVN6ANoFkdAkIpv3ai9I3V9lChoBmgJaA9DCIeowp/hC2JAlIaUUpRoFU3oA2gWR0CQlA8KG+K1dX2UKGgGaAloD0MIVAJiEq5cbECUhpRSlGgVTQ4DaBZHQJCVkP3BYV91fZQoaAZoCWgPQwj11VWBWjVeQJSGlFKUaBVN6ANoFkdAkJ37LMcIaHV9lChoBmgJaA9DCLyTT49tOWBAlIaUUpRoFU3oA2gWR0CQnrGmUGFBdX2UKGgGaAloD0MIwha7fVYrYUCUhpRSlGgVTegDaBZHQJCgG2LHdXV1fZQoaAZoCWgPQwgVN24xv35gQJSGlFKUaBVN6ANoFkdAkKJ0RzzVc3V9lChoBmgJaA9DCNP2r6w0NVlAlIaUUpRoFU3oA2gWR0CQouRUm2LHdX2UKGgGaAloD0MICmZMwZp7YUCUhpRSlGgVTegDaBZHQJClQbdadMF1fZQoaAZoCWgPQwgJ/OHnP6dvQJSGlFKUaBVNjgNoFkdAkKrv73wkPnV9lChoBmgJaA9DCM+EJoklu1xAlIaUUpRoFU3oA2gWR0CQrhsyBTXKdX2UKGgGaAloD0MIo+iBj0GEakCUhpRSlGgVTbgDaBZHQJCxBk5IYm91fZQoaAZoCWgPQwgst7QakoJhQJSGlFKUaBVN6ANoFkdAkLOUw35vcnV9lChoBmgJaA9DCBL3WPpQc2RAlIaUUpRoFU3oA2gWR0CQuX1qWToudX2UKGgGaAloD0MIX5Z2aq7Mb0CUhpRSlGgVTRQCaBZHQJC9Dc9GI9F1fZQoaAZoCWgPQwiOeR1xSHlhQJSGlFKUaBVN6ANoFkdAkL1CB9TgmHV9lChoBmgJaA9DCGtgqwSL029AlIaUUpRoFU1RAWgWR0CQviYVqN6xdX2UKGgGaAloD0MIZt0/FqItY0CUhpRSlGgVTegDaBZHQJC+598Z1mt1fZQoaAZoCWgPQwire2Rz1UJfQJSGlFKUaBVN6ANoFkdAkMEjot+TeXV9lChoBmgJaA9DCHe8yW9RX21AlIaUUpRoFU0NA2gWR0CQxzfP5YYBdX2UKGgGaAloD0MIDFwea8ZVYUCUhpRSlGgVTegDaBZHQJDJGt+1Bt11fZQoaAZoCWgPQwh2+kFdpKViQJSGlFKUaBVN6ANoFkdAkMpyJsO5KHV9lChoBmgJaA9DCIBjz55LLW9AlIaUUpRoFU1PAmgWR0CQz1tY0VJudX2UKGgGaAloD0MIdlCJ6xiPYECUhpRSlGgVTegDaBZHQJDR/WI42jx1fZQoaAZoCWgPQwgpdjQO9dlWQJSGlFKUaBVN6ANoFkdAkNaqZ6Uqx3V9lChoBmgJaA9DCMOgTKPJCllAlIaUUpRoFU3oA2gWR0CQ1yr8R+SbdX2UKGgGaAloD0MIGmt/Z3swYUCUhpRSlGgVTegDaBZHQJDZ39zfaYh1fZQoaAZoCWgPQwind/F+3MlsQJSGlFKUaBVNLQJoFkdAkNphGx2SuHV9lChoBmgJaA9DCG5MT1jis0RAlIaUUpRoFUupaBZHQJDgR+w1R+B1fZQoaAZoCWgPQwgFiljEMNVjQJSGlFKUaBVN6ANoFkdAkOO29+PRzHV9lChoBmgJaA9DCM/AyMuab15AlIaUUpRoFU3oA2gWR0CQ6eqoZQ54dX2UKGgGaAloD0MILLgf8EBbZUCUhpRSlGgVTegDaBZHQJDv8F1SwW51fZQoaAZoCWgPQwisGoS53TlrQJSGlFKUaBVNjQNoFkdAkPBN/SYw7HVlLg=="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gASVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 160, "n_steps": 2048, "gamma": 0.99, "gae_lambda": 0.95, "ent_coef": 0.0, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 10, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gASVvwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAUsBSxNDBIgAUwCUToWUKYwBX5SFlIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCB9lH2UKGgXaA6MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgYjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "system_info": {"OS": "Linux-5.4.188+-x86_64-with-Ubuntu-18.04-bionic #1 SMP Sun Apr 24 10:03:06 PDT 2022", "Python": "3.7.13", "Stable-Baselines3": "1.5.0", "PyTorch": "1.11.0+cu113", "GPU Enabled": "True", "Numpy": "1.21.6", "Gym": "0.21.0"}}
replay.mp4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3d6d4f1396b65317858d5dab9d98c94fe14a2e76d4e81f1b85145b634d366402
3
+ size 251903
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 243.05235571912232, "std_reward": 31.891818431414098, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2022-07-05T06:56:00.705444"}
 
1
+ {"mean_reward": 177.1553372533766, "std_reward": 93.22658712619601, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2022-07-05T07:22:10.439877"}