bguan commited on
Commit
ee17131
1 Parent(s): 5498d2e

bguan's lunar lander model #3 using PPO trained for 1M timesteps

Browse files
README.md CHANGED
@@ -10,7 +10,7 @@ model-index:
10
  results:
11
  - metrics:
12
  - type: mean_reward
13
- value: 218.48 +/- 23.54
14
  name: mean_reward
15
  task:
16
  type: reinforcement-learning
 
10
  results:
11
  - metrics:
12
  - type: mean_reward
13
+ value: 224.76 +/- 21.41
14
  name: mean_reward
15
  task:
16
  type: reinforcement-learning
bguan_ppo_lunarlander3.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af035aa09ec8ff55701233d45866426ddce2893049c2ea57fcf30f26309d3131
3
+ size 144114
bguan_ppo_lunarlander3/_stable_baselines3_version ADDED
@@ -0,0 +1 @@
 
 
1
+ 1.5.0
bguan_ppo_lunarlander3/data ADDED
@@ -0,0 +1,94 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "policy_class": {
3
+ ":type:": "<class 'abc.ABCMeta'>",
4
+ ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
+ "__module__": "stable_baselines3.common.policies",
6
+ "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
+ "__init__": "<function ActorCriticPolicy.__init__ at 0x7f2104204f80>",
8
+ "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f210420b050>",
9
+ "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f210420b0e0>",
10
+ "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f210420b170>",
11
+ "_build": "<function ActorCriticPolicy._build at 0x7f210420b200>",
12
+ "forward": "<function ActorCriticPolicy.forward at 0x7f210420b290>",
13
+ "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f210420b320>",
14
+ "_predict": "<function ActorCriticPolicy._predict at 0x7f210420b3b0>",
15
+ "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f210420b440>",
16
+ "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f210420b4d0>",
17
+ "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f210420b560>",
18
+ "__abstractmethods__": "frozenset()",
19
+ "_abc_impl": "<_abc_data object at 0x7f2104261180>"
20
+ },
21
+ "verbose": 0,
22
+ "policy_kwargs": {},
23
+ "observation_space": {
24
+ ":type:": "<class 'gym.spaces.box.Box'>",
25
+ ":serialized:": "gAWVnwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/5RoCksIhZSMAUOUdJRSlIwEaGlnaJRoEiiWIAAAAAAAAAAAAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAf5RoCksIhZRoFXSUUpSMDWJvdW5kZWRfYmVsb3eUaBIolggAAAAAAAAAAAAAAAAAAACUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYIAAAAAAAAAAAAAAAAAAAAlGghSwiFlGgVdJRSlIwKX25wX3JhbmRvbZROdWIu",
26
+ "dtype": "float32",
27
+ "_shape": [
28
+ 8
29
+ ],
30
+ "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]",
31
+ "high": "[inf inf inf inf inf inf inf inf]",
32
+ "bounded_below": "[False False False False False False False False]",
33
+ "bounded_above": "[False False False False False False False False]",
34
+ "_np_random": null
35
+ },
36
+ "action_space": {
37
+ ":type:": "<class 'gym.spaces.discrete.Discrete'>",
38
+ ":serialized:": "gAWVggAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUaAeTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu",
39
+ "n": 4,
40
+ "_shape": [],
41
+ "dtype": "int64",
42
+ "_np_random": null
43
+ },
44
+ "n_envs": 16,
45
+ "num_timesteps": 1015808,
46
+ "_total_timesteps": 1000000,
47
+ "_num_timesteps_at_start": 0,
48
+ "seed": null,
49
+ "action_noise": null,
50
+ "start_time": 1652076178.4782536,
51
+ "learning_rate": 0.0001,
52
+ "tensorboard_log": null,
53
+ "lr_schedule": {
54
+ ":type:": "<class 'function'>",
55
+ ":serialized:": "gAWVvwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAUsBSxNDBIgAUwCUToWUKYwBX5SFlIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCB9lH2UKGgXaA6MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgYjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8aNuLrHEMthZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"
56
+ },
57
+ "_last_obs": {
58
+ ":type:": "<class 'numpy.ndarray'>",
59
+ ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAGaTsL0phDu64rL3Od9O9LXxeHE7urgOuQAAgD8AAIA/M9MuvCn4A7oxmqC6dS2ZtbSRsDlsvbo5AACAPwAAgD9DUpA+PMGLPxkjFb67kpG+OU1IPbsUV74AAAAAAAAAAM0fkTxSAN25ViYXuLc7+7Lh4Ei7A+s1NwAAgD8AAIA/5rb9PbiWwjrqtj69ZbaNu54HjTw9n3u8AACAPwAAgD+akTI7uF6gOP5wAzsSyGu2iuOBu/QwG7oAAIA/AACAPw1Z4L3hVpG6R9KkuxxvDzk0Wjg7a94wOgAAgD8AAIA/2pDCvaGzDj/YC/k8ci6FvnMFnrvopLO9AAAAAAAAAABT9Au+/DCRP6EEwr1C53a+HZYNvsZwh7wAAAAAAAAAAKbFnr3h2tO47lKrutofbjVKUsq7+N/KOQAAgD8AAIA/APlQvVLQyrku9Nc6sQHUNTn5cDnqd/u5AACAPwAAgD/Ni0i+NhkfP3fyoL0t3Ga+XojlvW2uar0AAAAAAAAAAJpT6zzhmKO6G08jOfETGjRyNSm6rNw7uAAAgD8AAIA/M3zLPHten7qdk8k5TAsNNaUirTprdua4AACAPwAAgD8AYzm915pTu9mAIjzirYA85Hp8PD1RXr0AAIA/AACAP2bZ1Ly4Foq51livOxcIpzf9YpA7d5OxugAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
60
+ },
61
+ "_last_episode_starts": {
62
+ ":type:": "<class 'numpy.ndarray'>",
63
+ ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="
64
+ },
65
+ "_last_original_obs": null,
66
+ "_episode_num": 0,
67
+ "use_sde": false,
68
+ "sde_sample_freq": -1,
69
+ "_current_progress_remaining": -0.015808000000000044,
70
+ "ep_info_buffer": {
71
+ ":type:": "<class 'collections.deque'>",
72
+ ":serialized:": "gAWVfxAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMI8kOlETNbMECUhpRSlIwBbJRL54wBdJRHQKi2QOH31z11fZQoaAZoCWgPQwilSSno9v1jQJSGlFKUaBVN6ANoFkdAqL0JBPbfxnV9lChoBmgJaA9DCPTdrSxRympAlIaUUpRoFU2zA2gWR0Covv4mTkhidX2UKGgGaAloD0MIs0P8w5boX0CUhpRSlGgVTegDaBZHQKi/ySf16E91fZQoaAZoCWgPQwj3d7ZHb8RhQJSGlFKUaBVN6ANoFkdAqMDHyoXKsHV9lChoBmgJaA9DCGB2Tx4WDmJAlIaUUpRoFU3oA2gWR0CoxX+JgsshdX2UKGgGaAloD0MIXkccsoF5YkCUhpRSlGgVTegDaBZHQKjHvAt4A0d1fZQoaAZoCWgPQwioGOdvQsFZQJSGlFKUaBVN6ANoFkdAqMuKuIRAbHV9lChoBmgJaA9DCI83+S26iWNAlIaUUpRoFU3oA2gWR0CozGcsMAmzdX2UKGgGaAloD0MIknpP5bQ/IECUhpRSlGgVTR8BaBZHQKjMyaFVT751fZQoaAZoCWgPQwhCsoAJ3B5ZQJSGlFKUaBVN6ANoFkdAqM2LM/yGz3V9lChoBmgJaA9DCPvOL0rQIVhAlIaUUpRoFU3oA2gWR0CozkaNuLrHdX2UKGgGaAloD0MIXb9gN+x8YkCUhpRSlGgVTegDaBZHQKjPoQXAM2F1fZQoaAZoCWgPQwg2kC42rf1YQJSGlFKUaBVN6ANoFkdAqNBmfwqiGnV9lChoBmgJaA9DCM1Zn3JMaEBAlIaUUpRoFU0nAWgWR0Co0Qb6pHZsdX2UKGgGaAloD0MIns4VpQTwYECUhpRSlGgVTegDaBZHQKjTGejmCAd1fZQoaAZoCWgPQwjIKM+8HLFiQJSGlFKUaBVN6ANoFkdAqNNoUahpQHV9lChoBmgJaA9DCNVamIV2x1pAlIaUUpRoFU3oA2gWR0Co8yQ3gk1NdX2UKGgGaAloD0MIecn/5O8dYkCUhpRSlGgVTegDaBZHQKj6qhQm/nJ1fZQoaAZoCWgPQwi/1TpxuX9sQJSGlFKUaBVNzwFoFkdAqP7dZ3cHnnV9lChoBmgJaA9DCOViDKzjdlhAlIaUUpRoFU3oA2gWR0CpAYxqfvnbdX2UKGgGaAloD0MIysNCrWkQWUCUhpRSlGgVTegDaBZHQKkDUsZHd451fZQoaAZoCWgPQwhvDWyV4O1jQJSGlFKUaBVN6ANoFkdAqQQDvG6wuHV9lChoBmgJaA9DCDuJCP+iFmNAlIaUUpRoFU3oA2gWR0CpCwzw2ETQdX2UKGgGaAloD0MIGcbdIFo/X0CUhpRSlGgVTegDaBZHQKkO1jXnQpp1fZQoaAZoCWgPQwhtPNhit/1eQJSGlFKUaBVN6ANoFkdAqQ+4Nb1RL3V9lChoBmgJaA9DCHriOVtAPGBAlIaUUpRoFU3oA2gWR0CpEBsb3oLYdX2UKGgGaAloD0MIGjbK+s21X0CUhpRSlGgVTegDaBZHQKkQ4D/VAiV1fZQoaAZoCWgPQwjvWddoOfBcQJSGlFKUaBVN6ANoFkdAqRGcxASnL3V9lChoBmgJaA9DCP/r3LQZRWVAlIaUUpRoFU3oA2gWR0CpEwcPWhAXdX2UKGgGaAloD0MIlBPtKiR2YkCUhpRSlGgVTegDaBZHQKkUX9AHE/B1fZQoaAZoCWgPQwjFA8qm3ANjQJSGlFKUaBVN6ANoFkdAqRZ02itaIXV9lChoBmgJaA9DCOmY84z9DmRAlIaUUpRoFU3oA2gWR0CpFsM/yGzsdX2UKGgGaAloD0MIu9Bcp5FYYECUhpRSlGgVTegDaBZHQKk2ii0v4/N1fZQoaAZoCWgPQwhEMA4unTVkQJSGlFKUaBVN6ANoFkdAqT7KJVKf4HV9lChoBmgJaA9DCKPIWkOpCWRAlIaUUpRoFU3oA2gWR0CpQxUPH1e0dX2UKGgGaAloD0MIG0ZB8Pj/Y0CUhpRSlGgVTegDaBZHQKlFx9aUzKt1fZQoaAZoCWgPQwjFcHUARMFhQJSGlFKUaBVN6ANoFkdAqUep3os7MnV9lChoBmgJaA9DCLCtn/6z5F9AlIaUUpRoFU3oA2gWR0CpSGga3qiXdX2UKGgGaAloD0MIdo2WAz0RYECUhpRSlGgVTegDaBZHQKlQWih37k51fZQoaAZoCWgPQwhtyD8ziERhQJSGlFKUaBVN6ANoFkdAqVSXx2B8QnV9lChoBmgJaA9DCEijAifbRl9AlIaUUpRoFU3oA2gWR0CpVY8ry1/ldX2UKGgGaAloD0MIAyMva2IpYUCUhpRSlGgVTegDaBZHQKlV/BkZrHl1fZQoaAZoCWgPQwgfn5CdNwNhQJSGlFKUaBVN6ANoFkdAqVbWoJiRXHV9lChoBmgJaA9DCC4AjdKl+mBAlIaUUpRoFU3oA2gWR0CpV6RLsa86dX2UKGgGaAloD0MIbt44KczgYUCUhpRSlGgVTegDaBZHQKlZGoBJZnt1fZQoaAZoCWgPQwhJEoQrIKRnQJSGlFKUaBVN6ANoFkdAqVqeMXJo03V9lChoBmgJaA9DCIP4wI7/W2NAlIaUUpRoFU3oA2gWR0CpXN1UdaMadX2UKGgGaAloD0MIWeArunVpYkCUhpRSlGgVTegDaBZHQKldLADaGpN1fZQoaAZoCWgPQwj0MR8Q6OhkQJSGlFKUaBVN6ANoFkdAqWCMA5q/NHV9lChoBmgJaA9DCLr0L0nlamJAlIaUUpRoFU3oA2gWR0CphD6JqIrOdX2UKGgGaAloD0MIfh6jPPN2XECUhpRSlGgVTegDaBZHQKmIR0dzXBh1fZQoaAZoCWgPQwjAkqtY/PBWQJSGlFKUaBVN6ANoFkdAqYsKmwaBJHV9lChoBmgJaA9DCN21hHzQsmFAlIaUUpRoFU3oA2gWR0CpjOv4ubqhdX2UKGgGaAloD0MIEalpF9P9YECUhpRSlGgVTegDaBZHQKmNp+VC5Vh1fZQoaAZoCWgPQwhnSBXFq8pjQJSGlFKUaBVN6ANoFkdAqZWJdGAkLXV9lChoBmgJaA9DCHctIR/0qkVAlIaUUpRoFUvoaBZHQKmXgNH6Mzd1fZQoaAZoCWgPQwjkDwaeezNfQJSGlFKUaBVN6ANoFkdAqZmxgeA/cHV9lChoBmgJaA9DCGqjOh3IvlxAlIaUUpRoFU3oA2gWR0Cpmp+yquKXdX2UKGgGaAloD0MIhel7DcG5YECUhpRSlGgVTegDaBZHQKmbCIUrTYx1fZQoaAZoCWgPQwgRV87eGVNhQJSGlFKUaBVN6ANoFkdAqZvOeMAFPnV9lChoBmgJaA9DCBztuOF3bmNAlIaUUpRoFU3oA2gWR0CpnITUI9kjdX2UKGgGaAloD0MIGjVfJR8IWkCUhpRSlGgVTegDaBZHQKmd6H58BuJ1fZQoaAZoCWgPQwgGZK93f1BcQJSGlFKUaBVN6ANoFkdAqZ9Sj1wo9nV9lChoBmgJaA9DCNuGURA8Q2NAlIaUUpRoFU3oA2gWR0CpoXyThYNidX2UKGgGaAloD0MIh6QWSia8YkCUhpRSlGgVTegDaBZHQKmh0ZYxL011fZQoaAZoCWgPQwhGDDuMSdtfQJSGlFKUaBVN6ANoFkdAqaWT2QGOdXV9lChoBmgJaA9DCEVkWMUbFTBAlIaUUpRoFU0cAWgWR0CpxwOivgWKdX2UKGgGaAloD0MIFLAdjFgOYECUhpRSlGgVTegDaBZHQKnJ4nFYMfB1fZQoaAZoCWgPQwiKdhVSfvxiQJSGlFKUaBVN6ANoFkdAqc435DZ13nV9lChoBmgJaA9DCMPwETGlmmNAlIaUUpRoFU3oA2gWR0Cp0OGmce8xdX2UKGgGaAloD0MIGLX7VQBfZ0CUhpRSlGgVTegDaBZHQKnSkbExZdR1fZQoaAZoCWgPQwgwKT4+oQBgQJSGlFKUaBVN6ANoFkdAqdrVZFG5MHV9lChoBmgJaA9DCDHO34RCemJAlIaUUpRoFU3oA2gWR0Cp3JV8Ti84dX2UKGgGaAloD0MIpS2u8RkxYUCUhpRSlGgVTegDaBZHQKneklQ/HHZ1fZQoaAZoCWgPQwgOMsnIWUJkQJSGlFKUaBVN6ANoFkdAqd9rUwztTnV9lChoBmgJaA9DCNj0oKAU6mJAlIaUUpRoFU3oA2gWR0Cp38E0BOpLdX2UKGgGaAloD0MIclDCTNvOZUCUhpRSlGgVTegDaBZHQKngdEgntv51fZQoaAZoCWgPQwjuztptF9VkQJSGlFKUaBVN6ANoFkdAqeEsedTYNHV9lChoBmgJaA9DCE4LXvQVBmRAlIaUUpRoFU3oA2gWR0Cp4oh6By0bdX2UKGgGaAloD0MI0LhwICSiZUCUhpRSlGgVTegDaBZHQKnmMd+Xqqx1fZQoaAZoCWgPQwibdjHNdFJlQJSGlFKUaBVN6ANoFkdAqeaFUsFt9HV9lChoBmgJaA9DCOaw+47hSTFAlIaUUpRoFU0dAWgWR0Cp6WrRrrPddX2UKGgGaAloD0MICRnIs0vbYUCUhpRSlGgVTegDaBZHQKnpwlP8AJd1fZQoaAZoCWgPQwjAIypUt2BlQJSGlFKUaBVN6ANoFkdAqgpO1D0Dl3V9lChoBmgJaA9DCBVUVP1KL2JAlIaUUpRoFU3oA2gWR0CqDMHpjc2zdX2UKGgGaAloD0MIp7OTwVGMXUCUhpRSlGgVTegDaBZHQKoQjj4Hoox1fZQoaAZoCWgPQwhr8SkAxmVcQJSGlFKUaBVN6ANoFkdAqhMPQdCE6HV9lChoBmgJaA9DCOVC5V/LAWNAlIaUUpRoFU3oA2gWR0CqFMyH/LkkdX2UKGgGaAloD0MI0jk/xfGVYkCUhpRSlGgVTegDaBZHQKodV5ckdFR1fZQoaAZoCWgPQwh2bATi9XdlQJSGlFKUaBVN6ANoFkdAqh8qbc45tHV9lChoBmgJaA9DCFfQtMTKR11AlIaUUpRoFU3oA2gWR0CqIUyXUpd9dX2UKGgGaAloD0MI6BVPPVJTYUCUhpRSlGgVTegDaBZHQKoijGSZBs11fZQoaAZoCWgPQwgVViqoqPBdQJSGlFKUaBVN6ANoFkdAqiNNt65Xl3V9lChoBmgJaA9DCDvGFRdHyGNAlIaUUpRoFU3oA2gWR0CqJAJGnXNDdX2UKGgGaAloD0MIhxdEpKYMX0CUhpRSlGgVTegDaBZHQKolYapgkTp1fZQoaAZoCWgPQwgurBvvDk1iQJSGlFKUaBVN6ANoFkdAqij+/pMYdnV9lChoBmgJaA9DCJg0Ruuoq2JAlIaUUpRoFU3oA2gWR0CqKVBib2DhdX2UKGgGaAloD0MI1xNdF/4OY0CUhpRSlGgVTegDaBZHQKosWs4DLbJ1fZQoaAZoCWgPQwhDklm9w1FiQJSGlFKUaBVN6ANoFkdAqiyumR/3FnVlLg=="
73
+ },
74
+ "ep_success_buffer": {
75
+ ":type:": "<class 'collections.deque'>",
76
+ ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
77
+ },
78
+ "_n_updates": 496,
79
+ "n_steps": 1024,
80
+ "gamma": 0.999,
81
+ "gae_lambda": 0.98,
82
+ "ent_coef": 0.01,
83
+ "vf_coef": 0.5,
84
+ "max_grad_norm": 0.5,
85
+ "batch_size": 64,
86
+ "n_epochs": 8,
87
+ "clip_range": {
88
+ ":type:": "<class 'function'>",
89
+ ":serialized:": "gAWVvwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAUsBSxNDBIgAUwCUToWUKYwBX5SFlIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCB9lH2UKGgXaA6MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgYjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"
90
+ },
91
+ "clip_range_vf": null,
92
+ "normalize_advantage": true,
93
+ "target_kl": null
94
+ }
bguan_ppo_lunarlander3/policy.optimizer.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:04fbd786ec7bc091e546a5596e680d325e045710a0cb0392066a4e32191dcc83
3
+ size 84893
bguan_ppo_lunarlander3/policy.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fccae5586b9506f6362d2faa640c545e81301e42cd3d50dba863189121dae996
3
+ size 43201
bguan_ppo_lunarlander3/pytorch_variables.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d030ad8db708280fcae77d87e973102039acd23a11bdecc3db8eb6c0ac940ee1
3
+ size 431
bguan_ppo_lunarlander3/system_info.txt ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ OS: Linux-5.4.188+-x86_64-with-Ubuntu-18.04-bionic #1 SMP Sun Apr 24 10:03:06 PDT 2022
2
+ Python: 3.7.13
3
+ Stable-Baselines3: 1.5.0
4
+ PyTorch: 1.11.0+cu113
5
+ GPU Enabled: True
6
+ Numpy: 1.21.6
7
+ Gym: 0.21.0
config.json CHANGED
@@ -1 +1 @@
1
- {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7fe3b71a5dd0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7fe3b71a5e60>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7fe3b71a5ef0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7fe3b71a5f80>", "_build": "<function ActorCriticPolicy._build at 0x7fe3b7129050>", "forward": "<function ActorCriticPolicy.forward at 0x7fe3b71290e0>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7fe3b7129170>", "_predict": "<function ActorCriticPolicy._predict at 0x7fe3b7129200>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7fe3b7129290>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7fe3b7129320>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7fe3b71293b0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc_data object at 0x7fe3b7174a20>"}, "verbose": 0, "policy_kwargs": {}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVnwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/5RoCksIhZSMAUOUdJRSlIwEaGlnaJRoEiiWIAAAAAAAAAAAAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAf5RoCksIhZRoFXSUUpSMDWJvdW5kZWRfYmVsb3eUaBIolggAAAAAAAAAAAAAAAAAAACUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYIAAAAAAAAAAAAAAAAAAAAlGghSwiFlGgVdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [8], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False]", "bounded_above": "[False False False False False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gAWVggAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUaAeTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu", "n": 4, "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "num_timesteps": 507904, "_total_timesteps": 500000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1652055111.0983326, "learning_rate": 0.0003, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVvwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAUsBSxNDBIgAUwCUToWUKYwBX5SFlIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCB9lH2UKGgXaA6MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgYjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAICsVL1cZzu63RVfvBvIZ7zUptw7vO9GPQAAgD8AAIA/Jpi9PUgHobodC8W68S+vtXL83DhVK+M5AACAPwAAgD8zL+29nf5gPlEJIr0VGTy+NlT9u6p+dz0AAAAAAAAAAA1+uj36XR8/uCp8PTW2or7H13w9LQjUPQAAAAAAAAAA+qYmvq63mTkiOJu6smnMNmogC7y6wrU5AACAPwAAgD/zT7w9txwfP1o0WL3H9aC+CqfeO28/R70AAAAAAAAAAADpJr2PEjq69ZZYujdgTrUA9Q877mCAOQAAgD8AAIA/gAmdPUg7l7rtyDW6vCcwtYEG4TrVSFI5AACAPwAAgD8WeZ8+F/NaP9YYqz7m0c++ssqcPvNdLT4AAAAAAAAAAOa+OT7kRoE//t8dPhLWxr7d0M0+gZ8IPQAAAAAAAAAAZhEfvQkUQD9q7Rq9KnV2vq7oszxDLaO9AAAAAAAAAABm2Bm87LGbuWY1uDtpwDk41GDyuuFAiLoAAIA/AACAP1r/fr5FNmA/9iP0vebozr5VvV6+6NUGPgAAAAAAAAAAzeoBvSk8ULq6uQe6MFoGtlIBFbv13hs5AACAPwAAgD8Aji89n620u+CYFzw1XnA8e5QdvYpYTT0AAIA/AACAP2aF4Lz2vHa6Ct5OOy61YTh+iDy7MoP4uQAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.015808000000000044, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVbxAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIpZ4FobwlSkCUhpRSlIwBbJRL7owBdJRHQHoYF2aDwph1fZQoaAZoCWgPQwiwWMNF7vFcQJSGlFKUaBVN6ANoFkdAehwYeT3Zf3V9lChoBmgJaA9DCJZ7gVmhNDFAlIaUUpRoFU0BAWgWR0B6MUHjZL7GdX2UKGgGaAloD0MIDOpb5vTbYECUhpRSlGgVTegDaBZHQHo/PdEb5uZ1fZQoaAZoCWgPQwjYKOs3E8JdQJSGlFKUaBVN6ANoFkdAekRmdy1eB3V9lChoBmgJaA9DCO9VKxN+jWBAlIaUUpRoFU3oA2gWR0B6RgpI+W4WdX2UKGgGaAloD0MIcM6I0l4RYUCUhpRSlGgVTegDaBZHQHplQ+t8uz11fZQoaAZoCWgPQwh4KuCe5xJhQJSGlFKUaBVN6ANoFkdAemrlJYkmhXV9lChoBmgJaA9DCIm2Y+ouB2FAlIaUUpRoFU3oA2gWR0B6dHPrv9cbdX2UKGgGaAloD0MIoOHNGrwHPkCUhpRSlGgVTQgBaBZHQHqBhf4REnd1fZQoaAZoCWgPQwizzvi+uNgxQJSGlFKUaBVL4mgWR0B6nNJUYKpldX2UKGgGaAloD0MIWksBaf8lZECUhpRSlGgVTegDaBZHQHqhf5P/JeV1fZQoaAZoCWgPQwje/8cJE8NiQJSGlFKUaBVN6ANoFkdAeqmDBMzuW3V9lChoBmgJaA9DCJ92+Guyr15AlIaUUpRoFU3oA2gWR0B6r5+vyLAIdX2UKGgGaAloD0MIW5caoZ/ZJcCUhpRSlGgVTQUBaBZHQHq1ULMLWqd1fZQoaAZoCWgPQwh1P6cgP4NfQJSGlFKUaBVN6ANoFkdAerwMqBmPHXV9lChoBmgJaA9DCN5YUBgU+GNAlIaUUpRoFU3oA2gWR0B60pTvRZ2ZdX2UKGgGaAloD0MIM8SxLm7lQ0CUhpRSlGgVS9loFkdAetOy6cy31HV9lChoBmgJaA9DCAmocASphFpAlIaUUpRoFU3oA2gWR0B69TOPeYUndX2UKGgGaAloD0MICHJQwkw+Y0CUhpRSlGgVTegDaBZHQHtEWFajesR1fZQoaAZoCWgPQwhTBg5o6SFmQJSGlFKUaBVN6ANoFkdAe0ihRZU1h3V9lChoBmgJaA9DCPXVVYHaKGFAlIaUUpRoFU3oA2gWR0B7TR3Ux20RdX2UKGgGaAloD0MItf6WAPwzEsCUhpRSlGgVTQUBaBZHQHtZi3Td+G51fZQoaAZoCWgPQwiyhLUxdtVbQJSGlFKUaBVN6ANoFkdAe2LavicXnHV9lChoBmgJaA9DCKpE2VvKxF5AlIaUUpRoFU3oA2gWR0B7cPIS13MZdX2UKGgGaAloD0MI8nnFU48bYkCUhpRSlGgVTegDaBZHQHt3uAd4mkZ1fZQoaAZoCWgPQwir0asBSopjQJSGlFKUaBVN6ANoFkdAe5yMxGlQ/HV9lChoBmgJaA9DCIjYYOEk2mJAlIaUUpRoFU3oA2gWR0B7s/lJYkmhdX2UKGgGaAloD0MITUwXYvUnKkCUhpRSlGgVS8JoFkdAe8zjopx3mnV9lChoBmgJaA9DCJSilXuB3mJAlIaUUpRoFU3oA2gWR0B7zyZH/cWTdX2UKGgGaAloD0MILV4sDJEDYkCUhpRSlGgVTegDaBZHQHvboiC8OCp1fZQoaAZoCWgPQwh0CvKzkeJiQJSGlFKUaBVN6ANoFkdAe+FT5ftx/HV9lChoBmgJaA9DCAcLJ2n+E2BAlIaUUpRoFU3oA2gWR0B75qQ2dd3TdX2UKGgGaAloD0MI6StIMxZVLMCUhpRSlGgVS+BoFkdAe+qBoVVPvnV9lChoBmgJaA9DCNUl4xhJ+2FAlIaUUpRoFU3oA2gWR0B77Nhqj8DTdX2UKGgGaAloD0MIB7R0Bdu4OkCUhpRSlGgVS+ZoFkdAe/4i35N47nV9lChoBmgJaA9DCHkCYadYYV9AlIaUUpRoFU3oA2gWR0B7/7FZPl+3dX2UKGgGaAloD0MIUWnEzD45QUCUhpRSlGgVS9poFkdAfAusgMc6vXV9lChoBmgJaA9DCOwYV1wcG0tAlIaUUpRoFUvRaBZHQHwSb3PAwf11fZQoaAZoCWgPQwgNG2X9ZvtaQJSGlFKUaBVN6ANoFkdAfB1f+CK77XV9lChoBmgJaA9DCGfttgvNyFxAlIaUUpRoFU3oA2gWR0B8IfyGzru6dX2UKGgGaAloD0MIgVoMHiYDY0CUhpRSlGgVTegDaBZHQHwluirT6SF1fZQoaAZoCWgPQwgz3eukvlBZQJSGlFKUaBVN6ANoFkdAfHOr92ovSXV9lChoBmgJaA9DCNLI5xVPY2VAlIaUUpRoFU3oA2gWR0B8f60Sh8IBdX2UKGgGaAloD0MIC5xsA/e9YECUhpRSlGgVTegDaBZHQHyIuYtxuKp1fZQoaAZoCWgPQwjzBMJOsbZBQJSGlFKUaBVL8mgWR0B8jqrksBhhdX2UKGgGaAloD0MITDj0Fg+ZY0CUhpRSlGgVTegDaBZHQHyW+SGJvYR1fZQoaAZoCWgPQwgnS633G4hjQJSGlFKUaBVN6ANoFkdAfJ3HcUM5O3V9lChoBmgJaA9DCJlGk4sxCCVAlIaUUpRoFUvTaBZHQHy5X++/QBx1fZQoaAZoCWgPQwjE6/oFu61DQJSGlFKUaBVL82gWR0B8/jN9ph4MdX2UKGgGaAloD0MIDR07qMTFYUCUhpRSlGgVTegDaBZHQH0ANGmUGFB1fZQoaAZoCWgPQwidnKG4425jQJSGlFKUaBVN6ANoFkdAfQ2lwtJ4B3V9lChoBmgJaA9DCG1zY3pCI2NAlIaUUpRoFU3oA2gWR0B9GkxWT5fudX2UKGgGaAloD0MI9bwbCwo2YkCUhpRSlGgVTegDaBZHQH0huBxxT851fZQoaAZoCWgPQwie6pCb4V5QQJSGlFKUaBVLxGgWR0B9MonAqNIcdX2UKGgGaAloD0MIpcACmDIMRUCUhpRSlGgVS9doFkdAfTWItDlYEHV9lChoBmgJaA9DCMcqpWd6l0VAlIaUUpRoFUuhaBZHQH02B2r4nF51fZQoaAZoCWgPQwjDnnb4a55eQJSGlFKUaBVN6ANoFkdAfTik56t1ZHV9lChoBmgJaA9DCAMn28AdR2JAlIaUUpRoFU3oA2gWR0B9OnACW/rTdX2UKGgGaAloD0MIhIHn3kOvYkCUhpRSlGgVTegDaBZHQH1HH05EMLF1fZQoaAZoCWgPQwhNSkG3l3pDQJSGlFKUaBVL/WgWR0B9UrMbFS88dX2UKGgGaAloD0MISzlf7L1HXUCUhpRSlGgVTegDaBZHQH1YGm+Cbtt1fZQoaAZoCWgPQwjus8pMaalgQJSGlFKUaBVN6ANoFkdAfVyw++ueSXV9lChoBmgJaA9DCH/5ZMXwQ2FAlIaUUpRoFU3oA2gWR0B9YEjPfKp2dX2UKGgGaAloD0MIy2jk84peYUCUhpRSlGgVTegDaBZHQH1kAnc+JP91fZQoaAZoCWgPQwg3qWis/QU8QJSGlFKUaBVL2mgWR0B9ZLr/sE7odX2UKGgGaAloD0MIeSCySJO0ZECUhpRSlGgVTegDaBZHQH25jCpFTeh1fZQoaAZoCWgPQwjAJmvUw3hiQJSGlFKUaBVN6ANoFkdAfcZZOSGJvnV9lChoBmgJaA9DCKn7AKQ2ol1AlIaUUpRoFU3oA2gWR0B9zXkZJkGzdX2UKGgGaAloD0MIBK4rZgTwZECUhpRSlGgVTegDaBZHQH3T4YrJ8v51fZQoaAZoCWgPQwgYITzaOMxLQJSGlFKUaBVLw2gWR0B97tUEPlMidX2UKGgGaAloD0MIsacd/hr9YUCUhpRSlGgVTegDaBZHQH5M52ECeVd1fZQoaAZoCWgPQwiDvvT255NiQJSGlFKUaBVN6ANoFkdAfl9JBPbfxnV9lChoBmgJaA9DCMRdvYoMymNAlIaUUpRoFU3oA2gWR0B+Yo5/9YOldX2UKGgGaAloD0MIblLRWHsYYUCUhpRSlGgVTegDaBZHQH5jFVo6CDp1fZQoaAZoCWgPQwjjpgaazzxcQJSGlFKUaBVN6ANoFkdAfmeyDqW1MXV9lChoBmgJaA9DCB3nNuFeaVlAlIaUUpRoFU3oA2gWR0B+dlwVCXyBdX2UKGgGaAloD0MILqnaboIDXUCUhpRSlGgVTegDaBZHQH6Dx8UmD151fZQoaAZoCWgPQwgy/+ibtKBjQJSGlFKUaBVN6ANoFkdAfolSOinHenV9lChoBmgJaA9DCLL1DOGYPV9AlIaUUpRoFU3oA2gWR0B+jcfzSThYdX2UKGgGaAloD0MI8RDGT+NWXkCUhpRSlGgVTegDaBZHQH6Rbo0Q9Rt1fZQoaAZoCWgPQwj9Fp0stXhhQJSGlFKUaBVN6ANoFkdAfpUFtsN2DHV9lChoBmgJaA9DCLPttDUi311AlIaUUpRoFU3oA2gWR0B+lbvAoG6gdX2UKGgGaAloD0MISKRt/AniZECUhpRSlGgVTegDaBZHQH7o3eaa1Cx1fZQoaAZoCWgPQwgnEeFfBPNmQJSGlFKUaBVN6ANoFkdAfv1Ltu1nd3V9lChoBmgJaA9DCC3OGOYEjmVAlIaUUpRoFU3oA2gWR0B/A4tRNyo5dX2UKGgGaAloD0MIfnA+dSxcYUCUhpRSlGgVTegDaBZHQH8ezDn/1g91fZQoaAZoCWgPQwgcs+xJYGMyQJSGlFKUaBVL8mgWR0B/XeWIGhVVdX2UKGgGaAloD0MI3UPC9/6SZkCUhpRSlGgVTegDaBZHQH+AT2OAAhl1fZQoaAZoCWgPQwg+srlqnhFWQJSGlFKUaBVN6ANoFkdAf5NnMMZxaXV9lChoBmgJaA9DCFvtYS8U+WVAlIaUUpRoFU3oA2gWR0B/ls3aSLZSdX2UKGgGaAloD0MI3LjF/FzzY0CUhpRSlGgVTegDaBZHQH+XU/r0J4V1fZQoaAZoCWgPQwjCTNu/sh5eQJSGlFKUaBVN6ANoFkdAf5v2phnanXV9lChoBmgJaA9DCKp/EMmQKWFAlIaUUpRoFU3oA2gWR0B/qs0ALiMpdX2UKGgGaAloD0MIEynN5vG7Z0CUhpRSlGgVTegDaBZHQH+488DB/I91fZQoaAZoCWgPQwhlNsgkI1NiQJSGlFKUaBVN6ANoFkdAf78iUxEfDHV9lChoBmgJaA9DCKZ9c391n2BAlIaUUpRoFU3oA2gWR0B/xD2OAAhjdX2UKGgGaAloD0MID+1jBb8kX0CUhpRSlGgVTegDaBZHQH/IdM495hV1fZQoaAZoCWgPQwiflEkNbVtmQJSGlFKUaBVN6ANoFkdAf8zC6pYLcHV9lChoBmgJaA9DCH8XtmYr71pAlIaUUpRoFU3oA2gWR0B/zaqABkqddWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 124, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVvwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAUsBSxNDBIgAUwCUToWUKYwBX5SFlIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCB9lH2UKGgXaA6MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgYjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "system_info": {"OS": "Linux-5.4.188+-x86_64-with-Ubuntu-18.04-bionic #1 SMP Sun Apr 24 10:03:06 PDT 2022", "Python": "3.7.13", "Stable-Baselines3": "1.5.0", "PyTorch": "1.11.0+cu113", "GPU Enabled": "True", "Numpy": "1.21.6", "Gym": "0.21.0"}}
 
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f2104204f80>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f210420b050>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f210420b0e0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f210420b170>", "_build": "<function ActorCriticPolicy._build at 0x7f210420b200>", "forward": "<function ActorCriticPolicy.forward at 0x7f210420b290>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f210420b320>", "_predict": "<function ActorCriticPolicy._predict at 0x7f210420b3b0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f210420b440>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f210420b4d0>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f210420b560>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc_data object at 0x7f2104261180>"}, "verbose": 0, "policy_kwargs": {}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVnwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/5RoCksIhZSMAUOUdJRSlIwEaGlnaJRoEiiWIAAAAAAAAAAAAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAf5RoCksIhZRoFXSUUpSMDWJvdW5kZWRfYmVsb3eUaBIolggAAAAAAAAAAAAAAAAAAACUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYIAAAAAAAAAAAAAAAAAAAAlGghSwiFlGgVdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [8], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False]", "bounded_above": "[False False False False False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gAWVggAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUaAeTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu", "n": 4, "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "num_timesteps": 1015808, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1652076178.4782536, "learning_rate": 0.0001, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVvwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAUsBSxNDBIgAUwCUToWUKYwBX5SFlIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCB9lH2UKGgXaA6MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgYjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8aNuLrHEMthZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAGaTsL0phDu64rL3Od9O9LXxeHE7urgOuQAAgD8AAIA/M9MuvCn4A7oxmqC6dS2ZtbSRsDlsvbo5AACAPwAAgD9DUpA+PMGLPxkjFb67kpG+OU1IPbsUV74AAAAAAAAAAM0fkTxSAN25ViYXuLc7+7Lh4Ei7A+s1NwAAgD8AAIA/5rb9PbiWwjrqtj69ZbaNu54HjTw9n3u8AACAPwAAgD+akTI7uF6gOP5wAzsSyGu2iuOBu/QwG7oAAIA/AACAPw1Z4L3hVpG6R9KkuxxvDzk0Wjg7a94wOgAAgD8AAIA/2pDCvaGzDj/YC/k8ci6FvnMFnrvopLO9AAAAAAAAAABT9Au+/DCRP6EEwr1C53a+HZYNvsZwh7wAAAAAAAAAAKbFnr3h2tO47lKrutofbjVKUsq7+N/KOQAAgD8AAIA/APlQvVLQyrku9Nc6sQHUNTn5cDnqd/u5AACAPwAAgD/Ni0i+NhkfP3fyoL0t3Ga+XojlvW2uar0AAAAAAAAAAJpT6zzhmKO6G08jOfETGjRyNSm6rNw7uAAAgD8AAIA/M3zLPHten7qdk8k5TAsNNaUirTprdua4AACAPwAAgD8AYzm915pTu9mAIjzirYA85Hp8PD1RXr0AAIA/AACAP2bZ1Ly4Foq51livOxcIpzf9YpA7d5OxugAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.015808000000000044, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVfxAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMI8kOlETNbMECUhpRSlIwBbJRL54wBdJRHQKi2QOH31z11fZQoaAZoCWgPQwilSSno9v1jQJSGlFKUaBVN6ANoFkdAqL0JBPbfxnV9lChoBmgJaA9DCPTdrSxRympAlIaUUpRoFU2zA2gWR0Covv4mTkhidX2UKGgGaAloD0MIs0P8w5boX0CUhpRSlGgVTegDaBZHQKi/ySf16E91fZQoaAZoCWgPQwj3d7ZHb8RhQJSGlFKUaBVN6ANoFkdAqMDHyoXKsHV9lChoBmgJaA9DCGB2Tx4WDmJAlIaUUpRoFU3oA2gWR0CoxX+JgsshdX2UKGgGaAloD0MIXkccsoF5YkCUhpRSlGgVTegDaBZHQKjHvAt4A0d1fZQoaAZoCWgPQwioGOdvQsFZQJSGlFKUaBVN6ANoFkdAqMuKuIRAbHV9lChoBmgJaA9DCI83+S26iWNAlIaUUpRoFU3oA2gWR0CozGcsMAmzdX2UKGgGaAloD0MIknpP5bQ/IECUhpRSlGgVTR8BaBZHQKjMyaFVT751fZQoaAZoCWgPQwhCsoAJ3B5ZQJSGlFKUaBVN6ANoFkdAqM2LM/yGz3V9lChoBmgJaA9DCPvOL0rQIVhAlIaUUpRoFU3oA2gWR0CozkaNuLrHdX2UKGgGaAloD0MIXb9gN+x8YkCUhpRSlGgVTegDaBZHQKjPoQXAM2F1fZQoaAZoCWgPQwg2kC42rf1YQJSGlFKUaBVN6ANoFkdAqNBmfwqiGnV9lChoBmgJaA9DCM1Zn3JMaEBAlIaUUpRoFU0nAWgWR0Co0Qb6pHZsdX2UKGgGaAloD0MIns4VpQTwYECUhpRSlGgVTegDaBZHQKjTGejmCAd1fZQoaAZoCWgPQwjIKM+8HLFiQJSGlFKUaBVN6ANoFkdAqNNoUahpQHV9lChoBmgJaA9DCNVamIV2x1pAlIaUUpRoFU3oA2gWR0Co8yQ3gk1NdX2UKGgGaAloD0MIecn/5O8dYkCUhpRSlGgVTegDaBZHQKj6qhQm/nJ1fZQoaAZoCWgPQwi/1TpxuX9sQJSGlFKUaBVNzwFoFkdAqP7dZ3cHnnV9lChoBmgJaA9DCOViDKzjdlhAlIaUUpRoFU3oA2gWR0CpAYxqfvnbdX2UKGgGaAloD0MIysNCrWkQWUCUhpRSlGgVTegDaBZHQKkDUsZHd451fZQoaAZoCWgPQwhvDWyV4O1jQJSGlFKUaBVN6ANoFkdAqQQDvG6wuHV9lChoBmgJaA9DCDuJCP+iFmNAlIaUUpRoFU3oA2gWR0CpCwzw2ETQdX2UKGgGaAloD0MIGcbdIFo/X0CUhpRSlGgVTegDaBZHQKkO1jXnQpp1fZQoaAZoCWgPQwhtPNhit/1eQJSGlFKUaBVN6ANoFkdAqQ+4Nb1RL3V9lChoBmgJaA9DCHriOVtAPGBAlIaUUpRoFU3oA2gWR0CpEBsb3oLYdX2UKGgGaAloD0MIGjbK+s21X0CUhpRSlGgVTegDaBZHQKkQ4D/VAiV1fZQoaAZoCWgPQwjvWddoOfBcQJSGlFKUaBVN6ANoFkdAqRGcxASnL3V9lChoBmgJaA9DCP/r3LQZRWVAlIaUUpRoFU3oA2gWR0CpEwcPWhAXdX2UKGgGaAloD0MIlBPtKiR2YkCUhpRSlGgVTegDaBZHQKkUX9AHE/B1fZQoaAZoCWgPQwjFA8qm3ANjQJSGlFKUaBVN6ANoFkdAqRZ02itaIXV9lChoBmgJaA9DCOmY84z9DmRAlIaUUpRoFU3oA2gWR0CpFsM/yGzsdX2UKGgGaAloD0MIu9Bcp5FYYECUhpRSlGgVTegDaBZHQKk2ii0v4/N1fZQoaAZoCWgPQwhEMA4unTVkQJSGlFKUaBVN6ANoFkdAqT7KJVKf4HV9lChoBmgJaA9DCKPIWkOpCWRAlIaUUpRoFU3oA2gWR0CpQxUPH1e0dX2UKGgGaAloD0MIG0ZB8Pj/Y0CUhpRSlGgVTegDaBZHQKlFx9aUzKt1fZQoaAZoCWgPQwjFcHUARMFhQJSGlFKUaBVN6ANoFkdAqUep3os7MnV9lChoBmgJaA9DCLCtn/6z5F9AlIaUUpRoFU3oA2gWR0CpSGga3qiXdX2UKGgGaAloD0MIdo2WAz0RYECUhpRSlGgVTegDaBZHQKlQWih37k51fZQoaAZoCWgPQwhtyD8ziERhQJSGlFKUaBVN6ANoFkdAqVSXx2B8QnV9lChoBmgJaA9DCEijAifbRl9AlIaUUpRoFU3oA2gWR0CpVY8ry1/ldX2UKGgGaAloD0MIAyMva2IpYUCUhpRSlGgVTegDaBZHQKlV/BkZrHl1fZQoaAZoCWgPQwgfn5CdNwNhQJSGlFKUaBVN6ANoFkdAqVbWoJiRXHV9lChoBmgJaA9DCC4AjdKl+mBAlIaUUpRoFU3oA2gWR0CpV6RLsa86dX2UKGgGaAloD0MIbt44KczgYUCUhpRSlGgVTegDaBZHQKlZGoBJZnt1fZQoaAZoCWgPQwhJEoQrIKRnQJSGlFKUaBVN6ANoFkdAqVqeMXJo03V9lChoBmgJaA9DCIP4wI7/W2NAlIaUUpRoFU3oA2gWR0CpXN1UdaMadX2UKGgGaAloD0MIWeArunVpYkCUhpRSlGgVTegDaBZHQKldLADaGpN1fZQoaAZoCWgPQwj0MR8Q6OhkQJSGlFKUaBVN6ANoFkdAqWCMA5q/NHV9lChoBmgJaA9DCLr0L0nlamJAlIaUUpRoFU3oA2gWR0CphD6JqIrOdX2UKGgGaAloD0MIfh6jPPN2XECUhpRSlGgVTegDaBZHQKmIR0dzXBh1fZQoaAZoCWgPQwjAkqtY/PBWQJSGlFKUaBVN6ANoFkdAqYsKmwaBJHV9lChoBmgJaA9DCN21hHzQsmFAlIaUUpRoFU3oA2gWR0CpjOv4ubqhdX2UKGgGaAloD0MIEalpF9P9YECUhpRSlGgVTegDaBZHQKmNp+VC5Vh1fZQoaAZoCWgPQwhnSBXFq8pjQJSGlFKUaBVN6ANoFkdAqZWJdGAkLXV9lChoBmgJaA9DCHctIR/0qkVAlIaUUpRoFUvoaBZHQKmXgNH6Mzd1fZQoaAZoCWgPQwjkDwaeezNfQJSGlFKUaBVN6ANoFkdAqZmxgeA/cHV9lChoBmgJaA9DCGqjOh3IvlxAlIaUUpRoFU3oA2gWR0Cpmp+yquKXdX2UKGgGaAloD0MIhel7DcG5YECUhpRSlGgVTegDaBZHQKmbCIUrTYx1fZQoaAZoCWgPQwgRV87eGVNhQJSGlFKUaBVN6ANoFkdAqZvOeMAFPnV9lChoBmgJaA9DCBztuOF3bmNAlIaUUpRoFU3oA2gWR0CpnITUI9kjdX2UKGgGaAloD0MIGjVfJR8IWkCUhpRSlGgVTegDaBZHQKmd6H58BuJ1fZQoaAZoCWgPQwgGZK93f1BcQJSGlFKUaBVN6ANoFkdAqZ9Sj1wo9nV9lChoBmgJaA9DCNuGURA8Q2NAlIaUUpRoFU3oA2gWR0CpoXyThYNidX2UKGgGaAloD0MIh6QWSia8YkCUhpRSlGgVTegDaBZHQKmh0ZYxL011fZQoaAZoCWgPQwhGDDuMSdtfQJSGlFKUaBVN6ANoFkdAqaWT2QGOdXV9lChoBmgJaA9DCEVkWMUbFTBAlIaUUpRoFU0cAWgWR0CpxwOivgWKdX2UKGgGaAloD0MIFLAdjFgOYECUhpRSlGgVTegDaBZHQKnJ4nFYMfB1fZQoaAZoCWgPQwiKdhVSfvxiQJSGlFKUaBVN6ANoFkdAqc435DZ13nV9lChoBmgJaA9DCMPwETGlmmNAlIaUUpRoFU3oA2gWR0Cp0OGmce8xdX2UKGgGaAloD0MIGLX7VQBfZ0CUhpRSlGgVTegDaBZHQKnSkbExZdR1fZQoaAZoCWgPQwgwKT4+oQBgQJSGlFKUaBVN6ANoFkdAqdrVZFG5MHV9lChoBmgJaA9DCDHO34RCemJAlIaUUpRoFU3oA2gWR0Cp3JV8Ti84dX2UKGgGaAloD0MIpS2u8RkxYUCUhpRSlGgVTegDaBZHQKneklQ/HHZ1fZQoaAZoCWgPQwgOMsnIWUJkQJSGlFKUaBVN6ANoFkdAqd9rUwztTnV9lChoBmgJaA9DCNj0oKAU6mJAlIaUUpRoFU3oA2gWR0Cp38E0BOpLdX2UKGgGaAloD0MIclDCTNvOZUCUhpRSlGgVTegDaBZHQKngdEgntv51fZQoaAZoCWgPQwjuztptF9VkQJSGlFKUaBVN6ANoFkdAqeEsedTYNHV9lChoBmgJaA9DCE4LXvQVBmRAlIaUUpRoFU3oA2gWR0Cp4oh6By0bdX2UKGgGaAloD0MI0LhwICSiZUCUhpRSlGgVTegDaBZHQKnmMd+Xqqx1fZQoaAZoCWgPQwibdjHNdFJlQJSGlFKUaBVN6ANoFkdAqeaFUsFt9HV9lChoBmgJaA9DCOaw+47hSTFAlIaUUpRoFU0dAWgWR0Cp6WrRrrPddX2UKGgGaAloD0MICRnIs0vbYUCUhpRSlGgVTegDaBZHQKnpwlP8AJd1fZQoaAZoCWgPQwjAIypUt2BlQJSGlFKUaBVN6ANoFkdAqgpO1D0Dl3V9lChoBmgJaA9DCBVUVP1KL2JAlIaUUpRoFU3oA2gWR0CqDMHpjc2zdX2UKGgGaAloD0MIp7OTwVGMXUCUhpRSlGgVTegDaBZHQKoQjj4Hoox1fZQoaAZoCWgPQwhr8SkAxmVcQJSGlFKUaBVN6ANoFkdAqhMPQdCE6HV9lChoBmgJaA9DCOVC5V/LAWNAlIaUUpRoFU3oA2gWR0CqFMyH/LkkdX2UKGgGaAloD0MI0jk/xfGVYkCUhpRSlGgVTegDaBZHQKodV5ckdFR1fZQoaAZoCWgPQwh2bATi9XdlQJSGlFKUaBVN6ANoFkdAqh8qbc45tHV9lChoBmgJaA9DCFfQtMTKR11AlIaUUpRoFU3oA2gWR0CqIUyXUpd9dX2UKGgGaAloD0MI6BVPPVJTYUCUhpRSlGgVTegDaBZHQKoijGSZBs11fZQoaAZoCWgPQwgVViqoqPBdQJSGlFKUaBVN6ANoFkdAqiNNt65Xl3V9lChoBmgJaA9DCDvGFRdHyGNAlIaUUpRoFU3oA2gWR0CqJAJGnXNDdX2UKGgGaAloD0MIhxdEpKYMX0CUhpRSlGgVTegDaBZHQKolYapgkTp1fZQoaAZoCWgPQwgurBvvDk1iQJSGlFKUaBVN6ANoFkdAqij+/pMYdnV9lChoBmgJaA9DCJg0Ruuoq2JAlIaUUpRoFU3oA2gWR0CqKVBib2DhdX2UKGgGaAloD0MI1xNdF/4OY0CUhpRSlGgVTegDaBZHQKosWs4DLbJ1fZQoaAZoCWgPQwhDklm9w1FiQJSGlFKUaBVN6ANoFkdAqiyumR/3FnVlLg=="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 496, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 8, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVvwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAUsBSxNDBIgAUwCUToWUKYwBX5SFlIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgEMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxIL3Vzci9sb2NhbC9saWIvcHl0aG9uMy43L2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCB9lH2UKGgXaA6MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgYjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "system_info": {"OS": "Linux-5.4.188+-x86_64-with-Ubuntu-18.04-bionic #1 SMP Sun Apr 24 10:03:06 PDT 2022", "Python": "3.7.13", "Stable-Baselines3": "1.5.0", "PyTorch": "1.11.0+cu113", "GPU Enabled": "True", "Numpy": "1.21.6", "Gym": "0.21.0"}}
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:68942288e97858cb0952f52623c858c27353067cdf4eb2282c56f3af81a2238a
3
- size 234632
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70a5ac37ab52d967a1f80f4f0995c1de46a802e721bd0d957185e04ced9dd168
3
+ size 245417
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 218.47820877534906, "std_reward": 23.54250514950306, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2022-05-09T00:25:15.736811"}
 
1
+ {"mean_reward": 224.75846835024868, "std_reward": 21.411892070032263, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2022-05-09T06:40:11.790025"}