aayushmnit commited on
Commit
e3f0b19
1 Parent(s): e685607

Upload PPO LunarLander-v2 trained agent 1e6

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
- value: 263.40 +/- 12.54
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
+ value: 227.16 +/- 83.82
20
  name: mean_reward
21
  verified: false
22
  ---
config.json CHANGED
@@ -1 +1 @@
1
- {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f58ae03e790>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f58ae03e820>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f58ae03e8b0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f58ae03e940>", "_build": "<function ActorCriticPolicy._build at 0x7f58ae03e9d0>", "forward": "<function ActorCriticPolicy.forward at 0x7f58ae03ea60>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f58ae03eaf0>", "_predict": "<function ActorCriticPolicy._predict at 0x7f58ae03eb80>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f58ae03ec10>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f58ae03eca0>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f58ae03ed30>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc_data object at 0x7f58ae033fc0>"}, "verbose": 1, "policy_kwargs": {}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVnwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/5RoCksIhZSMAUOUdJRSlIwEaGlnaJRoEiiWIAAAAAAAAAAAAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAf5RoCksIhZRoFXSUUpSMDWJvdW5kZWRfYmVsb3eUaBIolggAAAAAAAAAAAAAAAAAAACUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYIAAAAAAAAAAAAAAAAAAAAlGghSwiFlGgVdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [8], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False]", "bounded_above": "[False False False False False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gAWVggAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUaAeTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu", "n": 4, "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "num_timesteps": 1015808, "_total_timesteps": 1000000.0, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1670893292436745039, "learning_rate": 0.0003, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4BDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/M6kqMFUyYYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAICmSr3h4JG6nFG/O2PaIDdVFGC6IK0WNgAAgD8AAIA/mtA8vSkYWbovYiu7YE6Rtucg3jeQzUk6AACAPwAAgD9zN4w9e0qMumIxWDkEh/I1So8kOVPye7gAAIA/AAAAAACnWj32KHq8qc+GO5sEtjxI6ts9hFSRvQAAgD8AAIA/ALVCPcPBDbr6gTy79b2ltk8ywLoCZhY2AACAPwAAAADNeMy89nxTumKdjTmtpWw0yTU5u5HWprgAAIA/AACAP3OKVz7qCOA+iWQCvtZskL6zvi482GR0PQAAAAAAAAAAmpUWPOGsg7olxqizjD6xL1BFb7rW678zAACAPwAAgD+qanS+mWBFP7byIT5pLbi+eeV0vft96DwAAAAAAAAAABo/i72Ptnq62MRgu0B7tLZYZBs6bmGDOgAAgD8AAIA/GuRKPiZljT5txIa+5P1LviAar7wn6Le8AAAAAAAAAAAzCzA8aUA6PhCQsL3mayC+TmxPPCdMtb0AAAAAAAAAADNbVztIB6q6dcrnOtEiZzXXTJ24/c4EugAAgD8AAIA/AKnRvR+kRD+aqQM9/ROyvl0Xd70xGL09AAAAAAAAAADm2bI99qhyuqaGO7yZP4s8t19nO05+db0AAIA/AAAAAGbawTtcIwq6FbtbumbScrTkuo+7Jh+COQAAgD8AAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.015808000000000044, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVfRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIRSxi2OGKYkCUhpRSlIwBbJRN6AOMAXSUR0CWkMg8bJfZdX2UKGgGaAloD0MItyizQabZZECUhpRSlGgVTegDaBZHQJaSk8kleGB1fZQoaAZoCWgPQwjQRq6bUhpoQJSGlFKUaBVN6ANoFkdAlpUc9fTkQ3V9lChoBmgJaA9DCBCtFW2O32FAlIaUUpRoFU3oA2gWR0CWmwmIj4YadX2UKGgGaAloD0MIyZOkayY8Y0CUhpRSlGgVTegDaBZHQJafrzPKMeh1fZQoaAZoCWgPQwitpuuJrnVjQJSGlFKUaBVN6ANoFkdAlqADL0SRKnV9lChoBmgJaA9DCD+nID8bcGRAlIaUUpRoFU3oA2gWR0CWpZWQfZEldX2UKGgGaAloD0MIzEV8J+aAYkCUhpRSlGgVTegDaBZHQJanXM0P6Kt1fZQoaAZoCWgPQwifWRKgptFlQJSGlFKUaBVN6ANoFkdAlqo0DZDiO3V9lChoBmgJaA9DCGQipdk8i2VAlIaUUpRoFU3oA2gWR0CWxnog3cYZdX2UKGgGaAloD0MIlZ1+UJd2Y0CUhpRSlGgVTegDaBZHQJbJL20zCUJ1fZQoaAZoCWgPQwgST3YzI01mQJSGlFKUaBVN6ANoFkdAlsqkZiuuBHV9lChoBmgJaA9DCD/h7NYy+2NAlIaUUpRoFU3oA2gWR0CWz4P9DQZ5dX2UKGgGaAloD0MIoffGEIBGYECUhpRSlGgVTegDaBZHQJbSGCHymQ91fZQoaAZoCWgPQwhd3bHYpo9iQJSGlFKUaBVN6ANoFkdAltQR99c8knV9lChoBmgJaA9DCAPS/gfYaWxAlIaUUpRoFU2fA2gWR0CW2IcvM8oydX2UKGgGaAloD0MIdChDVUwxY0CUhpRSlGgVTegDaBZHQJbY53PiT+x1fZQoaAZoCWgPQwjxftx++XxPQJSGlFKUaBVL0WgWR0CW2k9NN8E3dX2UKGgGaAloD0MIZd8Vwf+iY0CUhpRSlGgVTegDaBZHQJbaXFMqSYB1fZQoaAZoCWgPQwgBNbVsLfpiQJSGlFKUaBVN6ANoFkdAlt55dB0IT3V9lChoBmgJaA9DCDmZuFWQzWNAlIaUUpRoFU3oA2gWR0CW5Chxo7FLdX2UKGgGaAloD0MIbt44Kcy0ZECUhpRSlGgVTegDaBZHQJbo4c7yQPt1fZQoaAZoCWgPQwjOABdkS1llQJSGlFKUaBVN6ANoFkdAluk+QQtjC3V9lChoBmgJaA9DCPVk/tE302VAlIaUUpRoFU3oA2gWR0CW7tgZTAFgdX2UKGgGaAloD0MIZ3+g3DZgYkCUhpRSlGgVTegDaBZHQJbwl6IFeOZ1fZQoaAZoCWgPQwimKJfGr/plQJSGlFKUaBVN6ANoFkdAlvNSV4X403V9lChoBmgJaA9DCAspP6n2W0dAlIaUUpRoFUvaaBZHQJb1HTSb6P91fZQoaAZoCWgPQwihuyTOCoFkQJSGlFKUaBVN6ANoFkdAlw6UhePaMHV9lChoBmgJaA9DCPZFQltOvmRAlIaUUpRoFU3oA2gWR0CXEQMtsenydX2UKGgGaAloD0MIL4oe+JiVZECUhpRSlGgVTegDaBZHQJcSc0bcXWR1fZQoaAZoCWgPQwhH5/wUxzFkQJSGlFKUaBVN6ANoFkdAlxnHpbD/EXV9lChoBmgJaA9DCClZTkJpOGJAlIaUUpRoFU3oA2gWR0CXG8Ot4iX6dX2UKGgGaAloD0MIcodNZOaLYUCUhpRSlGgVTegDaBZHQJcgZu/Dcdp1fZQoaAZoCWgPQwj0iTxJuoRkQJSGlFKUaBVN6ANoFkdAlyDCQDFId3V9lChoBmgJaA9DCEw2HmwxG2JAlIaUUpRoFU3oA2gWR0CXIjiR4hUzdX2UKGgGaAloD0MIXmiu08h7YkCUhpRSlGgVTegDaBZHQJciRradtl91fZQoaAZoCWgPQwjJWG3+3+9jQJSGlFKUaBVN6ANoFkdAlyajziCJ43V9lChoBmgJaA9DCBN9PsqIPWhAlIaUUpRoFU3oA2gWR0CXLHf779AHdX2UKGgGaAloD0MI8nnFUw9NZECUhpRSlGgVTegDaBZHQJcxGUcGTs91fZQoaAZoCWgPQwjh7xezpatlQJSGlFKUaBVN6ANoFkdAlzdCyt3fRHV9lChoBmgJaA9DCHWPbK6aK2NAlIaUUpRoFU3oA2gWR0CXOP6C17Y1dX2UKGgGaAloD0MIAI49ey5UZECUhpRSlGgVTegDaBZHQJc7wRSP2f11fZQoaAZoCWgPQwixNsZO+K9gQJSGlFKUaBVN6ANoFkdAlz1XZ00WM3V9lChoBmgJaA9DCG73cp8c52NAlIaUUpRoFU3oA2gWR0CXVhlQ/HHWdX2UKGgGaAloD0MIt7QaEveMX0CUhpRSlGgVTegDaBZHQJdYL8+A3DN1fZQoaAZoCWgPQwjtvI3NzmZwQJSGlFKUaBVNlAFoFkdAl1jhS1mapnV9lChoBmgJaA9DCC/gZYaN12BAlIaUUpRoFU3oA2gWR0CXWWCbMHKPdX2UKGgGaAloD0MIYHXkSOfrYECUhpRSlGgVTegDaBZHQJdfKAFxGUh1fZQoaAZoCWgPQwi1UDI5tfdeQJSGlFKUaBVN6ANoFkdAl2DmCyyD7XV9lChoBmgJaA9DCBGQL6GCwWRAlIaUUpRoFU3oA2gWR0CXZOnWattAdX2UKGgGaAloD0MIXmOXqN70ZkCUhpRSlGgVTegDaBZHQJdlRaNdZ7p1fZQoaAZoCWgPQwhkOnR6XkNgQJSGlFKUaBVN6ANoFkdAl2aU2tMfzXV9lChoBmgJaA9DCAGHUKVmYmVAlIaUUpRoFU3oA2gWR0CXZqFNtZV5dX2UKGgGaAloD0MIKZKvBNKOY0CUhpRSlGgVTegDaBZHQJdquzZ6D5F1fZQoaAZoCWgPQwgm4NdIkoZlQJSGlFKUaBVN6ANoFkdAl3BV85S3s3V9lChoBmgJaA9DCB0ibk4lXWNAlIaUUpRoFU3oA2gWR0CXestL+PzWdX2UKGgGaAloD0MIrDb/rzqZZUCUhpRSlGgVTegDaBZHQJd8h/ViF0x1fZQoaAZoCWgPQwiFCg4vCO9mQJSGlFKUaBVN6ANoFkdAl38/6oESunV9lChoBmgJaA9DCMgMVMa/uGNAlIaUUpRoFU3oA2gWR0CXgPHOKO1fdX2UKGgGaAloD0MIFeKReHnDZ0CUhpRSlGgVTegDaBZHQJeafLB9Cu51fZQoaAZoCWgPQwiC4zJuag1lQJSGlFKUaBVN6ANoFkdAl5zYn4O+ZnV9lChoBmgJaA9DCNWxSumZTVxAlIaUUpRoFU3oA2gWR0CXnYuq3mV8dX2UKGgGaAloD0MIU5eMY6STZkCUhpRSlGgVTegDaBZHQJeeEs9SuQp1fZQoaAZoCWgPQwicpWQ5iVJwQJSGlFKUaBVN2wJoFkdAl59VmBe5WnV9lChoBmgJaA9DCOs2qP0WPXFAlIaUUpRoFU0hA2gWR0CXoStjkMkQdX2UKGgGaAloD0MIaww6IfSKZUCUhpRSlGgVTegDaBZHQJej6xMWXTp1fZQoaAZoCWgPQwg7+8qDdJJmQJSGlFKUaBVN6ANoFkdAl6WW4qgAZXV9lChoBmgJaA9DCHk+A+rNnkVAlIaUUpRoFUvOaBZHQJemYornTy91fZQoaAZoCWgPQwh2/BcIgotlQJSGlFKUaBVN6ANoFkdAl6ltb9qDb3V9lChoBmgJaA9DCGpQNA9g/2BAlIaUUpRoFU3oA2gWR0CXqu/CIk7fdX2UKGgGaAloD0MIUigLX19BZECUhpRSlGgVTegDaBZHQJeu6gBcRlJ1fZQoaAZoCWgPQwil3ehjPppIQJSGlFKUaBVLx2gWR0CXr0V7Qb++dX2UKGgGaAloD0MIQMObNXi9bkCUhpRSlGgVTTYBaBZHQJezaq6vq1R1fZQoaAZoCWgPQwgC85Apn/ZxQJSGlFKUaBVN4wNoFkdAl7PRYaHbh3V9lChoBmgJaA9DCD+nID8bdGdAlIaUUpRoFU3oA2gWR0CXvWCOmzjWdX2UKGgGaAloD0MIBhGpaRfaZUCUhpRSlGgVTegDaBZHQJe/Al+mWMV1fZQoaAZoCWgPQwjnOSLfJaFnQJSGlFKUaBVN6ANoFkdAl8GqagElmnV9lChoBmgJaA9DCOhLb38unGdAlIaUUpRoFU3oA2gWR0CXw1abWmP6dX2UKGgGaAloD0MIGjOJesG0YECUhpRSlGgVTegDaBZHQJfc55Pdl/Z1fZQoaAZoCWgPQwiQL6GCw9hmQJSGlFKUaBVN6ANoFkdAl99DgQ6IWXV9lChoBmgJaA9DCKNbr+lBm3BAlIaUUpRoFU23A2gWR0CX35Io3JgcdX2UKGgGaAloD0MI2Nglqje7Y0CUhpRSlGgVTegDaBZHQJfgievpyIZ1fZQoaAZoCWgPQwh2UfTAh5RxQJSGlFKUaBVNBQJoFkdAl+EWEkB0ZHV9lChoBmgJaA9DCEHYKVbN3nJAlIaUUpRoFU3zAmgWR0CX4VaoddVvdX2UKGgGaAloD0MIz02bcZryZ0CUhpRSlGgVTegDaBZHQJfjrqrzXjF1fZQoaAZoCWgPQwgbKzHPSj9nQJSGlFKUaBVN6ANoFkdAl+bIyO7xu3V9lChoBmgJaA9DCEPFOH/T53BAlIaUUpRoFU1SA2gWR0CX7BoSL61tdX2UKGgGaAloD0MI5nYv98k0Z0CUhpRSlGgVTegDaBZHQJfu+SpzcRF1fZQoaAZoCWgPQwg4FakwtvZyQJSGlFKUaBVNtQNoFkdAl/D4rFwT/XV9lChoBmgJaA9DCPX0EfgDaXJAlIaUUpRoFU2NAWgWR0CX8uvuw5eadX2UKGgGaAloD0MI3dCUnX6CcECUhpRSlGgVTWwBaBZHQJfzcUN8VpN1fZQoaAZoCWgPQwjYR6eufB5kQJSGlFKUaBVN6ANoFkdAl/jkt/WlM3V9lChoBmgJaA9DCDgVqTC2OXBAlIaUUpRoFU1TAmgWR0CX/iH4GlhxdX2UKGgGaAloD0MIn+bkRSZIY0CUhpRSlGgVTegDaBZHQJgFX7Lt/nZ1fZQoaAZoCWgPQwidLouJTYNjQJSGlFKUaBVN6ANoFkdAmAdluaWonHV9lChoBmgJaA9DCEJaY9CJk3FAlIaUUpRoFU1IA2gWR0CYCiK1XvH+dX2UKGgGaAloD0MIBDi9i3fyY0CUhpRSlGgVTegDaBZHQJgKkf2bobJ1fZQoaAZoCWgPQwiNmUS9YGllQJSGlFKUaBVN6ANoFkdAmAxsPFvQ4XV9lChoBmgJaA9DCLWK/tDMo3BAlIaUUpRoFU3yAmgWR0CYDUZ1V5rydX2UKGgGaAloD0MIqAGDpM8TbkCUhpRSlGgVTSQBaBZHQJgPZBlcyFh1ZS4="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 248, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4BDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOC9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/yZmZmZmZmoWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "system_info": {"OS": "Linux-5.10.133+-x86_64-with-glibc2.27 #1 SMP Fri Aug 26 08:44:51 UTC 2022", "Python": "3.8.16", "Stable-Baselines3": "1.6.2", "PyTorch": "1.13.0+cu116", "GPU Enabled": "True", "Numpy": "1.21.6", "Gym": "0.21.0"}}
 
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gASVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f06fb60f3b0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f06fb60f440>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f06fb60f4d0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f06fb60f560>", "_build": "<function ActorCriticPolicy._build at 0x7f06fb60f5f0>", "forward": "<function ActorCriticPolicy.forward at 0x7f06fb60f680>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7f06fb60f710>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f06fb60f7a0>", "_predict": "<function ActorCriticPolicy._predict at 0x7f06fb60f830>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f06fb60f8c0>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f06fb60f950>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f06fb60f9e0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc_data object at 0x7f06fb64ecf0>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 1000448, "_total_timesteps": 1000000.0, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1683783101143513005, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gASVqgAAAAAAAACMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMDF9yZWNvbnN0cnVjdJSTlIwFbnVtcHmUjAduZGFycmF5lJOUSwCFlEMBYpSHlFKUKEsBSwFLCIaUaAOMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiiUMg5oUNPc+pHj8CG5q9IqCgvgzsqryB/6i9AAAAAAAAAACUdJRiLg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gASViQAAAAAAAACMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMDF9yZWNvbnN0cnVjdJSTlIwFbnVtcHmUjAduZGFycmF5lJOUSwCFlEMBYpSHlFKUKEsBSwGFlGgDjAVkdHlwZZSTlIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYolDAQCUdJRiLg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.00044800000000000395, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gASVPQwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHCtthuwX6+MAWyUTXMBjAF0lEdAmFhnJLdvbXV9lChoBkdAb58ZflZHNGgHTV4BaAhHQJhaATRIBil1fZQoaAZHQG3kd07r9l5oB01GAWgIR0CYXLQQcxTLdX2UKGgGR0BxBlutOmBOaAdNbQFoCEdAmF5euA7Pp3V9lChoBkdAcK20/4ZdfWgHTVUBaAhHQJhf+u0TlDF1fZQoaAZHQHB65fx+a0BoB00nAWgIR0CYYpPlMh5gdX2UKGgGR0BwJjr7fpEAaAdNZgFoCEdAmGQ380k4WHV9lChoBkdAbHvWK/EfkmgHTbQBaAhHQJhmPBKtga51fZQoaAZHQG9oW7nPmgdoB03OAWgIR0CYaZK8+RozdX2UKGgGR0BwnjBO58SgaAdNPgFoCEdAmGsCiItUXHV9lChoBkdAcRj1sLv1DmgHTXIBaAhHQJht7EdeY2N1fZQoaAZHQB0cz67/XGxoB00KAWgIR0CYbyFFUhmodX2UKGgGR0Bwxr6ZYxL1aAdNCgFoCEdAmHByyyD7InV9lChoBkdARH748EFGG2gHTQ4BaAhHQJhxq7SRbKR1fZQoaAZHQHDcH8sMAm1oB00ZAWgIR0CYdCjIq9XcdX2UKGgGR0BwZJoduHeraAdNKQFoCEdAmHWECaJAMXV9lChoBkfAHMgvDgqEvmgHTQsBaAhHQJh2w1TBInV1fZQoaAZHQEw+Uu+RHPNoB0vyaAhHQJh33bfxc3V1fZQoaAZHQHD2XUpd8iRoB00qAWgIR0CYepqh11W9dX2UKGgGR0BvO6Jhvze5aAdNagFoCEdAmHw6BEroXHV9lChoBkdAcgKCemNzbWgHTWQBaAhHQJh90gHNX5p1fZQoaAZHQHDSgrH2h7FoB01EAWgIR0CYgHYqoZQ6dX2UKGgGR0Bv/BWtEG7jaAdNTAFoCEdAmIH6hg3Lm3V9lChoBkdAcJpNFjNILGgHTScBaAhHQJiDVlAeJYV1fZQoaAZHQHCaZBX0XgtoB01TAWgIR0CYhiJWvKU3dX2UKGgGR0BwzS1F6RhdaAdNIQFoCEdAmIdviPyTZHV9lChoBkdAa9IkDZDiO2gHTUEBaAhHQJiI4t/WlM11fZQoaAZHQG6bhbW3BpJoB007AWgIR0CYi35le4TcdX2UKGgGR0BsyVzMibDuaAdNOgFoCEdAmIzqnWJ79nV9lChoBkdAcR932mHgxmgHTVQCaAhHQJiPm/Zdv891fZQoaAZHQHFbgyAQQMBoB01JAWgIR0CYkk8/lhgFdX2UKGgGR0BtJsc81XNkaAdNXAFoCEdAmJPmpMpPRHV9lChoBkdAP0lbmlqJuWgHS/xoCEdAmJUSxu89OnV9lChoBkdAZX4ecQRPGmgHTegDaAhHQJia4Qrc0tR1fZQoaAZHQDXXefqX4TNoB00LAWgIR0CYnUqtozvadX2UKGgGR0BvXEcsDnvEaAdNMQFoCEdAmJ6qX0Gu93V9lChoBkdAcUABEa2nbmgHTTABaAhHQJigB33YcvN1fZQoaAZHQGsVhu4wyqNoB01GAWgIR0CYoq8fms/6dX2UKGgGR0BsaLR2KVIJaAdNbwFoCEdAmKRYUSIxg3V9lChoBkdAbHIwHJLdvmgHTUoBaAhHQJil3WAf+0h1fZQoaAZHQG8xVJL/S6VoB00wAWgIR0CYqIM/yGzsdX2UKGgGR0BiQvJ1aGHpaAdN6ANoCEdAmK0c/Y8MeHV9lChoBkdAbpVY5ksjFGgHTUkBaAhHQJiv49zOopB1fZQoaAZHQHGPfM8ox59oB002AWgIR0CYsYndO6/ZdX2UKGgGR0BwzIxKxs2vaAdNcQFoCEdAmLM6LS/j83V9lChoBkdAcI7ikO7QLWgHTVoBaAhHQJi2AUbkwN91fZQoaAZHQDj9+iJwbVBoB0v/aAhHQJi3JqDbrTp1fZQoaAZHQG/IONo8IRhoB01FAWgIR0CYuJxGlQ/HdX2UKGgGR0Buk99H+ZPVaAdNPwFoCEdAmLtKyKNyYHV9lChoBkdAbR/v3rUsnWgHTZoBaAhHQJi9J3r2QGR1fZQoaAZHQGUN1s+FDfFoB03oA2gIR0CYwvOEug6EdX2UKGgGR0BttuYUnG83aAdNSQFoCEdAmMRv3rUsnXV9lChoBkdAYXjTjNpudmgHTegDaAhHQJjKMGs3hn91fZQoaAZHQD8CjmCAc1hoB0vyaAhHQJjMei0v4/N1fZQoaAZHQExR13+uNgloB0vlaAhHQJjNh95Qgs91fZQoaAZHQG7JYHoouwpoB02PAWgIR0CYz1c1O0swdX2UKGgGR0Bwqc+RoysTaAdNbAFoCEdAmNI6U3XI2nV9lChoBkdAQwPgccU/OmgHTQQBaAhHQJjTaCFsYVJ1fZQoaAZHQG2HcVgx8D1oB00rAWgIR0CY1MfAsTWYdX2UKGgGR0BB0R5C4SYgaAdNEwFoCEdAmNYGnbZezHV9lChoBkdAcDKb8m8dxWgHTSIBaAhHQJjYjf3vhIh1fZQoaAZHQGPKYfOlfqpoB03oA2gIR0CY3kEt/WlNdX2UKGgGR0BxnWvC/GlzaAdN2QNoCEdAmOP+1v2oN3V9lChoBkdAbjoEX+ERJ2gHTUkBaAhHQJjle9Jz1bt1fZQoaAZHQG2aCpvP1L9oB009AWgIR0CY5vWmP5pKdX2UKGgGR0Bwwq0jTrmhaAdNYAFoCEdAmOnL7j1f3XV9lChoBkdAcBaiUgSvkmgHTU4BaAhHQJjrbz+WGAV1fZQoaAZHQG/jEoWpIc1oB01CAWgIR0CY7PxNZeRgdX2UKGgGR0Bx+IibDuSfaAdNVQFoCEdAmO+/JV81GnV9lChoBkdAcIpGPPszEmgHTUIBaAhHQJjxN37k4m11fZQoaAZHQG6PiR4hUzdoB00kAWgIR0CY8oaWHDaXdX2UKGgGR0Bu0gbXHzYmaAdNKgFoCEdAmPPbxNIsiHV9lChoBkdAPu89SuQp4WgHS+poCEdAmPY3bypaR3V9lChoBkdAbc/AymALA2gHTT4BaAhHQJj3pehPCVN1fZQoaAZHv/njs2NvOyFoB0vraAhHQJj4s4cWCVd1fZQoaAZHQGHys67ulXRoB03oA2gIR0CY/nDziCJ5dX2UKGgGR0Bxo2SjgydnaAdNKQFoCEdAmP/TP8hs7HV9lChoBkdAcJQEAo5PuWgHTTUBaAhHQJkCcOe8PFx1fZQoaAZHQG6ASn1nM+xoB003AWgIR0CZA9UrCm/GdX2UKGgGR0Bw/iW0JF9baAdNiQFoCEdAmQWXz+WGAXV9lChoBkdAbUihCdBjWmgHTUoBaAhHQJkIVokAxSJ1fZQoaAZHQHBCdTLns9loB02TAWgIR0CZCiYhdMTOdX2UKGgGR0Bhnk6eXiR5aAdN6ANoCEdAmQ/kmlZX+3V9lChoBkdAbtyGiYb832gHTTABaAhHQJkRSHck+ot1fZQoaAZHQDxnXHzYmLNoB00IAWgIR0CZE7U0vXbudX2UKGgGR0BwCRaxHG0eaAdNkgJoCEdAmRarIxQBP3V9lChoBkdAb9HTmW+oL2gHTVEBaAhHQJkZry8SPEN1fZQoaAZHQHGUQIldC3RoB03bAWgIR0CZG8VWCEpRdX2UKGgGR0BxkX9bX6InaAdNNAFoCEdAmR0giRnvlXV9lChoBkdAcITYbbUPQWgHTT8BaAhHQJkfyZpi7TV1fZQoaAZHQHCIzrRjSXtoB006AWgIR0CZITT/yXlbdX2UKGgGR0BirsI5YHPeaAdN6ANoCEdAmSc8U21lXnV9lChoBkdAbhdLU1AJLWgHTUcBaAhHQJko0USIxg11fZQoaAZHQHF8ycwxnFpoB01+A2gIR0CZLhNcGC7LdX2UKGgGR0Bw7fgm7aqTaAdNXwFoCEdAmTDbl/6O53V9lChoBkdAb7AeCCjDbmgHTSIBaAhHQJkyMMgEEDB1fZQoaAZHQHBb0LQXyiFoB00vAWgIR0CZM48ujASGdX2UKGgGR0BuVfLaEi+taAdNRgFoCEdAmTUJ6IFeOXV9lChoBkdAbY7J4B3iaWgHTSgCaAhHQJk4zTfBN211fZQoaAZHQGvpawMYuTRoB01YAWgIR0CZOllxOtW/dWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gASVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 3908, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gASVlAIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBVudW1weS5jb3JlLm11bHRpYXJyYXmUjAxfcmVjb25zdHJ1Y3SUk5RoBowHbmRhcnJheZSTlEsAhZRDAWKUh5RSlChLAUsIhZRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYolDCAEBAQEBAQEBlHSUYowNYm91bmRlZF9hYm92ZZRoEGgSSwCFlGgUh5RSlChLAUsIhZRoGolDCAEBAQEBAQEBlHSUYowGX3NoYXBllEsIhZSMA2xvd5RoEGgSSwCFlGgUh5RSlChLAUsIhZRoColDIAAAtMIAALTCAACgwAAAoMDbD0nAAACgwAAAAIAAAACAlHSUYowEaGlnaJRoEGgSSwCFlGgUh5RSlChLAUsIhZRoColDIAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lHSUYowIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gASV1QAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCloCmgOjApfbnBfcmFuZG9tlE51Yi4=", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 1, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gASV7wIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsBSwFLE0MEiABTAJROhZQpjAFflIWUjF8vaG9tZS9hYXl1c2gvbWluaWNvbmRhMy9lbnZzL3B5MzcvbGliL3B5dGhvbjMuNy9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4RDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMXy9ob21lL2FheXVzaC9taW5pY29uZGEzL2VudnMvcHkzNy9saWIvcHl0aG9uMy43L3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gASV7wIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsBSwFLE0MEiABTAJROhZQpjAFflIWUjF8vaG9tZS9hYXl1c2gvbWluaWNvbmRhMy9lbnZzL3B5MzcvbGliL3B5dGhvbjMuNy9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4RDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMXy9ob21lL2FheXVzaC9taW5pY29uZGEzL2VudnMvcHkzNy9saWIvcHl0aG9uMy43L3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "system_info": {"OS": "Linux-5.10.16.3-microsoft-standard-WSL2-x86_64-with-debian-bookworm-sid # 1 SMP Fri Apr 2 22:23:49 UTC 2021", "Python": "3.7.16", "Stable-Baselines3": "2.0.0a5", "PyTorch": "1.13.1+cu117", "GPU Enabled": "True", "Numpy": "1.21.6", "Cloudpickle": "2.2.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.21.0"}}
ppo-Lunarlander-v2.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1bcec83f2210730726edd22378004fef22e1ca51a472cc5e5a26b736b0dcf86
3
+ size 146335
ppo-Lunarlander-v2/_stable_baselines3_version ADDED
@@ -0,0 +1 @@
 
 
1
+ 2.0.0a5
ppo-Lunarlander-v2/data ADDED
@@ -0,0 +1,99 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "policy_class": {
3
+ ":type:": "<class 'abc.ABCMeta'>",
4
+ ":serialized:": "gASVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
+ "__module__": "stable_baselines3.common.policies",
6
+ "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
+ "__init__": "<function ActorCriticPolicy.__init__ at 0x7f06fb60f3b0>",
8
+ "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f06fb60f440>",
9
+ "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f06fb60f4d0>",
10
+ "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f06fb60f560>",
11
+ "_build": "<function ActorCriticPolicy._build at 0x7f06fb60f5f0>",
12
+ "forward": "<function ActorCriticPolicy.forward at 0x7f06fb60f680>",
13
+ "extract_features": "<function ActorCriticPolicy.extract_features at 0x7f06fb60f710>",
14
+ "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f06fb60f7a0>",
15
+ "_predict": "<function ActorCriticPolicy._predict at 0x7f06fb60f830>",
16
+ "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f06fb60f8c0>",
17
+ "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f06fb60f950>",
18
+ "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f06fb60f9e0>",
19
+ "__abstractmethods__": "frozenset()",
20
+ "_abc_impl": "<_abc_data object at 0x7f06fb64ecf0>"
21
+ },
22
+ "verbose": 1,
23
+ "policy_kwargs": {},
24
+ "num_timesteps": 1000448,
25
+ "_total_timesteps": 1000000.0,
26
+ "_num_timesteps_at_start": 0,
27
+ "seed": null,
28
+ "action_noise": null,
29
+ "start_time": 1683783101143513005,
30
+ "learning_rate": 0.0003,
31
+ "tensorboard_log": null,
32
+ "_last_obs": {
33
+ ":type:": "<class 'numpy.ndarray'>",
34
+ ":serialized:": "gASVqgAAAAAAAACMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMDF9yZWNvbnN0cnVjdJSTlIwFbnVtcHmUjAduZGFycmF5lJOUSwCFlEMBYpSHlFKUKEsBSwFLCIaUaAOMBWR0eXBllJOUjAJmNJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRiiUMg5oUNPc+pHj8CG5q9IqCgvgzsqryB/6i9AAAAAAAAAACUdJRiLg=="
35
+ },
36
+ "_last_episode_starts": {
37
+ ":type:": "<class 'numpy.ndarray'>",
38
+ ":serialized:": "gASViQAAAAAAAACMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMDF9yZWNvbnN0cnVjdJSTlIwFbnVtcHmUjAduZGFycmF5lJOUSwCFlEMBYpSHlFKUKEsBSwGFlGgDjAVkdHlwZZSTlIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYolDAQCUdJRiLg=="
39
+ },
40
+ "_last_original_obs": null,
41
+ "_episode_num": 0,
42
+ "use_sde": false,
43
+ "sde_sample_freq": -1,
44
+ "_current_progress_remaining": -0.00044800000000000395,
45
+ "_stats_window_size": 100,
46
+ "ep_info_buffer": {
47
+ ":type:": "<class 'collections.deque'>",
48
+ ":serialized:": "gASVPQwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHCtthuwX6+MAWyUTXMBjAF0lEdAmFhnJLdvbXV9lChoBkdAb58ZflZHNGgHTV4BaAhHQJhaATRIBil1fZQoaAZHQG3kd07r9l5oB01GAWgIR0CYXLQQcxTLdX2UKGgGR0BxBlutOmBOaAdNbQFoCEdAmF5euA7Pp3V9lChoBkdAcK20/4ZdfWgHTVUBaAhHQJhf+u0TlDF1fZQoaAZHQHB65fx+a0BoB00nAWgIR0CYYpPlMh5gdX2UKGgGR0BwJjr7fpEAaAdNZgFoCEdAmGQ380k4WHV9lChoBkdAbHvWK/EfkmgHTbQBaAhHQJhmPBKtga51fZQoaAZHQG9oW7nPmgdoB03OAWgIR0CYaZK8+RozdX2UKGgGR0BwnjBO58SgaAdNPgFoCEdAmGsCiItUXHV9lChoBkdAcRj1sLv1DmgHTXIBaAhHQJht7EdeY2N1fZQoaAZHQB0cz67/XGxoB00KAWgIR0CYbyFFUhmodX2UKGgGR0Bwxr6ZYxL1aAdNCgFoCEdAmHByyyD7InV9lChoBkdARH748EFGG2gHTQ4BaAhHQJhxq7SRbKR1fZQoaAZHQHDcH8sMAm1oB00ZAWgIR0CYdCjIq9XcdX2UKGgGR0BwZJoduHeraAdNKQFoCEdAmHWECaJAMXV9lChoBkfAHMgvDgqEvmgHTQsBaAhHQJh2w1TBInV1fZQoaAZHQEw+Uu+RHPNoB0vyaAhHQJh33bfxc3V1fZQoaAZHQHD2XUpd8iRoB00qAWgIR0CYepqh11W9dX2UKGgGR0BvO6Jhvze5aAdNagFoCEdAmHw6BEroXHV9lChoBkdAcgKCemNzbWgHTWQBaAhHQJh90gHNX5p1fZQoaAZHQHDSgrH2h7FoB01EAWgIR0CYgHYqoZQ6dX2UKGgGR0Bv/BWtEG7jaAdNTAFoCEdAmIH6hg3Lm3V9lChoBkdAcJpNFjNILGgHTScBaAhHQJiDVlAeJYV1fZQoaAZHQHCaZBX0XgtoB01TAWgIR0CYhiJWvKU3dX2UKGgGR0BwzS1F6RhdaAdNIQFoCEdAmIdviPyTZHV9lChoBkdAa9IkDZDiO2gHTUEBaAhHQJiI4t/WlM11fZQoaAZHQG6bhbW3BpJoB007AWgIR0CYi35le4TcdX2UKGgGR0BsyVzMibDuaAdNOgFoCEdAmIzqnWJ79nV9lChoBkdAcR932mHgxmgHTVQCaAhHQJiPm/Zdv891fZQoaAZHQHFbgyAQQMBoB01JAWgIR0CYkk8/lhgFdX2UKGgGR0BtJsc81XNkaAdNXAFoCEdAmJPmpMpPRHV9lChoBkdAP0lbmlqJuWgHS/xoCEdAmJUSxu89OnV9lChoBkdAZX4ecQRPGmgHTegDaAhHQJia4Qrc0tR1fZQoaAZHQDXXefqX4TNoB00LAWgIR0CYnUqtozvadX2UKGgGR0BvXEcsDnvEaAdNMQFoCEdAmJ6qX0Gu93V9lChoBkdAcUABEa2nbmgHTTABaAhHQJigB33YcvN1fZQoaAZHQGsVhu4wyqNoB01GAWgIR0CYoq8fms/6dX2UKGgGR0BsaLR2KVIJaAdNbwFoCEdAmKRYUSIxg3V9lChoBkdAbHIwHJLdvmgHTUoBaAhHQJil3WAf+0h1fZQoaAZHQG8xVJL/S6VoB00wAWgIR0CYqIM/yGzsdX2UKGgGR0BiQvJ1aGHpaAdN6ANoCEdAmK0c/Y8MeHV9lChoBkdAbpVY5ksjFGgHTUkBaAhHQJiv49zOopB1fZQoaAZHQHGPfM8ox59oB002AWgIR0CYsYndO6/ZdX2UKGgGR0BwzIxKxs2vaAdNcQFoCEdAmLM6LS/j83V9lChoBkdAcI7ikO7QLWgHTVoBaAhHQJi2AUbkwN91fZQoaAZHQDj9+iJwbVBoB0v/aAhHQJi3JqDbrTp1fZQoaAZHQG/IONo8IRhoB01FAWgIR0CYuJxGlQ/HdX2UKGgGR0Buk99H+ZPVaAdNPwFoCEdAmLtKyKNyYHV9lChoBkdAbR/v3rUsnWgHTZoBaAhHQJi9J3r2QGR1fZQoaAZHQGUN1s+FDfFoB03oA2gIR0CYwvOEug6EdX2UKGgGR0BttuYUnG83aAdNSQFoCEdAmMRv3rUsnXV9lChoBkdAYXjTjNpudmgHTegDaAhHQJjKMGs3hn91fZQoaAZHQD8CjmCAc1hoB0vyaAhHQJjMei0v4/N1fZQoaAZHQExR13+uNgloB0vlaAhHQJjNh95Qgs91fZQoaAZHQG7JYHoouwpoB02PAWgIR0CYz1c1O0swdX2UKGgGR0Bwqc+RoysTaAdNbAFoCEdAmNI6U3XI2nV9lChoBkdAQwPgccU/OmgHTQQBaAhHQJjTaCFsYVJ1fZQoaAZHQG2HcVgx8D1oB00rAWgIR0CY1MfAsTWYdX2UKGgGR0BB0R5C4SYgaAdNEwFoCEdAmNYGnbZezHV9lChoBkdAcDKb8m8dxWgHTSIBaAhHQJjYjf3vhIh1fZQoaAZHQGPKYfOlfqpoB03oA2gIR0CY3kEt/WlNdX2UKGgGR0BxnWvC/GlzaAdN2QNoCEdAmOP+1v2oN3V9lChoBkdAbjoEX+ERJ2gHTUkBaAhHQJjle9Jz1bt1fZQoaAZHQG2aCpvP1L9oB009AWgIR0CY5vWmP5pKdX2UKGgGR0Bwwq0jTrmhaAdNYAFoCEdAmOnL7j1f3XV9lChoBkdAcBaiUgSvkmgHTU4BaAhHQJjrbz+WGAV1fZQoaAZHQG/jEoWpIc1oB01CAWgIR0CY7PxNZeRgdX2UKGgGR0Bx+IibDuSfaAdNVQFoCEdAmO+/JV81GnV9lChoBkdAcIpGPPszEmgHTUIBaAhHQJjxN37k4m11fZQoaAZHQG6PiR4hUzdoB00kAWgIR0CY8oaWHDaXdX2UKGgGR0Bu0gbXHzYmaAdNKgFoCEdAmPPbxNIsiHV9lChoBkdAPu89SuQp4WgHS+poCEdAmPY3bypaR3V9lChoBkdAbc/AymALA2gHTT4BaAhHQJj3pehPCVN1fZQoaAZHv/njs2NvOyFoB0vraAhHQJj4s4cWCVd1fZQoaAZHQGHys67ulXRoB03oA2gIR0CY/nDziCJ5dX2UKGgGR0Bxo2SjgydnaAdNKQFoCEdAmP/TP8hs7HV9lChoBkdAcJQEAo5PuWgHTTUBaAhHQJkCcOe8PFx1fZQoaAZHQG6ASn1nM+xoB003AWgIR0CZA9UrCm/GdX2UKGgGR0Bw/iW0JF9baAdNiQFoCEdAmQWXz+WGAXV9lChoBkdAbUihCdBjWmgHTUoBaAhHQJkIVokAxSJ1fZQoaAZHQHBCdTLns9loB02TAWgIR0CZCiYhdMTOdX2UKGgGR0Bhnk6eXiR5aAdN6ANoCEdAmQ/kmlZX+3V9lChoBkdAbtyGiYb832gHTTABaAhHQJkRSHck+ot1fZQoaAZHQDxnXHzYmLNoB00IAWgIR0CZE7U0vXbudX2UKGgGR0BwCRaxHG0eaAdNkgJoCEdAmRarIxQBP3V9lChoBkdAb9HTmW+oL2gHTVEBaAhHQJkZry8SPEN1fZQoaAZHQHGUQIldC3RoB03bAWgIR0CZG8VWCEpRdX2UKGgGR0BxkX9bX6InaAdNNAFoCEdAmR0giRnvlXV9lChoBkdAcITYbbUPQWgHTT8BaAhHQJkfyZpi7TV1fZQoaAZHQHCIzrRjSXtoB006AWgIR0CZITT/yXlbdX2UKGgGR0BirsI5YHPeaAdN6ANoCEdAmSc8U21lXnV9lChoBkdAbhdLU1AJLWgHTUcBaAhHQJko0USIxg11fZQoaAZHQHF8ycwxnFpoB01+A2gIR0CZLhNcGC7LdX2UKGgGR0Bw7fgm7aqTaAdNXwFoCEdAmTDbl/6O53V9lChoBkdAb7AeCCjDbmgHTSIBaAhHQJkyMMgEEDB1fZQoaAZHQHBb0LQXyiFoB00vAWgIR0CZM48ujASGdX2UKGgGR0BuVfLaEi+taAdNRgFoCEdAmTUJ6IFeOXV9lChoBkdAbY7J4B3iaWgHTSgCaAhHQJk4zTfBN211fZQoaAZHQGvpawMYuTRoB01YAWgIR0CZOllxOtW/dWUu"
49
+ },
50
+ "ep_success_buffer": {
51
+ ":type:": "<class 'collections.deque'>",
52
+ ":serialized:": "gASVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
53
+ },
54
+ "_n_updates": 3908,
55
+ "observation_space": {
56
+ ":type:": "<class 'gymnasium.spaces.box.Box'>",
57
+ ":serialized:": "gASVlAIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBVudW1weS5jb3JlLm11bHRpYXJyYXmUjAxfcmVjb25zdHJ1Y3SUk5RoBowHbmRhcnJheZSTlEsAhZRDAWKUh5RSlChLAUsIhZRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYolDCAEBAQEBAQEBlHSUYowNYm91bmRlZF9hYm92ZZRoEGgSSwCFlGgUh5RSlChLAUsIhZRoGolDCAEBAQEBAQEBlHSUYowGX3NoYXBllEsIhZSMA2xvd5RoEGgSSwCFlGgUh5RSlChLAUsIhZRoColDIAAAtMIAALTCAACgwAAAoMDbD0nAAACgwAAAAIAAAACAlHSUYowEaGlnaJRoEGgSSwCFlGgUh5RSlChLAUsIhZRoColDIAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lHSUYowIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=",
58
+ "dtype": "float32",
59
+ "bounded_below": "[ True True True True True True True True]",
60
+ "bounded_above": "[ True True True True True True True True]",
61
+ "_shape": [
62
+ 8
63
+ ],
64
+ "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]",
65
+ "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]",
66
+ "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]",
67
+ "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]",
68
+ "_np_random": null
69
+ },
70
+ "action_space": {
71
+ ":type:": "<class 'gymnasium.spaces.discrete.Discrete'>",
72
+ ":serialized:": "gASV1QAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCloCmgOjApfbnBfcmFuZG9tlE51Yi4=",
73
+ "n": "4",
74
+ "start": "0",
75
+ "_shape": [],
76
+ "dtype": "int64",
77
+ "_np_random": null
78
+ },
79
+ "n_envs": 1,
80
+ "n_steps": 1024,
81
+ "gamma": 0.999,
82
+ "gae_lambda": 0.98,
83
+ "ent_coef": 0.01,
84
+ "vf_coef": 0.5,
85
+ "max_grad_norm": 0.5,
86
+ "batch_size": 64,
87
+ "n_epochs": 4,
88
+ "clip_range": {
89
+ ":type:": "<class 'function'>",
90
+ ":serialized:": "gASV7wIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsBSwFLE0MEiABTAJROhZQpjAFflIWUjF8vaG9tZS9hYXl1c2gvbWluaWNvbmRhMy9lbnZzL3B5MzcvbGliL3B5dGhvbjMuNy9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4RDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMXy9ob21lL2FheXVzaC9taW5pY29uZGEzL2VudnMvcHkzNy9saWIvcHl0aG9uMy43L3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"
91
+ },
92
+ "clip_range_vf": null,
93
+ "normalize_advantage": true,
94
+ "target_kl": null,
95
+ "lr_schedule": {
96
+ ":type:": "<class 'function'>",
97
+ ":serialized:": "gASV7wIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsBSwFLE0MEiABTAJROhZQpjAFflIWUjF8vaG9tZS9hYXl1c2gvbWluaWNvbmRhMy9lbnZzL3B5MzcvbGliL3B5dGhvbjMuNy9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4RDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMXy9ob21lL2FheXVzaC9taW5pY29uZGEzL2VudnMvcHkzNy9saWIvcHl0aG9uMy43L3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"
98
+ }
99
+ }
ppo-Lunarlander-v2/policy.optimizer.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:23f03ad250dde15545fa80dc8620ef5a94c930c56de1a14f55039ac4abc71f73
3
+ size 87929
ppo-Lunarlander-v2/policy.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81a24d8378f26828a166955cb03fcf386fcd1f0dcf0767a149336e4c6047077b
3
+ size 43329
ppo-Lunarlander-v2/pytorch_variables.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d030ad8db708280fcae77d87e973102039acd23a11bdecc3db8eb6c0ac940ee1
3
+ size 431
ppo-Lunarlander-v2/system_info.txt ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ - OS: Linux-5.10.16.3-microsoft-standard-WSL2-x86_64-with-debian-bookworm-sid # 1 SMP Fri Apr 2 22:23:49 UTC 2021
2
+ - Python: 3.7.16
3
+ - Stable-Baselines3: 2.0.0a5
4
+ - PyTorch: 1.13.1+cu117
5
+ - GPU Enabled: True
6
+ - Numpy: 1.21.6
7
+ - Cloudpickle: 2.2.1
8
+ - Gymnasium: 0.28.1
9
+ - OpenAI Gym: 0.21.0
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 263.4026389837111, "std_reward": 12.539074516974933, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2022-12-13T01:24:01.734416"}
 
1
+ {"mean_reward": 227.16474877851095, "std_reward": 83.81876941049664, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-05-10T23:01:11.486767"}