Upload PPO LunarLander-v2 trained agent
Browse files- README.md +1 -1
- config.json +1 -1
- ppo-LunarLander-v2.zip +2 -2
- ppo-LunarLander-v2/data +22 -22
- ppo-LunarLander-v2/policy.optimizer.pth +1 -1
- ppo-LunarLander-v2/policy.pth +1 -1
- replay.mp4 +0 -0
- results.json +1 -1
README.md
CHANGED
@@ -16,7 +16,7 @@ model-index:
|
|
16 |
type: LunarLander-v2
|
17 |
metrics:
|
18 |
- type: mean_reward
|
19 |
-
value:
|
20 |
name: mean_reward
|
21 |
verified: false
|
22 |
---
|
|
|
16 |
type: LunarLander-v2
|
17 |
metrics:
|
18 |
- type: mean_reward
|
19 |
+
value: 281.00 +/- 19.72
|
20 |
name: mean_reward
|
21 |
verified: false
|
22 |
---
|
config.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7fddaa2e90d0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7fddaa2e9160>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7fddaa2e91f0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7fddaa2e9280>", "_build": "<function ActorCriticPolicy._build at 0x7fddaa2e9310>", "forward": "<function ActorCriticPolicy.forward at 0x7fddaa2e93a0>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7fddaa2e9430>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7fddaa2e94c0>", "_predict": "<function ActorCriticPolicy._predict at 0x7fddaa2e9550>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7fddaa2e95e0>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7fddaa2e9670>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7fddaa2e9700>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7fddaa2e3a80>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 1003520, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1682426688940370667, "learning_rate": 0.0003, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4JDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/M6kqMFUyYYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAICKH76+Uic/nQSfPdJZpr4RT7q9LviVPQAAAAAAAAAAsyEJvXLOZj4/MiY+j3x8vmdrET1WVJ87AAAAAAAAAAAA15s8GJ2FPnWW7z1do5S+N4e0PW6WhT0AAAAAAAAAAE1ac72p/za8dGM9PXDojjwfT5q94mtrPQAAgD8AAIA/zeCsvVRUKj6CZ6A9tGaBvljyCj0JlUo8AAAAAAAAAACaZZO99ahkP22/l73vbMC+5l5KvQm/q7wAAAAAAAAAAOaKvr2kyGs6zyIhPPLDILPpqty7evUHswAAgD8AAAAAza0LPdQmn7yannC9GWcovOa8Ujyaqp49AACAPwAAgD8Nadc9q+UUPx/2sTw32J++aMuPPeND8LwAAAAAAAAAAGZIv738DI8/WtaDvnr1w77P+xS+4JSvvQAAAAAAAAAA5opLPcqhiD55bIa93EmMvnaK6Dx2bNa8AAAAAAAAAADNLEA99g1hP4WK6j3ewMy+a5suPQbET70AAAAAAAAAAABk+jvhCo+6mAM/OiecHbn6yze7otZMuQAAgD8AAIA/wEPdvYrZYT/9uKG9MMq8vkh/yr2JBS88AAAAAAAAAACz4bK9oWecvGMbzj2z7iO9dC4OvsAdAr4AAAAAAACAP7ZjlT67SCI/zoVUPEDOo77krlc+jdTQvAAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.0035199999999999676, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVaRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIb/JbdDLRbECUhpRSlIwBbJRNHwGMAXSUR0C1tCr8zhxYdX2UKGgGaAloD0MI5usy/KdVcECUhpRSlGgVTQYBaBZHQLW0Ne3QUpN1fZQoaAZoCWgPQwiJ1LSLqdxxQJSGlFKUaBVN4gFoFkdAtbSGckMTe3V9lChoBmgJaA9DCNvDXihgmHFAlIaUUpRoFU0iAWgWR0C1tJxlMAWBdX2UKGgGaAloD0MIyNEcWbnocECUhpRSlGgVTTIBaBZHQLW075Jsfq51fZQoaAZoCWgPQwiRm+EGvNdyQJSGlFKUaBVNDQFoFkdAtbT28cuJ13V9lChoBmgJaA9DCOmBj8GKAnBAlIaUUpRoFU0GAWgWR0C1tQaBAfMfdX2UKGgGaAloD0MI93XgnFF3cECUhpRSlGgVS/1oFkdAtbUWaOPvKHV9lChoBmgJaA9DCMNJmj9m+nFAlIaUUpRoFUvtaBZHQLW1LCr92ox1fZQoaAZoCWgPQwjAety32nVwQJSGlFKUaBVNCQFoFkdAtbY6ZfD1oXV9lChoBmgJaA9DCBx9zAdEcnJAlIaUUpRoFU0pAWgWR0C1tk8r/bTMdX2UKGgGaAloD0MIoyJOJ1ldcUCUhpRSlGgVTRQBaBZHQLW2VedCmdl1fZQoaAZoCWgPQwgWinQ/p8BxQJSGlFKUaBVNEAFoFkdAtbZpALRa5nV9lChoBmgJaA9DCJf/kH77+HBAlIaUUpRoFU0PAWgWR0C1ttF6mfoSdX2UKGgGaAloD0MII0kQrgDIcECUhpRSlGgVS/poFkdAtbbb3PAwf3V9lChoBmgJaA9DCMvydRl+Jm5AlIaUUpRoFU0MAWgWR0C1tvaUiY9gdX2UKGgGaAloD0MI74y2KomocECUhpRSlGgVTSABaBZHQLW3DO0svqV1fZQoaAZoCWgPQwjvWGyTisFdQJSGlFKUaBVN6ANoFkdAtbcdKCg9NnV9lChoBmgJaA9DCL9jeOzngXBAlIaUUpRoFU0EAWgWR0C1t18slLOBdX2UKGgGaAloD0MI1pC4x1LxcECUhpRSlGgVTRMBaBZHQLW3n1dgOSZ1fZQoaAZoCWgPQwjyI37Fmp9uQJSGlFKUaBVNAwFoFkdAtbfw5ggHNXV9lChoBmgJaA9DCPIIbqRsZXFAlIaUUpRoFUv7aBZHQLW38URWcSZ1fZQoaAZoCWgPQwghVn+E4UhyQJSGlFKUaBVL+2gWR0C1uAPt6X0HdX2UKGgGaAloD0MIqRd8mtM/ckCUhpRSlGgVS/NoFkdAtbgPCMxXXHV9lChoBmgJaA9DCNP1RNeFZXFAlIaUUpRoFU0jAWgWR0C1uC+32EkCdX2UKGgGaAloD0MIL4UHzW69cECUhpRSlGgVS+NoFkdAtbhF3aBZp3V9lChoBmgJaA9DCJW5+Ub01XFAlIaUUpRoFU0DAWgWR0C1udLZ8KG+dX2UKGgGaAloD0MIRdREnw+CbkCUhpRSlGgVTR0BaBZHQLW6DKvV3EB1fZQoaAZoCWgPQwgfoWZIVfVyQJSGlFKUaBVNHAFoFkdAtbosvnKW9nV9lChoBmgJaA9DCH0kJT0Ma3NAlIaUUpRoFUv3aBZHQLW6QfF72L51fZQoaAZoCWgPQwiLFqBttSNvQJSGlFKUaBVNEwFoFkdAtbqAXenAI3V9lChoBmgJaA9DCGgIxyx74m1AlIaUUpRoFU0TAWgWR0C1uqUhaC+UdX2UKGgGaAloD0MIb38uGrIbcUCUhpRSlGgVTRABaBZHQLW6txVyWAx1fZQoaAZoCWgPQwhsmKHxRLlwQJSGlFKUaBVNDgFoFkdAtbrDLns9jnV9lChoBmgJaA9DCOknnN0aRXBAlIaUUpRoFU0GAWgWR0C1ux6aTfSAdX2UKGgGaAloD0MI5dU5BuSbcECUhpRSlGgVTSwBaBZHQLW7MJrcj7h1fZQoaAZoCWgPQwgZjBGJAuNxQJSGlFKUaBVNHAFoFkdAtbt92KVIJHV9lChoBmgJaA9DCCidSDDVUXJAlIaUUpRoFU0fAWgWR0C1u4RbW3BpdX2UKGgGaAloD0MIVryReaTfcUCUhpRSlGgVTQEBaBZHQLW7kw6ySmt1fZQoaAZoCWgPQwgOaVTg5BBxQJSGlFKUaBVNHwFoFkdAtbuTRYzSC3V9lChoBmgJaA9DCELRPIDFf3FAlIaUUpRoFU0fAWgWR0C1u7P7WNFSdX2UKGgGaAloD0MIk45yMJvvckCUhpRSlGgVTTkBaBZHQLW8ixj8UEh1fZQoaAZoCWgPQwg8FXDPs/9yQJSGlFKUaBVNEAFoFkdAtbzsAKfFrHV9lChoBmgJaA9DCIl8l1IXUHFAlIaUUpRoFUv9aBZHQLW87eVcD8t1fZQoaAZoCWgPQwiQZiyaThFxQJSGlFKUaBVNNgFoFkdAtb0JBkZrHnV9lChoBmgJaA9DCISgo1WtF21AlIaUUpRoFU0XAWgWR0C1vQ4aHbh4dX2UKGgGaAloD0MIfh6jPHM6b0CUhpRSlGgVS/9oFkdAtb0bMW43FXV9lChoBmgJaA9DCLOyfcibxXBAlIaUUpRoFU0LAWgWR0C1vUVclgMMdX2UKGgGaAloD0MIWB050llXcUCUhpRSlGgVTQUBaBZHQLW9Tsenyd51fZQoaAZoCWgPQwiifEELycFwQJSGlFKUaBVNEwFoFkdAtb1bXpW3jXV9lChoBmgJaA9DCAr2X+em8FRAlIaUUpRoFUu6aBZHQLW9feZof0V1fZQoaAZoCWgPQwicTx2rFE9xQJSGlFKUaBVNFgFoFkdAtb21SflIVnV9lChoBmgJaA9DCEYjn1d8s3FAlIaUUpRoFU0MAWgWR0C1vbcjzI3jdX2UKGgGaAloD0MIttlYifnrcUCUhpRSlGgVS/doFkdAtb3rJFLFoHV9lChoBmgJaA9DCCXs20lEdG9AlIaUUpRoFU0XAWgWR0C1vg9dzGPxdX2UKGgGaAloD0MImu/gJ47wbkCUhpRSlGgVTR0BaBZHQLW+9ScslLR1fZQoaAZoCWgPQwgEx2XclBJxQJSGlFKUaBVNFAFoFkdAtb8HWmP5pXV9lChoBmgJaA9DCL+2fvpPn3JAlIaUUpRoFUvuaBZHQLW/M4VARkF1fZQoaAZoCWgPQwhwmGiQQqxwQJSGlFKUaBVNLQFoFkdAtb9CS8rZrnV9lChoBmgJaA9DCJ8FobxPMXNAlIaUUpRoFU0BAWgWR0C1v1Lv1DjSdX2UKGgGaAloD0MIXhJnRdTGcECUhpRSlGgVTRMBaBZHQLW/hlSCOFR1fZQoaAZoCWgPQwgxCKwc2jpuQJSGlFKUaBVL92gWR0C1v5YgA6uGdX2UKGgGaAloD0MIteBFX0H9b0CUhpRSlGgVS/poFkdAtb+xB8hLXnV9lChoBmgJaA9DCLStZp3xlHJAlIaUUpRoFU0SAWgWR0C1v8iEUTL4dX2UKGgGaAloD0MIMewwJr1xckCUhpRSlGgVTTYBaBZHQLW/zScbzbx1fZQoaAZoCWgPQwg/U69bhKVyQJSGlFKUaBVL8GgWR0C1wALZamoBdX2UKGgGaAloD0MIXcR3YlYmckCUhpRSlGgVS/5oFkdAtcAbEehf0HV9lChoBmgJaA9DCBJMNbPWRnBAlIaUUpRoFU0wAWgWR0C1wDHhwVCYdX2UKGgGaAloD0MI0jb+RGXeb0CUhpRSlGgVTREBaBZHQLXAcRV6u4h1fZQoaAZoCWgPQwhz275HfeJuQJSGlFKUaBVL7WgWR0C1wIvgJkXldX2UKGgGaAloD0MIBOeMKO1WckCUhpRSlGgVS+RoFkdAtcGAVrRBvHV9lChoBmgJaA9DCGMJa2MsvXFAlIaUUpRoFU0tAWgWR0C1wY//7zkIdX2UKGgGaAloD0MI7blMTUJyckCUhpRSlGgVTdsBaBZHQLXBodvsJIF1fZQoaAZoCWgPQwhm+E83ULJvQJSGlFKUaBVNCAFoFkdAtcGu0eEIxHV9lChoBmgJaA9DCMbf9gSJ/XBAlIaUUpRoFU0vAWgWR0C1wbBk/bCadX2UKGgGaAloD0MIYviImNKXcUCUhpRSlGgVTQQBaBZHQLXBxMHryDt1fZQoaAZoCWgPQwjGNNO9TrlwQJSGlFKUaBVL8GgWR0C1wddoBaLXdX2UKGgGaAloD0MIJo+n5YfucUCUhpRSlGgVTQYBaBZHQLXCCfIS13N1fZQoaAZoCWgPQwjLEMe6OA9yQJSGlFKUaBVNDwFoFkdAtcJKgM+eOHV9lChoBmgJaA9DCFMFo5I6OG9AlIaUUpRoFU0gAWgWR0C1wk2KEWZadX2UKGgGaAloD0MIxanWwqx5cUCUhpRSlGgVTQUBaBZHQLXCbtF8XvZ1fZQoaAZoCWgPQwg0LbEyGmRxQJSGlFKUaBVNJwFoFkdAtcJzKFIuoXV9lChoBmgJaA9DCJSJWwWxLHFAlIaUUpRoFUv9aBZHQLXCeKAavRt1fZQoaAZoCWgPQwjCvTJv1R9yQJSGlFKUaBVL+GgWR0C1woRcqvvCdX2UKGgGaAloD0MIn8ppT4nNcECUhpRSlGgVTRwBaBZHQLXDuOUMXrN1fZQoaAZoCWgPQwjJrx9iw5RwQJSGlFKUaBVNBQFoFkdAtcPZwkxASnV9lChoBmgJaA9DCNXsgVZgqXFAlIaUUpRoFUv+aBZHQLXD3XAdn011fZQoaAZoCWgPQwjsFRbcj8RvQJSGlFKUaBVNLwFoFkdAtcP1xKg7HXV9lChoBmgJaA9DCHy3eeOk2m1AlIaUUpRoFU0RAWgWR0C1xBUjLSuydX2UKGgGaAloD0MIsW8nESFEckCUhpRSlGgVTRABaBZHQLXEI8sMAm11fZQoaAZoCWgPQwgmxccnJDZwQJSGlFKUaBVNKgFoFkdAtcRQgDA8CHV9lChoBmgJaA9DCL0aoDTUEnJAlIaUUpRoFU0bAWgWR0C1xGoukDZEdX2UKGgGaAloD0MIWHA/4EFgcUCUhpRSlGgVTTQBaBZHQLXEfigkC3h1fZQoaAZoCWgPQwhkH2RZcGFyQJSGlFKUaBVNIwFoFkdAtcStfhMrVnV9lChoBmgJaA9DCAq8k0+P401AlIaUUpRoFUvqaBZHQLXEu6BiCrd1fZQoaAZoCWgPQwhWC+wxkbBuQJSGlFKUaBVNEAFoFkdAtcTUNMGorHV9lChoBmgJaA9DCM5uLZMhF3FAlIaUUpRoFU0dAWgWR0C1xOae9SMtdX2UKGgGaAloD0MICvKzkWvvbECUhpRSlGgVTQsBaBZHQLXE/G/vfCR1fZQoaAZoCWgPQwiuSbclMv9yQJSGlFKUaBVNBgFoFkdAtcURaKUFCHV9lChoBmgJaA9DCOAO1ClP9HBAlIaUUpRoFU0oAWgWR0C1xUvl2eQNdWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 810, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVnwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/5RoCksIhZSMAUOUdJRSlIwEaGlnaJRoEiiWIAAAAAAAAAAAAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAf5RoCksIhZRoFXSUUpSMDWJvdW5kZWRfYmVsb3eUaBIolggAAAAAAAAAAAAAAAAAAACUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYIAAAAAAAAAAAAAAAAAAAAlGghSwiFlGgVdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [8], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False]", "bounded_above": "[False False False False False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gAWVLwsAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUaAeTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZSMFG51bXB5LnJhbmRvbS5fcGlja2xllIwSX19yYW5kb21zdGF0ZV9jdG9ylJOUjAdNVDE5OTM3lIWUUpR9lCiMDWJpdF9nZW5lcmF0b3KUaBOMBXN0YXRllH2UKIwDa2V5lIwSbnVtcHkuY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QolsAJAAAAAAAAUpc4G/2dDSP1bMWDtLFdoAPdMmk17fcq86Bi9sIS10GKggvsSWxg41zeKhn8qU4ZmDrbok5JCaAaaCpLBJ1+Sq6tptQJVx3wA3yicv5JG3z1u5We6zLYhB71aks/x9fCP9dRlS/fVrDEqsy08jSun2aDzFJGTWlrRvk62Ctmx8bFALjNiCXwfW+k7roPmuPQ1zuIwRGwnvzdg0D8/+qRCqc7WEhuWEFSsnKlls45UogSSxL3URQf/zyeO3wrwcQLNM1U3IsLKzBOTLzfYmUc5Hv6jXbg8sbyMAwtOb8aIfP7r1papTz11DAC76UuaPYpKcWoXLTlpztfFVQ9MZrt9EPiOdDncMTYOdS5iqZJVbXzqM5+2vZU8SkOjCYCjLkU/ntYpJxuPxQOKchZWTBA8buF5f8pwCbbvcsk0GF6ArBin+fZjUZ4NBK/gfJ1VwA65wAHhUdfPTYCyvrZVb8no2W6MzsfrTq2G1LaxCrTG1JVmWyY8VV3GTlN3PHyBiMv4uN67l7uKzN7imFj0h7kIAeYX3C8C4YPVED4li2ud6W10xAO/gNusjQVffU7PhyQ5Z2m7od6Su39xcUa2eEmjOpT92qlHwF7sTZU17mJpgFGqIr4WLcyGEh42i44LKgPH36vfZLsGIDg6MpqTuhNnGrt7tM4iw1lgQrwdSXqSjxepDQHfodtb3f/rkJteKuNI3nlb0Y63kdDyqZVEOsoFH0LQA2fW7ptG2tFK0meAuWUeikKF9UHYRPoIyJLumnUXCaabpVlo4LPYGFSduL9GIZKLxDzQIFXly8JQGk+nGCQJxedip4z7mfn2Ak9gXeIyHlE5ZV6kMAA0NSLraFlBIwhsFpKxKsBEgsCZpi355uuhj/eGvTo/UNaQGEHuFyAWwnUXe+Q6IA8Wd+18TBJ9hJAcvKDJF2+lr/jvqLHcbEkdI3RKKuKPuhveQ/muUwRUPttkF6n7NoJ/gbegdM8nvYxKrEHaqZgaLm7ahOm1rRDgF2lN9WsIjzBZS+xcmPDi9JcFmkoRQ/FR93z1qC9AD9igHOQnSkRPrsuPI37sRquBtk0WNJIe2ez8h3eu4/aX3rzyJKYaemD626mtSa9sTU0HKQvyBHMR6wKhfNTLAanLq/IOytFHXPo4vTiHO/0PpQBLCQWV3Zk8vqpVHWyiaI14ahseXns78W0+WdHI0V9cn9QbYbeE8WteMXLDmy39cdc3L0sVP6JRGqSzS4QvT7oL7dXK52aHpNtyXKxDR3cyiV7K18W4o75P358pDFhw9hcOvI/BhdYyzJ0OH28EIRhhk6gUHO2ohfFJtmdAStf4DBnd0skJWoY8CEp6GAylRJXx0yKxXAfbu0+ZW5hkCAhDycYTQU2ASVhZOV3d2JIaf89CJaqCHcAYwJN/V4kUD606ICVee2hN9TeZioZ3/l3ptQFkCNANauMP5Nii9ykjAI/1wkHKOEpstgNJwnK1GIRCU4cyZdlX/cP9cqyhGOOIsMM4Zgemp4SRIcYbyY3ok/0xTySFKkmv37bRImUBGVgGlOWOxlclJ0D4RtXQwxN762xG6bediTFS6xm9NfW68pyZOi7pN1E6m+pAO0D9r5UOVyEgZZlLzYXywut0uklnxjaq9Vn+PVxz3L71ooBHsqV1nH0G+N/AmSshKPPLxJs+VqH4pdmZh8cwP5ovfSHbNbDjOqChMnA23/I5vq0tO9xaqrfYxlfs172syspz4EcI1SgttrfM1Vp/WK/1IWunitWxQJfpdJjZZKp50DEZ0HMvmOv7DTl2dBhz9SIfaPwKms6DBTL/vEdANI1GV1jGHBmqTS2SWh8I77Khv5YPND2IpBLVu/pkD54JxJDTgh7/Qd/STJbd4U9ioZlDUXNy/ZuOq9TSJNBnu4gfBJxc35UGCAsoRh2wyQkgsj2MmqhUuxUXt4jYI5mGNcht3aDiCLZs1LAK/wvW/5d3qeZL0MWv97VZpv4Icp+6y9Y+buadTM+o9hklrtoIQyNpZzbZBAtVdRvQrCzj8pu9d38lp64XcP7hTm3jxhs4ugf8WD9h5OBzScxjHg6JBGv0IRSjq4qCjIV6zgJ3WxLoa4slQwPHLB30bczi1UMAPZjK+29vbWLItHdC+HRQK7XgPIOqFgh7V4ls2JRX60EAeQZ+MIh2OyeMoEzxiS0UDur7oiIENw2Qmm0fVrcsZfeo7mTOH9sklr5vKzlcCDuXIhkcfhnyRy0KOeoOJx6LUUlCre/UJg1dYoECdWYBLYJCQ39Oi3VIy1p9CQ54pr5Xigg3Ju7q393jb62tpyxzBpzywTvqdt+YlVkKjKO9huJd5ta+egB6909ZXXhrVKSPfCi8wuC1OEVihfsPO+uUlGOlt6oUg4gsaftSGPYidKpUFBtkNRr6FwGS5aGaiWEzQn3k1hAxmMAknvBzw4haH+Z2Lf3iBJoaZyUat+Lv0ldEjQUFLLYlU3mgGwhfvQKJTLKTVZj4INlTpeg7QpUnOPUmrTR9xiLRtMMTpCdDQbuKpUr3LyY87EvTjwJdjYnKa/iXLOHv2zilVZ9/zS0Ee0TRhPMx28DSmXhXplt/hbM1Y6VdKnm2q/gd7lOD7Tg6V7Eldt1Qz8wyxhLidwflGN9f0hr1fbYqW6htA9D/9xyVEfrBqd622aee308LzuLLMqdePNWX6jWv+tAWLuWdM7DOshHiMWbBgLrJpNERCnyNKXluzMGie+eFSdOQpnSMnJFEf1jZ/DHlR+CcXEY+yGyvuBUDpJoVyqEGb1D1502ptp28YKdr218w5UcQHRTVD/M3pguJFfgb0NNlT4tMR3fzZOZ9wapSrpAecz3oSvSPFkAqRm5NisMKeVyUlSZmL1bzk0rFqDLiw6H7oeOLii9wLNgS7WcgQ42K1tfD/PTukbOKF4387GZm9+7wjthX68Vee6VObfnkx5RieyL5eu5w29ZbxnSVrgxHL+S/VQb9vfu02UtHfWh4AwWP8/5c0/ryLsQuXag/kIttmzRFZlrc3JDkdz50F0s8/KOwo4XM8i6Wcjj3IT+sQxIPen56vlbH5iTq/+vOn2Kw3kOB3IkCc39gSRo3BPSqQDJow2XnIvHWsyG/Ejr9xe8iTjSnN4yZ2jEscyRXahDG+Q/wwPl4DyHMEVfzVqFbMMcPKNJwNxrvo7ocO0z8DxYae4XHDeahZrRPJjXSi5TcL1/aeHw8g8IoVZfH5zjUJ6YQOn4sB1qJRGXBItDpFe+RHLOaieQdxx/Sd+aBZ+zcRk4fI5KcrkEV68Ai35Nd9G+tmQzUEs/cVEyfIBobQ2naF2l3MU7VgWKclvl6njDioSCpiHwlGgJjAJ1NJSJiIeUUpQoSwNoDU5OTkr/////Sv////9LAHSUYk1wAoWUjAFDlHSUUpSMA3Bvc5RNMAF1jAloYXNfZ2F1c3OUSwCMBWdhdXNzlEcAAAAAAAAAAHVidWIu", "n": 4, "_shape": [], "dtype": "int64", "_np_random": "RandomState(MT19937)"}, "n_envs": 16, "n_steps": 256, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 3, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4JDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/yZmZmZmZmoWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "system_info": {"OS": "Linux-5.10.147+-x86_64-with-glibc2.31 # 1 SMP Sat Dec 10 16:00:40 UTC 2022", "Python": "3.9.16", "Stable-Baselines3": "1.8.0", "PyTorch": "2.0.0+cu118", "GPU Enabled": "True", "Numpy": "1.22.4", "Gym": "0.21.0"}}
|
|
|
1 |
+
{"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f923dbe63a0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f923dbe6430>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f923dbe64c0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f923dbe6550>", "_build": "<function ActorCriticPolicy._build at 0x7f923dbe65e0>", "forward": "<function ActorCriticPolicy.forward at 0x7f923dbe6670>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7f923dbe6700>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f923dbe6790>", "_predict": "<function ActorCriticPolicy._predict at 0x7f923dbe6820>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f923dbe68b0>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f923dbe6940>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f923dbe69d0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7f923dbe5d40>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 200704, "_total_timesteps": 200000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1682438668734311416, "learning_rate": 0.0003, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4JDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/M6kqMFUyYYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAID3Kj0f+eK7EtnKPS5tej3pSze9imUNvAAAgD8AAIA/8759vju5Sz/gW4q9tae+vp1D174DfUA9AAAAAAAAAACaQbg+HlepPttIir5rHRi/Igm6PpxnJb4AAAAAAAAAAM3N9bzhkKu669FsO/rWhjxKUuW7nQNrPQAAgD8AAIA/ACZOvEy7BD5BHoU9m46jvt7Twjyiji+9AAAAAAAAAADTldQ+lXv8PpewQL4ZuCK/bIPCPkJuQ74AAAAAAAAAAGaw3j3j3p4/xnoRPzpOJb85CPk9yNJ/PgAAAAAAAAAAGqrDvUV4mD/Zgx2/1IEsv+hEmb2o7oG+AAAAAAAAAACzy+m9xYOcPz5u6r6pu/C+5qpTvucpoL4AAAAAAAAAAGb0DT2fde+76oEIvuQM6r3e0cI82IKCPgAAgD8AAIA/O5GHvmtCYj/uVnK+zqXFvtmk+L5T3+68AAAAAAAAAADaP0U+/iDsPU4S776BAEy+OUTyvJ5Trr0AAAAAAAAAAIC5eT7xa3E+H5+EvnYMEr/lUaI+mb4mvgAAAAAAAAAAzRXgvCkEdrrY5Xs7CoxLPD6+1btH2jQ9AACAPwAAgD/NS/K8LoaSvOPlRL3Mmx+9BKEJPg0X/z0AAIA/AACAP7rJaz5G6tg+jn3QvZr/6L4kozw+q0vevQAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.0035199999999999676, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVKBAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIjzNN2P7kb0CUhpRSlIwBbJRL0owBdJRHQJ1Ak2wV0tB1fZQoaAZoCWgPQwgPDCB86BRyQJSGlFKUaBVL62gWR0CdQbEDhcZ+dX2UKGgGaAloD0MIcH1Yb1QscECUhpRSlGgVS8hoFkdAnUJ5YLb5/XV9lChoBmgJaA9DCA7ABkQIbmhAlIaUUpRoFU3oA2gWR0CdQrB8hLXddX2UKGgGaAloD0MIgNQmTu79c0CUhpRSlGgVS+poFkdAnUNUfs/puHV9lChoBmgJaA9DCAKDpE9ruXFAlIaUUpRoFU0QAWgWR0CdRAvvBrN4dX2UKGgGaAloD0MIg6RPq2gHcUCUhpRSlGgVS/loFkdAnURte+mFanV9lChoBmgJaA9DCHbexmbHn29AlIaUUpRoFUvlaBZHQJ1E5lcyFf11fZQoaAZoCWgPQwj1aRX94TBzQJSGlFKUaBVL42gWR0CdRVZIg/1QdX2UKGgGaAloD0MI09ufi4bkaECUhpRSlGgVTegDaBZHQJ1FfgLqlgt1fZQoaAZoCWgPQwgdVyO70kIbQJSGlFKUaBVLg2gWR0CdRe2+fywwdX2UKGgGaAloD0MIC2DKwAEFPECUhpRSlGgVS1hoFkdAnUYqpxWDH3V9lChoBmgJaA9DCK96wDzkH3BAlIaUUpRoFUu9aBZHQJ1HNoZhrnF1fZQoaAZoCWgPQwidZRahmD1wQJSGlFKUaBVLy2gWR0CdR3A7PppwdX2UKGgGaAloD0MI7l7uk6PdcUCUhpRSlGgVS8JoFkdAnUeXJLdvbXV9lChoBmgJaA9DCAaCABk6+HJAlIaUUpRoFUvlaBZHQJ1IS7kGRmt1fZQoaAZoCWgPQwgpdjQOtXNyQJSGlFKUaBVLzmgWR0CdUWIp6QeWdX2UKGgGaAloD0MIIOup1de/cECUhpRSlGgVS8NoFkdAnVIDJZGKAXV9lChoBmgJaA9DCLznwHKEC3JAlIaUUpRoFU0HAWgWR0CdUh1UEPlNdX2UKGgGaAloD0MIMQkX8kjbcUCUhpRSlGgVS9loFkdAnVL+7L+xW3V9lChoBmgJaA9DCAspP6n2wnFAlIaUUpRoFUvbaBZHQJ1TibtqpLp1fZQoaAZoCWgPQwgUs14MJcFxQJSGlFKUaBVLx2gWR0CdU4o4+8oQdX2UKGgGaAloD0MI1GLwMK3DcUCUhpRSlGgVS9NoFkdAnVOx+rlvInV9lChoBmgJaA9DCIaPiCkRrXBAlIaUUpRoFU0bAWgWR0CdVF3+MqBmdX2UKGgGaAloD0MIXaW762wWckCUhpRSlGgVS9ZoFkdAnVUjN6gM+nV9lChoBmgJaA9DCLd/ZaUJEHNAlIaUUpRoFUvZaBZHQJ1VyyPdVNp1fZQoaAZoCWgPQwiJKCZvABxxQJSGlFKUaBVL/WgWR0CdVf/HYHxCdX2UKGgGaAloD0MIMnIW9jQ+bkCUhpRSlGgVS/hoFkdAnVYIN/e+EnV9lChoBmgJaA9DCKRRgZNtgnBAlIaUUpRoFUu5aBZHQJ1XALSeAd51fZQoaAZoCWgPQwizCMVW0OpoQJSGlFKUaBVN6ANoFkdAnVdpEQXhwXV9lChoBmgJaA9DCLtjsU2q1HJAlIaUUpRoFUu+aBZHQJ1Xmb7TDwZ1fZQoaAZoCWgPQwjQK556pLdzQJSGlFKUaBVL72gWR0CdXSnlnyuqdX2UKGgGaAloD0MIRfZBlsVmc0CUhpRSlGgVS85oFkdAnV2XYDklu3V9lChoBmgJaA9DCNTyA1e5pnBAlIaUUpRoFUvhaBZHQJ1dqI68xsV1fZQoaAZoCWgPQwhLIZBL3GhxQJSGlFKUaBVL2mgWR0CdXgzP8hs7dX2UKGgGaAloD0MIdO/hkqNzc0CUhpRSlGgVS/5oFkdAnV7o7JW/8HV9lChoBmgJaA9DCPc+VYWGdnBAlIaUUpRoFUvkaBZHQJ1e9uFYdQx1fZQoaAZoCWgPQwiOy7ipgZFvQJSGlFKUaBVLuWgWR0CdXxy0rsjWdX2UKGgGaAloD0MIyJi7llCzcECUhpRSlGgVS91oFkdAnV99UbT+enV9lChoBmgJaA9DCKkwthBkEHNAlIaUUpRoFUvGaBZHQJ1fq/BWPtF1fZQoaAZoCWgPQwiXVG03QclvQJSGlFKUaBVL8mgWR0CdYOxoZhrndX2UKGgGaAloD0MIAtNp3UbacECUhpRSlGgVS95oFkdAnWFjYVZcLXV9lChoBmgJaA9DCJ+Sc2IPT3JAlIaUUpRoFUviaBZHQJ1h6piqhlF1fZQoaAZoCWgPQwjKNQUyO9ZvQJSGlFKUaBVL4mgWR0CdYhgHu7YkdX2UKGgGaAloD0MI7SsP0tMLcUCUhpRSlGgVS89oFkdAnWcnV9Wp63V9lChoBmgJaA9DCCIXnMEfBXBAlIaUUpRoFUvIaBZHQJ1nYGB4D9x1fZQoaAZoCWgPQwg49BYP731MQJSGlFKUaBVLomgWR0CdZ6fq5byIdX2UKGgGaAloD0MI7DNnfYrcckCUhpRSlGgVS9JoFkdAnWe4f8uSOnV9lChoBmgJaA9DCPpjWptGum9AlIaUUpRoFUvOaBZHQJ1oCNn5BTp1fZQoaAZoCWgPQwhw6ZjzDH1kQJSGlFKUaBVN6ANoFkdAnWioagmJFnV9lChoBmgJaA9DCHAIVWp2wnFAlIaUUpRoFUvaaBZHQJ1pPIsAeaN1fZQoaAZoCWgPQwgXRQ98DIFuQJSGlFKUaBVLzmgWR0CdaWzlcQiBdX2UKGgGaAloD0MIHv0v1yKZckCUhpRSlGgVS+ZoFkdAnWmsAJb+tXV9lChoBmgJaA9DCHycacJ2WXNAlIaUUpRoFUv3aBZHQJ1qjmOlwcZ1fZQoaAZoCWgPQwhETl/P11FtQJSGlFKUaBVL0GgWR0CdaxYNAkcCdX2UKGgGaAloD0MITaHzGrs9c0CUhpRSlGgVS+FoFkdAnWshwEQoTnV9lChoBmgJaA9DCHpQUIoWdHBAlIaUUpRoFUvSaBZHQJ1rvxH5Jsh1fZQoaAZoCWgPQwh9CRUcHn1wQJSGlFKUaBVL7WgWR0CdbE/YraufdX2UKGgGaAloD0MIYsCSq9ihc0CUhpRSlGgVS+xoFkdAnW1aZH/cWXV9lChoBmgJaA9DCAH76NTV4HJAlIaUUpRoFUvdaBZHQJ1tbt4RmK91fZQoaAZoCWgPQwhjDoKOlp5xQJSGlFKUaBVL0mgWR0CdbXx1xKg7dX2UKGgGaAloD0MIpwTEJBwJckCUhpRSlGgVS+FoFkdAnW2Zk078vXV9lChoBmgJaA9DCLmKxW+KgHBAlIaUUpRoFUvLaBZHQJ1yCfUWl/J1fZQoaAZoCWgPQwiQgxJmGqhyQJSGlFKUaBVL/mgWR0CdcjG/N7jUdX2UKGgGaAloD0MIbZG0G72zckCUhpRSlGgVS9xoFkdAnXMKz7di2HV9lChoBmgJaA9DCFrwoq+gHXJAlIaUUpRoFUvQaBZHQJ1zMJE6T4d1fZQoaAZoCWgPQwhTzhd7L6hmQJSGlFKUaBVN6ANoFkdAnXNsLfDUE3V9lChoBmgJaA9DCEGchxOYXXBAlIaUUpRoFUu7aBZHQJ10GZc9nsd1fZQoaAZoCWgPQwjVIw1ua2BuQJSGlFKUaBVNAAFoFkdAnXQe9i+cpnV9lChoBmgJaA9DCDttjQhGJm9AlIaUUpRoFUvAaBZHQJ10QAiml691fZQoaAZoCWgPQwg+7IUCNn5wQJSGlFKUaBVL52gWR0CddKCPZIxydX2UKGgGaAloD0MIVft0POaTaECUhpRSlGgVTegDaBZHQJ11FnnMdLh1fZQoaAZoCWgPQwiGAraDUUVyQJSGlFKUaBVL3WgWR0CddXdPLxI8dX2UKGgGaAloD0MIxQH0+/6SckCUhpRSlGgVS8toFkdAnXWGALApKHV9lChoBmgJaA9DCChDVUylp3FAlIaUUpRoFUvDaBZHQJ12NJDmbLF1fZQoaAZoCWgPQwi7uI0GsNJxQJSGlFKUaBVL0mgWR0CddqHhCMP0dX2UKGgGaAloD0MIx0rMs9K1cECUhpRSlGgVS99oFkdAnXa3WnTAnHV9lChoBmgJaA9DCB7dCIuK5W9AlIaUUpRoFUvraBZHQJ13COhkAgh1fZQoaAZoCWgPQwhBRkCFo6RxQJSGlFKUaBVL32gWR0CddyGjsUqQdX2UKGgGaAloD0MIwVPIlXrbcECUhpRSlGgVS+ZoFkdAnXdq99MK1HV9lChoBmgJaA9DCESJljyemXJAlIaUUpRoFUvSaBZHQJ18raK1og51fZQoaAZoCWgPQwhlGeJYFwdwQJSGlFKUaBVL42gWR0CdfQhCMPz4dX2UKGgGaAloD0MIsKpefmefcUCUhpRSlGgVS9hoFkdAnX0hGUfPonV9lChoBmgJaA9DCLOWAtI+dHNAlIaUUpRoFUvRaBZHQJ19vaSLZSN1fZQoaAZoCWgPQwjPZWoSPH5yQJSGlFKUaBVL32gWR0CdfiTHKfWddX2UKGgGaAloD0MILV4sDFFAckCUhpRSlGgVS9xoFkdAnX5AxSHdoHV9lChoBmgJaA9DCLaBO1AntW9AlIaUUpRoFUvqaBZHQJ1/EcxTKkl1fZQoaAZoCWgPQwhuMxXikW1zQJSGlFKUaBVL62gWR0Cdf6R3/xUedX2UKGgGaAloD0MI1owMcheWckCUhpRSlGgVS9xoFkdAnX/VPJq7AnV9lChoBmgJaA9DCLiTiPCv0HFAlIaUUpRoFUvzaBZHQJ2Aa5UcXFd1fZQoaAZoCWgPQwhlGeJYl5NwQJSGlFKUaBVL0mgWR0CdgJDB/I8ydX2UKGgGaAloD0MIDFpIwGhXcECUhpRSlGgVS8toFkdAnYF8kleF+XV9lChoBmgJaA9DCEKZRpOLu0ZAlIaUUpRoFUuwaBZHQJ2BzK3d9Dx1fZQoaAZoCWgPQwgIBhA+1LxyQJSGlFKUaBVL5WgWR0CdgdkNnXd1dX2UKGgGaAloD0MIKGVSQ9uDckCUhpRSlGgVS9doFkdAnYIBmXgLqnV9lChoBmgJaA9DCCR/MPCcJ3JAlIaUUpRoFUv7aBZHQJ2CXjIaLn91fZQoaAZoCWgPQwgLfhtivIZyQJSGlFKUaBVLw2gWR0CdgrsCT2WZdX2UKGgGaAloD0MIJO6x9GFQcUCUhpRSlGgVS9poFkdAnYOPUnXumnV9lChoBmgJaA9DCIXpew3BN3JAlIaUUpRoFU0AAWgWR0Cdg7M7EHdHdX2UKGgGaAloD0MIEAaeew+ObkCUhpRSlGgVS8toFkdAnYPNuk1uSHVlLg=="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 1668, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVnwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/5RoCksIhZSMAUOUdJRSlIwEaGlnaJRoEiiWIAAAAAAAAAAAAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAf5RoCksIhZRoFXSUUpSMDWJvdW5kZWRfYmVsb3eUaBIolggAAAAAAAAAAAAAAAAAAACUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYIAAAAAAAAAAAAAAAAAAAAlGghSwiFlGgVdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [8], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False]", "bounded_above": "[False False False False False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gAWVggAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUaAeTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu", "n": 4, "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "n_steps": 256, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4JDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/yZmZmZmZmoWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "system_info": {"OS": "Linux-5.10.147+-x86_64-with-glibc2.31 # 1 SMP Sat Dec 10 16:00:40 UTC 2022", "Python": "3.9.16", "Stable-Baselines3": "1.8.0", "PyTorch": "2.0.0+cu118", "GPU Enabled": "True", "Numpy": "1.22.4", "Gym": "0.21.0"}}
|
ppo-LunarLander-v2.zip
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:29faab3ac77022cee54daf8cc0523ebb860d77c3e3ce9caf56006f6a61133164
|
3 |
+
size 147278
|
ppo-LunarLander-v2/data
CHANGED
@@ -4,29 +4,29 @@
|
|
4 |
":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
|
5 |
"__module__": "stable_baselines3.common.policies",
|
6 |
"__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
|
7 |
-
"__init__": "<function ActorCriticPolicy.__init__ at
|
8 |
-
"_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at
|
9 |
-
"reset_noise": "<function ActorCriticPolicy.reset_noise at
|
10 |
-
"_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at
|
11 |
-
"_build": "<function ActorCriticPolicy._build at
|
12 |
-
"forward": "<function ActorCriticPolicy.forward at
|
13 |
-
"extract_features": "<function ActorCriticPolicy.extract_features at
|
14 |
-
"_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at
|
15 |
-
"_predict": "<function ActorCriticPolicy._predict at
|
16 |
-
"evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at
|
17 |
-
"get_distribution": "<function ActorCriticPolicy.get_distribution at
|
18 |
-
"predict_values": "<function ActorCriticPolicy.predict_values at
|
19 |
"__abstractmethods__": "frozenset()",
|
20 |
-
"_abc_impl": "<_abc._abc_data object at
|
21 |
},
|
22 |
"verbose": 1,
|
23 |
"policy_kwargs": {},
|
24 |
-
"num_timesteps":
|
25 |
-
"_total_timesteps":
|
26 |
"_num_timesteps_at_start": 0,
|
27 |
"seed": null,
|
28 |
"action_noise": null,
|
29 |
-
"start_time":
|
30 |
"learning_rate": 0.0003,
|
31 |
"tensorboard_log": null,
|
32 |
"lr_schedule": {
|
@@ -35,7 +35,7 @@
|
|
35 |
},
|
36 |
"_last_obs": {
|
37 |
":type:": "<class 'numpy.ndarray'>",
|
38 |
-
":serialized:": "
|
39 |
},
|
40 |
"_last_episode_starts": {
|
41 |
":type:": "<class 'numpy.ndarray'>",
|
@@ -49,13 +49,13 @@
|
|
49 |
"_stats_window_size": 100,
|
50 |
"ep_info_buffer": {
|
51 |
":type:": "<class 'collections.deque'>",
|
52 |
-
":serialized:": "
|
53 |
},
|
54 |
"ep_success_buffer": {
|
55 |
":type:": "<class 'collections.deque'>",
|
56 |
":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
|
57 |
},
|
58 |
-
"_n_updates":
|
59 |
"observation_space": {
|
60 |
":type:": "<class 'gym.spaces.box.Box'>",
|
61 |
":serialized:": "gAWVnwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/5RoCksIhZSMAUOUdJRSlIwEaGlnaJRoEiiWIAAAAAAAAAAAAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAf5RoCksIhZRoFXSUUpSMDWJvdW5kZWRfYmVsb3eUaBIolggAAAAAAAAAAAAAAAAAAACUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYIAAAAAAAAAAAAAAAAAAAAlGghSwiFlGgVdJRSlIwKX25wX3JhbmRvbZROdWIu",
|
@@ -71,11 +71,11 @@
|
|
71 |
},
|
72 |
"action_space": {
|
73 |
":type:": "<class 'gym.spaces.discrete.Discrete'>",
|
74 |
-
":serialized:": "
|
75 |
"n": 4,
|
76 |
"_shape": [],
|
77 |
"dtype": "int64",
|
78 |
-
"_np_random":
|
79 |
},
|
80 |
"n_envs": 16,
|
81 |
"n_steps": 256,
|
@@ -85,7 +85,7 @@
|
|
85 |
"vf_coef": 0.5,
|
86 |
"max_grad_norm": 0.5,
|
87 |
"batch_size": 64,
|
88 |
-
"n_epochs":
|
89 |
"clip_range": {
|
90 |
":type:": "<class 'function'>",
|
91 |
":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4JDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/yZmZmZmZmoWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="
|
|
|
4 |
":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
|
5 |
"__module__": "stable_baselines3.common.policies",
|
6 |
"__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
|
7 |
+
"__init__": "<function ActorCriticPolicy.__init__ at 0x7f923dbe63a0>",
|
8 |
+
"_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f923dbe6430>",
|
9 |
+
"reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f923dbe64c0>",
|
10 |
+
"_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f923dbe6550>",
|
11 |
+
"_build": "<function ActorCriticPolicy._build at 0x7f923dbe65e0>",
|
12 |
+
"forward": "<function ActorCriticPolicy.forward at 0x7f923dbe6670>",
|
13 |
+
"extract_features": "<function ActorCriticPolicy.extract_features at 0x7f923dbe6700>",
|
14 |
+
"_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f923dbe6790>",
|
15 |
+
"_predict": "<function ActorCriticPolicy._predict at 0x7f923dbe6820>",
|
16 |
+
"evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f923dbe68b0>",
|
17 |
+
"get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f923dbe6940>",
|
18 |
+
"predict_values": "<function ActorCriticPolicy.predict_values at 0x7f923dbe69d0>",
|
19 |
"__abstractmethods__": "frozenset()",
|
20 |
+
"_abc_impl": "<_abc._abc_data object at 0x7f923dbe5d40>"
|
21 |
},
|
22 |
"verbose": 1,
|
23 |
"policy_kwargs": {},
|
24 |
+
"num_timesteps": 200704,
|
25 |
+
"_total_timesteps": 200000,
|
26 |
"_num_timesteps_at_start": 0,
|
27 |
"seed": null,
|
28 |
"action_noise": null,
|
29 |
+
"start_time": 1682438668734311416,
|
30 |
"learning_rate": 0.0003,
|
31 |
"tensorboard_log": null,
|
32 |
"lr_schedule": {
|
|
|
35 |
},
|
36 |
"_last_obs": {
|
37 |
":type:": "<class 'numpy.ndarray'>",
|
38 |
+
":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAID3Kj0f+eK7EtnKPS5tej3pSze9imUNvAAAgD8AAIA/8759vju5Sz/gW4q9tae+vp1D174DfUA9AAAAAAAAAACaQbg+HlepPttIir5rHRi/Igm6PpxnJb4AAAAAAAAAAM3N9bzhkKu669FsO/rWhjxKUuW7nQNrPQAAgD8AAIA/ACZOvEy7BD5BHoU9m46jvt7Twjyiji+9AAAAAAAAAADTldQ+lXv8PpewQL4ZuCK/bIPCPkJuQ74AAAAAAAAAAGaw3j3j3p4/xnoRPzpOJb85CPk9yNJ/PgAAAAAAAAAAGqrDvUV4mD/Zgx2/1IEsv+hEmb2o7oG+AAAAAAAAAACzy+m9xYOcPz5u6r6pu/C+5qpTvucpoL4AAAAAAAAAAGb0DT2fde+76oEIvuQM6r3e0cI82IKCPgAAgD8AAIA/O5GHvmtCYj/uVnK+zqXFvtmk+L5T3+68AAAAAAAAAADaP0U+/iDsPU4S776BAEy+OUTyvJ5Trr0AAAAAAAAAAIC5eT7xa3E+H5+EvnYMEr/lUaI+mb4mvgAAAAAAAAAAzRXgvCkEdrrY5Xs7CoxLPD6+1btH2jQ9AACAPwAAgD/NS/K8LoaSvOPlRL3Mmx+9BKEJPg0X/z0AAIA/AACAP7rJaz5G6tg+jn3QvZr/6L4kozw+q0vevQAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
|
39 |
},
|
40 |
"_last_episode_starts": {
|
41 |
":type:": "<class 'numpy.ndarray'>",
|
|
|
49 |
"_stats_window_size": 100,
|
50 |
"ep_info_buffer": {
|
51 |
":type:": "<class 'collections.deque'>",
|
52 |
+
":serialized:": "gAWVKBAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIjzNN2P7kb0CUhpRSlIwBbJRL0owBdJRHQJ1Ak2wV0tB1fZQoaAZoCWgPQwgPDCB86BRyQJSGlFKUaBVL62gWR0CdQbEDhcZ+dX2UKGgGaAloD0MIcH1Yb1QscECUhpRSlGgVS8hoFkdAnUJ5YLb5/XV9lChoBmgJaA9DCA7ABkQIbmhAlIaUUpRoFU3oA2gWR0CdQrB8hLXddX2UKGgGaAloD0MIgNQmTu79c0CUhpRSlGgVS+poFkdAnUNUfs/puHV9lChoBmgJaA9DCAKDpE9ruXFAlIaUUpRoFU0QAWgWR0CdRAvvBrN4dX2UKGgGaAloD0MIg6RPq2gHcUCUhpRSlGgVS/loFkdAnURte+mFanV9lChoBmgJaA9DCHbexmbHn29AlIaUUpRoFUvlaBZHQJ1E5lcyFf11fZQoaAZoCWgPQwj1aRX94TBzQJSGlFKUaBVL42gWR0CdRVZIg/1QdX2UKGgGaAloD0MI09ufi4bkaECUhpRSlGgVTegDaBZHQJ1FfgLqlgt1fZQoaAZoCWgPQwgdVyO70kIbQJSGlFKUaBVLg2gWR0CdRe2+fywwdX2UKGgGaAloD0MIC2DKwAEFPECUhpRSlGgVS1hoFkdAnUYqpxWDH3V9lChoBmgJaA9DCK96wDzkH3BAlIaUUpRoFUu9aBZHQJ1HNoZhrnF1fZQoaAZoCWgPQwidZRahmD1wQJSGlFKUaBVLy2gWR0CdR3A7PppwdX2UKGgGaAloD0MI7l7uk6PdcUCUhpRSlGgVS8JoFkdAnUeXJLdvbXV9lChoBmgJaA9DCAaCABk6+HJAlIaUUpRoFUvlaBZHQJ1IS7kGRmt1fZQoaAZoCWgPQwgpdjQOtXNyQJSGlFKUaBVLzmgWR0CdUWIp6QeWdX2UKGgGaAloD0MIIOup1de/cECUhpRSlGgVS8NoFkdAnVIDJZGKAXV9lChoBmgJaA9DCLznwHKEC3JAlIaUUpRoFU0HAWgWR0CdUh1UEPlNdX2UKGgGaAloD0MIMQkX8kjbcUCUhpRSlGgVS9loFkdAnVL+7L+xW3V9lChoBmgJaA9DCAspP6n2wnFAlIaUUpRoFUvbaBZHQJ1TibtqpLp1fZQoaAZoCWgPQwgUs14MJcFxQJSGlFKUaBVLx2gWR0CdU4o4+8oQdX2UKGgGaAloD0MI1GLwMK3DcUCUhpRSlGgVS9NoFkdAnVOx+rlvInV9lChoBmgJaA9DCIaPiCkRrXBAlIaUUpRoFU0bAWgWR0CdVF3+MqBmdX2UKGgGaAloD0MIXaW762wWckCUhpRSlGgVS9ZoFkdAnVUjN6gM+nV9lChoBmgJaA9DCLd/ZaUJEHNAlIaUUpRoFUvZaBZHQJ1VyyPdVNp1fZQoaAZoCWgPQwiJKCZvABxxQJSGlFKUaBVL/WgWR0CdVf/HYHxCdX2UKGgGaAloD0MIMnIW9jQ+bkCUhpRSlGgVS/hoFkdAnVYIN/e+EnV9lChoBmgJaA9DCKRRgZNtgnBAlIaUUpRoFUu5aBZHQJ1XALSeAd51fZQoaAZoCWgPQwizCMVW0OpoQJSGlFKUaBVN6ANoFkdAnVdpEQXhwXV9lChoBmgJaA9DCLtjsU2q1HJAlIaUUpRoFUu+aBZHQJ1Xmb7TDwZ1fZQoaAZoCWgPQwjQK556pLdzQJSGlFKUaBVL72gWR0CdXSnlnyuqdX2UKGgGaAloD0MIRfZBlsVmc0CUhpRSlGgVS85oFkdAnV2XYDklu3V9lChoBmgJaA9DCNTyA1e5pnBAlIaUUpRoFUvhaBZHQJ1dqI68xsV1fZQoaAZoCWgPQwhLIZBL3GhxQJSGlFKUaBVL2mgWR0CdXgzP8hs7dX2UKGgGaAloD0MIdO/hkqNzc0CUhpRSlGgVS/5oFkdAnV7o7JW/8HV9lChoBmgJaA9DCPc+VYWGdnBAlIaUUpRoFUvkaBZHQJ1e9uFYdQx1fZQoaAZoCWgPQwiOy7ipgZFvQJSGlFKUaBVLuWgWR0CdXxy0rsjWdX2UKGgGaAloD0MIyJi7llCzcECUhpRSlGgVS91oFkdAnV99UbT+enV9lChoBmgJaA9DCKkwthBkEHNAlIaUUpRoFUvGaBZHQJ1fq/BWPtF1fZQoaAZoCWgPQwiXVG03QclvQJSGlFKUaBVL8mgWR0CdYOxoZhrndX2UKGgGaAloD0MIAtNp3UbacECUhpRSlGgVS95oFkdAnWFjYVZcLXV9lChoBmgJaA9DCJ+Sc2IPT3JAlIaUUpRoFUviaBZHQJ1h6piqhlF1fZQoaAZoCWgPQwjKNQUyO9ZvQJSGlFKUaBVL4mgWR0CdYhgHu7YkdX2UKGgGaAloD0MI7SsP0tMLcUCUhpRSlGgVS89oFkdAnWcnV9Wp63V9lChoBmgJaA9DCCIXnMEfBXBAlIaUUpRoFUvIaBZHQJ1nYGB4D9x1fZQoaAZoCWgPQwg49BYP731MQJSGlFKUaBVLomgWR0CdZ6fq5byIdX2UKGgGaAloD0MI7DNnfYrcckCUhpRSlGgVS9JoFkdAnWe4f8uSOnV9lChoBmgJaA9DCPpjWptGum9AlIaUUpRoFUvOaBZHQJ1oCNn5BTp1fZQoaAZoCWgPQwhw6ZjzDH1kQJSGlFKUaBVN6ANoFkdAnWioagmJFnV9lChoBmgJaA9DCHAIVWp2wnFAlIaUUpRoFUvaaBZHQJ1pPIsAeaN1fZQoaAZoCWgPQwgXRQ98DIFuQJSGlFKUaBVLzmgWR0CdaWzlcQiBdX2UKGgGaAloD0MIHv0v1yKZckCUhpRSlGgVS+ZoFkdAnWmsAJb+tXV9lChoBmgJaA9DCHycacJ2WXNAlIaUUpRoFUv3aBZHQJ1qjmOlwcZ1fZQoaAZoCWgPQwhETl/P11FtQJSGlFKUaBVL0GgWR0CdaxYNAkcCdX2UKGgGaAloD0MITaHzGrs9c0CUhpRSlGgVS+FoFkdAnWshwEQoTnV9lChoBmgJaA9DCHpQUIoWdHBAlIaUUpRoFUvSaBZHQJ1rvxH5Jsh1fZQoaAZoCWgPQwh9CRUcHn1wQJSGlFKUaBVL7WgWR0CdbE/YraufdX2UKGgGaAloD0MIYsCSq9ihc0CUhpRSlGgVS+xoFkdAnW1aZH/cWXV9lChoBmgJaA9DCAH76NTV4HJAlIaUUpRoFUvdaBZHQJ1tbt4RmK91fZQoaAZoCWgPQwhjDoKOlp5xQJSGlFKUaBVL0mgWR0CdbXx1xKg7dX2UKGgGaAloD0MIpwTEJBwJckCUhpRSlGgVS+FoFkdAnW2Zk078vXV9lChoBmgJaA9DCLmKxW+KgHBAlIaUUpRoFUvLaBZHQJ1yCfUWl/J1fZQoaAZoCWgPQwiQgxJmGqhyQJSGlFKUaBVL/mgWR0CdcjG/N7jUdX2UKGgGaAloD0MIbZG0G72zckCUhpRSlGgVS9xoFkdAnXMKz7di2HV9lChoBmgJaA9DCFrwoq+gHXJAlIaUUpRoFUvQaBZHQJ1zMJE6T4d1fZQoaAZoCWgPQwhTzhd7L6hmQJSGlFKUaBVN6ANoFkdAnXNsLfDUE3V9lChoBmgJaA9DCEGchxOYXXBAlIaUUpRoFUu7aBZHQJ10GZc9nsd1fZQoaAZoCWgPQwjVIw1ua2BuQJSGlFKUaBVNAAFoFkdAnXQe9i+cpnV9lChoBmgJaA9DCDttjQhGJm9AlIaUUpRoFUvAaBZHQJ10QAiml691fZQoaAZoCWgPQwg+7IUCNn5wQJSGlFKUaBVL52gWR0CddKCPZIxydX2UKGgGaAloD0MIVft0POaTaECUhpRSlGgVTegDaBZHQJ11FnnMdLh1fZQoaAZoCWgPQwiGAraDUUVyQJSGlFKUaBVL3WgWR0CddXdPLxI8dX2UKGgGaAloD0MIxQH0+/6SckCUhpRSlGgVS8toFkdAnXWGALApKHV9lChoBmgJaA9DCChDVUylp3FAlIaUUpRoFUvDaBZHQJ12NJDmbLF1fZQoaAZoCWgPQwi7uI0GsNJxQJSGlFKUaBVL0mgWR0CddqHhCMP0dX2UKGgGaAloD0MIx0rMs9K1cECUhpRSlGgVS99oFkdAnXa3WnTAnHV9lChoBmgJaA9DCB7dCIuK5W9AlIaUUpRoFUvraBZHQJ13COhkAgh1fZQoaAZoCWgPQwhBRkCFo6RxQJSGlFKUaBVL32gWR0CddyGjsUqQdX2UKGgGaAloD0MIwVPIlXrbcECUhpRSlGgVS+ZoFkdAnXdq99MK1HV9lChoBmgJaA9DCESJljyemXJAlIaUUpRoFUvSaBZHQJ18raK1og51fZQoaAZoCWgPQwhlGeJYFwdwQJSGlFKUaBVL42gWR0CdfQhCMPz4dX2UKGgGaAloD0MIsKpefmefcUCUhpRSlGgVS9hoFkdAnX0hGUfPonV9lChoBmgJaA9DCLOWAtI+dHNAlIaUUpRoFUvRaBZHQJ19vaSLZSN1fZQoaAZoCWgPQwjPZWoSPH5yQJSGlFKUaBVL32gWR0CdfiTHKfWddX2UKGgGaAloD0MILV4sDFFAckCUhpRSlGgVS9xoFkdAnX5AxSHdoHV9lChoBmgJaA9DCLaBO1AntW9AlIaUUpRoFUvqaBZHQJ1/EcxTKkl1fZQoaAZoCWgPQwhuMxXikW1zQJSGlFKUaBVL62gWR0Cdf6R3/xUedX2UKGgGaAloD0MI1owMcheWckCUhpRSlGgVS9xoFkdAnX/VPJq7AnV9lChoBmgJaA9DCLiTiPCv0HFAlIaUUpRoFUvzaBZHQJ2Aa5UcXFd1fZQoaAZoCWgPQwhlGeJYl5NwQJSGlFKUaBVL0mgWR0CdgJDB/I8ydX2UKGgGaAloD0MIDFpIwGhXcECUhpRSlGgVS8toFkdAnYF8kleF+XV9lChoBmgJaA9DCEKZRpOLu0ZAlIaUUpRoFUuwaBZHQJ2BzK3d9Dx1fZQoaAZoCWgPQwgIBhA+1LxyQJSGlFKUaBVL5WgWR0CdgdkNnXd1dX2UKGgGaAloD0MIKGVSQ9uDckCUhpRSlGgVS9doFkdAnYIBmXgLqnV9lChoBmgJaA9DCCR/MPCcJ3JAlIaUUpRoFUv7aBZHQJ2CXjIaLn91fZQoaAZoCWgPQwgLfhtivIZyQJSGlFKUaBVLw2gWR0CdgrsCT2WZdX2UKGgGaAloD0MIJO6x9GFQcUCUhpRSlGgVS9poFkdAnYOPUnXumnV9lChoBmgJaA9DCIXpew3BN3JAlIaUUpRoFU0AAWgWR0Cdg7M7EHdHdX2UKGgGaAloD0MIEAaeew+ObkCUhpRSlGgVS8toFkdAnYPNuk1uSHVlLg=="
|
53 |
},
|
54 |
"ep_success_buffer": {
|
55 |
":type:": "<class 'collections.deque'>",
|
56 |
":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
|
57 |
},
|
58 |
+
"_n_updates": 1668,
|
59 |
"observation_space": {
|
60 |
":type:": "<class 'gym.spaces.box.Box'>",
|
61 |
":serialized:": "gAWVnwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLCIWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWIAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/AACA/5RoCksIhZSMAUOUdJRSlIwEaGlnaJRoEiiWIAAAAAAAAAAAAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/AACAf5RoCksIhZRoFXSUUpSMDWJvdW5kZWRfYmVsb3eUaBIolggAAAAAAAAAAAAAAAAAAACUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLCIWUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYIAAAAAAAAAAAAAAAAAAAAlGghSwiFlGgVdJRSlIwKX25wX3JhbmRvbZROdWIu",
|
|
|
71 |
},
|
72 |
"action_space": {
|
73 |
":type:": "<class 'gym.spaces.discrete.Discrete'>",
|
74 |
+
":serialized:": "gAWVggAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUaAeTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu",
|
75 |
"n": 4,
|
76 |
"_shape": [],
|
77 |
"dtype": "int64",
|
78 |
+
"_np_random": null
|
79 |
},
|
80 |
"n_envs": 16,
|
81 |
"n_steps": 256,
|
|
|
85 |
"vf_coef": 0.5,
|
86 |
"max_grad_norm": 0.5,
|
87 |
"batch_size": 64,
|
88 |
+
"n_epochs": 4,
|
89 |
"clip_range": {
|
90 |
":type:": "<class 'function'>",
|
91 |
":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4JDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/yZmZmZmZmoWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="
|
ppo-LunarLander-v2/policy.optimizer.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 87929
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f5bbf8700da345a78d20b11491bbfd4ad3a36d382fb5c365175c8ab0a157f672
|
3 |
size 87929
|
ppo-LunarLander-v2/policy.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 43329
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fdd8b76feaf5349038e7b48aa227b021fc6b79978f9c23703397748b73237a84
|
3 |
size 43329
|
replay.mp4
CHANGED
Binary files a/replay.mp4 and b/replay.mp4 differ
|
|
results.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"mean_reward":
|
|
|
1 |
+
{"mean_reward": 281.00240688519204, "std_reward": 19.71639613809219, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-04-25T16:08:11.363700"}
|