trained model 2e+06 steps
Browse files- LunarLander-v2-ppo.zip +2 -2
- LunarLander-v2-ppo/data +20 -20
- LunarLander-v2-ppo/policy.optimizer.pth +1 -1
- LunarLander-v2-ppo/policy.pth +1 -1
- README.md +1 -1
- config.json +1 -1
- replay.mp4 +2 -2
- results.json +1 -1
LunarLander-v2-ppo.zip
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cca2cf27ca426703249e58e251037af36e799aa52704e64bdffb4dc6a69f4890
|
3 |
+
size 144143
|
LunarLander-v2-ppo/data
CHANGED
@@ -4,19 +4,19 @@
|
|
4 |
":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
|
5 |
"__module__": "stable_baselines3.common.policies",
|
6 |
"__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
|
7 |
-
"__init__": "<function ActorCriticPolicy.__init__ at
|
8 |
-
"_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at
|
9 |
-
"reset_noise": "<function ActorCriticPolicy.reset_noise at
|
10 |
-
"_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at
|
11 |
-
"_build": "<function ActorCriticPolicy._build at
|
12 |
-
"forward": "<function ActorCriticPolicy.forward at
|
13 |
-
"_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at
|
14 |
-
"_predict": "<function ActorCriticPolicy._predict at
|
15 |
-
"evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at
|
16 |
-
"get_distribution": "<function ActorCriticPolicy.get_distribution at
|
17 |
-
"predict_values": "<function ActorCriticPolicy.predict_values at
|
18 |
"__abstractmethods__": "frozenset()",
|
19 |
-
"_abc_impl": "<_abc_data object at
|
20 |
},
|
21 |
"verbose": 1,
|
22 |
"policy_kwargs": {},
|
@@ -47,19 +47,19 @@
|
|
47 |
"_num_timesteps_at_start": 0,
|
48 |
"seed": null,
|
49 |
"action_noise": null,
|
50 |
-
"start_time":
|
51 |
"learning_rate": {
|
52 |
":type:": "<class 'function'>",
|
53 |
-
":serialized:": "
|
54 |
},
|
55 |
-
"tensorboard_log": "runs/
|
56 |
"lr_schedule": {
|
57 |
":type:": "<class 'function'>",
|
58 |
-
":serialized:": "
|
59 |
},
|
60 |
"_last_obs": {
|
61 |
":type:": "<class 'numpy.ndarray'>",
|
62 |
-
":serialized:": "
|
63 |
},
|
64 |
"_last_episode_starts": {
|
65 |
":type:": "<class 'numpy.ndarray'>",
|
@@ -72,7 +72,7 @@
|
|
72 |
"_current_progress_remaining": -0.007616000000000067,
|
73 |
"ep_info_buffer": {
|
74 |
":type:": "<class 'collections.deque'>",
|
75 |
-
":serialized:": "
|
76 |
},
|
77 |
"ep_success_buffer": {
|
78 |
":type:": "<class 'collections.deque'>",
|
@@ -82,14 +82,14 @@
|
|
82 |
"n_steps": 1024,
|
83 |
"gamma": 0.99,
|
84 |
"gae_lambda": 0.95,
|
85 |
-
"ent_coef": 0.
|
86 |
"vf_coef": 0.5,
|
87 |
"max_grad_norm": 0.5,
|
88 |
"batch_size": 64,
|
89 |
"n_epochs": 10,
|
90 |
"clip_range": {
|
91 |
":type:": "<class 'function'>",
|
92 |
-
":serialized:": "
|
93 |
},
|
94 |
"clip_range_vf": null,
|
95 |
"target_kl": null
|
|
|
4 |
":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
|
5 |
"__module__": "stable_baselines3.common.policies",
|
6 |
"__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
|
7 |
+
"__init__": "<function ActorCriticPolicy.__init__ at 0x7f2ecf22b710>",
|
8 |
+
"_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f2ecf22b7a0>",
|
9 |
+
"reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f2ecf22b830>",
|
10 |
+
"_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f2ecf22b8c0>",
|
11 |
+
"_build": "<function ActorCriticPolicy._build at 0x7f2ecf22b950>",
|
12 |
+
"forward": "<function ActorCriticPolicy.forward at 0x7f2ecf22b9e0>",
|
13 |
+
"_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f2ecf22ba70>",
|
14 |
+
"_predict": "<function ActorCriticPolicy._predict at 0x7f2ecf22bb00>",
|
15 |
+
"evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f2ecf22bb90>",
|
16 |
+
"get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f2ecf22bc20>",
|
17 |
+
"predict_values": "<function ActorCriticPolicy.predict_values at 0x7f2ecf22bcb0>",
|
18 |
"__abstractmethods__": "frozenset()",
|
19 |
+
"_abc_impl": "<_abc_data object at 0x7f2ecf26cbd0>"
|
20 |
},
|
21 |
"verbose": 1,
|
22 |
"policy_kwargs": {},
|
|
|
47 |
"_num_timesteps_at_start": 0,
|
48 |
"seed": null,
|
49 |
"action_noise": null,
|
50 |
+
"start_time": 1652472552.9625235,
|
51 |
"learning_rate": {
|
52 |
":type:": "<class 'function'>",
|
53 |
+
":serialized:": "gAWVTQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAUsDSxNDHGQBiAAbAGQBGABkAXwAGAAUAGQBFwCIARQAUwCUTksBhpQpjANwY3SUhZSMHzxpcHl0aG9uLWlucHV0LTI3LTM4MzMzNDUyMWQ3NT6UjAg8bGFtYmRhPpRLAkMAlIwGZmFjdG9ylIwBeJSGlCl0lFKUfZQojAtfX3BhY2thZ2VfX5ROjAhfX25hbWVfX5SMCF9fbWFpbl9flHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUaBopUpSGlHSUUpSMHGNsb3VkcGlja2xlLmNsb3VkcGlja2xlX2Zhc3SUjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoH32UfZQoaBdoDowMX19xdWFsbmFtZV9flIwkbGluZWFyX2RlY2F5X3NjaGVkLjxsb2NhbHM+LjxsYW1iZGE+lIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoGIwHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEsKhZRSlGgvRz9QYk3S8an8hZRSlIaUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"
|
54 |
},
|
55 |
+
"tensorboard_log": "runs/gf22ryeo",
|
56 |
"lr_schedule": {
|
57 |
":type:": "<class 'function'>",
|
58 |
+
":serialized:": "gAWVTQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAUsDSxNDHGQBiAAbAGQBGABkAXwAGAAUAGQBFwCIARQAUwCUTksBhpQpjANwY3SUhZSMHzxpcHl0aG9uLWlucHV0LTI3LTM4MzMzNDUyMWQ3NT6UjAg8bGFtYmRhPpRLAkMAlIwGZmFjdG9ylIwBeJSGlCl0lFKUfZQojAtfX3BhY2thZ2VfX5ROjAhfX25hbWVfX5SMCF9fbWFpbl9flHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUaBopUpSGlHSUUpSMHGNsb3VkcGlja2xlLmNsb3VkcGlja2xlX2Zhc3SUjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoH32UfZQoaBdoDowMX19xdWFsbmFtZV9flIwkbGluZWFyX2RlY2F5X3NjaGVkLjxsb2NhbHM+LjxsYW1iZGE+lIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoGIwHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEsKhZRSlGgvRz9QYk3S8an8hZRSlIaUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"
|
59 |
},
|
60 |
"_last_obs": {
|
61 |
":type:": "<class 'numpy.ndarray'>",
|
62 |
+
":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAAD0uzwI7XQ/7h2SPTPkZb+Qck49dpHQPAAAAAAAAAAAGj0rPeGok7qDqUi9kDB2MMKhhrrSVp+zAACAPwAAgD+zHRS+uOjNPFYDrz6nfl++tTJmPqti1z0AAAAAAAAAABrvIj5SP4O7qHxAuRN4UTYmk7m8WlZeOAAAgD8AAIA/GrALPYXsx7vhmgu8oQqOOyF2TT2vM4a8AACAPwAAgD8Nx5s9re3SPtYLqzx/ZiK/tTrNPQ/EKb0AAAAAAAAAAIa6Cb41KTs/t+JLvndXb79GmDS+EnlWvQAAAAAAAAAA2owYvqNXYD3ntYw+fdJhvjM5T73Igzk+AAAAAAAAAAC6vAC+3ymFP1ZAjb6nIXG/gZsJvlNV6r0AAAAAAAAAADN/Tr32wDC6TrUKPAaH/LLOF3m7KP9+sgAAgD8AAIA/JleIPY/OfbooAto3ZvDQMjJ2cbkLq/62AACAPwAAgD+AVsS9FESEupJngD6pyai4UcNduxmhn7cAAIA/AAAAAM2ee7zDsQu6rwG2ty9UpbICS+a7Q/HZNgAAgD8AAIA/qhB6vl4BKj8Wcwq+xSIovxiynb5TkLM8AAAAAAAAAACavPQ9hTCpPrU2471GuhW/Lv7APdqUnb0AAAAAAAAAAM3MUzyCz6Y/KHLmPSysC7/vFoI8Su/nOgAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
|
63 |
},
|
64 |
"_last_episode_starts": {
|
65 |
":type:": "<class 'numpy.ndarray'>",
|
|
|
72 |
"_current_progress_remaining": -0.007616000000000067,
|
73 |
"ep_info_buffer": {
|
74 |
":type:": "<class 'collections.deque'>",
|
75 |
+
":serialized:": "gAWVHxAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIAwtgykCRcUCUhpRSlIwBbJRLpYwBdJRHQKF1zsiSq2l1fZQoaAZoCWgPQwiscwzIHpdwQJSGlFKUaBVLqWgWR0ChdgMZHd43dX2UKGgGaAloD0MInDQNiiZecECUhpRSlGgVS6VoFkdAoXYXoRqXW3V9lChoBmgJaA9DCGdkkLuI2m9AlIaUUpRoFUueaBZHQKF2OKYRdyF1fZQoaAZoCWgPQwh3K0t0FsdyQJSGlFKUaBVLwGgWR0Chdk0rsjVydX2UKGgGaAloD0MI9phIaba4cUCUhpRSlGgVS7loFkdAoXZ1+CsfaHV9lChoBmgJaA9DCLNAu0NK3HFAlIaUUpRoFUu7aBZHQKF2kpx3mmt1fZQoaAZoCWgPQwhSf73CAohwQJSGlFKUaBVLo2gWR0ChdpDtG/etdX2UKGgGaAloD0MI2ILeG4P6c0CUhpRSlGgVS+1oFkdAoXa9OARTTHV9lChoBmgJaA9DCM3n3O36/25AlIaUUpRoFUuUaBZHQKF286HTI/91fZQoaAZoCWgPQwjOp45ViptyQJSGlFKUaBVLq2gWR0ChdzO9eyAydX2UKGgGaAloD0MIJCao4ZtDckCUhpRSlGgVS89oFkdAoXdJ2OhkAnV9lChoBmgJaA9DCDGVfsKZYnNAlIaUUpRoFUuyaBZHQKF3+EU0vXd1fZQoaAZoCWgPQwhD5zV2CX9wQJSGlFKUaBVLn2gWR0CheAhuXNTtdX2UKGgGaAloD0MI/Yf021ejcECUhpRSlGgVS6BoFkdAoXgNlPJq7HV9lChoBmgJaA9DCAO2gxH78nFAlIaUUpRoFUuNaBZHQKF4F4Uvf0p1fZQoaAZoCWgPQwgzjLtBtIlxQJSGlFKUaBVLmWgWR0CheGihWYF8dX2UKGgGaAloD0MIt7QaEjc3c0CUhpRSlGgVS7doFkdAoXifVbzK93V9lChoBmgJaA9DCHNmu0IfWXFAlIaUUpRoFUuXaBZHQKGJ3uIhyKh1fZQoaAZoCWgPQwgtlbcjnLNyQJSGlFKUaBVLwGgWR0ChigFIVdondX2UKGgGaAloD0MIB5eOOc9MbkCUhpRSlGgVS7hoFkdAoYoOu9vjwXV9lChoBmgJaA9DCOC8OPEVCnRAlIaUUpRoFUu4aBZHQKGKK3y7PIJ1fZQoaAZoCWgPQwiAEMmQ409xQJSGlFKUaBVLkmgWR0ChikwjUutfdX2UKGgGaAloD0MIRwTj4JK3cECUhpRSlGgVS6RoFkdAoYpK3uuzQnV9lChoBmgJaA9DCE8kmGomgHNAlIaUUpRoFUvKaBZHQKGKafwqiGp1fZQoaAZoCWgPQwg/4ezWMmFxQJSGlFKUaBVLrmgWR0ChisWWpqASdX2UKGgGaAloD0MIUn5S7RMpckCUhpRSlGgVS9RoFkdAoYwjobGWEHV9lChoBmgJaA9DCJYlOsss0HJAlIaUUpRoFUvSaBZHQKGMQMjNY8x1fZQoaAZoCWgPQwiPpnoyP+NyQJSGlFKUaBVL3GgWR0ChjFnbItDldX2UKGgGaAloD0MI9wMeGEDlc0CUhpRSlGgVS9toFkdAoYxdGI9C/3V9lChoBmgJaA9DCPz/OGHCOHNAlIaUUpRoFUu8aBZHQKGMeOLiuMd1fZQoaAZoCWgPQwgpIVhVr91vQJSGlFKUaBVLmmgWR0ChjHZOSGJvdX2UKGgGaAloD0MITyMtlfefc0CUhpRSlGgVS9NoFkdAoYyXp6hQFnV9lChoBmgJaA9DCNKOG36323BAlIaUUpRoFUuhaBZHQKGM8npjc211fZQoaAZoCWgPQwhPBkfJK2JyQJSGlFKUaBVLyWgWR0ChjPnwgDA8dX2UKGgGaAloD0MIKo4Dr5ZTcUCUhpRSlGgVS6xoFkdAoYz8/lhgE3V9lChoBmgJaA9DCAZM4NZdbm9AlIaUUpRoFUuQaBZHQKGNEGVRk3F1fZQoaAZoCWgPQwgbDeAtEB9yQJSGlFKUaBVLvWgWR0ChjRiQ1aW5dX2UKGgGaAloD0MIf6MdNzy1cUCUhpRSlGgVS7poFkdAoY0sfs/puHV9lChoBmgJaA9DCCC1iZO7GnNAlIaUUpRoFUvTaBZHQKGNPD7ZWaN1fZQoaAZoCWgPQwjdJtwrc8pvQJSGlFKUaBVLi2gWR0ChjnKRuCPIdX2UKGgGaAloD0MIf6FHjF5KcECUhpRSlGgVS4poFkdAoY6I7JW/8HV9lChoBmgJaA9DCGwldJdEXHJAlIaUUpRoFUu0aBZHQKGPJk5IYm91fZQoaAZoCWgPQwh1HaopiU9xQJSGlFKUaBVLr2gWR0ChjzHvMKTjdX2UKGgGaAloD0MIjukJS7wcckCUhpRSlGgVS8poFkdAoY9TB9Cu2nV9lChoBmgJaA9DCDTW/s62+nFAlIaUUpRoFUvDaBZHQKGPUNBnjAB1fZQoaAZoCWgPQwjQtpp1hjdyQJSGlFKUaBVLiGgWR0Chj2+ZG8VYdX2UKGgGaAloD0MI3H9kOrRsckCUhpRSlGgVS6FoFkdAoY+LiKiwjnV9lChoBmgJaA9DCEJClC+oZHNAlIaUUpRoFUu9aBZHQKGPknXumaZ1fZQoaAZoCWgPQwivXkVGBy5xQJSGlFKUaBVLl2gWR0Chj5mMXJo1dX2UKGgGaAloD0MIWTFcHQAjckCUhpRSlGgVS7FoFkdAoY/IIKMNt3V9lChoBmgJaA9DCHAi+rV1UXJAlIaUUpRoFUu3aBZHQKGP2SYgJTl1fZQoaAZoCWgPQwhU/N8RlWRxQJSGlFKUaBVLsWgWR0Chj+1hTfixdX2UKGgGaAloD0MIl/+Qfvt6C8CUhpRSlGgVS2poFkdAoZFh8lXzUnV9lChoBmgJaA9DCK98lufBmXFAlIaUUpRoFUuraBZHQKGRfDgqEvl1fZQoaAZoCWgPQwi7mGa611VwQJSGlFKUaBVLiGgWR0ChkYl6iTMadX2UKGgGaAloD0MIhnZOs4B3c0CUhpRSlGgVS8toFkdAoZH78R+SbHV9lChoBmgJaA9DCMGO/wIBGHJAlIaUUpRoFUupaBZHQKGSGOXE61d1fZQoaAZoCWgPQwiu78NBgvZxQJSGlFKUaBVLqWgWR0ChkmRBmf5DdX2UKGgGaAloD0MIAvG6fgH9cUCUhpRSlGgVS6ZoFkdAoZKFnoPkJnV9lChoBmgJaA9DCL2NzY7U13FAlIaUUpRoFUugaBZHQKGSnssQNCt1fZQoaAZoCWgPQwjBG9KoQOFwQJSGlFKUaBVLomgWR0ChkrqbKA8TdX2UKGgGaAloD0MId2SsNn/AckCUhpRSlGgVS8VoFkdAoZMG1ndwenV9lChoBmgJaA9DCDGXVG035XNAlIaUUpRoFUvhaBZHQKGTTtjTa0x1fZQoaAZoCWgPQwjFAl/RrSZyQJSGlFKUaBVLvmgWR0Chk1dGiHqNdX2UKGgGaAloD0MIIH9pUV9ackCUhpRSlGgVS+toFkdAoZN4bsF+u3V9lChoBmgJaA9DCESoUrOHw2JAlIaUUpRoFU3oA2gWR0ChlB/D+BH1dX2UKGgGaAloD0MIIO7qVeSMcECUhpRSlGgVS6BoFkdAoZRWelKsdXV9lChoBmgJaA9DCDnThO0nenBAlIaUUpRoFUuaaBZHQKGUo6Ae7tl1fZQoaAZoCWgPQwguAI3SJYlxQJSGlFKUaBVLmGgWR0ChlLWSU1Q7dX2UKGgGaAloD0MI1q2ek95kcUCUhpRSlGgVS7loFkdAoZS/WOIZZXV9lChoBmgJaA9DCJfGL7ySBHJAlIaUUpRoFUvKaBZHQKGU5DUExIt1fZQoaAZoCWgPQwibBG9Io7FvQJSGlFKUaBVLkWgWR0ChlPYIjW07dX2UKGgGaAloD0MInP2BcpsAdECUhpRSlGgVS6BoFkdAoZUPmgam43V9lChoBmgJaA9DCEdxjjo6AWVAlIaUUpRoFU3oA2gWR0ChlT8oH9m6dX2UKGgGaAloD0MITwMGSZ+5b0CUhpRSlGgVS6NoFkdAoZVIrBj4H3V9lChoBmgJaA9DCHGt9rAXs3JAlIaUUpRoFUuiaBZHQKGVVe/Ho5h1fZQoaAZoCWgPQwjBOLh0jJJyQJSGlFKUaBVLsmgWR0ChlcAYYR/WdX2UKGgGaAloD0MIQDGyZE6MckCUhpRSlGgVS5poFkdAoZXAI+nqFHV9lChoBmgJaA9DCEwXYvWHbXBAlIaUUpRoFUujaBZHQKGVxt0FKTV1fZQoaAZoCWgPQwiw/s9hPjB0QJSGlFKUaBVLxGgWR0Chlizch1TzdX2UKGgGaAloD0MInInpQizfc0CUhpRSlGgVS6hoFkdAoZZokE9t/HV9lChoBmgJaA9DCCI17WKaiHNAlIaUUpRoFUvCaBZHQKGW8JbdJrd1fZQoaAZoCWgPQwjAJmvUg9ByQJSGlFKUaBVLr2gWR0ChlwY95hScdX2UKGgGaAloD0MIEHf1KnLbcUCUhpRSlGgVS4hoFkdAoZcAlnh86XV9lChoBmgJaA9DCAA8okL1s3NAlIaUUpRoFUuZaBZHQKGXCzAN5MV1fZQoaAZoCWgPQwh7+DJRRClzQJSGlFKUaBVLwWgWR0Chly8Empl0dX2UKGgGaAloD0MInIu/7Umlc0CUhpRSlGgVS7RoFkdAoZc6sU7CBXV9lChoBmgJaA9DCJpeYizT93BAlIaUUpRoFUu6aBZHQKGXW1k1/Dt1fZQoaAZoCWgPQwgra5visUpzQJSGlFKUaBVLnmgWR0Chl10x/NJOdX2UKGgGaAloD0MIkSv1LIgnckCUhpRSlGgVS81oFkdAoZdr5j6N2nV9lChoBmgJaA9DCFPMQdBR2XJAlIaUUpRoFUu/aBZHQKGXrCF9KEp1fZQoaAZoCWgPQwhGCI82zoxwQJSGlFKUaBVLnGgWR0Chl7bXpW3jdX2UKGgGaAloD0MIK2haYmXucECUhpRSlGgVS7doFkdAoZgEjJMg2nV9lChoBmgJaA9DCG04LA38hnRAlIaUUpRoFUumaBZHQKGYOJNTLnt1fZQoaAZoCWgPQwhTBaOSejRwQJSGlFKUaBVLoGgWR0ChmGKRU3n7dX2UKGgGaAloD0MIQtKnVTQ2ckCUhpRSlGgVS9ZoFkdAoZhpwyZa3nV9lChoBmgJaA9DCJQvaCHBeHFAlIaUUpRoFUuHaBZHQKGYkHWSU1R1fZQoaAZoCWgPQwgXRnpRu9JxQJSGlFKUaBVLkWgWR0ChmMYO2AoYdX2UKGgGaAloD0MImGw82CKacECUhpRSlGgVS51oFkdAoZj1kDp1R3VlLg=="
|
76 |
},
|
77 |
"ep_success_buffer": {
|
78 |
":type:": "<class 'collections.deque'>",
|
|
|
82 |
"n_steps": 1024,
|
83 |
"gamma": 0.99,
|
84 |
"gae_lambda": 0.95,
|
85 |
+
"ent_coef": 0.0,
|
86 |
"vf_coef": 0.5,
|
87 |
"max_grad_norm": 0.5,
|
88 |
"batch_size": 64,
|
89 |
"n_epochs": 10,
|
90 |
"clip_range": {
|
91 |
":type:": "<class 'function'>",
|
92 |
+
":serialized:": "gAWVTQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAUsDSxNDHGQBiAAbAGQBGABkAXwAGAAUAGQBFwCIARQAUwCUTksBhpQpjANwY3SUhZSMHzxpcHl0aG9uLWlucHV0LTI3LTM4MzMzNDUyMWQ3NT6UjAg8bGFtYmRhPpRLAkMAlIwGZmFjdG9ylIwBeJSGlCl0lFKUfZQojAtfX3BhY2thZ2VfX5ROjAhfX25hbWVfX5SMCF9fbWFpbl9flHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUaBopUpSGlHSUUpSMHGNsb3VkcGlja2xlLmNsb3VkcGlja2xlX2Zhc3SUjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoH32UfZQoaBdoDowMX19xdWFsbmFtZV9flIwkbGluZWFyX2RlY2F5X3NjaGVkLjxsb2NhbHM+LjxsYW1iZGE+lIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoGIwHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEsKhZRSlGgvRz/JmZmZmZmahZRSlIaUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"
|
93 |
},
|
94 |
"clip_range_vf": null,
|
95 |
"target_kl": null
|
LunarLander-v2-ppo/policy.optimizer.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 84637
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0231f82e28d580f8d2357fa4232cbf593c4cd463ea47cbccb4a2c7fcd76e6837
|
3 |
size 84637
|
LunarLander-v2-ppo/policy.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 43073
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3f40f091e67b09e9b12bbd11a7bb6ee9c04684eaf0859172f6ed9a81e4dfa211
|
3 |
size 43073
|
README.md
CHANGED
@@ -10,7 +10,7 @@ model-index:
|
|
10 |
results:
|
11 |
- metrics:
|
12 |
- type: mean_reward
|
13 |
-
value:
|
14 |
name: mean_reward
|
15 |
task:
|
16 |
type: reinforcement-learning
|
|
|
10 |
results:
|
11 |
- metrics:
|
12 |
- type: mean_reward
|
13 |
+
value: 274.96 +/- 15.47
|
14 |
name: mean_reward
|
15 |
task:
|
16 |
type: reinforcement-learning
|
config.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7fd21fd5b4d0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7fd21fd5b560>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7fd21fd5b5f0>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7fd21fd5b680>", "_build": "<function ActorCriticPolicy._build at 0x7fd21fd5b710>", "forward": "<function ActorCriticPolicy.forward at 0x7fd21fd5b7a0>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7fd21fd5b830>", "_predict": "<function ActorCriticPolicy._predict at 0x7fd21fd5b8c0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7fd21fd5b950>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7fd21fd5b9e0>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7fd21fd5ba70>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc_data object at 0x7fd21fd34060>"}, "verbose": 1, "policy_kwargs": {}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVngEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBXNoYXBllEsIhZSMA2xvd5SMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYgAAAAAAAAAAAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/lGgKSwiFlIwBQ5R0lFKUjARoaWdolGgSKJYgAAAAAAAAAAAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/lGgKSwiFlGgVdJRSlIwNYm91bmRlZF9iZWxvd5RoEiiWCAAAAAAAAAAAAAAAAAAAAJRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZRoFXSUUpSMDWJvdW5kZWRfYWJvdmWUaBIolggAAAAAAAAAAAAAAAAAAACUaCFLCIWUaBV0lFKUjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "shape": [8], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False]", "bounded_above": "[False False False False False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gAWVgQAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwFc2hhcGWUKYwFZHR5cGWUjAVudW1weZRoB5OUjAJpOJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRijApfbnBfcmFuZG9tlE51Yi4=", "n": 4, "shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "num_timesteps": 2015232, "_total_timesteps": 2000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1652284910.763263, "learning_rate": {":type:": "<class 'function'>", ":serialized:": "gAWVTAIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAUsDSxNDHGQBiAAbAGQBGABkAXwAGAAUAGQBFwCIARQAUwCUTksBhpQpjANwY3SUhZSMHjxpcHl0aG9uLWlucHV0LTctMzgzMzM0NTIxZDc1PpSMCDxsYW1iZGE+lEsCQwCUjAZmYWN0b3KUjAF4lIaUKXSUUpR9lCiMC19fcGFja2FnZV9flE6MCF9fbmFtZV9flIwIX19tYWluX1+UdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpRoGilSlIaUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoF2gOjAxfX3F1YWxuYW1lX1+UjCRsaW5lYXJfZGVjYXlfc2NoZWQuPGxvY2Fscz4uPGxhbWJkYT6UjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgYjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOUSwqFlFKUaC9HP1BiTdLxqfyFlFKUhpSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "tensorboard_log": "runs/27c28ti0", "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVTAIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAUsDSxNDHGQBiAAbAGQBGABkAXwAGAAUAGQBFwCIARQAUwCUTksBhpQpjANwY3SUhZSMHjxpcHl0aG9uLWlucHV0LTctMzgzMzM0NTIxZDc1PpSMCDxsYW1iZGE+lEsCQwCUjAZmYWN0b3KUjAF4lIaUKXSUUpR9lCiMC19fcGFja2FnZV9flE6MCF9fbmFtZV9flIwIX19tYWluX1+UdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpRoGilSlIaUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoF2gOjAxfX3F1YWxuYW1lX1+UjCRsaW5lYXJfZGVjYXlfc2NoZWQuPGxvY2Fscz4uPGxhbWJkYT6UjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgYjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOUSwqFlFKUaC9HP1BiTdLxqfyFlFKUhpSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAGjki76f8Ik/YFb1vsUIT7/+xKe+WrUVvgAAAAAAAAAAADGxPN30sD9fljc/7kjlvhKvmLwY/Ki9AAAAAAAAAACmLqk9LeU4P8phJzzmVXG/5cXxPdsIdL0AAAAAAAAAABoaX72PrkO6ZOyzupoBODNzB6y73ZfQOQAAgD8AAIA/ZnKDvLihvz88Ucq9Ha+MPZtYC7yXDiu9AAAAAAAAAADNz6I8u4i2P9zThz5ME4Q8creDuy2Lhj0AAAAAAAAAAGYwpT374pU95js8vrzexb5VX1a9NwO8vQAAAAAAAAAA5j5SPSl8CTmSDJ6zZJlYLma0aLvQzsQzAACAPwAAgD8AQJ46UfyvPxrsjjxXBp6+6Peyuor6f7sAAAAAAAAAABrdZD0UHJ26Xk64t5ow6bJI74s6gnjTNgAAgD8AAIA/GhqmPbi/uD3Nb7a3AnO5vl1/Nj1+Lf88AAAAAAAAAACa50c9vRUwPNFlwb05jl6+zi6MvUmZEr0AAAAAAAAAAO2tDD4Ldas/lvcjP8nQ0b7dxzI+pWP0PgAAAAAAAAAAzaLlvK5pobpWxPO3Gh7YsoYR8bkWSQw3AACAPwAAgD+ttho+xGl+P3xDsT4c4i6/H56YPmq9fj4AAAAAAAAAALqPGj7+IZs+YhemvhPYKL/OoDW91sizvQAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.007616000000000067, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVHRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIrwYoDTU4cUCUhpRSlIwBbJRLsYwBdJRHQKIYpgx8D0V1fZQoaAZoCWgPQwiIodXJGSJwQJSGlFKUaBVLlWgWR0CiGKEJa7mMdX2UKGgGaAloD0MIPXyZKIK+cECUhpRSlGgVS4poFkdAohi591EE1XV9lChoBmgJaA9DCP9YiA4BYnJAlIaUUpRoFUu8aBZHQKIY2mTkhid1fZQoaAZoCWgPQwiI2jaMwnRyQJSGlFKUaBVL1GgWR0CiLIExh2GJdX2UKGgGaAloD0MIwVQza2lLcECUhpRSlGgVS51oFkdAoiyCjJuEVXV9lChoBmgJaA9DCKwCtRg8o3BAlIaUUpRoFUubaBZHQKIshZ7HAAR1fZQoaAZoCWgPQwg9gbBTbFRzQJSGlFKUaBVLrmgWR0CiLJhkqc3EdX2UKGgGaAloD0MIxvzc0NQNckCUhpRSlGgVS7hoFkdAoi19jurp7nV9lChoBmgJaA9DCCmYMQWrxnJAlIaUUpRoFUugaBZHQKItoPYnOSp1fZQoaAZoCWgPQwjwplt2CC1zQJSGlFKUaBVLvGgWR0CiLagntv4udX2UKGgGaAloD0MIQnbexiZKckCUhpRSlGgVS6BoFkdAoi3LxiG34XV9lChoBmgJaA9DCIbLKmyGhnNAlIaUUpRoFUu9aBZHQKIt7lZowmF1fZQoaAZoCWgPQwgotoKmZUxzQJSGlFKUaBVLpmgWR0CiLfXumaYvdX2UKGgGaAloD0MIOPbsuUwDcECUhpRSlGgVS5doFkdAoi4JRCQcP3V9lChoBmgJaA9DCKJ+F7YmnnBAlIaUUpRoFUuraBZHQKIuGWN3np11fZQoaAZoCWgPQwheglMfyAdwQJSGlFKUaBVLpWgWR0CiLh7JfYz0dX2UKGgGaAloD0MIMZdUbbc6cECUhpRSlGgVS49oFkdAoi5MiKR+0HV9lChoBmgJaA9DCMbhzK8mFXJAlIaUUpRoFUu/aBZHQKIude7cwg11fZQoaAZoCWgPQwiDaoMT0UJyQJSGlFKUaBVLr2gWR0CiLoBg3LmqdX2UKGgGaAloD0MIbvqzH6mcckCUhpRSlGgVS9RoFkdAoi6Xxx1gY3V9lChoBmgJaA9DCGprRDAOsnFAlIaUUpRoFUuvaBZHQKIutGyX2M91fZQoaAZoCWgPQwi3ek56X8NzQJSGlFKUaBVLvmgWR0CiLtw8OkLydX2UKGgGaAloD0MIBJFFmng7SkCUhpRSlGgVS1NoFkdAoi8UdPtUoHV9lChoBmgJaA9DCFK2SNpNQnJAlIaUUpRoFUvZaBZHQKIvZK6nR9h1fZQoaAZoCWgPQwjfUznt6SxwQJSGlFKUaBVLjWgWR0CiL6tSZSeidX2UKGgGaAloD0MIlsyxvKudcUCUhpRSlGgVS4NoFkdAoi/fWe6I33V9lChoBmgJaA9DCLGJzFwgoXFAlIaUUpRoFUuUaBZHQKIv8sXizcB1fZQoaAZoCWgPQwh4nKIjedZxQJSGlFKUaBVLsGgWR0CiL/2+wkgPdX2UKGgGaAloD0MIlkIglzhOdECUhpRSlGgVS7JoFkdAojAMp5NXYHV9lChoBmgJaA9DCFn4+lpX5XJAlIaUUpRoFUvCaBZHQKIwHBw++uh1fZQoaAZoCWgPQwi0VrQ5jjlzQJSGlFKUaBVLnmgWR0CiMDdfb9IgdX2UKGgGaAloD0MIuAGfH4aEcECUhpRSlGgVS4toFkdAojBZi9ZieHV9lChoBmgJaA9DCBqiCn8GJHJAlIaUUpRoFUu7aBZHQKIwbJL/S6V1fZQoaAZoCWgPQwj4ja8984xwQJSGlFKUaBVLmGgWR0CiMJ6By0a7dX2UKGgGaAloD0MI6fLmcK2Fc0CUhpRSlGgVS6hoFkdAojC5zeXRgXV9lChoBmgJaA9DCEcCDTY1dnFAlIaUUpRoFUu9aBZHQKIwxj0+TvB1fZQoaAZoCWgPQwiYE7TJYVdyQJSGlFKUaBVLmmgWR0CiMOhAWznidX2UKGgGaAloD0MIvk1/9uNVckCUhpRSlGgVS7FoFkdAojEITCcf/3V9lChoBmgJaA9DCCMsKuJ06XBAlIaUUpRoFUulaBZHQKIxPyqdYnx1fZQoaAZoCWgPQwhwe4LE9qFwQJSGlFKUaBVLj2gWR0CiMTlHz6JqdX2UKGgGaAloD0MIqOMxA1WJcUCUhpRSlGgVS45oFkdAojGm/Ho5gnV9lChoBmgJaA9DCCno9pJGY3FAlIaUUpRoFUuXaBZHQKIx477sOXp1fZQoaAZoCWgPQwi8dJMYBHxwQJSGlFKUaBVLmGgWR0CiMfSIpH7QdX2UKGgGaAloD0MIgPRNmoalc0CUhpRSlGgVS7JoFkdAojH0nkT6BXV9lChoBmgJaA9DCE2CN6RRvnFAlIaUUpRoFUu7aBZHQKIyeNjLB9F1fZQoaAZoCWgPQwhioGtfgLpxQJSGlFKUaBVLpWgWR0CiMoUeU6gedX2UKGgGaAloD0MIL/1LUtlHcUCUhpRSlGgVS7BoFkdAojKViWmgrnV9lChoBmgJaA9DCOmedY3W93BAlIaUUpRoFUuVaBZHQKIyposZpBZ1fZQoaAZoCWgPQwiKk/sdirFxQJSGlFKUaBVLo2gWR0CiMrgWrOqvdX2UKGgGaAloD0MIYhVvZB4Wc0CUhpRSlGgVS+RoFkdAojLaSvC/GnV9lChoBmgJaA9DCIS53cu9dXJAlIaUUpRoFUumaBZHQKIy5/8VHnV1fZQoaAZoCWgPQwiC4seYu1F0QJSGlFKUaBVL1GgWR0CiMuXTEzfrdX2UKGgGaAloD0MI2QkvwekdcUCUhpRSlGgVS5toFkdAojMCEBbOeXV9lChoBmgJaA9DCPnAjv+C+XJAlIaUUpRoFUudaBZHQKIzMf8Muvl1fZQoaAZoCWgPQwgA4q5eBedyQJSGlFKUaBVLvGgWR0CiM0NwR5C4dX2UKGgGaAloD0MIEy15PG22cUCUhpRSlGgVS69oFkdAojN0G3WnTHV9lChoBmgJaA9DCEuTUtAt4nFAlIaUUpRoFUutaBZHQKI0FV6NVBF1fZQoaAZoCWgPQwg34sluJmxwQJSGlFKUaBVLp2gWR0CiNBMuFpPAdX2UKGgGaAloD0MIV12HasowckCUhpRSlGgVS7FoFkdAojQ3zg/C7HV9lChoBmgJaA9DCDKR0mzeynNAlIaUUpRoFUvRaBZHQKI0XzK9wm51fZQoaAZoCWgPQwjryfyjr29yQJSGlFKUaBVLfmgWR0CiNHzW5H3DdX2UKGgGaAloD0MIYcJoVnYucECUhpRSlGgVS5toFkdAojSVZRsMzHV9lChoBmgJaA9DCNcS8kHPknNAlIaUUpRoFUujaBZHQKI0oCZF5Od1fZQoaAZoCWgPQwjXS1ME+NRwQJSGlFKUaBVLn2gWR0CiNLY5cTrWdX2UKGgGaAloD0MIyJQPQRVCcUCUhpRSlGgVS51oFkdAojS/wy6+WXV9lChoBmgJaA9DCPHwngPL2W9AlIaUUpRoFUuaaBZHQKI05nSOR1Z1fZQoaAZoCWgPQwjEd2LWiytzQJSGlFKUaBVLzGgWR0CiNRYWcjJNdX2UKGgGaAloD0MI6RA4Emg5cUCUhpRSlGgVS7doFkdAojVGevpyInV9lChoBmgJaA9DCO+SOCviknBAlIaUUpRoFUuxaBZHQKI1rBa9sad1fZQoaAZoCWgPQwi9GTVf5d1wQJSGlFKUaBVLqGgWR0CiNcB1cMVldX2UKGgGaAloD0MIkh/xK5YVc0CUhpRSlGgVS9loFkdAojXoQz1scnV9lChoBmgJaA9DCNCZtKk6e3JAlIaUUpRoFUuRaBZHQKI2DCjUNKB1fZQoaAZoCWgPQwje5/hosWBzQJSGlFKUaBVL1WgWR0CiNhXNcGC7dX2UKGgGaAloD0MIT3Yzo1+tcUCUhpRSlGgVS7NoFkdAojZ329L6DXV9lChoBmgJaA9DCAIQd/Wq5nBAlIaUUpRoFUupaBZHQKI2d8a4tpV1fZQoaAZoCWgPQwh5eM+B5WVzQJSGlFKUaBVLrGgWR0CiNqITXarWdX2UKGgGaAloD0MI4Ep2bASrcECUhpRSlGgVS6FoFkdAojazKNhmXnV9lChoBmgJaA9DCF35LM+DanJAlIaUUpRoFUuSaBZHQKI20oiLVFx1fZQoaAZoCWgPQwjx8nSuaNhxQJSGlFKUaBVLvWgWR0CiNvFXq7iAdX2UKGgGaAloD0MImkS94NO6b0CUhpRSlGgVS6loFkdAojbw9ovi+HV9lChoBmgJaA9DCKj/rPlxJXBAlIaUUpRoFUuJaBZHQKI3Cvjfek51fZQoaAZoCWgPQwhTILOzKCNyQJSGlFKUaBVLuWgWR0CiNxZHd43WdX2UKGgGaAloD0MItVAyOXXTcUCUhpRSlGgVS8toFkdAojc4s7MgU3V9lChoBmgJaA9DCPa0w19TH3JAlIaUUpRoFUt4aBZHQKI3PF4LThJ1fZQoaAZoCWgPQwgDfSJPEuhxQJSGlFKUaBVLrmgWR0CiN1CTdLxqdX2UKGgGaAloD0MI3xYs1UXyckCUhpRSlGgVS6poFkdAojfB2IO6NHV9lChoBmgJaA9DCIy/7QkSV3JAlIaUUpRoFUuQaBZHQKI3z/MGHHp1fZQoaAZoCWgPQwh7iEZ3UHVyQJSGlFKUaBVLgGgWR0CiOACdz4lAdX2UKGgGaAloD0MIfqfJjLdyUECUhpRSlGgVS3doFkdAojge+AVfu3V9lChoBmgJaA9DCIKtEixOGXFAlIaUUpRoFUu2aBZHQKI4IYPXkHV1fZQoaAZoCWgPQwhDkIMSZqpxQJSGlFKUaBVLo2gWR0CiOHLl3hXKdX2UKGgGaAloD0MIhzJUxRRxckCUhpRSlGgVS89oFkdAojiXgYP5HnV9lChoBmgJaA9DCMTMPo/RWm5AlIaUUpRoFUufaBZHQKI45HSWqtJ1fZQoaAZoCWgPQwgXK2owjeBzQJSGlFKUaBVLyGgWR0CiORmx2SuAdX2UKGgGaAloD0MI/82LE9+6c0CUhpRSlGgVS7poFkdAojk+hRIjGHV9lChoBmgJaA9DCDZ39L9crHJAlIaUUpRoFUumaBZHQKI5UXLvCuV1fZQoaAZoCWgPQwh2cRsNoPpzQJSGlFKUaBVL0mgWR0CiOWntF8XvdX2UKGgGaAloD0MI5X6HokBVc0CUhpRSlGgVS75oFkdAojln9xZMc3V9lChoBmgJaA9DCLn+XZ85D3NAlIaUUpRoFUu0aBZHQKI5fSofjjt1ZS4="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 1230, "n_steps": 1024, "gamma": 0.99, "gae_lambda": 0.95, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 10, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVTAIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAUsDSxNDHGQBiAAbAGQBGABkAXwAGAAUAGQBFwCIARQAUwCUTksBhpQpjANwY3SUhZSMHjxpcHl0aG9uLWlucHV0LTctMzgzMzM0NTIxZDc1PpSMCDxsYW1iZGE+lEsCQwCUjAZmYWN0b3KUjAF4lIaUKXSUUpR9lCiMC19fcGFja2FnZV9flE6MCF9fbmFtZV9flIwIX19tYWluX1+UdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpRoGilSlIaUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoF2gOjAxfX3F1YWxuYW1lX1+UjCRsaW5lYXJfZGVjYXlfc2NoZWQuPGxvY2Fscz4uPGxhbWJkYT6UjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgYjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOUSwqFlFKUaC9HP8mZmZmZmZqFlFKUhpSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "clip_range_vf": null, "target_kl": null, "system_info": {"OS": "Linux-5.4.188+-x86_64-with-Ubuntu-18.04-bionic #1 SMP Sun Apr 24 10:03:06 PDT 2022", "Python": "3.7.13", "Stable-Baselines3": "1.4.0", "PyTorch": "1.11.0+cu113", "GPU Enabled": "False", "Numpy": "1.21.6", "Gym": "0.17.3"}}
|
|
|
1 |
+
{"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param sde_net_arch: Network architecture for extracting features\n when using gSDE. If None, the latent features from the policy will be used.\n Pass an empty list to use the states as features.\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f2ecf22b710>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f2ecf22b7a0>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f2ecf22b830>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f2ecf22b8c0>", "_build": "<function ActorCriticPolicy._build at 0x7f2ecf22b950>", "forward": "<function ActorCriticPolicy.forward at 0x7f2ecf22b9e0>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f2ecf22ba70>", "_predict": "<function ActorCriticPolicy._predict at 0x7f2ecf22bb00>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f2ecf22bb90>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f2ecf22bc20>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f2ecf22bcb0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc_data object at 0x7f2ecf26cbd0>"}, "verbose": 1, "policy_kwargs": {}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVngEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBXNoYXBllEsIhZSMA2xvd5SMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYgAAAAAAAAAAAAgP8AAID/AACA/wAAgP8AAID/AACA/wAAgP8AAID/lGgKSwiFlIwBQ5R0lFKUjARoaWdolGgSKJYgAAAAAAAAAAAAgH8AAIB/AACAfwAAgH8AAIB/AACAfwAAgH8AAIB/lGgKSwiFlGgVdJRSlIwNYm91bmRlZF9iZWxvd5RoEiiWCAAAAAAAAAAAAAAAAAAAAJRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZRoFXSUUpSMDWJvdW5kZWRfYWJvdmWUaBIolggAAAAAAAAAAAAAAAAAAACUaCFLCIWUaBV0lFKUjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "shape": [8], "low": "[-inf -inf -inf -inf -inf -inf -inf -inf]", "high": "[inf inf inf inf inf inf inf inf]", "bounded_below": "[False False False False False False False False]", "bounded_above": "[False False False False False False False False]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gAWVgQAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwFc2hhcGWUKYwFZHR5cGWUjAVudW1weZRoB5OUjAJpOJSJiIeUUpQoSwOMATyUTk5OSv////9K/////0sAdJRijApfbnBfcmFuZG9tlE51Yi4=", "n": 4, "shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "num_timesteps": 2015232, "_total_timesteps": 2000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1652472552.9625235, "learning_rate": {":type:": "<class 'function'>", ":serialized:": "gAWVTQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAUsDSxNDHGQBiAAbAGQBGABkAXwAGAAUAGQBFwCIARQAUwCUTksBhpQpjANwY3SUhZSMHzxpcHl0aG9uLWlucHV0LTI3LTM4MzMzNDUyMWQ3NT6UjAg8bGFtYmRhPpRLAkMAlIwGZmFjdG9ylIwBeJSGlCl0lFKUfZQojAtfX3BhY2thZ2VfX5ROjAhfX25hbWVfX5SMCF9fbWFpbl9flHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUaBopUpSGlHSUUpSMHGNsb3VkcGlja2xlLmNsb3VkcGlja2xlX2Zhc3SUjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoH32UfZQoaBdoDowMX19xdWFsbmFtZV9flIwkbGluZWFyX2RlY2F5X3NjaGVkLjxsb2NhbHM+LjxsYW1iZGE+lIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoGIwHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEsKhZRSlGgvRz9QYk3S8an8hZRSlIaUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "tensorboard_log": "runs/gf22ryeo", "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVTQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAUsDSxNDHGQBiAAbAGQBGABkAXwAGAAUAGQBFwCIARQAUwCUTksBhpQpjANwY3SUhZSMHzxpcHl0aG9uLWlucHV0LTI3LTM4MzMzNDUyMWQ3NT6UjAg8bGFtYmRhPpRLAkMAlIwGZmFjdG9ylIwBeJSGlCl0lFKUfZQojAtfX3BhY2thZ2VfX5ROjAhfX25hbWVfX5SMCF9fbWFpbl9flHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUaBopUpSGlHSUUpSMHGNsb3VkcGlja2xlLmNsb3VkcGlja2xlX2Zhc3SUjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoH32UfZQoaBdoDowMX19xdWFsbmFtZV9flIwkbGluZWFyX2RlY2F5X3NjaGVkLjxsb2NhbHM+LjxsYW1iZGE+lIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoGIwHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEsKhZRSlGgvRz9QYk3S8an8hZRSlIaUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAAD0uzwI7XQ/7h2SPTPkZb+Qck49dpHQPAAAAAAAAAAAGj0rPeGok7qDqUi9kDB2MMKhhrrSVp+zAACAPwAAgD+zHRS+uOjNPFYDrz6nfl++tTJmPqti1z0AAAAAAAAAABrvIj5SP4O7qHxAuRN4UTYmk7m8WlZeOAAAgD8AAIA/GrALPYXsx7vhmgu8oQqOOyF2TT2vM4a8AACAPwAAgD8Nx5s9re3SPtYLqzx/ZiK/tTrNPQ/EKb0AAAAAAAAAAIa6Cb41KTs/t+JLvndXb79GmDS+EnlWvQAAAAAAAAAA2owYvqNXYD3ntYw+fdJhvjM5T73Igzk+AAAAAAAAAAC6vAC+3ymFP1ZAjb6nIXG/gZsJvlNV6r0AAAAAAAAAADN/Tr32wDC6TrUKPAaH/LLOF3m7KP9+sgAAgD8AAIA/JleIPY/OfbooAto3ZvDQMjJ2cbkLq/62AACAPwAAgD+AVsS9FESEupJngD6pyai4UcNduxmhn7cAAIA/AAAAAM2ee7zDsQu6rwG2ty9UpbICS+a7Q/HZNgAAgD8AAIA/qhB6vl4BKj8Wcwq+xSIovxiynb5TkLM8AAAAAAAAAACavPQ9hTCpPrU2471GuhW/Lv7APdqUnb0AAAAAAAAAAM3MUzyCz6Y/KHLmPSysC7/vFoI8Su/nOgAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.007616000000000067, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVHxAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIAwtgykCRcUCUhpRSlIwBbJRLpYwBdJRHQKF1zsiSq2l1fZQoaAZoCWgPQwiscwzIHpdwQJSGlFKUaBVLqWgWR0ChdgMZHd43dX2UKGgGaAloD0MInDQNiiZecECUhpRSlGgVS6VoFkdAoXYXoRqXW3V9lChoBmgJaA9DCGdkkLuI2m9AlIaUUpRoFUueaBZHQKF2OKYRdyF1fZQoaAZoCWgPQwh3K0t0FsdyQJSGlFKUaBVLwGgWR0Chdk0rsjVydX2UKGgGaAloD0MI9phIaba4cUCUhpRSlGgVS7loFkdAoXZ1+CsfaHV9lChoBmgJaA9DCLNAu0NK3HFAlIaUUpRoFUu7aBZHQKF2kpx3mmt1fZQoaAZoCWgPQwhSf73CAohwQJSGlFKUaBVLo2gWR0ChdpDtG/etdX2UKGgGaAloD0MI2ILeG4P6c0CUhpRSlGgVS+1oFkdAoXa9OARTTHV9lChoBmgJaA9DCM3n3O36/25AlIaUUpRoFUuUaBZHQKF286HTI/91fZQoaAZoCWgPQwjOp45ViptyQJSGlFKUaBVLq2gWR0ChdzO9eyAydX2UKGgGaAloD0MIJCao4ZtDckCUhpRSlGgVS89oFkdAoXdJ2OhkAnV9lChoBmgJaA9DCDGVfsKZYnNAlIaUUpRoFUuyaBZHQKF3+EU0vXd1fZQoaAZoCWgPQwhD5zV2CX9wQJSGlFKUaBVLn2gWR0CheAhuXNTtdX2UKGgGaAloD0MI/Yf021ejcECUhpRSlGgVS6BoFkdAoXgNlPJq7HV9lChoBmgJaA9DCAO2gxH78nFAlIaUUpRoFUuNaBZHQKF4F4Uvf0p1fZQoaAZoCWgPQwgzjLtBtIlxQJSGlFKUaBVLmWgWR0CheGihWYF8dX2UKGgGaAloD0MIt7QaEjc3c0CUhpRSlGgVS7doFkdAoXifVbzK93V9lChoBmgJaA9DCHNmu0IfWXFAlIaUUpRoFUuXaBZHQKGJ3uIhyKh1fZQoaAZoCWgPQwgtlbcjnLNyQJSGlFKUaBVLwGgWR0ChigFIVdondX2UKGgGaAloD0MIB5eOOc9MbkCUhpRSlGgVS7hoFkdAoYoOu9vjwXV9lChoBmgJaA9DCOC8OPEVCnRAlIaUUpRoFUu4aBZHQKGKK3y7PIJ1fZQoaAZoCWgPQwiAEMmQ409xQJSGlFKUaBVLkmgWR0ChikwjUutfdX2UKGgGaAloD0MIRwTj4JK3cECUhpRSlGgVS6RoFkdAoYpK3uuzQnV9lChoBmgJaA9DCE8kmGomgHNAlIaUUpRoFUvKaBZHQKGKafwqiGp1fZQoaAZoCWgPQwg/4ezWMmFxQJSGlFKUaBVLrmgWR0ChisWWpqASdX2UKGgGaAloD0MIUn5S7RMpckCUhpRSlGgVS9RoFkdAoYwjobGWEHV9lChoBmgJaA9DCJYlOsss0HJAlIaUUpRoFUvSaBZHQKGMQMjNY8x1fZQoaAZoCWgPQwiPpnoyP+NyQJSGlFKUaBVL3GgWR0ChjFnbItDldX2UKGgGaAloD0MI9wMeGEDlc0CUhpRSlGgVS9toFkdAoYxdGI9C/3V9lChoBmgJaA9DCPz/OGHCOHNAlIaUUpRoFUu8aBZHQKGMeOLiuMd1fZQoaAZoCWgPQwgpIVhVr91vQJSGlFKUaBVLmmgWR0ChjHZOSGJvdX2UKGgGaAloD0MITyMtlfefc0CUhpRSlGgVS9NoFkdAoYyXp6hQFnV9lChoBmgJaA9DCNKOG36323BAlIaUUpRoFUuhaBZHQKGM8npjc211fZQoaAZoCWgPQwhPBkfJK2JyQJSGlFKUaBVLyWgWR0ChjPnwgDA8dX2UKGgGaAloD0MIKo4Dr5ZTcUCUhpRSlGgVS6xoFkdAoYz8/lhgE3V9lChoBmgJaA9DCAZM4NZdbm9AlIaUUpRoFUuQaBZHQKGNEGVRk3F1fZQoaAZoCWgPQwgbDeAtEB9yQJSGlFKUaBVLvWgWR0ChjRiQ1aW5dX2UKGgGaAloD0MIf6MdNzy1cUCUhpRSlGgVS7poFkdAoY0sfs/puHV9lChoBmgJaA9DCCC1iZO7GnNAlIaUUpRoFUvTaBZHQKGNPD7ZWaN1fZQoaAZoCWgPQwjdJtwrc8pvQJSGlFKUaBVLi2gWR0ChjnKRuCPIdX2UKGgGaAloD0MIf6FHjF5KcECUhpRSlGgVS4poFkdAoY6I7JW/8HV9lChoBmgJaA9DCGwldJdEXHJAlIaUUpRoFUu0aBZHQKGPJk5IYm91fZQoaAZoCWgPQwh1HaopiU9xQJSGlFKUaBVLr2gWR0ChjzHvMKTjdX2UKGgGaAloD0MIjukJS7wcckCUhpRSlGgVS8poFkdAoY9TB9Cu2nV9lChoBmgJaA9DCDTW/s62+nFAlIaUUpRoFUvDaBZHQKGPUNBnjAB1fZQoaAZoCWgPQwjQtpp1hjdyQJSGlFKUaBVLiGgWR0Chj2+ZG8VYdX2UKGgGaAloD0MI3H9kOrRsckCUhpRSlGgVS6FoFkdAoY+LiKiwjnV9lChoBmgJaA9DCEJClC+oZHNAlIaUUpRoFUu9aBZHQKGPknXumaZ1fZQoaAZoCWgPQwivXkVGBy5xQJSGlFKUaBVLl2gWR0Chj5mMXJo1dX2UKGgGaAloD0MIWTFcHQAjckCUhpRSlGgVS7FoFkdAoY/IIKMNt3V9lChoBmgJaA9DCHAi+rV1UXJAlIaUUpRoFUu3aBZHQKGP2SYgJTl1fZQoaAZoCWgPQwhU/N8RlWRxQJSGlFKUaBVLsWgWR0Chj+1hTfixdX2UKGgGaAloD0MIl/+Qfvt6C8CUhpRSlGgVS2poFkdAoZFh8lXzUnV9lChoBmgJaA9DCK98lufBmXFAlIaUUpRoFUuraBZHQKGRfDgqEvl1fZQoaAZoCWgPQwi7mGa611VwQJSGlFKUaBVLiGgWR0ChkYl6iTMadX2UKGgGaAloD0MIhnZOs4B3c0CUhpRSlGgVS8toFkdAoZH78R+SbHV9lChoBmgJaA9DCMGO/wIBGHJAlIaUUpRoFUupaBZHQKGSGOXE61d1fZQoaAZoCWgPQwiu78NBgvZxQJSGlFKUaBVLqWgWR0ChkmRBmf5DdX2UKGgGaAloD0MIAvG6fgH9cUCUhpRSlGgVS6ZoFkdAoZKFnoPkJnV9lChoBmgJaA9DCL2NzY7U13FAlIaUUpRoFUugaBZHQKGSnssQNCt1fZQoaAZoCWgPQwjBG9KoQOFwQJSGlFKUaBVLomgWR0ChkrqbKA8TdX2UKGgGaAloD0MId2SsNn/AckCUhpRSlGgVS8VoFkdAoZMG1ndwenV9lChoBmgJaA9DCDGXVG035XNAlIaUUpRoFUvhaBZHQKGTTtjTa0x1fZQoaAZoCWgPQwjFAl/RrSZyQJSGlFKUaBVLvmgWR0Chk1dGiHqNdX2UKGgGaAloD0MIIH9pUV9ackCUhpRSlGgVS+toFkdAoZN4bsF+u3V9lChoBmgJaA9DCESoUrOHw2JAlIaUUpRoFU3oA2gWR0ChlB/D+BH1dX2UKGgGaAloD0MIIO7qVeSMcECUhpRSlGgVS6BoFkdAoZRWelKsdXV9lChoBmgJaA9DCDnThO0nenBAlIaUUpRoFUuaaBZHQKGUo6Ae7tl1fZQoaAZoCWgPQwguAI3SJYlxQJSGlFKUaBVLmGgWR0ChlLWSU1Q7dX2UKGgGaAloD0MI1q2ek95kcUCUhpRSlGgVS7loFkdAoZS/WOIZZXV9lChoBmgJaA9DCJfGL7ySBHJAlIaUUpRoFUvKaBZHQKGU5DUExIt1fZQoaAZoCWgPQwibBG9Io7FvQJSGlFKUaBVLkWgWR0ChlPYIjW07dX2UKGgGaAloD0MInP2BcpsAdECUhpRSlGgVS6BoFkdAoZUPmgam43V9lChoBmgJaA9DCEdxjjo6AWVAlIaUUpRoFU3oA2gWR0ChlT8oH9m6dX2UKGgGaAloD0MITwMGSZ+5b0CUhpRSlGgVS6NoFkdAoZVIrBj4H3V9lChoBmgJaA9DCHGt9rAXs3JAlIaUUpRoFUuiaBZHQKGVVe/Ho5h1fZQoaAZoCWgPQwjBOLh0jJJyQJSGlFKUaBVLsmgWR0ChlcAYYR/WdX2UKGgGaAloD0MIQDGyZE6MckCUhpRSlGgVS5poFkdAoZXAI+nqFHV9lChoBmgJaA9DCEwXYvWHbXBAlIaUUpRoFUujaBZHQKGVxt0FKTV1fZQoaAZoCWgPQwiw/s9hPjB0QJSGlFKUaBVLxGgWR0Chlizch1TzdX2UKGgGaAloD0MInInpQizfc0CUhpRSlGgVS6hoFkdAoZZokE9t/HV9lChoBmgJaA9DCCI17WKaiHNAlIaUUpRoFUvCaBZHQKGW8JbdJrd1fZQoaAZoCWgPQwjAJmvUg9ByQJSGlFKUaBVLr2gWR0ChlwY95hScdX2UKGgGaAloD0MIEHf1KnLbcUCUhpRSlGgVS4hoFkdAoZcAlnh86XV9lChoBmgJaA9DCAA8okL1s3NAlIaUUpRoFUuZaBZHQKGXCzAN5MV1fZQoaAZoCWgPQwh7+DJRRClzQJSGlFKUaBVLwWgWR0Chly8Empl0dX2UKGgGaAloD0MInIu/7Umlc0CUhpRSlGgVS7RoFkdAoZc6sU7CBXV9lChoBmgJaA9DCJpeYizT93BAlIaUUpRoFUu6aBZHQKGXW1k1/Dt1fZQoaAZoCWgPQwgra5visUpzQJSGlFKUaBVLnmgWR0Chl10x/NJOdX2UKGgGaAloD0MIkSv1LIgnckCUhpRSlGgVS81oFkdAoZdr5j6N2nV9lChoBmgJaA9DCFPMQdBR2XJAlIaUUpRoFUu/aBZHQKGXrCF9KEp1fZQoaAZoCWgPQwhGCI82zoxwQJSGlFKUaBVLnGgWR0Chl7bXpW3jdX2UKGgGaAloD0MIK2haYmXucECUhpRSlGgVS7doFkdAoZgEjJMg2nV9lChoBmgJaA9DCG04LA38hnRAlIaUUpRoFUumaBZHQKGYOJNTLnt1fZQoaAZoCWgPQwhTBaOSejRwQJSGlFKUaBVLoGgWR0ChmGKRU3n7dX2UKGgGaAloD0MIQtKnVTQ2ckCUhpRSlGgVS9ZoFkdAoZhpwyZa3nV9lChoBmgJaA9DCJQvaCHBeHFAlIaUUpRoFUuHaBZHQKGYkHWSU1R1fZQoaAZoCWgPQwgXRnpRu9JxQJSGlFKUaBVLkWgWR0ChmMYO2AoYdX2UKGgGaAloD0MImGw82CKacECUhpRSlGgVS51oFkdAoZj1kDp1R3VlLg=="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 1230, "n_steps": 1024, "gamma": 0.99, "gae_lambda": 0.95, "ent_coef": 0.0, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 10, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVTQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwNX2J1aWx0aW5fdHlwZZSTlIwKTGFtYmRhVHlwZZSFlFKUKGgCjAhDb2RlVHlwZZSFlFKUKEsBSwBLAUsDSxNDHGQBiAAbAGQBGABkAXwAGAAUAGQBFwCIARQAUwCUTksBhpQpjANwY3SUhZSMHzxpcHl0aG9uLWlucHV0LTI3LTM4MzMzNDUyMWQ3NT6UjAg8bGFtYmRhPpRLAkMAlIwGZmFjdG9ylIwBeJSGlCl0lFKUfZQojAtfX3BhY2thZ2VfX5ROjAhfX25hbWVfX5SMCF9fbWFpbl9flHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUaBopUpSGlHSUUpSMHGNsb3VkcGlja2xlLmNsb3VkcGlja2xlX2Zhc3SUjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoH32UfZQoaBdoDowMX19xdWFsbmFtZV9flIwkbGluZWFyX2RlY2F5X3NjaGVkLjxsb2NhbHM+LjxsYW1iZGE+lIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoGIwHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEsKhZRSlGgvRz/JmZmZmZmahZRSlIaUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "target_kl": null, "system_info": {"OS": "Linux-5.4.188+-x86_64-with-Ubuntu-18.04-bionic #1 SMP Sun Apr 24 10:03:06 PDT 2022", "Python": "3.7.13", "Stable-Baselines3": "1.4.0", "PyTorch": "1.11.0+cu113", "GPU Enabled": "False", "Numpy": "1.21.6", "Gym": "0.17.3"}}
|
replay.mp4
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:59454b2cee1b147653b6b233ee2f69d7dece2a6533ec9885aad9321e550a94af
|
3 |
+
size 200437
|
results.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"mean_reward":
|
|
|
1 |
+
{"mean_reward": 274.958423, "std_reward": 15.466405560474827, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2022-05-13T20:47:02.517261"}
|