The key is a while loop on the mean_reward variable when evaluating your agent🥰📚
Browse files- README.md +1 -1
- config.json +1 -1
- ppo-LunarLander-v2.zip +2 -2
- ppo-LunarLander-v2/data +20 -20
- ppo-LunarLander-v2/policy.optimizer.pth +1 -1
- ppo-LunarLander-v2/policy.pth +1 -1
- replay.mp4 +0 -0
- results.json +1 -1
README.md
CHANGED
@@ -16,7 +16,7 @@ model-index:
|
|
16 |
type: LunarLander-v2
|
17 |
metrics:
|
18 |
- type: mean_reward
|
19 |
-
value:
|
20 |
name: mean_reward
|
21 |
verified: false
|
22 |
---
|
|
|
16 |
type: LunarLander-v2
|
17 |
metrics:
|
18 |
- type: mean_reward
|
19 |
+
value: 268.89 +/- 30.99
|
20 |
name: mean_reward
|
21 |
verified: false
|
22 |
---
|
config.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7fef12b74160>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7fef12b741f0>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7fef12b74280>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7fef12b74310>", "_build": "<function ActorCriticPolicy._build at 0x7fef12b743a0>", "forward": "<function ActorCriticPolicy.forward at 0x7fef12b74430>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7fef12b744c0>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7fef12b74550>", "_predict": "<function ActorCriticPolicy._predict at 0x7fef12b745e0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7fef12b74670>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7fef12b74700>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7fef12b74790>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7fef12b67300>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 1245184, "_total_timesteps": 1234567, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1686522094150615504, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAOZXQj2pcSK8FHNIvMnDXTweFI+9Rs85PQAAgD8AAIA/jXKnPY+bNbyD+O671HrCPBBVnb2+3p09AACAPwAAgD+1sKm+9F6cP95iu766m+q+H8zOvo15Eb0AAAAAAAAAAICkSD21ZbU/yj55PnKXdb5U7ks9gNc6PQAAAAAAAAAAzXEdPQpASbtOQHg7X6t/PIqMgry4RF09AACAPwAAgD+mWic+CO6XP9ipxj5Z9O++/BGMPi8Yrz0AAAAAAAAAAECKvT1BNfA9CCNHvv9pXr4Sn6c8dw2kvAAAAAAAAAAAaqCZvmeh7T69aco+EElovhSwML4tF20+AAAAAAAAAADN+Dg886o1P+KbPbzOkKy+ThGLO2Iwjb0AAAAAAAAAANqLiD24Zpe5DyWTO3dIHzVBA1C7puexugAAgD8AAAAAc+slPjQyXj92TzU+1WXjvstSVz5qKGG8AAAAAAAAAAAAaPA8pGlQu6+MiL2KS4s8uPF8PPDIb70AAIA/AACAPzMRG7wp/9U+PaC0PdcYor7Mksw70xH5PQAAAAAAAAAAlhhuvrItRj8sGjY+d6fJvmz0u77o6VA+AAAAAAAAAAAzj1U9hSMnPo6aI77vHHu+4xY4vXOuID0AAAAAAAAAAApWij4B+5Q/EpybPjSgEL+oLbI+Tc/KPAAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.008599776277836702, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVCgwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHIuPSlWOp+MAWyUTQQBjAF0lEdAlXByLAHminV9lChoBkdAbuxgMMI/q2gHTQ4BaAhHQJVwoI/qxC91fZQoaAZHQHK9Lb+Lm6poB00NAWgIR0CVcM+d9UjtdX2UKGgGR0BzVIaCL/CJaAdL52gIR0CVcNVS4vvjdX2UKGgGR0Bwc5kauOjqaAdL9GgIR0CVceVclgMMdX2UKGgGR0BxKkr08NhFaAdNDwFoCEdAlXJAxJul43V9lChoBkdAbeyjoIOYpmgHS+xoCEdAlXJifpUxVXV9lChoBkdAcoyfvnbItGgHTSABaAhHQJVy4YGdI5J1fZQoaAZHQHLh20u14PhoB0v3aAhHQJVzxuFYdQx1fZQoaAZHQHHqDURWcSZoB0vkaAhHQJV1WCL/CIl1fZQoaAZHQHEyznNgSe1oB0vraAhHQJV1iGO+7Dl1fZQoaAZHQEBCahpQDV9oB0u9aAhHQJV1rHDJlrd1fZQoaAZHQHJE3PE87p5oB0vvaAhHQJV14LhJiAl1fZQoaAZHQGK+aJAMUh5oB03oA2gIR0CVdrccENe/dX2UKGgGR0BtGWA5Jbt7aAdL6WgIR0CVdui9Zid8dX2UKGgGR0BwnDyLAHmjaAdL7WgIR0CVd1XAuZkTdX2UKGgGR0BxVvd0q6OHaAdL9WgIR0CVd2IDYAbRdX2UKGgGR0BwtQsRQJokaAdNEAFoCEdAlXfD0163RXV9lChoBkdAcGhNb1RLsmgHTRgBaAhHQJV4mDmKZUl1fZQoaAZHQHHimE0zj3poB00gAWgIR0CVePES/TLGdX2UKGgGR0BzmkpjMFEBaAdL8mgIR0CVeT2OQyRCdX2UKGgGR0BxTc9SuQp4aAdL+WgIR0CVeU8+zMRpdX2UKGgGR0Bwav+6y0KJaAdNCgFoCEdAlXlnkxREW3V9lChoBkdAc2BJRwZOz2gHS+9oCEdAlXme9Jz1b3V9lChoBkdAcEVo4dZJTWgHS+loCEdAlXoxqwhW53V9lChoBkdALe0+C9RJmWgHS9FoCEdAlXs3mV7hN3V9lChoBkdAcX8lar3j/GgHS/xoCEdAlXw9du5z53V9lChoBkdAcH5QlruYyGgHS+xoCEdAlXxDrZ8KHHV9lChoBkdAb2nVd5Y5k2gHS/JoCEdAlX1mA08/2XV9lChoBkdAcC2oZAIIGGgHTSMBaAhHQJV9jeIl+mZ1fZQoaAZHQHF//sVtXPtoB00BAWgIR0CVfaNjbzshdX2UKGgGR0ByG/mNipeeaAdL7WgIR0CVfb+jdpIudX2UKGgGR0ByFQGMXJo1aAdL4WgIR0CVfdVW0Z3tdX2UKGgGR0BwoW4kNWluaAdNAwFoCEdAlX5CPQv6CXV9lChoBkdAcoeT987ZF2gHS99oCEdAlX6UJng5znV9lChoBkdAcwVm7rcCYGgHS/loCEdAlX+FXq7iAHV9lChoBkdAcvhvUSZjQWgHS/VoCEdAlX/TxXnyNHV9lChoBkdAcPbhb4agmWgHTQEBaAhHQJWAFSNwR5F1fZQoaAZHQHNuDURWcSZoB0vzaAhHQJWUNJvo/zJ1fZQoaAZHQHEbymqHXVdoB00RAWgIR0CVlF+xGDtgdX2UKGgGR0Byi/kkrwvyaAdNNwFoCEdAlZWdxZMcqHV9lChoBkdAcGDz5oGpuWgHS+1oCEdAlZdTtb9qDnV9lChoBkdAcM0II4VARmgHS/JoCEdAlZedWp6yB3V9lChoBkdAcPVhJiAlOWgHTSMBaAhHQJWYTkS26TZ1fZQoaAZHQHD0++ZgG8poB0vkaAhHQJWYtcMVk+Z1fZQoaAZHQHC3fZh8YyhoB0vjaAhHQJWY6HgxagV1fZQoaAZHQHGiH2VVxS5oB0vgaAhHQJWZE/keZG91fZQoaAZHQHDtD9jwx35oB00IAWgIR0CVmiEiMYMwdX2UKGgGR0Bx7k6RyOrAaAdL9mgIR0CVmjIuXeFddX2UKGgGR0BunvOQhfShaAdNBQFoCEdAlZsIvWYnfHV9lChoBkdAb8Y/3WWhRWgHTTYBaAhHQJWbQywfQrt1fZQoaAZHQG/nMyJsO5JoB0v1aAhHQJWbhj4Hoox1fZQoaAZHQG2hWgFotcxoB00GAWgIR0CVnImJWNm2dX2UKGgGR0BxCALE1l5GaAdNFAFoCEdAlZypYPoV23V9lChoBkdAcaQWFN+LFWgHS/doCEdAlZznkLhJiHV9lChoBkdAcsW8uzyBkWgHTRoBaAhHQJWd61SflIV1fZQoaAZHQHBa9rTH80loB0v9aAhHQJWd6RZEDyR1fZQoaAZHQG2O33Hq/udoB0v9aAhHQJWe8JJGvwF1fZQoaAZHQHJZGtITXatoB0vqaAhHQJWe/kNnXd11fZQoaAZHQHGL8xKxs2xoB0vnaAhHQJWfdoRIz311fZQoaAZHQHJo9gSeyzJoB00dAWgIR0CVn/pGFzuGdX2UKGgGR0BxeU9s7+1jaAdL/2gIR0CVoAgzP8htdX2UKGgGR0Bwp6wTufEoaAdL7WgIR0CVoKrOZ9eAdX2UKGgGR0BzKGoLofSyaAdNAgFoCEdAlaFMawUxmHV9lChoBkdAciylfqoqC2gHS/FoCEdAlaGovBacJHV9lChoBkdAb3J3Cbc452gHS+toCEdAlaIH6/IsAnV9lChoBkdAcZfP6KtPpWgHS/xoCEdAlaI2uX/o7nV9lChoBkdANxIRVZLZjGgHS6BoCEdAlaOHCCSRsHV9lChoBkdAbZzZIQOFxmgHS/loCEdAlaOF81Gb1HV9lChoBkdAcIupKBd2PmgHS/toCEdAlaO05IYm9nV9lChoBkdAcJ2N83Mpw2gHS+doCEdAlaSQk9lmOHV9lChoBkdAcsCVO9FnZmgHTRUBaAhHQJWkxe9i+cp1fZQoaAZHQG3jiZWq95BoB0v+aAhHQJWlMWO6unx1fZQoaAZHQHLvAgLZzxRoB03CAWgIR0CVpXOObRWtdX2UKGgGR0BxJiRxLkCFaAdL+GgIR0CVpfrlvIfbdX2UKGgGR0ByuiWSlnAZaAdL8WgIR0CVpssBQvYfdX2UKGgGR0Bw5Kh4+r2haAdNEQFoCEdAlae+10DEFXV9lChoBkdAcMeRZlnRLWgHS/doCEdAlahejVQQ+XV9lChoBkdAcQwjUutfX2gHS+1oCEdAlahwi7kGRnV9lChoBkdAcaJtEG7jDWgHTQcBaAhHQJWpvWz4UN91fZQoaAZHQHC1YjB2wFFoB0vhaAhHQJWqMgDA8CB1fZQoaAZHQHE72sV+I/JoB0vhaAhHQJWqMJRfnfV1fZQoaAZHQHMXCM98qnZoB01PAWgIR0CVqotGNJe3dX2UKGgGR0BzGMm/nGKiaAdNJAFoCEdAlarn9zfaYnV9lChoBkdAb5j29tdiUmgHS/toCEdAlas2R7qptXV9lChoBkdAcm1Kb8WKuWgHTQwBaAhHQJWs0Of/WDp1fZQoaAZHQHBmXtWuHN5oB00WAWgIR0CVrObdJrckdX2UKGgGR0BwEVZwGW2PaAdNBAFoCEdAla1TtG/etXV9lChoBkdAchKSX+l0o2gHS/toCEdAla2ozBRAKXV9lChoBkdAcJQ+Q2dd3WgHTTwBaAhHQJWuu36Q/5d1fZQoaAZHQHG440ALiMpoB00CAWgIR0CVrs2+wkgPdX2UKGgGR0BygSs5n13/aAdL+2gIR0CVsDRoh6jWdX2UKGgGR0Byba+QEIPcaAdNCgFoCEdAlbCWoNutOnV9lChoBkdAcTh6sQumJmgHTTIBaAhHQJWxNKxs2vV1fZQoaAZHQHFzk+9rXUZoB0vraAhHQJWxncL0Bfd1fZQoaAZHQHDxlMM7U5NoB00BAWgIR0CVsfNXYDkmdX2UKGgGR0BxZbKfWcz7aAdNAwFoCEdAlbIASWZ7X3V9lChoBkdAcGKgam4y5GgHTRABaAhHQJWx/1h9b5d1fZQoaAZHQHHMc50bLlpoB0v/aAhHQJWyggfU4Jh1fZQoaAZHQHKXl0HQhOhoB00DAWgIR0CVsuQHzH0cdWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 304, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVcAIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoECiWCAAAAAAAAAABAQEBAQEBAZRoFEsIhZRoGHSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBAoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaApLCIWUaBh0lFKUjARoaWdolGgQKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgKSwiFlGgYdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV1QAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCloCmgOjApfbnBfcmFuZG9tlE51Yi4=", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "system_info": {"OS": "Linux-5.15.107+-x86_64-with-glibc2.31 # 1 SMP Sat Apr 29 09:15:28 UTC 2023", "Python": "3.10.12", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.0.1+cu118", "GPU Enabled": "True", "Numpy": "1.22.4", "Cloudpickle": "2.2.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
|
|
|
1 |
+
{"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7fcb7d180e50>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7fcb7d180ee0>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7fcb7d180f70>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7fcb7d181000>", "_build": "<function ActorCriticPolicy._build at 0x7fcb7d181090>", "forward": "<function ActorCriticPolicy.forward at 0x7fcb7d181120>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7fcb7d1811b0>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7fcb7d181240>", "_predict": "<function ActorCriticPolicy._predict at 0x7fcb7d1812d0>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7fcb7d181360>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7fcb7d1813f0>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7fcb7d181480>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7fcb7d1761c0>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 1572864, "_total_timesteps": 1570000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1686582390307425891, "learning_rate": 0.0003, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAL0hdr7TPOY+bTXtPmeMvr5NfZ6+1l6QPgAAAAAAAAAA5h3GvW2d2z4FbhI+7uGavhFnH7ze3yE9AAAAAAAAAACzqSa98FSSP/rI2b345AC/FwvZvZ7EhroAAAAAAAAAAI0zHr4NWoE/sA4mvW0b5L52mWK+WpUEPgAAAAAAAAAA82KxvYUzork586O6900Vt6ia57huw8A5AAAAAAAAgD/NebW9w7F3uojD1rqGicG1adW1ulpO+zkAAAAAAACAP/MR/b0hgJI/Oswavy7hIr+yJ9y97eGYvgAAAAAAAAAAAIEJPbAWZz/WBcw96z63vlgvjTxv0Di7AAAAAAAAAACzrC+9BOm0P7tDWb5hqmK+9wVxvY0OIL4AAAAAAAAAAO1HCT4mVZ0/Znh8PkVVCr8TydA97hrNPQAAAAAAAAAAzVG3vNIWxbtat9m70ESUPCeqIr2tWno9AACAPwAAgD+m1cG9NF+JPdEbsb1/wki+j9aNvc05+jwAAAAAAAAAALPY2T1qeRs+MgqMvgzzJL4MLSu9geScvQAAAAAAAAAAszh1va6vlLre6gu3j3wwsuVDMzuS0iA2AAAAAAAAgD/6ZWU+eS9LPyHJJD42QNW+eCxgPmbsproAAAAAAAAAADOLtb32sBy61M28PE9FmzQdBoA7RDOWMwAAAAAAAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.0018242038216560452, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVEgwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHI/qvmozeqMAWyUS+eMAXSUR0CXxOR64UeudX2UKGgGR0BxXE5xR2r5aAdNDwFoCEdAl8TknogV5HV9lChoBkdAcW7VjqfOEGgHS/JoCEdAl8WDRhMJyHV9lChoBkdAcO3Qd0aIe2gHTRMBaAhHQJfF25nUUfx1fZQoaAZHQHGpnUhFEzBoB0v8aAhHQJfGEN/e+Eh1fZQoaAZHQHAdyB9Tgl5oB0v0aAhHQJfG6cCo0hx1fZQoaAZHQHGG5Mg2ZRdoB00IAWgIR0CXxwY6nzg/dX2UKGgGR0BzipZvDP4VaAdL92gIR0CXx26xxDLKdX2UKGgGR0BxTd0MgEEDaAdL8WgIR0CXx+PpIMBqdX2UKGgGR0BuqmK64Ds/aAdNKAFoCEdAl8hRtDUmUnV9lChoBkdAcA+KyfL9uWgHTQ0BaAhHQJfIxawD/2l1fZQoaAZHQHG5gNkOI69oB0v6aAhHQJfI5kH2RJV1fZQoaAZHQHAa8U/OdG1oB0vsaAhHQJfK5mapgkV1fZQoaAZHQHDU6By0a61oB0v4aAhHQJfLXAM2FWZ1fZQoaAZHQHB0brTpgThoB00TAWgIR0CXy1v7WNFSdX2UKGgGR0Bxc6CuloDgaAdL9GgIR0CXy2bjcVQAdX2UKGgGR0BKNlUADJU6aAdLymgIR0CXy3dYGMXKdX2UKGgGR0BzMOltTDO1aAdL/mgIR0CXzDD2JzkqdX2UKGgGR0Bxt3Ye1a4daAdNFwFoCEdAl8w/b48EFHV9lChoBkdAbWGWP91loWgHS/VoCEdAl8xOn62v0XV9lChoBkdAYxBtygf2b2gHTegDaAhHQJfMVU+9rXV1fZQoaAZHQHDgGO+7Dl5oB0v3aAhHQJfNYLv1DjR1fZQoaAZHQFQFzzVc2R9oB0vcaAhHQJfNiYIBzWB1fZQoaAZHQHGzdT1kDp1oB00DAWgIR0CXzZMINVindX2UKGgGR0BwRFK7I1cdaAdL6mgIR0CXzje05U97dX2UKGgGR0BwouC6H0sfaAdNFgFoCEdAl85y31BdEHV9lChoBkdAcvj1RtP56GgHTQ8BaAhHQJfPi4UeuFJ1fZQoaAZHQHCA9d/rjYJoB00UAWgIR0CXz88GLUCrdX2UKGgGR0ByUn9wWFewaAdL+2gIR0CX0Z6lLvkSdX2UKGgGR0BvegxN7BwdaAdNBAFoCEdAl9ITo2XLNnV9lChoBkdAcNxjMmnfmGgHTR4BaAhHQJfSSzhP0qZ1fZQoaAZHQHDxiFGoaUBoB00UAWgIR0CX0m+QU5+6dX2UKGgGR0BzN921UlzEaAdL9WgIR0CX0paL4vexdX2UKGgGR0Bwqh9iMHbAaAdL92gIR0CX0pakhzNmdX2UKGgGR0By3O1TisGQaAdL82gIR0CX0pu6mO2idX2UKGgGR0BNz9mg8KXwaAdLtmgIR0CX0xP6sQumdX2UKGgGR0Bxp7a/RE4OaAdNMgFoCEdAl9Mxc/t6X3V9lChoBkdAbmuF3Y+SsGgHTR0BaAhHQJfTjXBguyx1fZQoaAZHQHM8FfZ26kJoB0vraAhHQJfToiD/VAl1fZQoaAZHQG2vU/wAlv9oB0vzaAhHQJfTyG47Rv51fZQoaAZHQHKLAP3BYV9oB00CAWgIR0CX0/KaXrt3dX2UKGgGR0BzRCMAFPi2aAdL7WgIR0CX1Gw8W9DhdX2UKGgGR0Bx+LyZrpJPaAdNDQFoCEdAl+pa5sj3VXV9lChoBkdAcNX+36Q/5mgHTQoBaAhHQJfqrKT0QK91fZQoaAZHQG3RKQJXyRVoB0v2aAhHQJfsZl5GBnV1fZQoaAZHQDQl/y5I6KdoB0vIaAhHQJfskadc0Lt1fZQoaAZHQG0IIE0SAYpoB0vjaAhHQJfsuu2Zy+91fZQoaAZHQG7AHFglWwNoB0viaAhHQJfsudEsrd51fZQoaAZHQG2WtMoMKCxoB0v7aAhHQJftRTMqz7d1fZQoaAZHQHF6oAsCkoFoB00JAWgIR0CX7dMn7YTTdX2UKGgGR0Bu0aRISUTtaAdNGgFoCEdAl+4IkZ75VXV9lChoBkdAcKInlnyup2gHS/1oCEdAl+46Vt4zJ3V9lChoBkdAccWlANXo1WgHTSoBaAhHQJfuRGwzLwF1fZQoaAZHQHJYpooNNJxoB0v5aAhHQJfugfNiYsx1fZQoaAZHQHH+vCEYfnxoB0vlaAhHQJfvAoCuEEl1fZQoaAZHQHD1xWcSXdFoB00OAWgIR0CX7yzuWrwOdX2UKGgGR0BxGKR6nivQaAdNIAFoCEdAl+9ogmqo63V9lChoBkdAcwdxxT850mgHTR0BaAhHQJfvpPBSDRN1fZQoaAZHQHCjmQ0XP7hoB0vhaAhHQJfwjgP3BYV1fZQoaAZHQG2O1uivgWJoB0v4aAhHQJfxR17pmmN1fZQoaAZHQHAGm7voePtoB0vuaAhHQJfyLb0voNd1fZQoaAZHQE2QcvugHu9oB0vCaAhHQJfygtSQ5m11fZQoaAZHQHB+gSzw+dNoB0v8aAhHQJfy3DCP6sR1fZQoaAZHQG5PiJ40Mw1oB00HAWgIR0CX8wUmD15CdX2UKGgGR0BxZBE8aGYbaAdNBAFoCEdAl/MV3hXKbXV9lChoBkdAcpRhgE2YOWgHTQkBaAhHQJf14sbvPTp1fZQoaAZHQG4Ropx3mmtoB0vzaAhHQJf2LQmeDnN1fZQoaAZHQHK//VNHpbFoB008AWgIR0CX9mWuHN5ddX2UKGgGR0BxXX3Zf2K3aAdNMgFoCEdAl/Z3/DLr5nV9lChoBkdAcKckI5YHPmgHTRYBaAhHQJf2lyzXz191fZQoaAZHQHCJGszVMEloB00iAWgIR0CX90WWQfZFdX2UKGgGR0BwLysLfDUFaAdNAwFoCEdAl/gGoNutOnV9lChoBkdAcSYkgwGnoGgHS/ZoCEdAl/iGF8G9pXV9lChoBkdAcd0IFNcnmmgHTaIBaAhHQJf5Aiml67d1fZQoaAZHQG/g7YkE9uBoB0vuaAhHQJf5nhESdvt1fZQoaAZHQHMhU0rK/21oB0vzaAhHQJf6G2KEWZZ1fZQoaAZHQHEyEnTiKixoB00aAWgIR0CX+oT8pCrtdX2UKGgGR0BzPbj3mFJyaAdNHQFoCEdAl/uG4d6syXV9lChoBkdAcratCzC1qmgHTTcBaAhHQJf8cDdP+GZ1fZQoaAZHQEaOLNOdoWZoB0vkaAhHQJf9OcBltj11fZQoaAZHQHClnpKSPlxoB0vjaAhHQJf9QyckMTh1fZQoaAZHQHPX3Ilt0mtoB0v3aAhHQJf+ApKBd2R1fZQoaAZHQHETRpL26CloB00SAWgIR0CX/jf9gnc+dX2UKGgGR0BwmclhPTG6aAdNJAFoCEdAl/79+9allHV9lChoBkdAbuROqvNeMWgHTV0CaAhHQJf/IWl/H5t1fZQoaAZHQHH1CUgSvkloB00QAWgIR0CX/2msNlRQdX2UKGgGR0Bw1XAN5MURaAdL+GgIR0CX/29uP3i8dX2UKGgGR0Bt0gFgUlAvaAdL72gIR0CYAA9XtBv8dX2UKGgGR0BveY2CNCJGaAdL82gIR0CYAL1RLsa9dX2UKGgGR0ByjXBfrrxBaAdNUQFoCEdAmAJ1b/wRXnV9lChoBkdAcox0b961LWgHTSwBaAhHQJgDFL7Gecx1fZQoaAZHQHB0V0YCQtBoB0v0aAhHQJgEqjQAuI11fZQoaAZHQHAKzGLk0aZoB00OAWgIR0CYBawB5ooNdX2UKGgGR0Bwy9RAKOT8aAdL/mgIR0CYBjkvsZ5zdX2UKGgGR0Bv1HQnhKlIaAdNdwFoCEdAmAZMIAwPAnV9lChoBkdAcgLbx3FDOWgHTTsBaAhHQJgGXkMkQf91fZQoaAZHQHBZ/WhAWzpoB00TAWgIR0CYBq5U96kZdX2UKGgGR0Bw6c6o2n89aAdNCwFoCEdAmAd0yckMTnV9lChoBkdAcXO/b0voNmgHS+poCEdAmAezpcHGCXV9lChoBkdAcFTEBsANomgHTQ8BaAhHQJgHu7TUiIN1ZS4="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 384, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVcAIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoECiWCAAAAAAAAAABAQEBAQEBAZRoFEsIhZRoGHSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBAoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaApLCIWUaBh0lFKUjARoaWdolGgQKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgKSwiFlGgYdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWV1QAAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCloCmgOjApfbnBfcmFuZG9tlE51Yi4=", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 16, "n_steps": 1024, "gamma": 0.999, "gae_lambda": 0.98, "ent_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 4, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz/JmZmZmZmahZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz8zqSowVTJhhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "system_info": {"OS": "Linux-5.15.107+-x86_64-with-glibc2.31 # 1 SMP Sat Apr 29 09:15:28 UTC 2023", "Python": "3.10.12", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.0.1+cu118", "GPU Enabled": "True", "Numpy": "1.22.4", "Cloudpickle": "2.2.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
|
ppo-LunarLander-v2.zip
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ffd960d8545d0496b90ad7037b468fddf21d77c1a4ac9b61aab489ae9289e0d2
|
3 |
+
size 146692
|
ppo-LunarLander-v2/data
CHANGED
@@ -4,34 +4,34 @@
|
|
4 |
":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
|
5 |
"__module__": "stable_baselines3.common.policies",
|
6 |
"__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
|
7 |
-
"__init__": "<function ActorCriticPolicy.__init__ at
|
8 |
-
"_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at
|
9 |
-
"reset_noise": "<function ActorCriticPolicy.reset_noise at
|
10 |
-
"_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at
|
11 |
-
"_build": "<function ActorCriticPolicy._build at
|
12 |
-
"forward": "<function ActorCriticPolicy.forward at
|
13 |
-
"extract_features": "<function ActorCriticPolicy.extract_features at
|
14 |
-
"_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at
|
15 |
-
"_predict": "<function ActorCriticPolicy._predict at
|
16 |
-
"evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at
|
17 |
-
"get_distribution": "<function ActorCriticPolicy.get_distribution at
|
18 |
-
"predict_values": "<function ActorCriticPolicy.predict_values at
|
19 |
"__abstractmethods__": "frozenset()",
|
20 |
-
"_abc_impl": "<_abc._abc_data object at
|
21 |
},
|
22 |
"verbose": 1,
|
23 |
"policy_kwargs": {},
|
24 |
-
"num_timesteps":
|
25 |
-
"_total_timesteps":
|
26 |
"_num_timesteps_at_start": 0,
|
27 |
"seed": null,
|
28 |
"action_noise": null,
|
29 |
-
"start_time":
|
30 |
"learning_rate": 0.0003,
|
31 |
"tensorboard_log": null,
|
32 |
"_last_obs": {
|
33 |
":type:": "<class 'numpy.ndarray'>",
|
34 |
-
":serialized:": "
|
35 |
},
|
36 |
"_last_episode_starts": {
|
37 |
":type:": "<class 'numpy.ndarray'>",
|
@@ -41,17 +41,17 @@
|
|
41 |
"_episode_num": 0,
|
42 |
"use_sde": false,
|
43 |
"sde_sample_freq": -1,
|
44 |
-
"_current_progress_remaining": -0.
|
45 |
"_stats_window_size": 100,
|
46 |
"ep_info_buffer": {
|
47 |
":type:": "<class 'collections.deque'>",
|
48 |
-
":serialized:": "
|
49 |
},
|
50 |
"ep_success_buffer": {
|
51 |
":type:": "<class 'collections.deque'>",
|
52 |
":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
|
53 |
},
|
54 |
-
"_n_updates":
|
55 |
"observation_space": {
|
56 |
":type:": "<class 'gymnasium.spaces.box.Box'>",
|
57 |
":serialized:": "gAWVcAIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoECiWCAAAAAAAAAABAQEBAQEBAZRoFEsIhZRoGHSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBAoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaApLCIWUaBh0lFKUjARoaWdolGgQKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgKSwiFlGgYdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=",
|
|
|
4 |
":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
|
5 |
"__module__": "stable_baselines3.common.policies",
|
6 |
"__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
|
7 |
+
"__init__": "<function ActorCriticPolicy.__init__ at 0x7fcb7d180e50>",
|
8 |
+
"_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7fcb7d180ee0>",
|
9 |
+
"reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7fcb7d180f70>",
|
10 |
+
"_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7fcb7d181000>",
|
11 |
+
"_build": "<function ActorCriticPolicy._build at 0x7fcb7d181090>",
|
12 |
+
"forward": "<function ActorCriticPolicy.forward at 0x7fcb7d181120>",
|
13 |
+
"extract_features": "<function ActorCriticPolicy.extract_features at 0x7fcb7d1811b0>",
|
14 |
+
"_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7fcb7d181240>",
|
15 |
+
"_predict": "<function ActorCriticPolicy._predict at 0x7fcb7d1812d0>",
|
16 |
+
"evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7fcb7d181360>",
|
17 |
+
"get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7fcb7d1813f0>",
|
18 |
+
"predict_values": "<function ActorCriticPolicy.predict_values at 0x7fcb7d181480>",
|
19 |
"__abstractmethods__": "frozenset()",
|
20 |
+
"_abc_impl": "<_abc._abc_data object at 0x7fcb7d1761c0>"
|
21 |
},
|
22 |
"verbose": 1,
|
23 |
"policy_kwargs": {},
|
24 |
+
"num_timesteps": 1572864,
|
25 |
+
"_total_timesteps": 1570000,
|
26 |
"_num_timesteps_at_start": 0,
|
27 |
"seed": null,
|
28 |
"action_noise": null,
|
29 |
+
"start_time": 1686582390307425891,
|
30 |
"learning_rate": 0.0003,
|
31 |
"tensorboard_log": null,
|
32 |
"_last_obs": {
|
33 |
":type:": "<class 'numpy.ndarray'>",
|
34 |
+
":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAAL0hdr7TPOY+bTXtPmeMvr5NfZ6+1l6QPgAAAAAAAAAA5h3GvW2d2z4FbhI+7uGavhFnH7ze3yE9AAAAAAAAAACzqSa98FSSP/rI2b345AC/FwvZvZ7EhroAAAAAAAAAAI0zHr4NWoE/sA4mvW0b5L52mWK+WpUEPgAAAAAAAAAA82KxvYUzork586O6900Vt6ia57huw8A5AAAAAAAAgD/NebW9w7F3uojD1rqGicG1adW1ulpO+zkAAAAAAACAP/MR/b0hgJI/Oswavy7hIr+yJ9y97eGYvgAAAAAAAAAAAIEJPbAWZz/WBcw96z63vlgvjTxv0Di7AAAAAAAAAACzrC+9BOm0P7tDWb5hqmK+9wVxvY0OIL4AAAAAAAAAAO1HCT4mVZ0/Znh8PkVVCr8TydA97hrNPQAAAAAAAAAAzVG3vNIWxbtat9m70ESUPCeqIr2tWno9AACAPwAAgD+m1cG9NF+JPdEbsb1/wki+j9aNvc05+jwAAAAAAAAAALPY2T1qeRs+MgqMvgzzJL4MLSu9geScvQAAAAAAAAAAszh1va6vlLre6gu3j3wwsuVDMzuS0iA2AAAAAAAAgD/6ZWU+eS9LPyHJJD42QNW+eCxgPmbsproAAAAAAAAAADOLtb32sBy61M28PE9FmzQdBoA7RDOWMwAAAAAAAIA/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
|
35 |
},
|
36 |
"_last_episode_starts": {
|
37 |
":type:": "<class 'numpy.ndarray'>",
|
|
|
41 |
"_episode_num": 0,
|
42 |
"use_sde": false,
|
43 |
"sde_sample_freq": -1,
|
44 |
+
"_current_progress_remaining": -0.0018242038216560452,
|
45 |
"_stats_window_size": 100,
|
46 |
"ep_info_buffer": {
|
47 |
":type:": "<class 'collections.deque'>",
|
48 |
+
":serialized:": "gAWVEgwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQHI/qvmozeqMAWyUS+eMAXSUR0CXxOR64UeudX2UKGgGR0BxXE5xR2r5aAdNDwFoCEdAl8TknogV5HV9lChoBkdAcW7VjqfOEGgHS/JoCEdAl8WDRhMJyHV9lChoBkdAcO3Qd0aIe2gHTRMBaAhHQJfF25nUUfx1fZQoaAZHQHGpnUhFEzBoB0v8aAhHQJfGEN/e+Eh1fZQoaAZHQHAdyB9Tgl5oB0v0aAhHQJfG6cCo0hx1fZQoaAZHQHGG5Mg2ZRdoB00IAWgIR0CXxwY6nzg/dX2UKGgGR0BzipZvDP4VaAdL92gIR0CXx26xxDLKdX2UKGgGR0BxTd0MgEEDaAdL8WgIR0CXx+PpIMBqdX2UKGgGR0BuqmK64Ds/aAdNKAFoCEdAl8hRtDUmUnV9lChoBkdAcA+KyfL9uWgHTQ0BaAhHQJfIxawD/2l1fZQoaAZHQHG5gNkOI69oB0v6aAhHQJfI5kH2RJV1fZQoaAZHQHAa8U/OdG1oB0vsaAhHQJfK5mapgkV1fZQoaAZHQHDU6By0a61oB0v4aAhHQJfLXAM2FWZ1fZQoaAZHQHB0brTpgThoB00TAWgIR0CXy1v7WNFSdX2UKGgGR0Bxc6CuloDgaAdL9GgIR0CXy2bjcVQAdX2UKGgGR0BKNlUADJU6aAdLymgIR0CXy3dYGMXKdX2UKGgGR0BzMOltTDO1aAdL/mgIR0CXzDD2JzkqdX2UKGgGR0Bxt3Ye1a4daAdNFwFoCEdAl8w/b48EFHV9lChoBkdAbWGWP91loWgHS/VoCEdAl8xOn62v0XV9lChoBkdAYxBtygf2b2gHTegDaAhHQJfMVU+9rXV1fZQoaAZHQHDgGO+7Dl5oB0v3aAhHQJfNYLv1DjR1fZQoaAZHQFQFzzVc2R9oB0vcaAhHQJfNiYIBzWB1fZQoaAZHQHGzdT1kDp1oB00DAWgIR0CXzZMINVindX2UKGgGR0BwRFK7I1cdaAdL6mgIR0CXzje05U97dX2UKGgGR0BwouC6H0sfaAdNFgFoCEdAl85y31BdEHV9lChoBkdAcvj1RtP56GgHTQ8BaAhHQJfPi4UeuFJ1fZQoaAZHQHCA9d/rjYJoB00UAWgIR0CXz88GLUCrdX2UKGgGR0ByUn9wWFewaAdL+2gIR0CX0Z6lLvkSdX2UKGgGR0BvegxN7BwdaAdNBAFoCEdAl9ITo2XLNnV9lChoBkdAcNxjMmnfmGgHTR4BaAhHQJfSSzhP0qZ1fZQoaAZHQHDxiFGoaUBoB00UAWgIR0CX0m+QU5+6dX2UKGgGR0BzN921UlzEaAdL9WgIR0CX0paL4vexdX2UKGgGR0Bwqh9iMHbAaAdL92gIR0CX0pakhzNmdX2UKGgGR0By3O1TisGQaAdL82gIR0CX0pu6mO2idX2UKGgGR0BNz9mg8KXwaAdLtmgIR0CX0xP6sQumdX2UKGgGR0Bxp7a/RE4OaAdNMgFoCEdAl9Mxc/t6X3V9lChoBkdAbmuF3Y+SsGgHTR0BaAhHQJfTjXBguyx1fZQoaAZHQHM8FfZ26kJoB0vraAhHQJfToiD/VAl1fZQoaAZHQG2vU/wAlv9oB0vzaAhHQJfTyG47Rv51fZQoaAZHQHKLAP3BYV9oB00CAWgIR0CX0/KaXrt3dX2UKGgGR0BzRCMAFPi2aAdL7WgIR0CX1Gw8W9DhdX2UKGgGR0Bx+LyZrpJPaAdNDQFoCEdAl+pa5sj3VXV9lChoBkdAcNX+36Q/5mgHTQoBaAhHQJfqrKT0QK91fZQoaAZHQG3RKQJXyRVoB0v2aAhHQJfsZl5GBnV1fZQoaAZHQDQl/y5I6KdoB0vIaAhHQJfskadc0Lt1fZQoaAZHQG0IIE0SAYpoB0vjaAhHQJfsuu2Zy+91fZQoaAZHQG7AHFglWwNoB0viaAhHQJfsudEsrd51fZQoaAZHQG2WtMoMKCxoB0v7aAhHQJftRTMqz7d1fZQoaAZHQHF6oAsCkoFoB00JAWgIR0CX7dMn7YTTdX2UKGgGR0Bu0aRISUTtaAdNGgFoCEdAl+4IkZ75VXV9lChoBkdAcKInlnyup2gHS/1oCEdAl+46Vt4zJ3V9lChoBkdAccWlANXo1WgHTSoBaAhHQJfuRGwzLwF1fZQoaAZHQHJYpooNNJxoB0v5aAhHQJfugfNiYsx1fZQoaAZHQHH+vCEYfnxoB0vlaAhHQJfvAoCuEEl1fZQoaAZHQHD1xWcSXdFoB00OAWgIR0CX7yzuWrwOdX2UKGgGR0BxGKR6nivQaAdNIAFoCEdAl+9ogmqo63V9lChoBkdAcwdxxT850mgHTR0BaAhHQJfvpPBSDRN1fZQoaAZHQHCjmQ0XP7hoB0vhaAhHQJfwjgP3BYV1fZQoaAZHQG2O1uivgWJoB0v4aAhHQJfxR17pmmN1fZQoaAZHQHAGm7voePtoB0vuaAhHQJfyLb0voNd1fZQoaAZHQE2QcvugHu9oB0vCaAhHQJfygtSQ5m11fZQoaAZHQHB+gSzw+dNoB0v8aAhHQJfy3DCP6sR1fZQoaAZHQG5PiJ40Mw1oB00HAWgIR0CX8wUmD15CdX2UKGgGR0BxZBE8aGYbaAdNBAFoCEdAl/MV3hXKbXV9lChoBkdAcpRhgE2YOWgHTQkBaAhHQJf14sbvPTp1fZQoaAZHQG4Ropx3mmtoB0vzaAhHQJf2LQmeDnN1fZQoaAZHQHK//VNHpbFoB008AWgIR0CX9mWuHN5ddX2UKGgGR0BxXX3Zf2K3aAdNMgFoCEdAl/Z3/DLr5nV9lChoBkdAcKckI5YHPmgHTRYBaAhHQJf2lyzXz191fZQoaAZHQHCJGszVMEloB00iAWgIR0CX90WWQfZFdX2UKGgGR0BwLysLfDUFaAdNAwFoCEdAl/gGoNutOnV9lChoBkdAcSYkgwGnoGgHS/ZoCEdAl/iGF8G9pXV9lChoBkdAcd0IFNcnmmgHTaIBaAhHQJf5Aiml67d1fZQoaAZHQG/g7YkE9uBoB0vuaAhHQJf5nhESdvt1fZQoaAZHQHMhU0rK/21oB0vzaAhHQJf6G2KEWZZ1fZQoaAZHQHEyEnTiKixoB00aAWgIR0CX+oT8pCrtdX2UKGgGR0BzPbj3mFJyaAdNHQFoCEdAl/uG4d6syXV9lChoBkdAcratCzC1qmgHTTcBaAhHQJf8cDdP+GZ1fZQoaAZHQEaOLNOdoWZoB0vkaAhHQJf9OcBltj11fZQoaAZHQHClnpKSPlxoB0vjaAhHQJf9QyckMTh1fZQoaAZHQHPX3Ilt0mtoB0v3aAhHQJf+ApKBd2R1fZQoaAZHQHETRpL26CloB00SAWgIR0CX/jf9gnc+dX2UKGgGR0BwmclhPTG6aAdNJAFoCEdAl/79+9allHV9lChoBkdAbuROqvNeMWgHTV0CaAhHQJf/IWl/H5t1fZQoaAZHQHH1CUgSvkloB00QAWgIR0CX/2msNlRQdX2UKGgGR0Bw1XAN5MURaAdL+GgIR0CX/29uP3i8dX2UKGgGR0Bt0gFgUlAvaAdL72gIR0CYAA9XtBv8dX2UKGgGR0BveY2CNCJGaAdL82gIR0CYAL1RLsa9dX2UKGgGR0ByjXBfrrxBaAdNUQFoCEdAmAJ1b/wRXnV9lChoBkdAcox0b961LWgHTSwBaAhHQJgDFL7Gecx1fZQoaAZHQHB0V0YCQtBoB0v0aAhHQJgEqjQAuI11fZQoaAZHQHAKzGLk0aZoB00OAWgIR0CYBawB5ooNdX2UKGgGR0Bwy9RAKOT8aAdL/mgIR0CYBjkvsZ5zdX2UKGgGR0Bv1HQnhKlIaAdNdwFoCEdAmAZMIAwPAnV9lChoBkdAcgLbx3FDOWgHTTsBaAhHQJgGXkMkQf91fZQoaAZHQHBZ/WhAWzpoB00TAWgIR0CYBq5U96kZdX2UKGgGR0Bw6c6o2n89aAdNCwFoCEdAmAd0yckMTnV9lChoBkdAcXO/b0voNmgHS+poCEdAmAezpcHGCXV9lChoBkdAcFTEBsANomgHTQ8BaAhHQJgHu7TUiIN1ZS4="
|
49 |
},
|
50 |
"ep_success_buffer": {
|
51 |
":type:": "<class 'collections.deque'>",
|
52 |
":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
|
53 |
},
|
54 |
+
"_n_updates": 384,
|
55 |
"observation_space": {
|
56 |
":type:": "<class 'gymnasium.spaces.box.Box'>",
|
57 |
":serialized:": "gAWVcAIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoB4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoECiWCAAAAAAAAAABAQEBAQEBAZRoFEsIhZRoGHSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBAoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaApLCIWUaBh0lFKUjARoaWdolGgQKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgKSwiFlGgYdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=",
|
ppo-LunarLander-v2/policy.optimizer.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 87929
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:87a44009d3ad50ce5bf4c3c45e18f25b5501700a7e7e7438734e67f7209e2e96
|
3 |
size 87929
|
ppo-LunarLander-v2/policy.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 43329
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:acf22106b514fa601dcde5587c5fcd912a184033b5cea39cf6e618aefe85d46a
|
3 |
size 43329
|
replay.mp4
CHANGED
Binary files a/replay.mp4 and b/replay.mp4 differ
|
|
results.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"mean_reward":
|
|
|
1 |
+
{"mean_reward": 268.89390700135795, "std_reward": 30.990567156284154, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-06-12T15:33:56.323331"}
|