ThomasSimonini HF staff commited on
Commit
bc9efd0
1 Parent(s): 83f2ee1

Initial commit

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: PandaReachDense-v3
17
  metrics:
18
  - type: mean_reward
19
- value: -0.37 +/- 0.25
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: PandaReachDense-v3
17
  metrics:
18
  - type: mean_reward
19
+ value: -0.26 +/- 0.13
20
  name: mean_reward
21
  verified: false
22
  ---
a2c-PandaReachDense-v3.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:93baaec741a59670f36ed835418cabbafcb932b2c9143f0de2696567a4adf90b
3
- size 106713
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:86c9d87e13f4b4597b3f13c0ba70b17b5de1f61d4308e239c5da602ae9dcdfe3
3
+ size 106666
a2c-PandaReachDense-v3/data CHANGED
@@ -4,9 +4,9 @@
4
  ":serialized:": "gAWVRQAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMG011bHRpSW5wdXRBY3RvckNyaXRpY1BvbGljeZSTlC4=",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n MultiInputActorClass policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space (Tuple)\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Uses the CombinedExtractor\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
- "__init__": "<function MultiInputActorCriticPolicy.__init__ at 0x7ff82903b5b0>",
8
  "__abstractmethods__": "frozenset()",
9
- "_abc_impl": "<_abc._abc_data object at 0x7ff829040e40>"
10
  },
11
  "verbose": 1,
12
  "policy_kwargs": {
@@ -19,46 +19,46 @@
19
  "weight_decay": 0
20
  }
21
  },
22
- "num_timesteps": 87648,
23
  "_total_timesteps": 1000000,
24
  "_num_timesteps_at_start": 0,
25
  "seed": null,
26
  "action_noise": null,
27
- "start_time": 1683723069964750852,
28
  "learning_rate": 0.0007,
29
  "tensorboard_log": null,
30
  "_last_obs": {
31
  ":type:": "<class 'collections.OrderedDict'>",
32
- ":serialized:": "gAWVuwEAAAAAAACMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwSbnVtcHkuY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QoljAAAAAAAAAAzrRfusItLT8SETM/SSOovunWZj+yiqM+FG+OvpfbBz1iXs8+FG+OvpfbBz1iXs8+lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksESwOGlIwBQ5R0lFKUjAxkZXNpcmVkX2dvYWyUaAcoljAAAAAAAAAAoLzRPzqn1j+T8m4/o4iTP0GFlz87kXc/PihRP9MvWr/5+pm/n+50Pb0dpj/wLI6/lGgOSwRLA4aUaBJ0lFKUjAtvYnNlcnZhdGlvbpRoByiWYAAAAAAAAADOtF+6wi0tPxIRMz+zZfI+u32MP8NtID9JI6i+6dZmP7KKoz7o/cA/BZsBvI6PI78Ub46+l9sHPWJezz6oj1c9VKzDOb9EiT0Ub46+l9sHPWJezz6oj1c9VKzDOb9EiT2UaA5LBEsGhpRoEnSUUpR1Lg==",
33
- "achieved_goal": "[[-8.5337169e-04 6.7647946e-01 6.9947922e-01]\n [-3.2839420e-01 9.0171677e-01 3.1941754e-01]\n [-2.7819121e-01 3.3168402e-02 4.0501696e-01]\n [-2.7819121e-01 3.3168402e-02 4.0501696e-01]]",
34
- "desired_goal": "[[ 1.6385689 1.6769783 0.9333889 ]\n [ 1.1526073 1.1837541 0.9670598 ]\n [ 0.8170203 -0.85229224 -1.2029716 ]\n [ 0.05979788 1.2977825 -1.1107464 ]]",
35
- "observation": "[[-8.5337169e-04 6.7647946e-01 6.9947922e-01 4.7343215e-01\n 1.0975870e+00 6.2667483e-01]\n [-3.2839420e-01 9.0171677e-01 3.1941754e-01 1.5077486e+00\n -7.9104947e-03 -6.3890922e-01]\n [-2.7819121e-01 3.3168402e-02 4.0501696e-01 5.2627236e-02\n 3.7321693e-04 6.7025654e-02]\n [-2.7819121e-01 3.3168402e-02 4.0501696e-01 5.2627236e-02\n 3.7321693e-04 6.7025654e-02]]"
36
  },
37
  "_last_episode_starts": {
38
  ":type:": "<class 'numpy.ndarray'>",
39
- ":serialized:": "gAWVdwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYEAAAAAAAAAAAAAQGUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwSFlIwBQ5R0lFKULg=="
40
  },
41
  "_last_original_obs": {
42
  ":type:": "<class 'collections.OrderedDict'>",
43
- ":serialized:": "gAWVuwEAAAAAAACMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwSbnVtcHkuY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QoljAAAAAAAAAA6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksESwOGlIwBQ5R0lFKUjAxkZXNpcmVkX2dvYWyUaAcoljAAAAAAAAAAqFS2vbK+rz3s32A+v7h6vLV2Qr1hT7o9v3iCvbrzDL7XI4k9smzivXp1h72Jbq49lGgOSwRLA4aUaBJ0lFKUjAtvYnNlcnZhdGlvbpRoByiWYAAAAAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAACUaA5LBEsGhpRoEnSUUpR1Lg==",
44
  "achieved_goal": "[[ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]]",
45
- "desired_goal": "[[-0.08902866 0.08581294 0.2196042 ]\n [-0.01530284 -0.04747649 0.09097172]\n [-0.06370687 -0.1376485 0.06696289]\n [-0.11055888 -0.06614204 0.08517177]]",
46
  "observation": "[[ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]]"
47
  },
48
  "_episode_num": 0,
49
  "use_sde": false,
50
  "sde_sample_freq": -1,
51
- "_current_progress_remaining": 0.9123600000000001,
52
  "_stats_window_size": 100,
53
  "ep_info_buffer": {
54
  ":type:": "<class 'collections.deque'>",
55
- ":serialized:": "gAWV4AsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHv+cPYFqzqr2MAWyUSwiMAXSUR0B0CYcT8HfNdX2UKGgGR7+emzjWCmMwaAdLAWgIR0B0CcUpNKywdX2UKGgGR7/ydI9TxXnyaAdLDGgIR0B0BXNPgvUSdX2UKGgGR7/plNtZV4oraAdLCGgIR0B0CExIre67dX2UKGgGR7+f4h2W6bvxaAdLAWgIR0B0CHXsgMc7dX2UKGgGR7/lmvnr6ciGaAdLCGgIR0B0DaUdJaq0dX2UKGgGR7/VUW2w3YL9aAdLBGgIR0B0CSbayrxRdX2UKGgGR7/TZB9kSVW0aAdLBGgIR0B0Dlf8dgfEdX2UKGgGR7/r9f9gnc+JaAdLC2gIR0B0C8WEbo8qdX2UKGgGR7+7gR9PUKAsaAdLAmgIR0B0CX0SRKYidX2UKGgGR7/pXokiUxEfaAdLCGgIR0B0BuxoqTbGdX2UKGgGR7+Y+B6KLsKLaAdLAWgIR0B0CakuYhMbdX2UKGgGR7+9ie/Yao/BaAdLAmgIR0B0Cgt/WlMzdX2UKGgGR7/LF2FFlTWHaAdLA2gIR0B0B3n1WbPQdX2UKGgGR7/ijpC8e0XxaAdLB2gIR0B0D47KaG5+dX2UKGgGR7/TwIdELH+7aAdLA2gIR0B0Coz9CNS7dX2UKGgGR7/rsGxD9fkWaAdLCWgIR0B0DV9Wp6yCdX2UKGgGR7/DtrKvFFUiaAdLAmgIR0B0CvBdld1MdX2UKGgGR7/dy1eBxxT9aAdLBmgIR0B0DmAEt/WldX2UKGgGR7/iR8UmD15CaAdLB2gIR0B0DCNvOyE+dX2UKGgGR7+j8YQ8OkLyaAdLAWgIR0B0DEsZpBX0dX2UKGgGR7/OjW07bL2YaAdLA2gIR0B0DuVD8cdYdX2UKGgGR7/zf2Cdz4lAaAdLDmgIR0B0CebSZ0CBdX2UKGgGR7/IsNlRP421aAdLA2gIR0B0DOaYu01JdX2UKGgGR7/N7YTTOPeYaAdLA2gIR0B0CoOz6ab4dX2UKGgGR7/gLHuJDVpcaAdLB2gIR0B0EEFyJbdKdX2UKGgGR7/A5imVJL/TaAdLAmgIR0B0EI85jpcHdX2UKGgGR7/dR3/xUedTaAdLBmgIR0B0C4+V1Oj7dX2UKGgGR8AB/9itq59WaAdLFmgIR0B0E4+pwS8KdX2UKGgGR7+xmbsniNsFaAdLAmgIR0B0C/sHB1s+dX2UKGgGR7/mlJQLux8laAdLCmgIR0B0Drn5i3G5dX2UKGgGR7/ApMHryDqXaAdLAmgIR0B0DwdwNsnBdX2UKGgGR7/lFwLmZE2HaAdLCGgIR0B0FPZlFtsOdX2UKGgGR7/tMfigkC3gaAdLCmgIR0B0EmOWBz3idX2UKGgGR7/klpPAO8TSaAdLCGgIR0B0DWHUMG5ddX2UKGgGR7/m6VUuL740aAdLB2gIR0B0EFGYrrgPdX2UKGgGR7/L5RCQcPvsaAdLA2gIR0B0FX91loUSdX2UKGgGR7/dsHSncclxaAdLBWgIR0B0Di3pfQa8dX2UKGgGR7/V8G9pRGc4aAdLBGgIR0B0FjtrsSkCdX2UKGgGR7/j5TQ3PzFuaAdLCGgIR0B0E+SEDhcadX2UKGgGR7/Mit7rs0HhaAdLA2gIR0B0DuQZGax5dX2UKGgGR7/iVuBMBZIQaAdLB2gIR0B0EaC9RJmNdX2UKGgGR7/S9t/FzdULaAdLA2gIR0B0D1mapgkUdX2UKGgGR7/WGDtgKF7EaAdLA2gIR0B0Eiw0O3DvdX2UKGgGR7/any/bj94vaAdLBmgIR0B0FOaQV9F4dX2UKGgGR7/lJx3mmtQsaAdLCGgIR0B0F6K508vFdX2UKGgGR7/U3xWkrPMTaAdLBGgIR0B0EAkzGgjAdX2UKGgGR7/YCJXQtz0ZaAdLBGgIR0B0FZV94NZvdX2UKGgGR7/jUf5k9U0faAdLBmgIR0B0EyZ7XxvvdX2UKGgGR7/PhsqJ/G2kaAdLA2gIR0B0EJOgxrSFdX2UKGgGR7/cjS5RTCLuaAdLBGgIR0B0GFVp9JBgdX2UKGgGR7/JoouwosqbaAdLA2gIR0B0GN3+uNgjdX2UKGgGR7/j/CAMDwH8aAdLBmgIR0B0EaNXHR1HdX2UKGgGR7/r0yYXwb2laAdLB2gIR0B0FGFbmlqKdX2UKGgGR7+80fozN2TxaAdLAmgIR0B0EfND+irUdX2UKGgGR7/izG5tm+TNaAdLBmgIR0B0Gfos7MgVdX2UKGgGR7/CQyRB/qgRaAdLAmgIR0B0GlQoCuEFdX2UKGgGR7/aGgBcRlH0aAdLBmgIR0B0FX3XZoPDdX2UKGgGR7/mGY8dPtUoaAdLB2gIR0B0E0aAFxGUdX2UKGgGR7/YVNHpbD/EaAdLBGgIR0B0FjRCx/utdX2UKGgGR7+8pjMFEAo5aAdLAmgIR0B0E6UmlZX/dX2UKGgGR7/jDO1OTJQtaAdLCGgIR0B0G9IatLcsdX2UKGgGR7/Ly8SPEKmbaAdLA2gIR0B0Fs8TzunddX2UKGgGR7/Vu5jH4oJBaAdLBGgIR0B0FGWHDaXbdX2UKGgGR7/T/kNnXd0raAdLBWgIR0B0HKiUPhAGdX2UKGgGR8AFXxQSBbwCaAdLG2gIR0B0Gl/jKgZkdX2UKGgGR7/L0Yj0L+glaAdLA2gIR0B0HSY+jdpJdX2UKGgGR7/j8Cgbp/wzaAdLB2gIR0B0FY8fV7QcdX2UKGgGR7/vwoTfzjFRaAdLCmgIR0B0GH73wkPddX2UKGgGR7+5hF3IMjNZaAdLAmgIR0B0Fez4UN8WdX2UKGgGR7/upV0cOskqaAdLCWgIR0B0HAAmzBykdX2UKGgGR7/gZsbedkJ8aAdLBmgIR0B0GZMEidJ8dX2UKGgGR7/lcrRSgoPTaAdLB2gIR0B0FyOsDGLldX2UKGgGR7/wbA+IMz/IaAdLC2gIR0B0Hxs1sLv1dX2UKGgGR7/LvnbItDlYaAdLA2gIR0B0HIhJRO1wdX2UKGgGR7/Hqlgtvn8saAdLA2gIR0B0F6yJKraNdX2UKGgGR7+2hpQDV6NVaAdLAmgIR0B0HNjoZAIIdX2UKGgGR7/qWPDHfdhzaAdLCGgIR0B0GvBqKxcFdX2UKGgGR7/lWJrLyMDPaAdLCGgIR0B0IG4UeuFIdX2UKGgGR7+i1kUbkwN9aAdLAWgIR0B0IJadMCcPdX2UKGgGR7/qXSa3I+4caAdLCWgIR0B0HmhRIjGDdX2UKGgGR7/nPUrkKeCkaAdLCmgIR0B0GWtEG7jDdX2UKGgGR7+i2phnanJlaAdLAWgIR0B0GZTNt65YdX2UKGgGR7/iBTGYKIBSaAdLB2gIR0B0IeapgkTpdX2UKGgGR7/xeT3Zf2K3aAdLDGgIR0B0HRCCz1K5dX2UKGgGR7/hs+eOGTLXaAdLB2gIR0B0H69WZJCjdX2UKGgGR7/OAo5PuXu3aAdLA2gIR0B0IC4Wk8A8dX2UKGgGR7/o5uQ6p5u7aAdLCmgIR0B0G18Sf16FdX2UKGgGR7/lrFwT/Q0GaAdLCGgIR0B0I0nUlRgrdX2UKGgGR7/iyRbKRuCPaAdLCGgIR0B0HpqDbrTqdX2UKGgGR7/i8HfMwDeTaAdLBWgIR0B0HFMDfWMCdX2UKGgGR7/QGRV6u4gBaAdLA2gIR0B0HN76YVqOdX2UKGgGR7/jZmh/RVp9aAdLB2gIR0B0JKHaews5dX2UKGgGR7/j1lPJq7AdaAdLB2gIR0B0H8mPYFq0dX2UKGgGR7/gdWyTpxFRaAdLBmgIR0B0HeCxu89PdX2UKGgGR7/gE2pAD7qIaAdLBmgIR0B0JaMn7YTTdX2UKGgGR7+8MhHLA57xaAdLAmgIR0B0Hjw4KhL5dX2UKGgGR7+8TQE6kqMFaAdLAmgIR0B0Jf8cdYGMdX2UKGgGR7/mHYYixFAnaAdLCWgIR0B0IXOVxCIDdX2UKGgGR7/QcVgx8D0UaAdLA2gIR0B0Hvifg75mdWUu"
56
  },
57
  "ep_success_buffer": {
58
  ":type:": "<class 'collections.deque'>",
59
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
60
  },
61
- "_n_updates": 4382,
62
  "n_steps": 5,
63
  "gamma": 0.99,
64
  "gae_lambda": 1.0,
 
4
  ":serialized:": "gAWVRQAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMG011bHRpSW5wdXRBY3RvckNyaXRpY1BvbGljeZSTlC4=",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n MultiInputActorClass policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space (Tuple)\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Uses the CombinedExtractor\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
+ "__init__": "<function MultiInputActorCriticPolicy.__init__ at 0x7fde7562f1c0>",
8
  "__abstractmethods__": "frozenset()",
9
+ "_abc_impl": "<_abc._abc_data object at 0x7fde7562a740>"
10
  },
11
  "verbose": 1,
12
  "policy_kwargs": {
 
19
  "weight_decay": 0
20
  }
21
  },
22
+ "num_timesteps": 79492,
23
  "_total_timesteps": 1000000,
24
  "_num_timesteps_at_start": 0,
25
  "seed": null,
26
  "action_noise": null,
27
+ "start_time": 1683724910010419395,
28
  "learning_rate": 0.0007,
29
  "tensorboard_log": null,
30
  "_last_obs": {
31
  ":type:": "<class 'collections.OrderedDict'>",
32
+ ":serialized:": "gAWVuwEAAAAAAACMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwSbnVtcHkuY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QoljAAAAAAAAAA3jMRvyLeET+Ntzq/eRSVvijvVD6wDPs+45hKvytJqT6v0RM//m0CPrcPdL0CKRg/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksESwOGlIwBQ5R0lFKUjAxkZXNpcmVkX2dvYWyUaAcoljAAAAAAAAAAKGaRvgzzhD+xd9u/p6KovlCIjz9plqQ/jyO7v+bQZT/Ngys/u0fXP3Tyzr9Mgr0/lGgOSwRLA4aUaBJ0lFKUjAtvYnNlcnZhdGlvbpRoByiWYAAAAAAAAADeMxG/It4RP423Or9htCy/x+6Yuhour795FJW+KO9UPrAM+z5oXcq+AmbiP8fBMz/jmEq/K0mpPq/REz+R54y/LTIivio/kz/+bQI+tw90vQIpGD//iqs/UWzYv7OwQj+UaA5LBEsGhpRoEnSUUpR1Lg==",
33
+ "achieved_goal": "[[-0.5671977 0.5697957 -0.72936326]\n [-0.29117182 0.20794356 0.49033117]\n [-0.79139537 0.33063635 0.57741827]\n [ 0.12737271 -0.0595853 0.5943757 ]]",
34
+ "desired_goal": "[[-0.28398252 1.0386672 -1.7145902 ]\n [-0.32936594 1.1213474 1.2858402 ]\n [-1.4620227 0.8977188 0.6699799 ]\n [ 1.6818765 -1.6167741 1.4805388 ]]",
35
+ "observation": "[[-5.6719768e-01 5.6979573e-01 -7.2936326e-01 -6.7462736e-01\n -1.1667841e-03 -1.3685944e+00]\n [-2.9117182e-01 2.0794356e-01 4.9033117e-01 -3.9524388e-01\n 1.7687380e+00 7.0217556e-01]\n [-7.9139537e-01 3.3063635e-01 5.7741827e-01 -1.1008168e+00\n -1.5839453e-01 1.1503651e+00]\n [ 1.2737271e-01 -5.9585299e-02 5.9437573e-01 1.3401793e+00\n -1.6908056e+00 7.6050872e-01]]"
36
  },
37
  "_last_episode_starts": {
38
  ":type:": "<class 'numpy.ndarray'>",
39
+ ":serialized:": "gAWVdwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYEAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwSFlIwBQ5R0lFKULg=="
40
  },
41
  "_last_original_obs": {
42
  ":type:": "<class 'collections.OrderedDict'>",
43
+ ":serialized:": "gAWVuwEAAAAAAACMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwSbnVtcHkuY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QoljAAAAAAAAAA6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksESwOGlIwBQ5R0lFKUjAxkZXNpcmVkX2dvYWyUaAcoljAAAAAAAAAAYbrhPYhAkr0gHw8+fMdRPSFiBT4JDDM+Lp3qO7HjoL3EKhM+VMEJvvoQFLyRrGI9lGgOSwRLA4aUaBJ0lFKUjAtvYnNlcnZhdGlvbpRoByiWYAAAAAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAACUaA5LBEsGhpRoEnSUUpR1Lg==",
44
  "achieved_goal": "[[ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]]",
45
+ "desired_goal": "[[ 0.11021877 -0.07141215 0.13976717]\n [ 0.05121563 0.13025714 0.1748506 ]\n [ 0.00715985 -0.07855929 0.14371783]\n [-0.13452655 -0.00903725 0.05534035]]",
46
  "observation": "[[ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]]"
47
  },
48
  "_episode_num": 0,
49
  "use_sde": false,
50
  "sde_sample_freq": -1,
51
+ "_current_progress_remaining": 0.92052,
52
  "_stats_window_size": 100,
53
  "ep_info_buffer": {
54
  ":type:": "<class 'collections.deque'>",
55
+ ":serialized:": "gAWV4AsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHv9awSrYGt6qMAWyUSwSMAXSUR0Byb34xk/bCdX2UKGgGR7/Vvegte2NOaAdLBWgIR0ByZKdrftQbdX2UKGgGR7/haC17Y02taAdLBmgIR0ByasNx2jfvdX2UKGgGR7/Ar7O3UhFFaAdLAmgIR0ByZUHv+fh/dX2UKGgGR7/O8yvcJtzkaAdLA2gIR0BydaJAMUh3dX2UKGgGR7/TcIZ62OQyaAdLBGgIR0BycJl6JIlMdX2UKGgGR7/R5aNdZ7ojaAdLA2gIR0ByZdn27FsIdX2UKGgGR7/MwA2hqTKUaAdLA2gIR0BydiPjn3cpdX2UKGgGR7/SPNFBppN9aAdLA2gIR0BycRBqsU7CdX2UKGgGR7/fBFuvUz9CaAdLBWgIR0Bya7RtxdY5dX2UKGgGR7+8uf29L6DXaAdLAmgIR0ByZi6RQrMDdX2UKGgGR7/P7MPjGT9saAdLA2gIR0BydrM9r434dX2UKGgGR7/Kj7ALy+YdaAdLA2gIR0BycaF+NLlFdX2UKGgGR7/NV5KODJ2daAdLA2gIR0BybETfzjFRdX2UKGgGR7/XlchTwUg0aAdLBWgIR0ByZwvkBCD3dX2UKGgGR7/PCgK4QSSNaAdLBGgIR0Byd2xQizLPdX2UKGgGR7/HqubI91U3aAdLA2gIR0BybNWsA/9pdX2UKGgGR7+nskY4yXUpaAdLAWgIR0Byd5opQUHqdX2UKGgGR7/a9q1w5vLpaAdLBGgIR0BycmEJ0GNadX2UKGgGR7/M92X9itq6aAdLA2gIR0BybU4uK4x2dX2UKGgGR7/S6DGtITXbaAdLBGgIR0BycxRl6JIldX2UKGgGR7+5uDSPU8V6aAdLAmgIR0BybbezlcQidX2UKGgGR7/gOwgTyrggaAdLBmgIR0ByeJyo4uK5dX2UKGgGR7+80tRNyo4uaAdLAmgIR0Byc2OxSpBHdX2UKGgGR7/kQljVhCtzaAdLCGgIR0ByaH4j8k2QdX2UKGgGR7/ShWHUMG5daAdLBGgIR0ByblwkxASndX2UKGgGR7/Adf9gnc+JaAdLAmgIR0ByaNbY9Pk8dX2UKGgGR7/ZAxBVuJk5aAdLBGgIR0ByeV6v7m+1dX2UKGgGR7/Vsf7rLQokaAdLBGgIR0BydCXUpd8idX2UKGgGR7/BYmLLpzLfaAdLAmgIR0BybstoSL62dX2UKGgGR7/SsniNsFdLaAdLBGgIR0ByaZaX8fmtdX2UKGgGR7/V3juKGcnWaAdLA2gIR0ByeeFGoaUBdX2UKGgGR7/KNQ0oBq9HaAdLA2gIR0BydKlANXo1dX2UKGgGR7/g1XmvGIbgaAdLBWgIR0Byb7VRUFSsdX2UKGgGR7/UiGWUr08OaAdLA2gIR0ByeoHgP3BYdX2UKGgGR7/W+B6KLsKLaAdLBWgIR0ByapDJEH+qdX2UKGgGR7/RZPl+3H7xaAdLA2gIR0ByexWYF7ladX2UKGgGR7/WuWa+evpyaAdLBGgIR0BycH5/LDAKdX2UKGgGR7+mFN+LFXJYaAdLAWgIR0Bye0BxPwd9dX2UKGgGR7/YgB91EE1VaAdLBGgIR0Bya0eYD1XedX2UKGgGR7/lgHVwxWT5aAdLCWgIR0Bydldu5z5odX2UKGgGR7/LGBnSOR1YaAdLBGgIR0BycSDqW1MNdX2UKGgGR7+8GZ/kNnXeaAdLAmgIR0Bya53X7LuAdX2UKGgGR7/Viay8jAzpaAdLBGgIR0Bye/3yqdYodX2UKGgGR7/DRUm2LHdXaAdLAmgIR0BydsTBZZB+dX2UKGgGR7/O7nPmgam5aAdLA2gIR0BycbVsk6cRdX2UKGgGR7/LIQvpQk5ZaAdLA2gIR0BybDC+De0pdX2UKGgGR7/Pos7MgU1yaAdLA2gIR0ByfHuPV/c4dX2UKGgGR7/Jq7iADq4ZaAdLA2gIR0Byd0WhysCDdX2UKGgGR7/R1/2Cdz4laAdLA2gIR0ByfRYYBNmEdX2UKGgGR7/iTJhfBvaUaAdLBGgIR0Bycn5qM3qBdX2UKGgGR7/aUTcqOLiuaAdLBGgIR0BybPpOerdWdX2UKGgGR7/aidJ8OTaCaAdLBGgIR0ByeA0YTCcgdX2UKGgGR7+MjZ+QU5+6aAdLAWgIR0BybSm3vx6OdX2UKGgGR7+h9gF5fMOgaAdLAWgIR0ByeDjT8YQ8dX2UKGgGR7/AVt4zJp35aAdLAmgIR0Byct3r2QGOdX2UKGgGR7/Wiay8jAzpaAdLBGgIR0ByfegOBlMAdX2UKGgGR7/DJIUahpQDaAdLAmgIR0Byc1Tgl4TsdX2UKGgGR7/OL0Bfa6BiaAdLA2gIR0ByeN+kP+XJdX2UKGgGR7+cry1/lQuVaAdLAWgIR0Byc4ZXMhX9dX2UKGgGR7/AUnG8274BaAdLAmgIR0ByfkokRjBmdX2UKGgGR7+je9Ba9sabaAdLAWgIR0ByfnOZ9d/sdX2UKGgGR7/B0se4kNWmaAdLAmgIR0Byc+H1vl2edX2UKGgGR7/GFMZgogFHaAdLA2gIR0ByeX1pTMq0dX2UKGgGR7/HCMPz4DcNaAdLA2gIR0ByfyktVaOhdX2UKGgGR7+99/jKgZjyaAdLAmgIR0ByefDIikftdX2UKGgGR7/K8YAKfFrEaAdLA2gIR0BydJTfixVydX2UKGgGR7/n5D7ZWaMKaAdLCWgIR0BybxF/hESedX2UKGgGR7+79deIEbHZaAdLAmgIR0Byellf7aZhdX2UKGgGR7/IroW56MR6aAdLA2gIR0Byf82m51/2dX2UKGgGR7/RLGaQV9F4aAdLA2gIR0BydUXBP9DQdX2UKGgGR7/Ke7tiQT24aAdLA2gIR0Byb8aNuLrHdX2UKGgGR7++v4dp7CzkaAdLAmgIR0ByevEfkmx/dX2UKGgGR7+7AO8TSLIgaAdLAmgIR0Bydbmig00ndX2UKGgGR7/Pt/FzdUKiaAdLA2gIR0BycFeiSJTEdX2UKGgGR7/XSLZSNwR5aAdLBGgIR0BygKPOpsGgdX2UKGgGR7/PkQwsXizcaAdLA2gIR0Bye3Ot4iX6dX2UKGgGR7/UqQzUI9kjaAdLA2gIR0BydkAU+LWJdX2UKGgGR7/AiYb83uNQaAdLAmgIR0BycLnyNGVidX2UKGgGR7+2NuLrHEMtaAdLAmgIR0BygRkK/mDEdX2UKGgGR7/SH2ys0YTCaAdLA2gIR0ByfAi8nNPhdX2UKGgGR7+8kjX4CZF5aAdLAmgIR0BycSUNayKOdX2UKGgGR7/JiYLLIPsiaAdLA2gIR0BydtbGFSKndX2UKGgGR7+1VtGd7OVxaAdLAmgIR0ByfF6NVBD5dX2UKGgGR7/axzq8lHBlaAdLBGgIR0ByceIfr8iwdX2UKGgGR7/S+jua4MF2aAdLBGgIR0ByfSaEzwc6dX2UKGgGR7/TuRs/IKc/aAdLBWgIR0Byd9DkU9IPdX2UKGgGR7/PyLhrFfiQaAdLA2gIR0BycnOE/SpjdX2UKGgGR7+6+PBBRhttaAdLAmgIR0ByfYKIBRyfdX2UKGgGR7/pGY0EX+ERaAdLCmgIR0BygwPOIInjdX2UKGgGR7+3ND+irT6SaAdLAmgIR0ByffV+Zw4sdX2UKGgGR7/Oo60Y0l7daAdLA2gIR0BycxIOH310dX2UKGgGR7/gJmmLtNSJaAdLBWgIR0ByeM1+AmRedX2UKGgGR7+dVmz0HyEtaAdLAWgIR0Byc05XEIgOdX2UKGgGR7/H0fYBeXzEaAdLA2gIR0Byg5me18b8dX2UKGgGR7/E1stTUAktaAdLAmgIR0ByfmCrcTJydX2UKGgGR792vbGm1pj+aAdLAWgIR0Byg8GKQ7tBdX2UKGgGR7/MGQCCBf8eaAdLA2gIR0ByeWK0lZ5idX2UKGgGR7/LFWn0kGA1aAdLA2gIR0ByfusHSncddX2UKGgGR7/ZrVOKwY+CaAdLBGgIR0BydAYEW69TdWUu"
56
  },
57
  "ep_success_buffer": {
58
  ":type:": "<class 'collections.deque'>",
59
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
60
  },
61
+ "_n_updates": 3974,
62
  "n_steps": 5,
63
  "gamma": 0.99,
64
  "gae_lambda": 1.0,
a2c-PandaReachDense-v3/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5bff22dc8560a3051ac937347ad4c68467ef2481b154c0c1d2d6263a52d87599
3
  size 44606
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39da30bbd88e78d49dfa759e68be225473ca70f46e55802b382e41ae2e3e5208
3
  size 44606
a2c-PandaReachDense-v3/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6a96059ed7645178b420d71a4b1910889b5a691ba685bd22a2c7ae7df8ec0a62
3
  size 45886
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ec06d546c0bad94df6cc88ebafae85c01cef022931be6272812b3cf986a4422
3
  size 45886
config.json CHANGED
@@ -1 +1 @@
1
- {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVRQAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMG011bHRpSW5wdXRBY3RvckNyaXRpY1BvbGljeZSTlC4=", "__module__": "stable_baselines3.common.policies", "__doc__": "\n MultiInputActorClass policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space (Tuple)\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Uses the CombinedExtractor\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function MultiInputActorCriticPolicy.__init__ at 0x7ff82903b5b0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7ff829040e40>"}, "verbose": 1, "policy_kwargs": {":type:": "<class 'dict'>", ":serialized:": "gAWVgQAAAAAAAAB9lCiMD29wdGltaXplcl9jbGFzc5SME3RvcmNoLm9wdGltLnJtc3Byb3CUjAdSTVNwcm9wlJOUjBBvcHRpbWl6ZXJfa3dhcmdzlH2UKIwFYWxwaGGURz/vrhR64UeujANlcHOURz7k+LWI42jxjAx3ZWlnaHRfZGVjYXmUSwB1dS4=", "optimizer_class": "<class 'torch.optim.rmsprop.RMSprop'>", "optimizer_kwargs": {"alpha": 0.99, "eps": 1e-05, "weight_decay": 0}}, "num_timesteps": 87648, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1683723069964750852, "learning_rate": 0.0007, "tensorboard_log": null, "_last_obs": {":type:": "<class 'collections.OrderedDict'>", ":serialized:": "gAWVuwEAAAAAAACMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwSbnVtcHkuY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QoljAAAAAAAAAAzrRfusItLT8SETM/SSOovunWZj+yiqM+FG+OvpfbBz1iXs8+FG+OvpfbBz1iXs8+lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksESwOGlIwBQ5R0lFKUjAxkZXNpcmVkX2dvYWyUaAcoljAAAAAAAAAAoLzRPzqn1j+T8m4/o4iTP0GFlz87kXc/PihRP9MvWr/5+pm/n+50Pb0dpj/wLI6/lGgOSwRLA4aUaBJ0lFKUjAtvYnNlcnZhdGlvbpRoByiWYAAAAAAAAADOtF+6wi0tPxIRMz+zZfI+u32MP8NtID9JI6i+6dZmP7KKoz7o/cA/BZsBvI6PI78Ub46+l9sHPWJezz6oj1c9VKzDOb9EiT0Ub46+l9sHPWJezz6oj1c9VKzDOb9EiT2UaA5LBEsGhpRoEnSUUpR1Lg==", "achieved_goal": "[[-8.5337169e-04 6.7647946e-01 6.9947922e-01]\n [-3.2839420e-01 9.0171677e-01 3.1941754e-01]\n [-2.7819121e-01 3.3168402e-02 4.0501696e-01]\n [-2.7819121e-01 3.3168402e-02 4.0501696e-01]]", "desired_goal": "[[ 1.6385689 1.6769783 0.9333889 ]\n [ 1.1526073 1.1837541 0.9670598 ]\n [ 0.8170203 -0.85229224 -1.2029716 ]\n [ 0.05979788 1.2977825 -1.1107464 ]]", "observation": "[[-8.5337169e-04 6.7647946e-01 6.9947922e-01 4.7343215e-01\n 1.0975870e+00 6.2667483e-01]\n [-3.2839420e-01 9.0171677e-01 3.1941754e-01 1.5077486e+00\n -7.9104947e-03 -6.3890922e-01]\n [-2.7819121e-01 3.3168402e-02 4.0501696e-01 5.2627236e-02\n 3.7321693e-04 6.7025654e-02]\n [-2.7819121e-01 3.3168402e-02 4.0501696e-01 5.2627236e-02\n 3.7321693e-04 6.7025654e-02]]"}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYEAAAAAAAAAAAAAQGUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwSFlIwBQ5R0lFKULg=="}, "_last_original_obs": {":type:": "<class 'collections.OrderedDict'>", ":serialized:": "gAWVuwEAAAAAAACMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwSbnVtcHkuY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QoljAAAAAAAAAA6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksESwOGlIwBQ5R0lFKUjAxkZXNpcmVkX2dvYWyUaAcoljAAAAAAAAAAqFS2vbK+rz3s32A+v7h6vLV2Qr1hT7o9v3iCvbrzDL7XI4k9smzivXp1h72Jbq49lGgOSwRLA4aUaBJ0lFKUjAtvYnNlcnZhdGlvbpRoByiWYAAAAAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAACUaA5LBEsGhpRoEnSUUpR1Lg==", "achieved_goal": "[[ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]]", "desired_goal": "[[-0.08902866 0.08581294 0.2196042 ]\n [-0.01530284 -0.04747649 0.09097172]\n [-0.06370687 -0.1376485 0.06696289]\n [-0.11055888 -0.06614204 0.08517177]]", "observation": "[[ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]]"}, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": 0.9123600000000001, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWV4AsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHv+cPYFqzqr2MAWyUSwiMAXSUR0B0CYcT8HfNdX2UKGgGR7+emzjWCmMwaAdLAWgIR0B0CcUpNKywdX2UKGgGR7/ydI9TxXnyaAdLDGgIR0B0BXNPgvUSdX2UKGgGR7/plNtZV4oraAdLCGgIR0B0CExIre67dX2UKGgGR7+f4h2W6bvxaAdLAWgIR0B0CHXsgMc7dX2UKGgGR7/lmvnr6ciGaAdLCGgIR0B0DaUdJaq0dX2UKGgGR7/VUW2w3YL9aAdLBGgIR0B0CSbayrxRdX2UKGgGR7/TZB9kSVW0aAdLBGgIR0B0Dlf8dgfEdX2UKGgGR7/r9f9gnc+JaAdLC2gIR0B0C8WEbo8qdX2UKGgGR7+7gR9PUKAsaAdLAmgIR0B0CX0SRKYidX2UKGgGR7/pXokiUxEfaAdLCGgIR0B0BuxoqTbGdX2UKGgGR7+Y+B6KLsKLaAdLAWgIR0B0CakuYhMbdX2UKGgGR7+9ie/Yao/BaAdLAmgIR0B0Cgt/WlMzdX2UKGgGR7/LF2FFlTWHaAdLA2gIR0B0B3n1WbPQdX2UKGgGR7/ijpC8e0XxaAdLB2gIR0B0D47KaG5+dX2UKGgGR7/TwIdELH+7aAdLA2gIR0B0Coz9CNS7dX2UKGgGR7/rsGxD9fkWaAdLCWgIR0B0DV9Wp6yCdX2UKGgGR7/DtrKvFFUiaAdLAmgIR0B0CvBdld1MdX2UKGgGR7/dy1eBxxT9aAdLBmgIR0B0DmAEt/WldX2UKGgGR7/iR8UmD15CaAdLB2gIR0B0DCNvOyE+dX2UKGgGR7+j8YQ8OkLyaAdLAWgIR0B0DEsZpBX0dX2UKGgGR7/OjW07bL2YaAdLA2gIR0B0DuVD8cdYdX2UKGgGR7/zf2Cdz4lAaAdLDmgIR0B0CebSZ0CBdX2UKGgGR7/IsNlRP421aAdLA2gIR0B0DOaYu01JdX2UKGgGR7/N7YTTOPeYaAdLA2gIR0B0CoOz6ab4dX2UKGgGR7/gLHuJDVpcaAdLB2gIR0B0EEFyJbdKdX2UKGgGR7/A5imVJL/TaAdLAmgIR0B0EI85jpcHdX2UKGgGR7/dR3/xUedTaAdLBmgIR0B0C4+V1Oj7dX2UKGgGR8AB/9itq59WaAdLFmgIR0B0E4+pwS8KdX2UKGgGR7+xmbsniNsFaAdLAmgIR0B0C/sHB1s+dX2UKGgGR7/mlJQLux8laAdLCmgIR0B0Drn5i3G5dX2UKGgGR7/ApMHryDqXaAdLAmgIR0B0DwdwNsnBdX2UKGgGR7/lFwLmZE2HaAdLCGgIR0B0FPZlFtsOdX2UKGgGR7/tMfigkC3gaAdLCmgIR0B0EmOWBz3idX2UKGgGR7/klpPAO8TSaAdLCGgIR0B0DWHUMG5ddX2UKGgGR7/m6VUuL740aAdLB2gIR0B0EFGYrrgPdX2UKGgGR7/L5RCQcPvsaAdLA2gIR0B0FX91loUSdX2UKGgGR7/dsHSncclxaAdLBWgIR0B0Di3pfQa8dX2UKGgGR7/V8G9pRGc4aAdLBGgIR0B0FjtrsSkCdX2UKGgGR7/j5TQ3PzFuaAdLCGgIR0B0E+SEDhcadX2UKGgGR7/Mit7rs0HhaAdLA2gIR0B0DuQZGax5dX2UKGgGR7/iVuBMBZIQaAdLB2gIR0B0EaC9RJmNdX2UKGgGR7/S9t/FzdULaAdLA2gIR0B0D1mapgkUdX2UKGgGR7/WGDtgKF7EaAdLA2gIR0B0Eiw0O3DvdX2UKGgGR7/any/bj94vaAdLBmgIR0B0FOaQV9F4dX2UKGgGR7/lJx3mmtQsaAdLCGgIR0B0F6K508vFdX2UKGgGR7/U3xWkrPMTaAdLBGgIR0B0EAkzGgjAdX2UKGgGR7/YCJXQtz0ZaAdLBGgIR0B0FZV94NZvdX2UKGgGR7/jUf5k9U0faAdLBmgIR0B0EyZ7XxvvdX2UKGgGR7/PhsqJ/G2kaAdLA2gIR0B0EJOgxrSFdX2UKGgGR7/cjS5RTCLuaAdLBGgIR0B0GFVp9JBgdX2UKGgGR7/JoouwosqbaAdLA2gIR0B0GN3+uNgjdX2UKGgGR7/j/CAMDwH8aAdLBmgIR0B0EaNXHR1HdX2UKGgGR7/r0yYXwb2laAdLB2gIR0B0FGFbmlqKdX2UKGgGR7+80fozN2TxaAdLAmgIR0B0EfND+irUdX2UKGgGR7/izG5tm+TNaAdLBmgIR0B0Gfos7MgVdX2UKGgGR7/CQyRB/qgRaAdLAmgIR0B0GlQoCuEFdX2UKGgGR7/aGgBcRlH0aAdLBmgIR0B0FX3XZoPDdX2UKGgGR7/mGY8dPtUoaAdLB2gIR0B0E0aAFxGUdX2UKGgGR7/YVNHpbD/EaAdLBGgIR0B0FjRCx/utdX2UKGgGR7+8pjMFEAo5aAdLAmgIR0B0E6UmlZX/dX2UKGgGR7/jDO1OTJQtaAdLCGgIR0B0G9IatLcsdX2UKGgGR7/Ly8SPEKmbaAdLA2gIR0B0Fs8TzunddX2UKGgGR7/Vu5jH4oJBaAdLBGgIR0B0FGWHDaXbdX2UKGgGR7/T/kNnXd0raAdLBWgIR0B0HKiUPhAGdX2UKGgGR8AFXxQSBbwCaAdLG2gIR0B0Gl/jKgZkdX2UKGgGR7/L0Yj0L+glaAdLA2gIR0B0HSY+jdpJdX2UKGgGR7/j8Cgbp/wzaAdLB2gIR0B0FY8fV7QcdX2UKGgGR7/vwoTfzjFRaAdLCmgIR0B0GH73wkPddX2UKGgGR7+5hF3IMjNZaAdLAmgIR0B0Fez4UN8WdX2UKGgGR7/upV0cOskqaAdLCWgIR0B0HAAmzBykdX2UKGgGR7/gZsbedkJ8aAdLBmgIR0B0GZMEidJ8dX2UKGgGR7/lcrRSgoPTaAdLB2gIR0B0FyOsDGLldX2UKGgGR7/wbA+IMz/IaAdLC2gIR0B0Hxs1sLv1dX2UKGgGR7/LvnbItDlYaAdLA2gIR0B0HIhJRO1wdX2UKGgGR7/Hqlgtvn8saAdLA2gIR0B0F6yJKraNdX2UKGgGR7+2hpQDV6NVaAdLAmgIR0B0HNjoZAIIdX2UKGgGR7/qWPDHfdhzaAdLCGgIR0B0GvBqKxcFdX2UKGgGR7/lWJrLyMDPaAdLCGgIR0B0IG4UeuFIdX2UKGgGR7+i1kUbkwN9aAdLAWgIR0B0IJadMCcPdX2UKGgGR7/qXSa3I+4caAdLCWgIR0B0HmhRIjGDdX2UKGgGR7/nPUrkKeCkaAdLCmgIR0B0GWtEG7jDdX2UKGgGR7+i2phnanJlaAdLAWgIR0B0GZTNt65YdX2UKGgGR7/iBTGYKIBSaAdLB2gIR0B0IeapgkTpdX2UKGgGR7/xeT3Zf2K3aAdLDGgIR0B0HRCCz1K5dX2UKGgGR7/hs+eOGTLXaAdLB2gIR0B0H69WZJCjdX2UKGgGR7/OAo5PuXu3aAdLA2gIR0B0IC4Wk8A8dX2UKGgGR7/o5uQ6p5u7aAdLCmgIR0B0G18Sf16FdX2UKGgGR7/lrFwT/Q0GaAdLCGgIR0B0I0nUlRgrdX2UKGgGR7/iyRbKRuCPaAdLCGgIR0B0HpqDbrTqdX2UKGgGR7/i8HfMwDeTaAdLBWgIR0B0HFMDfWMCdX2UKGgGR7/QGRV6u4gBaAdLA2gIR0B0HN76YVqOdX2UKGgGR7/jZmh/RVp9aAdLB2gIR0B0JKHaews5dX2UKGgGR7/j1lPJq7AdaAdLB2gIR0B0H8mPYFq0dX2UKGgGR7/gdWyTpxFRaAdLBmgIR0B0HeCxu89PdX2UKGgGR7/gE2pAD7qIaAdLBmgIR0B0JaMn7YTTdX2UKGgGR7+8MhHLA57xaAdLAmgIR0B0Hjw4KhL5dX2UKGgGR7+8TQE6kqMFaAdLAmgIR0B0Jf8cdYGMdX2UKGgGR7/mHYYixFAnaAdLCWgIR0B0IXOVxCIDdX2UKGgGR7/QcVgx8D0UaAdLA2gIR0B0Hvifg75mdWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 4382, "n_steps": 5, "gamma": 0.99, "gae_lambda": 1.0, "ent_coef": 0.0, "vf_coef": 0.5, "max_grad_norm": 0.5, "normalize_advantage": false, "observation_space": {":type:": "<class 'gymnasium.spaces.dict.Dict'>", ":serialized:": "gAWVsAMAAAAAAACMFWd5bW5hc2l1bS5zcGFjZXMuZGljdJSMBERpY3SUk5QpgZR9lCiMBnNwYWNlc5SMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwUZ3ltbmFzaXVtLnNwYWNlcy5ib3iUjANCb3iUk5QpgZR9lCiMBWR0eXBllIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowNYm91bmRlZF9iZWxvd5SMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYDAAAAAAAAAAEBAZRoE4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksDhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoHCiWAwAAAAAAAAABAQGUaCBLA4WUaCR0lFKUjAZfc2hhcGWUSwOFlIwDbG93lGgcKJYMAAAAAAAAAAAAIMEAACDBAAAgwZRoFksDhZRoJHSUUpSMBGhpZ2iUaBwolgwAAAAAAAAAAAAgQQAAIEEAACBBlGgWSwOFlGgkdJRSlIwIbG93X3JlcHKUjAUtMTAuMJSMCWhpZ2hfcmVwcpSMBDEwLjCUjApfbnBfcmFuZG9tlE51YowMZGVzaXJlZF9nb2FslGgNKYGUfZQoaBBoFmgZaBwolgMAAAAAAAAAAQEBlGggSwOFlGgkdJRSlGgnaBwolgMAAAAAAAAAAQEBlGggSwOFlGgkdJRSlGgsSwOFlGguaBwolgwAAAAAAAAAAAAgwQAAIMEAACDBlGgWSwOFlGgkdJRSlGgzaBwolgwAAAAAAAAAAAAgQQAAIEEAACBBlGgWSwOFlGgkdJRSlGg4jAUtMTAuMJRoOowEMTAuMJRoPE51YowLb2JzZXJ2YXRpb26UaA0pgZR9lChoEGgWaBloHCiWBgAAAAAAAAABAQEBAQGUaCBLBoWUaCR0lFKUaCdoHCiWBgAAAAAAAAABAQEBAQGUaCBLBoWUaCR0lFKUaCxLBoWUaC5oHCiWGAAAAAAAAAAAACDBAAAgwQAAIMEAACDBAAAgwQAAIMGUaBZLBoWUaCR0lFKUaDNoHCiWGAAAAAAAAAAAACBBAAAgQQAAIEEAACBBAAAgQQAAIEGUaBZLBoWUaCR0lFKUaDiMBS0xMC4wlGg6jAQxMC4wlGg8TnVidWgsTmgQTmg8TnViLg==", "spaces": "OrderedDict([('achieved_goal', Box(-10.0, 10.0, (3,), float32)), ('desired_goal', Box(-10.0, 10.0, (3,), float32)), ('observation', Box(-10.0, 10.0, (6,), float32))])", "_shape": null, "dtype": null, "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVnQEAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWAwAAAAAAAAABAQGUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLA4WUjAFDlHSUUpSMDWJvdW5kZWRfYWJvdmWUaBEolgMAAAAAAAAAAQEBlGgVSwOFlGgZdJRSlIwGX3NoYXBllEsDhZSMA2xvd5RoESiWDAAAAAAAAAAAAIC/AACAvwAAgL+UaAtLA4WUaBl0lFKUjARoaWdolGgRKJYMAAAAAAAAAAAAgD8AAIA/AACAP5RoC0sDhZRoGXSUUpSMCGxvd19yZXBylIwELTEuMJSMCWhpZ2hfcmVwcpSMAzEuMJSMCl9ucF9yYW5kb22UTnViLg==", "dtype": "float32", "bounded_below": "[ True True True]", "bounded_above": "[ True True True]", "_shape": [3], "low": "[-1. -1. -1.]", "high": "[1. 1. 1.]", "low_repr": "-1.0", "high_repr": "1.0", "_np_random": null}, "n_envs": 4, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz9G8AaNuLrHhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "system_info": {"OS": "Linux-5.10.147+-x86_64-with-glibc2.31 # 1 SMP Sat Dec 10 16:00:40 UTC 2022", "Python": "3.10.11", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.0.0+cu118", "GPU Enabled": "False", "Numpy": "1.22.4", "Cloudpickle": "2.2.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
 
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVRQAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMG011bHRpSW5wdXRBY3RvckNyaXRpY1BvbGljeZSTlC4=", "__module__": "stable_baselines3.common.policies", "__doc__": "\n MultiInputActorClass policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space (Tuple)\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Uses the CombinedExtractor\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function MultiInputActorCriticPolicy.__init__ at 0x7fde7562f1c0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7fde7562a740>"}, "verbose": 1, "policy_kwargs": {":type:": "<class 'dict'>", ":serialized:": "gAWVgQAAAAAAAAB9lCiMD29wdGltaXplcl9jbGFzc5SME3RvcmNoLm9wdGltLnJtc3Byb3CUjAdSTVNwcm9wlJOUjBBvcHRpbWl6ZXJfa3dhcmdzlH2UKIwFYWxwaGGURz/vrhR64UeujANlcHOURz7k+LWI42jxjAx3ZWlnaHRfZGVjYXmUSwB1dS4=", "optimizer_class": "<class 'torch.optim.rmsprop.RMSprop'>", "optimizer_kwargs": {"alpha": 0.99, "eps": 1e-05, "weight_decay": 0}}, "num_timesteps": 79492, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1683724910010419395, "learning_rate": 0.0007, "tensorboard_log": null, "_last_obs": {":type:": "<class 'collections.OrderedDict'>", ":serialized:": "gAWVuwEAAAAAAACMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwSbnVtcHkuY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QoljAAAAAAAAAA3jMRvyLeET+Ntzq/eRSVvijvVD6wDPs+45hKvytJqT6v0RM//m0CPrcPdL0CKRg/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksESwOGlIwBQ5R0lFKUjAxkZXNpcmVkX2dvYWyUaAcoljAAAAAAAAAAKGaRvgzzhD+xd9u/p6KovlCIjz9plqQ/jyO7v+bQZT/Ngys/u0fXP3Tyzr9Mgr0/lGgOSwRLA4aUaBJ0lFKUjAtvYnNlcnZhdGlvbpRoByiWYAAAAAAAAADeMxG/It4RP423Or9htCy/x+6Yuhour795FJW+KO9UPrAM+z5oXcq+AmbiP8fBMz/jmEq/K0mpPq/REz+R54y/LTIivio/kz/+bQI+tw90vQIpGD//iqs/UWzYv7OwQj+UaA5LBEsGhpRoEnSUUpR1Lg==", "achieved_goal": "[[-0.5671977 0.5697957 -0.72936326]\n [-0.29117182 0.20794356 0.49033117]\n [-0.79139537 0.33063635 0.57741827]\n [ 0.12737271 -0.0595853 0.5943757 ]]", "desired_goal": "[[-0.28398252 1.0386672 -1.7145902 ]\n [-0.32936594 1.1213474 1.2858402 ]\n [-1.4620227 0.8977188 0.6699799 ]\n [ 1.6818765 -1.6167741 1.4805388 ]]", "observation": "[[-5.6719768e-01 5.6979573e-01 -7.2936326e-01 -6.7462736e-01\n -1.1667841e-03 -1.3685944e+00]\n [-2.9117182e-01 2.0794356e-01 4.9033117e-01 -3.9524388e-01\n 1.7687380e+00 7.0217556e-01]\n [-7.9139537e-01 3.3063635e-01 5.7741827e-01 -1.1008168e+00\n -1.5839453e-01 1.1503651e+00]\n [ 1.2737271e-01 -5.9585299e-02 5.9437573e-01 1.3401793e+00\n -1.6908056e+00 7.6050872e-01]]"}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYEAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwSFlIwBQ5R0lFKULg=="}, "_last_original_obs": {":type:": "<class 'collections.OrderedDict'>", ":serialized:": "gAWVuwEAAAAAAACMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwSbnVtcHkuY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QoljAAAAAAAAAA6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksESwOGlIwBQ5R0lFKUjAxkZXNpcmVkX2dvYWyUaAcoljAAAAAAAAAAYbrhPYhAkr0gHw8+fMdRPSFiBT4JDDM+Lp3qO7HjoL3EKhM+VMEJvvoQFLyRrGI9lGgOSwRLA4aUaBJ0lFKUjAtvYnNlcnZhdGlvbpRoByiWYAAAAAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAACUaA5LBEsGhpRoEnSUUpR1Lg==", "achieved_goal": "[[ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]]", "desired_goal": "[[ 0.11021877 -0.07141215 0.13976717]\n [ 0.05121563 0.13025714 0.1748506 ]\n [ 0.00715985 -0.07855929 0.14371783]\n [-0.13452655 -0.00903725 0.05534035]]", "observation": "[[ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]]"}, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": 0.92052, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWV4AsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHv9awSrYGt6qMAWyUSwSMAXSUR0Byb34xk/bCdX2UKGgGR7/Vvegte2NOaAdLBWgIR0ByZKdrftQbdX2UKGgGR7/haC17Y02taAdLBmgIR0ByasNx2jfvdX2UKGgGR7/Ar7O3UhFFaAdLAmgIR0ByZUHv+fh/dX2UKGgGR7/O8yvcJtzkaAdLA2gIR0BydaJAMUh3dX2UKGgGR7/TcIZ62OQyaAdLBGgIR0BycJl6JIlMdX2UKGgGR7/R5aNdZ7ojaAdLA2gIR0ByZdn27FsIdX2UKGgGR7/MwA2hqTKUaAdLA2gIR0BydiPjn3cpdX2UKGgGR7/SPNFBppN9aAdLA2gIR0BycRBqsU7CdX2UKGgGR7/fBFuvUz9CaAdLBWgIR0Bya7RtxdY5dX2UKGgGR7+8uf29L6DXaAdLAmgIR0ByZi6RQrMDdX2UKGgGR7/P7MPjGT9saAdLA2gIR0BydrM9r434dX2UKGgGR7/Kj7ALy+YdaAdLA2gIR0BycaF+NLlFdX2UKGgGR7/NV5KODJ2daAdLA2gIR0BybETfzjFRdX2UKGgGR7/XlchTwUg0aAdLBWgIR0ByZwvkBCD3dX2UKGgGR7/PCgK4QSSNaAdLBGgIR0Byd2xQizLPdX2UKGgGR7/HqubI91U3aAdLA2gIR0BybNWsA/9pdX2UKGgGR7+nskY4yXUpaAdLAWgIR0Byd5opQUHqdX2UKGgGR7/a9q1w5vLpaAdLBGgIR0BycmEJ0GNadX2UKGgGR7/M92X9itq6aAdLA2gIR0BybU4uK4x2dX2UKGgGR7/S6DGtITXbaAdLBGgIR0BycxRl6JIldX2UKGgGR7+5uDSPU8V6aAdLAmgIR0BybbezlcQidX2UKGgGR7/gOwgTyrggaAdLBmgIR0ByeJyo4uK5dX2UKGgGR7+80tRNyo4uaAdLAmgIR0Byc2OxSpBHdX2UKGgGR7/kQljVhCtzaAdLCGgIR0ByaH4j8k2QdX2UKGgGR7/ShWHUMG5daAdLBGgIR0ByblwkxASndX2UKGgGR7/Adf9gnc+JaAdLAmgIR0ByaNbY9Pk8dX2UKGgGR7/ZAxBVuJk5aAdLBGgIR0ByeV6v7m+1dX2UKGgGR7/Vsf7rLQokaAdLBGgIR0BydCXUpd8idX2UKGgGR7/BYmLLpzLfaAdLAmgIR0BybstoSL62dX2UKGgGR7/SsniNsFdLaAdLBGgIR0ByaZaX8fmtdX2UKGgGR7/V3juKGcnWaAdLA2gIR0ByeeFGoaUBdX2UKGgGR7/KNQ0oBq9HaAdLA2gIR0BydKlANXo1dX2UKGgGR7/g1XmvGIbgaAdLBWgIR0Byb7VRUFSsdX2UKGgGR7/UiGWUr08OaAdLA2gIR0ByeoHgP3BYdX2UKGgGR7/W+B6KLsKLaAdLBWgIR0ByapDJEH+qdX2UKGgGR7/RZPl+3H7xaAdLA2gIR0ByexWYF7ladX2UKGgGR7/WuWa+evpyaAdLBGgIR0BycH5/LDAKdX2UKGgGR7+mFN+LFXJYaAdLAWgIR0Bye0BxPwd9dX2UKGgGR7/YgB91EE1VaAdLBGgIR0Bya0eYD1XedX2UKGgGR7/lgHVwxWT5aAdLCWgIR0Bydldu5z5odX2UKGgGR7/LGBnSOR1YaAdLBGgIR0BycSDqW1MNdX2UKGgGR7+8GZ/kNnXeaAdLAmgIR0Bya53X7LuAdX2UKGgGR7/Viay8jAzpaAdLBGgIR0Bye/3yqdYodX2UKGgGR7/DRUm2LHdXaAdLAmgIR0BydsTBZZB+dX2UKGgGR7/O7nPmgam5aAdLA2gIR0BycbVsk6cRdX2UKGgGR7/LIQvpQk5ZaAdLA2gIR0BybDC+De0pdX2UKGgGR7/Pos7MgU1yaAdLA2gIR0ByfHuPV/c4dX2UKGgGR7/Jq7iADq4ZaAdLA2gIR0Byd0WhysCDdX2UKGgGR7/R1/2Cdz4laAdLA2gIR0ByfRYYBNmEdX2UKGgGR7/iTJhfBvaUaAdLBGgIR0Bycn5qM3qBdX2UKGgGR7/aUTcqOLiuaAdLBGgIR0BybPpOerdWdX2UKGgGR7/aidJ8OTaCaAdLBGgIR0ByeA0YTCcgdX2UKGgGR7+MjZ+QU5+6aAdLAWgIR0BybSm3vx6OdX2UKGgGR7+h9gF5fMOgaAdLAWgIR0ByeDjT8YQ8dX2UKGgGR7/AVt4zJp35aAdLAmgIR0Byct3r2QGOdX2UKGgGR7/Wiay8jAzpaAdLBGgIR0ByfegOBlMAdX2UKGgGR7/DJIUahpQDaAdLAmgIR0Byc1Tgl4TsdX2UKGgGR7/OL0Bfa6BiaAdLA2gIR0ByeN+kP+XJdX2UKGgGR7+cry1/lQuVaAdLAWgIR0Byc4ZXMhX9dX2UKGgGR7/AUnG8274BaAdLAmgIR0ByfkokRjBmdX2UKGgGR7+je9Ba9sabaAdLAWgIR0ByfnOZ9d/sdX2UKGgGR7/B0se4kNWmaAdLAmgIR0Byc+H1vl2edX2UKGgGR7/GFMZgogFHaAdLA2gIR0ByeX1pTMq0dX2UKGgGR7/HCMPz4DcNaAdLA2gIR0ByfyktVaOhdX2UKGgGR7+99/jKgZjyaAdLAmgIR0ByefDIikftdX2UKGgGR7/K8YAKfFrEaAdLA2gIR0BydJTfixVydX2UKGgGR7/n5D7ZWaMKaAdLCWgIR0BybxF/hESedX2UKGgGR7+79deIEbHZaAdLAmgIR0Byellf7aZhdX2UKGgGR7/IroW56MR6aAdLA2gIR0Byf82m51/2dX2UKGgGR7/RLGaQV9F4aAdLA2gIR0BydUXBP9DQdX2UKGgGR7/Ke7tiQT24aAdLA2gIR0Byb8aNuLrHdX2UKGgGR7++v4dp7CzkaAdLAmgIR0ByevEfkmx/dX2UKGgGR7+7AO8TSLIgaAdLAmgIR0Bydbmig00ndX2UKGgGR7/Pt/FzdUKiaAdLA2gIR0BycFeiSJTEdX2UKGgGR7/XSLZSNwR5aAdLBGgIR0BygKPOpsGgdX2UKGgGR7/PkQwsXizcaAdLA2gIR0Bye3Ot4iX6dX2UKGgGR7/UqQzUI9kjaAdLA2gIR0BydkAU+LWJdX2UKGgGR7/AiYb83uNQaAdLAmgIR0BycLnyNGVidX2UKGgGR7+2NuLrHEMtaAdLAmgIR0BygRkK/mDEdX2UKGgGR7/SH2ys0YTCaAdLA2gIR0ByfAi8nNPhdX2UKGgGR7+8kjX4CZF5aAdLAmgIR0BycSUNayKOdX2UKGgGR7/JiYLLIPsiaAdLA2gIR0BydtbGFSKndX2UKGgGR7+1VtGd7OVxaAdLAmgIR0ByfF6NVBD5dX2UKGgGR7/axzq8lHBlaAdLBGgIR0ByceIfr8iwdX2UKGgGR7/S+jua4MF2aAdLBGgIR0ByfSaEzwc6dX2UKGgGR7/TuRs/IKc/aAdLBWgIR0Byd9DkU9IPdX2UKGgGR7/PyLhrFfiQaAdLA2gIR0BycnOE/SpjdX2UKGgGR7+6+PBBRhttaAdLAmgIR0ByfYKIBRyfdX2UKGgGR7/pGY0EX+ERaAdLCmgIR0BygwPOIInjdX2UKGgGR7+3ND+irT6SaAdLAmgIR0ByffV+Zw4sdX2UKGgGR7/Oo60Y0l7daAdLA2gIR0BycxIOH310dX2UKGgGR7/gJmmLtNSJaAdLBWgIR0ByeM1+AmRedX2UKGgGR7+dVmz0HyEtaAdLAWgIR0Byc05XEIgOdX2UKGgGR7/H0fYBeXzEaAdLA2gIR0Byg5me18b8dX2UKGgGR7/E1stTUAktaAdLAmgIR0ByfmCrcTJydX2UKGgGR792vbGm1pj+aAdLAWgIR0Byg8GKQ7tBdX2UKGgGR7/MGQCCBf8eaAdLA2gIR0ByeWK0lZ5idX2UKGgGR7/LFWn0kGA1aAdLA2gIR0ByfusHSncddX2UKGgGR7/ZrVOKwY+CaAdLBGgIR0BydAYEW69TdWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 3974, "n_steps": 5, "gamma": 0.99, "gae_lambda": 1.0, "ent_coef": 0.0, "vf_coef": 0.5, "max_grad_norm": 0.5, "normalize_advantage": false, "observation_space": {":type:": "<class 'gymnasium.spaces.dict.Dict'>", ":serialized:": "gAWVsAMAAAAAAACMFWd5bW5hc2l1bS5zcGFjZXMuZGljdJSMBERpY3SUk5QpgZR9lCiMBnNwYWNlc5SMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwUZ3ltbmFzaXVtLnNwYWNlcy5ib3iUjANCb3iUk5QpgZR9lCiMBWR0eXBllIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowNYm91bmRlZF9iZWxvd5SMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYDAAAAAAAAAAEBAZRoE4wCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksDhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoHCiWAwAAAAAAAAABAQGUaCBLA4WUaCR0lFKUjAZfc2hhcGWUSwOFlIwDbG93lGgcKJYMAAAAAAAAAAAAIMEAACDBAAAgwZRoFksDhZRoJHSUUpSMBGhpZ2iUaBwolgwAAAAAAAAAAAAgQQAAIEEAACBBlGgWSwOFlGgkdJRSlIwIbG93X3JlcHKUjAUtMTAuMJSMCWhpZ2hfcmVwcpSMBDEwLjCUjApfbnBfcmFuZG9tlE51YowMZGVzaXJlZF9nb2FslGgNKYGUfZQoaBBoFmgZaBwolgMAAAAAAAAAAQEBlGggSwOFlGgkdJRSlGgnaBwolgMAAAAAAAAAAQEBlGggSwOFlGgkdJRSlGgsSwOFlGguaBwolgwAAAAAAAAAAAAgwQAAIMEAACDBlGgWSwOFlGgkdJRSlGgzaBwolgwAAAAAAAAAAAAgQQAAIEEAACBBlGgWSwOFlGgkdJRSlGg4jAUtMTAuMJRoOowEMTAuMJRoPE51YowLb2JzZXJ2YXRpb26UaA0pgZR9lChoEGgWaBloHCiWBgAAAAAAAAABAQEBAQGUaCBLBoWUaCR0lFKUaCdoHCiWBgAAAAAAAAABAQEBAQGUaCBLBoWUaCR0lFKUaCxLBoWUaC5oHCiWGAAAAAAAAAAAACDBAAAgwQAAIMEAACDBAAAgwQAAIMGUaBZLBoWUaCR0lFKUaDNoHCiWGAAAAAAAAAAAACBBAAAgQQAAIEEAACBBAAAgQQAAIEGUaBZLBoWUaCR0lFKUaDiMBS0xMC4wlGg6jAQxMC4wlGg8TnVidWgsTmgQTmg8TnViLg==", "spaces": "OrderedDict([('achieved_goal', Box(-10.0, 10.0, (3,), float32)), ('desired_goal', Box(-10.0, 10.0, (3,), float32)), ('observation', Box(-10.0, 10.0, (6,), float32))])", "_shape": null, "dtype": null, "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVnQEAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWAwAAAAAAAAABAQGUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLA4WUjAFDlHSUUpSMDWJvdW5kZWRfYWJvdmWUaBEolgMAAAAAAAAAAQEBlGgVSwOFlGgZdJRSlIwGX3NoYXBllEsDhZSMA2xvd5RoESiWDAAAAAAAAAAAAIC/AACAvwAAgL+UaAtLA4WUaBl0lFKUjARoaWdolGgRKJYMAAAAAAAAAAAAgD8AAIA/AACAP5RoC0sDhZRoGXSUUpSMCGxvd19yZXBylIwELTEuMJSMCWhpZ2hfcmVwcpSMAzEuMJSMCl9ucF9yYW5kb22UTnViLg==", "dtype": "float32", "bounded_below": "[ True True True]", "bounded_above": "[ True True True]", "_shape": [3], "low": "[-1. -1. -1.]", "high": "[1. 1. 1.]", "low_repr": "-1.0", "high_repr": "1.0", "_np_random": null}, "n_envs": 4, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVxQIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSS91c3IvbG9jYWwvbGliL3B5dGhvbjMuMTAvZGlzdC1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEuEQwIEAZSMA3ZhbJSFlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjEkvdXNyL2xvY2FsL2xpYi9weXRob24zLjEwL2Rpc3QtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lHVOTmgAjBBfbWFrZV9lbXB0eV9jZWxslJOUKVKUhZR0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaB99lH2UKGgWaA2MDF9fcXVhbG5hbWVfX5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUjA9fX2Fubm90YXRpb25zX1+UfZSMDl9fa3dkZWZhdWx0c19flE6MDF9fZGVmYXVsdHNfX5ROjApfX21vZHVsZV9flGgXjAdfX2RvY19flE6MC19fY2xvc3VyZV9flGgAjApfbWFrZV9jZWxslJOURz9G8AaNuLrHhZRSlIWUjBdfY2xvdWRwaWNrbGVfc3VibW9kdWxlc5RdlIwLX19nbG9iYWxzX1+UfZR1hpSGUjAu"}, "system_info": {"OS": "Linux-5.10.147+-x86_64-with-glibc2.31 # 1 SMP Sat Dec 10 16:00:40 UTC 2022", "Python": "3.10.11", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.0.0+cu118", "GPU Enabled": "False", "Numpy": "1.22.4", "Cloudpickle": "2.2.1", "Gymnasium": "0.28.1", "OpenAI Gym": "0.25.2"}}
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": -0.3731922900304198, "std_reward": 0.24761006609831218, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-05-10T12:56:44.841701"}
 
1
+ {"mean_reward": -0.25809289999999996, "std_reward": 0.12599486341629168, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-05-10T13:28:31.373861"}
vec_normalize.pkl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7213840b5a8056cfcc967e0dd8956e3d47132fcac0941cc332922c9126b12a7d
3
  size 2553
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fba557c9e2c2e0506120d0e41114b972ef6e2586c4cfe742772e0912a2159695
3
  size 2553