pregonas commited on
Commit
13ef26c
1 Parent(s): c61f13a

Initial commit

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: PandaReachDense-v2
17
  metrics:
18
  - type: mean_reward
19
- value: -2.53 +/- 0.94
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: PandaReachDense-v2
17
  metrics:
18
  - type: mean_reward
19
+ value: -1.77 +/- 0.25
20
  name: mean_reward
21
  verified: false
22
  ---
a2c-PandaReachDense-v2.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5f118197b1bb5caa6eca22bc8745e61e3b232fb031e2ed1ac29e0c3152f0901d
3
- size 108148
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e559e216484d85442408f9e84220fec0a8a9a691f114dda2d9e76027348b33ba
3
+ size 109425
a2c-PandaReachDense-v2/data CHANGED
@@ -4,9 +4,9 @@
4
  ":serialized:": "gAWVRQAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMG011bHRpSW5wdXRBY3RvckNyaXRpY1BvbGljeZSTlC4=",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n MultiInputActorClass policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space (Tuple)\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Uses the CombinedExtractor\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
- "__init__": "<function MultiInputActorCriticPolicy.__init__ at 0x7fcb3b77f5e0>",
8
  "__abstractmethods__": "frozenset()",
9
- "_abc_impl": "<_abc._abc_data object at 0x7fcb3b781200>"
10
  },
11
  "verbose": 1,
12
  "policy_kwargs": {
@@ -41,24 +41,24 @@
41
  "_np_random": null
42
  },
43
  "n_envs": 4,
44
- "num_timesteps": 1000000,
45
- "_total_timesteps": 1000000,
46
  "_num_timesteps_at_start": 0,
47
  "seed": null,
48
  "action_noise": null,
49
- "start_time": 1680286311978665348,
50
- "learning_rate": 0.0007,
51
  "tensorboard_log": null,
52
  "lr_schedule": {
53
  ":type:": "<class 'function'>",
54
- ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4JDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/RvAGjbi6x4WUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="
55
  },
56
  "_last_obs": {
57
  ":type:": "<class 'collections.OrderedDict'>",
58
- ":serialized:": "gAWVuwEAAAAAAACMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwSbnVtcHkuY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QoljAAAAAAAAAAYB7SPr7Vt7jJAhM/YB7SPr7Vt7jJAhM/YB7SPr7Vt7jJAhM/YB7SPr7Vt7jJAhM/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksESwOGlIwBQ5R0lFKUjAxkZXNpcmVkX2dvYWyUaAcoljAAAAAAAAAAl3vYP+62fb/6hX+/ET+QP2RhxD8ybKm/A9wlPrCltb8zyks/xESqv10bNT+x1zu/lGgOSwRLA4aUaBJ0lFKUjAtvYnNlcnZhdGlvbpRoByiWYAAAAAAAAABgHtI+vtW3uMkCEz9uzrM7xau2uklQm7pgHtI+vtW3uMkCEz9uzrM7xau2uklQm7pgHtI+vtW3uMkCEz9uzrM7xau2uklQm7pgHtI+vtW3uMkCEz9uzrM7xau2uklQm7qUaA5LBEsGhpRoEnSUUpR1Lg==",
59
- "achieved_goal": "[[ 4.1038799e-01 -8.7659326e-05 5.7426125e-01]\n [ 4.1038799e-01 -8.7659326e-05 5.7426125e-01]\n [ 4.1038799e-01 -8.7659326e-05 5.7426125e-01]\n [ 4.1038799e-01 -8.7659326e-05 5.7426125e-01]]",
60
- "desired_goal": "[[ 1.6912717 -0.99107254 -0.99813807]\n [ 1.1269246 1.5342221 -1.3236144 ]\n [ 0.16197209 -1.4191189 0.79605407]\n [-1.3302236 0.7074488 -0.73375994]]",
61
- "observation": "[[ 4.1038799e-01 -8.7659326e-05 5.7426125e-01 5.4872548e-03\n -1.3936689e-03 -1.1849488e-03]\n [ 4.1038799e-01 -8.7659326e-05 5.7426125e-01 5.4872548e-03\n -1.3936689e-03 -1.1849488e-03]\n [ 4.1038799e-01 -8.7659326e-05 5.7426125e-01 5.4872548e-03\n -1.3936689e-03 -1.1849488e-03]\n [ 4.1038799e-01 -8.7659326e-05 5.7426125e-01 5.4872548e-03\n -1.3936689e-03 -1.1849488e-03]]"
62
  },
63
  "_last_episode_starts": {
64
  ":type:": "<class 'numpy.ndarray'>",
@@ -66,29 +66,29 @@
66
  },
67
  "_last_original_obs": {
68
  ":type:": "<class 'collections.OrderedDict'>",
69
- ":serialized:": "gAWVuwEAAAAAAACMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwSbnVtcHkuY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QoljAAAAAAAAAA6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksESwOGlIwBQ5R0lFKUjAxkZXNpcmVkX2dvYWyUaAcoljAAAAAAAAAAEsYFPRRksj2tMS4+CdEVvZBAKj1UBPQ9cO11vVQPh7zQRKw9xpr2ve04RD03kQI+lGgOSwRLA4aUaBJ0lFKUjAtvYnNlcnZhdGlvbpRoByiWYAAAAAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAACUaA5LBEsGhpRoEnSUUpR1Lg==",
70
  "achieved_goal": "[[ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]]",
71
- "desired_goal": "[[ 0.0326596 0.08710495 0.17011137]\n [-0.0365763 0.04156548 0.11914888]\n [-0.06004089 -0.0164868 0.08411562]\n [-0.12041239 0.04790585 0.12750708]]",
72
  "observation": "[[ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]]"
73
  },
74
  "_episode_num": 0,
75
- "use_sde": false,
76
  "sde_sample_freq": -1,
77
  "_current_progress_remaining": 0.0,
78
  "ep_info_buffer": {
79
  ":type:": "<class 'collections.deque'>",
80
- ":serialized:": "gAWVHRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIWtWSjnIQBsCUhpRSlIwBbJRLMowBdJRHQKcsd2fTTfB1fZQoaAZoCWgPQwgvwakPJO8AwJSGlFKUaBVLMmgWR0CnLCWq94/vdX2UKGgGaAloD0MIQrEVNC2RAsCUhpRSlGgVSzJoFkdApyvTTH80lHV9lChoBmgJaA9DCNyhYTHqWvy/lIaUUpRoFUsyaBZHQKcrdy4nWrh1fZQoaAZoCWgPQwhh+l5DcFwDwJSGlFKUaBVLMmgWR0CnLWxIjGDMdX2UKGgGaAloD0MIlBPtKqRsFsCUhpRSlGgVSzJoFkdApy0aGetjkXV9lChoBmgJaA9DCJEotKz75wPAlIaUUpRoFUsyaBZHQKcsx6WPcSJ1fZQoaAZoCWgPQwgYesToucX8v5SGlFKUaBVLMmgWR0CnLGuv2Xb/dX2UKGgGaAloD0MIqRWm7zUkBcCUhpRSlGgVSzJoFkdApy5lfE4vOHV9lChoBmgJaA9DCIGv6NZrev+/lIaUUpRoFUsyaBZHQKcuE1vVEux1fZQoaAZoCWgPQwi9/48TJqwLwJSGlFKUaBVLMmgWR0CnLcDSgGr0dX2UKGgGaAloD0MIcET3rGtEFsCUhpRSlGgVSzJoFkdApy1kr3CbdHV9lChoBmgJaA9DCMsRMpBndwHAlIaUUpRoFUsyaBZHQKcvVerMkhR1fZQoaAZoCWgPQwjYZfhPNzADwJSGlFKUaBVLMmgWR0CnLwPEjxCqdX2UKGgGaAloD0MIxsGlY86TBsCUhpRSlGgVSzJoFkdApy6xYcNpd3V9lChoBmgJaA9DCB5U4jrGVQfAlIaUUpRoFUsyaBZHQKcuVUxVQyh1fZQoaAZoCWgPQwinP/uRItIFwJSGlFKUaBVLMmgWR0CnMEeS0Sh8dX2UKGgGaAloD0MIZF3cRgOYAMCUhpRSlGgVSzJoFkdApy/1Y6nzhHV9lChoBmgJaA9DCATmIVM+ZAbAlIaUUpRoFUsyaBZHQKcvowD/2kB1fZQoaAZoCWgPQwhegehJmWQQwJSGlFKUaBVLMmgWR0CnL0cNH6MzdX2UKGgGaAloD0MIo5BkVu+QC8CUhpRSlGgVSzJoFkdApzFwP5HmR3V9lChoBmgJaA9DCEgYBiy5ygHAlIaUUpRoFUsyaBZHQKcxHq9Gqgh1fZQoaAZoCWgPQwjs3LQZp6H+v5SGlFKUaBVLMmgWR0CnMMz4+KTCdX2UKGgGaAloD0MIfjUHCOZoD8CUhpRSlGgVSzJoFkdApzBxWHUMHHV9lChoBmgJaA9DCK6f/rPmhwrAlIaUUpRoFUsyaBZHQKcy6aMrEtN1fZQoaAZoCWgPQwjDDI0ngngLwJSGlFKUaBVLMmgWR0CnMpf3N9pidX2UKGgGaAloD0MILoz0ona//7+UhpRSlGgVSzJoFkdApzJGQlruY3V9lChoBmgJaA9DCJmghm9h/QjAlIaUUpRoFUsyaBZHQKcx6ogmqo91fZQoaAZoCWgPQwhKC5dV2Ez4v5SGlFKUaBVLMmgWR0CnNHA6dUbUdX2UKGgGaAloD0MIl631RUJbA8CUhpRSlGgVSzJoFkdApzQeotL+P3V9lChoBmgJaA9DCPeRW5NuSwPAlIaUUpRoFUsyaBZHQKczzRYRuj11fZQoaAZoCWgPQwj2RNeFH4wRwJSGlFKUaBVLMmgWR0CnM3HHvMKUdX2UKGgGaAloD0MIOe//44SJA8CUhpRSlGgVSzJoFkdApzYFymygPHV9lChoBmgJaA9DCFe0Oc5tggLAlIaUUpRoFUsyaBZHQKc1tMEidJ91fZQoaAZoCWgPQwg1ecpqun4EwJSGlFKUaBVLMmgWR0CnNWMWfseGdX2UKGgGaAloD0MIC9KMRdOZ+r+UhpRSlGgVSzJoFkdApzUH2dupCXV9lChoBmgJaA9DCCNNvAM8KQnAlIaUUpRoFUsyaBZHQKc3ruMuOCJ1fZQoaAZoCWgPQwjxhF5/Et//v5SGlFKUaBVLMmgWR0CnN1101ZTydX2UKGgGaAloD0MIgSGrWz0nBcCUhpRSlGgVSzJoFkdApzcLYAbQ1XV9lChoBmgJaA9DCJ9x4UBINg3AlIaUUpRoFUsyaBZHQKc2sAoXsPd1fZQoaAZoCWgPQwgTYFj+fFsHwJSGlFKUaBVLMmgWR0CnOUcuBczJdX2UKGgGaAloD0MIBwlRvqDlAsCUhpRSlGgVSzJoFkdApzj2JrLyMHV9lChoBmgJaA9DCONw5ldzYAnAlIaUUpRoFUsyaBZHQKc4pLEDQqt1fZQoaAZoCWgPQwhkc9U8R8QCwJSGlFKUaBVLMmgWR0CnOEmdI5HVdX2UKGgGaAloD0MIzvxqDhAMAMCUhpRSlGgVSzJoFkdApzrLwvxpc3V9lChoBmgJaA9DCBheSfJcvxPAlIaUUpRoFUsyaBZHQKc6eiOearp1fZQoaAZoCWgPQwhrDaX2Itr9v5SGlFKUaBVLMmgWR0CnOihXr+o+dX2UKGgGaAloD0MI9x4uOe4U+L+UhpRSlGgVSzJoFkdApznMEPlMiHV9lChoBmgJaA9DCPwcHy3O2APAlIaUUpRoFUsyaBZHQKc7w4e9zwN1fZQoaAZoCWgPQwiWlSaloHsKwJSGlFKUaBVLMmgWR0CnO3G4qgAZdX2UKGgGaAloD0MIcv4mFCJgCsCUhpRSlGgVSzJoFkdApzsflp48l3V9lChoBmgJaA9DCNRDNLqDmPe/lIaUUpRoFUsyaBZHQKc6w3Ov+wV1fZQoaAZoCWgPQwgpsWt7u+UCwJSGlFKUaBVLMmgWR0CnPMGTLW7OdX2UKGgGaAloD0MIwHlx4qv9BsCUhpRSlGgVSzJoFkdApzxvY4ACGXV9lChoBmgJaA9DCF8lH7sL1A3AlIaUUpRoFUsyaBZHQKc8Ha0QbuN1fZQoaAZoCWgPQwhGXtbEAp/7v5SGlFKUaBVLMmgWR0CnO8Gp++dtdX2UKGgGaAloD0MIveMUHckFD8CUhpRSlGgVSzJoFkdApz24X668QXV9lChoBmgJaA9DCHgLJCh+LAfAlIaUUpRoFUsyaBZHQKc9Zhhpg1F1fZQoaAZoCWgPQwh8gO7LmQ0CwJSGlFKUaBVLMmgWR0CnPROE/SpjdX2UKGgGaAloD0MIcQFolC6dBsCUhpRSlGgVSzJoFkdApzy3dCVrynV9lChoBmgJaA9DCAyR09fztQ7AlIaUUpRoFUsyaBZHQKc+r9iMHbB1fZQoaAZoCWgPQwh/vFetTJgBwJSGlFKUaBVLMmgWR0CnPl24EwFldX2UKGgGaAloD0MINUbrqGoC/b+UhpRSlGgVSzJoFkdApz4LhzeXRnV9lChoBmgJaA9DCNV5VPzf0f6/lIaUUpRoFUsyaBZHQKc9r2xIJ7d1fZQoaAZoCWgPQwjzjlN0JFcFwJSGlFKUaBVLMmgWR0CnP5Z13dKvdX2UKGgGaAloD0MI+u3rwDkjC8CUhpRSlGgVSzJoFkdApz9EMqjJuHV9lChoBmgJaA9DCJS+EHLeHw7AlIaUUpRoFUsyaBZHQKc+8bcXWOJ1fZQoaAZoCWgPQwjGpL+XwgMKwJSGlFKUaBVLMmgWR0CnPpVstTUBdX2UKGgGaAloD0MIlbpkHCN5CsCUhpRSlGgVSzJoFkdAp0CF+XqqwXV9lChoBmgJaA9DCK+Xpghwuvy/lIaUUpRoFUsyaBZHQKdAM+/QBxR1fZQoaAZoCWgPQwiRD3o2q+4TwJSGlFKUaBVLMmgWR0CnP+Gf5DZ2dX2UKGgGaAloD0MIQdR9AFKrEcCUhpRSlGgVSzJoFkdApz+Fgnc+JXV9lChoBmgJaA9DCEyqtpvgm/q/lIaUUpRoFUsyaBZHQKdBbBTGYKJ1fZQoaAZoCWgPQwh6qkNuhosSwJSGlFKUaBVLMmgWR0CnQRnrIHTrdX2UKGgGaAloD0MIEXNJ1XbzBMCUhpRSlGgVSzJoFkdAp0DHW8RL9XV9lChoBmgJaA9DCFExzt+Egg7AlIaUUpRoFUsyaBZHQKdAaxHG0eF1fZQoaAZoCWgPQwi6TbhX5g0CwJSGlFKUaBVLMmgWR0CnQmLh73PBdX2UKGgGaAloD0MI5xcl6C9UDsCUhpRSlGgVSzJoFkdAp0IQnSfDk3V9lChoBmgJaA9DCLLV5ZSAWP2/lIaUUpRoFUsyaBZHQKdBvlZowmF1fZQoaAZoCWgPQwhcVIuIYlIGwJSGlFKUaBVLMmgWR0CnQWIfbKzSdX2UKGgGaAloD0MI2JyDZ0LT+b+UhpRSlGgVSzJoFkdAp0NSJ9AoonV9lChoBmgJaA9DCIDVkSOdoQfAlIaUUpRoFUsyaBZHQKdDAAG0NSZ1fZQoaAZoCWgPQwgRGsHG9a/4v5SGlFKUaBVLMmgWR0CnQq1kUbkwdX2UKGgGaAloD0MI4UIewY0UBMCUhpRSlGgVSzJoFkdAp0JRUPxx1nV9lChoBmgJaA9DCFLvqZz2dADAlIaUUpRoFUsyaBZHQKdERsXSBsh1fZQoaAZoCWgPQwi9OVyrPRwRwJSGlFKUaBVLMmgWR0CnQ/Sn+AEudX2UKGgGaAloD0MIkiQIV0BhEcCUhpRSlGgVSzJoFkdAp0OiLwWnCXV9lChoBmgJaA9DCAKAY8+eCwvAlIaUUpRoFUsyaBZHQKdDReiSJTF1fZQoaAZoCWgPQwjzVIfcDHf2v5SGlFKUaBVLMmgWR0CnRTHKwIMSdX2UKGgGaAloD0MIy2d5HtwdD8CUhpRSlGgVSzJoFkdAp0Tf1OCXhXV9lChoBmgJaA9DCNhGPNnNjPS/lIaUUpRoFUsyaBZHQKdEjXYlIEt1fZQoaAZoCWgPQwiO6J51jZbzv5SGlFKUaBVLMmgWR0CnRDEwN9YwdX2UKGgGaAloD0MITHFV2XflAcCUhpRSlGgVSzJoFkdAp0Ye49X9znV9lChoBmgJaA9DCNC2mnXGdwLAlIaUUpRoFUsyaBZHQKdFzRBNVR11fZQoaAZoCWgPQwhdaoR+pt71v5SGlFKUaBVLMmgWR0CnRXqIznA7dX2UKGgGaAloD0MI2Xkbmx3pAMCUhpRSlGgVSzJoFkdAp0Ue606YFHV9lChoBmgJaA9DCIWZtn9lZQjAlIaUUpRoFUsyaBZHQKdHCBVdX1d1fZQoaAZoCWgPQwiJRQw7jOkBwJSGlFKUaBVLMmgWR0CnRrXRG+bmdX2UKGgGaAloD0MIBFYOLbLdEcCUhpRSlGgVSzJoFkdAp0ZjTz/ZNHV9lChoBmgJaA9DCOSG3023DBDAlIaUUpRoFUsyaBZHQKdGBvxYq5N1ZS4="
81
  },
82
  "ep_success_buffer": {
83
  ":type:": "<class 'collections.deque'>",
84
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
85
  },
86
  "_n_updates": 50000,
87
- "n_steps": 5,
88
  "gamma": 0.99,
89
- "gae_lambda": 1.0,
90
  "ent_coef": 0.0,
91
- "vf_coef": 0.5,
92
  "max_grad_norm": 0.5,
93
  "normalize_advantage": false
94
  }
 
4
  ":serialized:": "gAWVRQAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMG011bHRpSW5wdXRBY3RvckNyaXRpY1BvbGljeZSTlC4=",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n MultiInputActorClass policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space (Tuple)\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Uses the CombinedExtractor\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
+ "__init__": "<function MultiInputActorCriticPolicy.__init__ at 0x7f8249c790d0>",
8
  "__abstractmethods__": "frozenset()",
9
+ "_abc_impl": "<_abc._abc_data object at 0x7f8249c77340>"
10
  },
11
  "verbose": 1,
12
  "policy_kwargs": {
 
41
  "_np_random": null
42
  },
43
  "n_envs": 4,
44
+ "num_timesteps": 2000000,
45
+ "_total_timesteps": 2000000,
46
  "_num_timesteps_at_start": 0,
47
  "seed": null,
48
  "action_noise": null,
49
+ "start_time": 1680290443097352701,
50
+ "learning_rate": 0.00025,
51
  "tensorboard_log": null,
52
  "lr_schedule": {
53
  ":type:": "<class 'function'>",
54
+ ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4JDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/MGJN0vGp/IWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="
55
  },
56
  "_last_obs": {
57
  ":type:": "<class 'collections.OrderedDict'>",
58
+ ":serialized:": "gAWVuwEAAAAAAACMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwSbnVtcHkuY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QoljAAAAAAAAAAtQSaPsU1DrzOjgk/tQSaPsU1DrzOjgk/tQSaPsU1DrzOjgk/tQSaPsU1DrzOjgk/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksESwOGlIwBQ5R0lFKUjAxkZXNpcmVkX2dvYWyUaAcoljAAAAAAAAAAM9DHP0f1vD8QKqY/0tjUvpCDj79sJj2/2b+hv0aItL/e8ME/sZuJv7PRjj/v+Ea/lGgOSwRLA4aUaBJ0lFKUjAtvYnNlcnZhdGlvbpRoByiWYAAAAAAAAAC1BJo+xTUOvM6OCT/xHqy7SLVIOsotJju1BJo+xTUOvM6OCT/xHqy7SLVIOsotJju1BJo+xTUOvM6OCT/xHqy7SLVIOsotJju1BJo+xTUOvM6OCT/xHqy7SLVIOsotJjuUaA5LBEsGhpRoEnSUUpR1Lg==",
59
+ "achieved_goal": "[[ 0.30081716 -0.00867981 0.5373353 ]\n [ 0.30081716 -0.00867981 0.5373353 ]\n [ 0.30081716 -0.00867981 0.5373353 ]\n [ 0.30081716 -0.00867981 0.5373353 ]]",
60
+ "desired_goal": "[[ 1.5610412 1.4762353 1.2981586]\n [-0.4157167 -1.1212025 -0.7388675]\n [-1.2636672 -1.4104087 1.5151632]\n [-1.0750638 1.1157745 -0.7772359]]",
61
+ "observation": "[[ 0.30081716 -0.00867981 0.5373353 -0.00525271 0.00076564 0.00253569]\n [ 0.30081716 -0.00867981 0.5373353 -0.00525271 0.00076564 0.00253569]\n [ 0.30081716 -0.00867981 0.5373353 -0.00525271 0.00076564 0.00253569]\n [ 0.30081716 -0.00867981 0.5373353 -0.00525271 0.00076564 0.00253569]]"
62
  },
63
  "_last_episode_starts": {
64
  ":type:": "<class 'numpy.ndarray'>",
 
66
  },
67
  "_last_original_obs": {
68
  ":type:": "<class 'collections.OrderedDict'>",
69
+ ":serialized:": "gAWVuwEAAAAAAACMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwSbnVtcHkuY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QoljAAAAAAAAAA6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksESwOGlIwBQ5R0lFKUjAxkZXNpcmVkX2dvYWyUaAcoljAAAAAAAAAAkqUYvgeUDL5WqHU+9uyAPOp/lL1wMx09iejCvbVyzT3JFXI+XiyGvX1Htb3Ka8Q9lGgOSwRLA4aUaBJ0lFKUjAtvYnNlcnZhdGlvbpRoByiWYAAAAAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAACUaA5LBEsGhpRoEnSUUpR1Lg==",
70
  "achieved_goal": "[[ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]]",
71
+ "desired_goal": "[[-0.1490691 -0.13728343 0.23989996]\n [ 0.01573799 -0.0725096 0.03837913]\n [-0.09517009 0.10031644 0.23641123]\n [-0.06551431 -0.08851526 0.09590872]]",
72
  "observation": "[[ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]]"
73
  },
74
  "_episode_num": 0,
75
+ "use_sde": true,
76
  "sde_sample_freq": -1,
77
  "_current_progress_remaining": 0.0,
78
  "ep_info_buffer": {
79
  ":type:": "<class 'collections.deque'>",
80
+ ":serialized:": "gAWVHRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIhQoOL4iI+r+UhpRSlIwBbJRLMowBdJRHQLP0eTEBKcx1fZQoaAZoCWgPQwj4b16c+Kr6v5SGlFKUaBVLMmgWR0Cz9FkQbuMNdX2UKGgGaAloD0MIsmMjEK+r/7+UhpRSlGgVSzJoFkdAs/Q5eyAxz3V9lChoBmgJaA9DCC5U/rW8cvq/lIaUUpRoFUsyaBZHQLP0GO7QLNR1fZQoaAZoCWgPQwiojlVKz7T7v5SGlFKUaBVLMmgWR0Cz9PBPfsNUdX2UKGgGaAloD0MI+igjLgDN+b+UhpRSlGgVSzJoFkdAs/TQLDye7XV9lChoBmgJaA9DCMAHr13aMPy/lIaUUpRoFUsyaBZHQLP0sJuEVWV1fZQoaAZoCWgPQwin5nKDoQ76v5SGlFKUaBVLMmgWR0Cz9JAnMMZxdX2UKGgGaAloD0MI34eDhCgf/7+UhpRSlGgVSzJoFkdAs/Ve8BdUsHV9lChoBmgJaA9DCIapLXWQl/y/lIaUUpRoFUsyaBZHQLP1Ps6q8151fZQoaAZoCWgPQwh56SYxCKz6v5SGlFKUaBVLMmgWR0Cz9R9A5aNddX2UKGgGaAloD0MI7DNnfcpx+L+UhpRSlGgVSzJoFkdAs/T+uGKyfXV9lChoBmgJaA9DCFoqb0c4Lfa/lIaUUpRoFUsyaBZHQLP10L4vexh1fZQoaAZoCWgPQwi4VnvYC0X8v5SGlFKUaBVLMmgWR0Cz9bCSzPa+dX2UKGgGaAloD0MIg8DKoUX2+7+UhpRSlGgVSzJoFkdAs/WQ+UyHmHV9lChoBmgJaA9DCOuoaoKoe/y/lIaUUpRoFUsyaBZHQLP1cGxD9fl1fZQoaAZoCWgPQwiFsBpLWNv8v5SGlFKUaBVLMmgWR0Cz9j+mR/3GdX2UKGgGaAloD0MIkQpjC0HO+b+UhpRSlGgVSzJoFkdAs/Yff3vhInV9lChoBmgJaA9DCDIDlfHvs/i/lIaUUpRoFUsyaBZHQLP1/+XJHRV1fZQoaAZoCWgPQwg8EcR5OIH/v5SGlFKUaBVLMmgWR0Cz9d9cjZ+QdX2UKGgGaAloD0MIGTigpStY/L+UhpRSlGgVSzJoFkdAs/a1i6QNkXV9lChoBmgJaA9DCJNuS+SCs/i/lIaUUpRoFUsyaBZHQLP2lWtEG7l1fZQoaAZoCWgPQwgE54wo7U39v5SGlFKUaBVLMmgWR0Cz9nXb/Ot5dX2UKGgGaAloD0MI/OO9amVC+r+UhpRSlGgVSzJoFkdAs/ZVbJOnEXV9lChoBmgJaA9DCJtyhXe5yPu/lIaUUpRoFUsyaBZHQLP3I9SuQp51fZQoaAZoCWgPQwjy6bEtAw74v5SGlFKUaBVLMmgWR0Cz9wO/UONHdX2UKGgGaAloD0MIKIHNOXgm+r+UhpRSlGgVSzJoFkdAs/bkJC0F83V9lChoBmgJaA9DCEBs6dFUD/u/lIaUUpRoFUsyaBZHQLP2w7gsK9h1fZQoaAZoCWgPQwird7gdGpb5v5SGlFKUaBVLMmgWR0Cz98wxesxPdX2UKGgGaAloD0MI+BisONWa/r+UhpRSlGgVSzJoFkdAs/esSPEKmnV9lChoBmgJaA9DCIfe4uE9R/u/lIaUUpRoFUsyaBZHQLP3jO/tY0V1fZQoaAZoCWgPQwhdFajF4CEAwJSGlFKUaBVLMmgWR0Cz92ytzS1FdX2UKGgGaAloD0MIkZkLXB7r+7+UhpRSlGgVSzJoFkdAs/h2tW+49XV9lChoBmgJaA9DCDGale1D3vu/lIaUUpRoFUsyaBZHQLP4VuiN83N1fZQoaAZoCWgPQwiBzTl4JjT4v5SGlFKUaBVLMmgWR0Cz+DeuieundX2UKGgGaAloD0MI641aYfpe+L+UhpRSlGgVSzJoFkdAs/gXfk3juXV9lChoBmgJaA9DCJSilXuBGfm/lIaUUpRoFUsyaBZHQLP5JzYEnst1fZQoaAZoCWgPQwj9E1ysqEH8v5SGlFKUaBVLMmgWR0Cz+QdbgTAWdX2UKGgGaAloD0MIuwuUFFiA+r+UhpRSlGgVSzJoFkdAs/joPbwjMXV9lChoBmgJaA9DCKRTVz7LEwDAlIaUUpRoFUsyaBZHQLP4yABkqc51fZQoaAZoCWgPQwiDMLd7uU/5v5SGlFKUaBVLMmgWR0Cz+dY1xbSrdX2UKGgGaAloD0MIi/87okI1/L+UhpRSlGgVSzJoFkdAs/m2ZYxL03V9lChoBmgJaA9DCE2CN6RRgQDAlIaUUpRoFUsyaBZHQLP5lyLQ5WB1fZQoaAZoCWgPQwjMm8O12sP6v5SGlFKUaBVLMmgWR0Cz+Xb3PAwgdX2UKGgGaAloD0MIJeoFn+Yk+b+UhpRSlGgVSzJoFkdAs/qRs1sLv3V9lChoBmgJaA9DCH7GhQMhmfe/lIaUUpRoFUsyaBZHQLP6cd7OVxF1fZQoaAZoCWgPQwhhcM0d/W/2v5SGlFKUaBVLMmgWR0Cz+lKg/TsqdX2UKGgGaAloD0MIsoAJ3Lob9r+UhpRSlGgVSzJoFkdAs/oyXVsk6nV9lChoBmgJaA9DCI2chT3tcPa/lIaUUpRoFUsyaBZHQLP7RRGc4HZ1fZQoaAZoCWgPQwiRgTy7fGv6v5SGlFKUaBVLMmgWR0Cz+yU12q1gdX2UKGgGaAloD0MI3QiLijid+r+UhpRSlGgVSzJoFkdAs/sF/tpmE3V9lChoBmgJaA9DCBjrG5jcqPm/lIaUUpRoFUsyaBZHQLP65dGy5Zt1fZQoaAZoCWgPQwj1vvG1Z9b+v5SGlFKUaBVLMmgWR0Cz+/57w8W9dX2UKGgGaAloD0MIv5gtWRXh+7+UhpRSlGgVSzJoFkdAs/veqDK5kXV9lChoBmgJaA9DCOLplbIM8fi/lIaUUpRoFUsyaBZHQLP7v4axX4l1fZQoaAZoCWgPQwg826M33Ef4v5SGlFKUaBVLMmgWR0Cz+59Mj/uLdX2UKGgGaAloD0MI/OHnvwev9b+UhpRSlGgVSzJoFkdAs/yYyGi5/nV9lChoBmgJaA9DCO8DkNrEyfi/lIaUUpRoFUsyaBZHQLP8eKHwgDB1fZQoaAZoCWgPQwiLNzKP/IH8v5SGlFKUaBVLMmgWR0Cz/FkgjhUBdX2UKGgGaAloD0MIIHpSJjV097+UhpRSlGgVSzJoFkdAs/w4oLG7z3V9lChoBmgJaA9DCLB2FOeo4/y/lIaUUpRoFUsyaBZHQLP9B5E+gUV1fZQoaAZoCWgPQwj2J/G5E2z3v5SGlFKUaBVLMmgWR0Cz/OdthuwYdX2UKGgGaAloD0MIscOY9PdS+b+UhpRSlGgVSzJoFkdAs/zH0XgtOHV9lChoBmgJaA9DCLqgvmVO1/y/lIaUUpRoFUsyaBZHQLP8p1QqI8B1fZQoaAZoCWgPQwiY+Q5+4sD3v5SGlFKUaBVLMmgWR0Cz/XcZUDMedX2UKGgGaAloD0MIwjBgyVUs97+UhpRSlGgVSzJoFkdAs/1W7Xg9/3V9lChoBmgJaA9DCLTnMjUJ3v2/lIaUUpRoFUsyaBZHQLP9N04iosJ1fZQoaAZoCWgPQwifr1kuGx38v5SGlFKUaBVLMmgWR0Cz/RbLyMDPdX2UKGgGaAloD0MIoYUEjC4PAMCUhpRSlGgVSzJoFkdAs/3nTNMXanV9lChoBmgJaA9DCAaE1sOXSfa/lIaUUpRoFUsyaBZHQLP9xzNliBp1fZQoaAZoCWgPQwjtLHqnAq76v5SGlFKUaBVLMmgWR0Cz/aeSbH6udX2UKGgGaAloD0MIN+LJbmY0+7+UhpRSlGgVSzJoFkdAs/2HAdn003V9lChoBmgJaA9DCNbm/1VHzvi/lIaUUpRoFUsyaBZHQLP+WT/Q0Gh1fZQoaAZoCWgPQwh9dytLdFb5v5SGlFKUaBVLMmgWR0Cz/jkmhM8HdX2UKGgGaAloD0MI7lpCPuhZ+b+UhpRSlGgVSzJoFkdAs/4ZhgE2YXV9lChoBmgJaA9DCERtG0ZBcPm/lIaUUpRoFUsyaBZHQLP9+QDV6NV1fZQoaAZoCWgPQwhlj1AzpMr7v5SGlFKUaBVLMmgWR0Cz/saT4cm0dX2UKGgGaAloD0MIwjI2dLP/9r+UhpRSlGgVSzJoFkdAs/6miO/+KnV9lChoBmgJaA9DCLdj6q7sAve/lIaUUpRoFUsyaBZHQLP+hyZKFqV1fZQoaAZoCWgPQwg0u+6tSMz2v5SGlFKUaBVLMmgWR0Cz/mah6By0dX2UKGgGaAloD0MIzuFa7WGv/b+UhpRSlGgVSzJoFkdAs/88BuGbkXV9lChoBmgJaA9DCMQI4dHG0fi/lIaUUpRoFUsyaBZHQLP/G+d9Ujt1fZQoaAZoCWgPQwhRMjm1M8z2v5SGlFKUaBVLMmgWR0Cz/vxJ7LMcdX2UKGgGaAloD0MIKT+p9um4/b+UhpRSlGgVSzJoFkdAs/7bwPRRdnV9lChoBmgJaA9DCIRkARO4dfi/lIaUUpRoFUsyaBZHQLP/p3VTaTR1fZQoaAZoCWgPQwj+mqxRD9H8v5SGlFKUaBVLMmgWR0Cz/4dVBD5TdX2UKGgGaAloD0MItCH/zCA++r+UhpRSlGgVSzJoFkdAs/9nvWpZOnV9lChoBmgJaA9DCBVXlX1XRPu/lIaUUpRoFUsyaBZHQLP/R2CuloF1fZQoaAZoCWgPQwivQspPqr33v5SGlFKUaBVLMmgWR0C0ABiliz9kdX2UKGgGaAloD0MIiXssfehC/b+UhpRSlGgVSzJoFkdAs//4eMhounV9lChoBmgJaA9DCJg1scBX9P2/lIaUUpRoFUsyaBZHQLP/2OJLuhN1fZQoaAZoCWgPQwirX+l8eFb4v5SGlFKUaBVLMmgWR0Cz/7haPjn3dX2UKGgGaAloD0MIm6285H9y/r+UhpRSlGgVSzJoFkdAtACFbeMyanV9lChoBmgJaA9DCAjMQ6Z8iPi/lIaUUpRoFUsyaBZHQLQAZU5uIh11fZQoaAZoCWgPQwgvou2Yuuv6v5SGlFKUaBVLMmgWR0C0AEW+j/ModX2UKGgGaAloD0MIVyJQ/YNIAMCUhpRSlGgVSzJoFkdAtAAlOtW+5HV9lChoBmgJaA9DCNNmnIaoQvm/lIaUUpRoFUsyaBZHQLQA9vrGBFx1fZQoaAZoCWgPQwiYUMHhBZH+v5SGlFKUaBVLMmgWR0C0ANbfpD/mdX2UKGgGaAloD0MIETRmEvXC97+UhpRSlGgVSzJoFkdAtAC3TnaFmHV9lChoBmgJaA9DCO5cGOlF7fy/lIaUUpRoFUsyaBZHQLQAltHhCMR1ZS4="
81
  },
82
  "ep_success_buffer": {
83
  ":type:": "<class 'collections.deque'>",
84
  ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
85
  },
86
  "_n_updates": 50000,
87
+ "n_steps": 10,
88
  "gamma": 0.99,
89
+ "gae_lambda": 0.9,
90
  "ent_coef": 0.0,
91
+ "vf_coef": 0.4,
92
  "max_grad_norm": 0.5,
93
  "normalize_advantage": false
94
  }
a2c-PandaReachDense-v2/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:696a1fd1cb54c16e1d078081551ca8349b7e0d59ab816d548d3732e55e9762ed
3
- size 44734
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9257339899c48f2b2f2c4a1a9a3fd0d0113d79c1b0596adc62f63470bb9c17f3
3
+ size 45438
a2c-PandaReachDense-v2/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:858a61ff4410857231eb23fd914f48bd68e40b0dcf0eb683a9b8ae4ffa3849ad
3
- size 46014
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:021c53b1fc5ff65c400fa10cb46de1825e53a208ec217ef82503c2838a9191cc
3
+ size 46718
config.json CHANGED
@@ -1 +1 @@
1
- {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVRQAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMG011bHRpSW5wdXRBY3RvckNyaXRpY1BvbGljeZSTlC4=", "__module__": "stable_baselines3.common.policies", "__doc__": "\n MultiInputActorClass policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space (Tuple)\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Uses the CombinedExtractor\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function MultiInputActorCriticPolicy.__init__ at 0x7fcb3b77f5e0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7fcb3b781200>"}, "verbose": 1, "policy_kwargs": {":type:": "<class 'dict'>", ":serialized:": "gAWVgQAAAAAAAAB9lCiMD29wdGltaXplcl9jbGFzc5SME3RvcmNoLm9wdGltLnJtc3Byb3CUjAdSTVNwcm9wlJOUjBBvcHRpbWl6ZXJfa3dhcmdzlH2UKIwFYWxwaGGURz/vrhR64UeujANlcHOURz7k+LWI42jxjAx3ZWlnaHRfZGVjYXmUSwB1dS4=", "optimizer_class": "<class 'torch.optim.rmsprop.RMSprop'>", "optimizer_kwargs": {"alpha": 0.99, "eps": 1e-05, "weight_decay": 0}}, "observation_space": {":type:": "<class 'gym.spaces.dict.Dict'>", ":serialized:": "gAWVUgMAAAAAAACMD2d5bS5zcGFjZXMuZGljdJSMBERpY3SUk5QpgZR9lCiMBnNwYWNlc5SMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwOZ3ltLnNwYWNlcy5ib3iUjANCb3iUk5QpgZR9lCiMBWR0eXBllIwFbnVtcHmUaBCTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowGX3NoYXBllEsDhZSMA2xvd5SMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYMAAAAAAAAAAAAIMEAACDBAAAgwZRoFUsDhZSMAUOUdJRSlIwEaGlnaJRoHSiWDAAAAAAAAAAAACBBAAAgQQAAIEGUaBVLA4WUaCB0lFKUjA1ib3VuZGVkX2JlbG93lGgdKJYDAAAAAAAAAAEBAZRoEowCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksDhZRoIHSUUpSMDWJvdW5kZWRfYWJvdmWUaB0olgMAAAAAAAAAAQEBlGgsSwOFlGggdJRSlIwKX25wX3JhbmRvbZROdWKMDGRlc2lyZWRfZ29hbJRoDSmBlH2UKGgQaBVoGEsDhZRoGmgdKJYMAAAAAAAAAAAAIMEAACDBAAAgwZRoFUsDhZRoIHSUUpRoI2gdKJYMAAAAAAAAAAAAIEEAACBBAAAgQZRoFUsDhZRoIHSUUpRoKGgdKJYDAAAAAAAAAAEBAZRoLEsDhZRoIHSUUpRoMmgdKJYDAAAAAAAAAAEBAZRoLEsDhZRoIHSUUpRoN051YowLb2JzZXJ2YXRpb26UaA0pgZR9lChoEGgVaBhLBoWUaBpoHSiWGAAAAAAAAAAAACDBAAAgwQAAIMEAACDBAAAgwQAAIMGUaBVLBoWUaCB0lFKUaCNoHSiWGAAAAAAAAAAAACBBAAAgQQAAIEEAACBBAAAgQQAAIEGUaBVLBoWUaCB0lFKUaChoHSiWBgAAAAAAAAABAQEBAQGUaCxLBoWUaCB0lFKUaDJoHSiWBgAAAAAAAAABAQEBAQGUaCxLBoWUaCB0lFKUaDdOdWJ1aBhOaBBOaDdOdWIu", "spaces": "OrderedDict([('achieved_goal', Box([-10. -10. -10.], [10. 10. 10.], (3,), float32)), ('desired_goal', Box([-10. -10. -10.], [10. 10. 10.], (3,), float32)), ('observation', Box([-10. -10. -10. -10. -10. -10.], [10. 10. 10. 10. 10. 10.], (6,), float32))])", "_shape": null, "dtype": null, "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVbQEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLA4WUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWDAAAAAAAAAAAAIC/AACAvwAAgL+UaApLA4WUjAFDlHSUUpSMBGhpZ2iUaBIolgwAAAAAAAAAAACAPwAAgD8AAIA/lGgKSwOFlGgVdJRSlIwNYm91bmRlZF9iZWxvd5RoEiiWAwAAAAAAAAABAQGUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLA4WUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYDAAAAAAAAAAEBAZRoIUsDhZRoFXSUUpSMCl9ucF9yYW5kb22UTnViLg==", "dtype": "float32", "_shape": [3], "low": "[-1. -1. -1.]", "high": "[1. 1. 1.]", "bounded_below": "[ True True True]", "bounded_above": "[ True True True]", "_np_random": null}, "n_envs": 4, "num_timesteps": 1000000, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1680286311978665348, "learning_rate": 0.0007, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4JDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/RvAGjbi6x4WUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "_last_obs": {":type:": "<class 'collections.OrderedDict'>", ":serialized:": "gAWVuwEAAAAAAACMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwSbnVtcHkuY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QoljAAAAAAAAAAYB7SPr7Vt7jJAhM/YB7SPr7Vt7jJAhM/YB7SPr7Vt7jJAhM/YB7SPr7Vt7jJAhM/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksESwOGlIwBQ5R0lFKUjAxkZXNpcmVkX2dvYWyUaAcoljAAAAAAAAAAl3vYP+62fb/6hX+/ET+QP2RhxD8ybKm/A9wlPrCltb8zyks/xESqv10bNT+x1zu/lGgOSwRLA4aUaBJ0lFKUjAtvYnNlcnZhdGlvbpRoByiWYAAAAAAAAABgHtI+vtW3uMkCEz9uzrM7xau2uklQm7pgHtI+vtW3uMkCEz9uzrM7xau2uklQm7pgHtI+vtW3uMkCEz9uzrM7xau2uklQm7pgHtI+vtW3uMkCEz9uzrM7xau2uklQm7qUaA5LBEsGhpRoEnSUUpR1Lg==", "achieved_goal": "[[ 4.1038799e-01 -8.7659326e-05 5.7426125e-01]\n [ 4.1038799e-01 -8.7659326e-05 5.7426125e-01]\n [ 4.1038799e-01 -8.7659326e-05 5.7426125e-01]\n [ 4.1038799e-01 -8.7659326e-05 5.7426125e-01]]", "desired_goal": "[[ 1.6912717 -0.99107254 -0.99813807]\n [ 1.1269246 1.5342221 -1.3236144 ]\n [ 0.16197209 -1.4191189 0.79605407]\n [-1.3302236 0.7074488 -0.73375994]]", "observation": "[[ 4.1038799e-01 -8.7659326e-05 5.7426125e-01 5.4872548e-03\n -1.3936689e-03 -1.1849488e-03]\n [ 4.1038799e-01 -8.7659326e-05 5.7426125e-01 5.4872548e-03\n -1.3936689e-03 -1.1849488e-03]\n [ 4.1038799e-01 -8.7659326e-05 5.7426125e-01 5.4872548e-03\n -1.3936689e-03 -1.1849488e-03]\n [ 4.1038799e-01 -8.7659326e-05 5.7426125e-01 5.4872548e-03\n -1.3936689e-03 -1.1849488e-03]]"}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYEAAAAAAAAAAEBAQGUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwSFlIwBQ5R0lFKULg=="}, "_last_original_obs": {":type:": "<class 'collections.OrderedDict'>", ":serialized:": "gAWVuwEAAAAAAACMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwSbnVtcHkuY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QoljAAAAAAAAAA6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksESwOGlIwBQ5R0lFKUjAxkZXNpcmVkX2dvYWyUaAcoljAAAAAAAAAAEsYFPRRksj2tMS4+CdEVvZBAKj1UBPQ9cO11vVQPh7zQRKw9xpr2ve04RD03kQI+lGgOSwRLA4aUaBJ0lFKUjAtvYnNlcnZhdGlvbpRoByiWYAAAAAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAACUaA5LBEsGhpRoEnSUUpR1Lg==", "achieved_goal": "[[ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]]", "desired_goal": "[[ 0.0326596 0.08710495 0.17011137]\n [-0.0365763 0.04156548 0.11914888]\n [-0.06004089 -0.0164868 0.08411562]\n [-0.12041239 0.04790585 0.12750708]]", "observation": "[[ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]]"}, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": 0.0, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVHRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIWtWSjnIQBsCUhpRSlIwBbJRLMowBdJRHQKcsd2fTTfB1fZQoaAZoCWgPQwgvwakPJO8AwJSGlFKUaBVLMmgWR0CnLCWq94/vdX2UKGgGaAloD0MIQrEVNC2RAsCUhpRSlGgVSzJoFkdApyvTTH80lHV9lChoBmgJaA9DCNyhYTHqWvy/lIaUUpRoFUsyaBZHQKcrdy4nWrh1fZQoaAZoCWgPQwhh+l5DcFwDwJSGlFKUaBVLMmgWR0CnLWxIjGDMdX2UKGgGaAloD0MIlBPtKqRsFsCUhpRSlGgVSzJoFkdApy0aGetjkXV9lChoBmgJaA9DCJEotKz75wPAlIaUUpRoFUsyaBZHQKcsx6WPcSJ1fZQoaAZoCWgPQwgYesToucX8v5SGlFKUaBVLMmgWR0CnLGuv2Xb/dX2UKGgGaAloD0MIqRWm7zUkBcCUhpRSlGgVSzJoFkdApy5lfE4vOHV9lChoBmgJaA9DCIGv6NZrev+/lIaUUpRoFUsyaBZHQKcuE1vVEux1fZQoaAZoCWgPQwi9/48TJqwLwJSGlFKUaBVLMmgWR0CnLcDSgGr0dX2UKGgGaAloD0MIcET3rGtEFsCUhpRSlGgVSzJoFkdApy1kr3CbdHV9lChoBmgJaA9DCMsRMpBndwHAlIaUUpRoFUsyaBZHQKcvVerMkhR1fZQoaAZoCWgPQwjYZfhPNzADwJSGlFKUaBVLMmgWR0CnLwPEjxCqdX2UKGgGaAloD0MIxsGlY86TBsCUhpRSlGgVSzJoFkdApy6xYcNpd3V9lChoBmgJaA9DCB5U4jrGVQfAlIaUUpRoFUsyaBZHQKcuVUxVQyh1fZQoaAZoCWgPQwinP/uRItIFwJSGlFKUaBVLMmgWR0CnMEeS0Sh8dX2UKGgGaAloD0MIZF3cRgOYAMCUhpRSlGgVSzJoFkdApy/1Y6nzhHV9lChoBmgJaA9DCATmIVM+ZAbAlIaUUpRoFUsyaBZHQKcvowD/2kB1fZQoaAZoCWgPQwhegehJmWQQwJSGlFKUaBVLMmgWR0CnL0cNH6MzdX2UKGgGaAloD0MIo5BkVu+QC8CUhpRSlGgVSzJoFkdApzFwP5HmR3V9lChoBmgJaA9DCEgYBiy5ygHAlIaUUpRoFUsyaBZHQKcxHq9Gqgh1fZQoaAZoCWgPQwjs3LQZp6H+v5SGlFKUaBVLMmgWR0CnMMz4+KTCdX2UKGgGaAloD0MIfjUHCOZoD8CUhpRSlGgVSzJoFkdApzBxWHUMHHV9lChoBmgJaA9DCK6f/rPmhwrAlIaUUpRoFUsyaBZHQKcy6aMrEtN1fZQoaAZoCWgPQwjDDI0ngngLwJSGlFKUaBVLMmgWR0CnMpf3N9pidX2UKGgGaAloD0MILoz0ona//7+UhpRSlGgVSzJoFkdApzJGQlruY3V9lChoBmgJaA9DCJmghm9h/QjAlIaUUpRoFUsyaBZHQKcx6ogmqo91fZQoaAZoCWgPQwhKC5dV2Ez4v5SGlFKUaBVLMmgWR0CnNHA6dUbUdX2UKGgGaAloD0MIl631RUJbA8CUhpRSlGgVSzJoFkdApzQeotL+P3V9lChoBmgJaA9DCPeRW5NuSwPAlIaUUpRoFUsyaBZHQKczzRYRuj11fZQoaAZoCWgPQwj2RNeFH4wRwJSGlFKUaBVLMmgWR0CnM3HHvMKUdX2UKGgGaAloD0MIOe//44SJA8CUhpRSlGgVSzJoFkdApzYFymygPHV9lChoBmgJaA9DCFe0Oc5tggLAlIaUUpRoFUsyaBZHQKc1tMEidJ91fZQoaAZoCWgPQwg1ecpqun4EwJSGlFKUaBVLMmgWR0CnNWMWfseGdX2UKGgGaAloD0MIC9KMRdOZ+r+UhpRSlGgVSzJoFkdApzUH2dupCXV9lChoBmgJaA9DCCNNvAM8KQnAlIaUUpRoFUsyaBZHQKc3ruMuOCJ1fZQoaAZoCWgPQwjxhF5/Et//v5SGlFKUaBVLMmgWR0CnN1101ZTydX2UKGgGaAloD0MIgSGrWz0nBcCUhpRSlGgVSzJoFkdApzcLYAbQ1XV9lChoBmgJaA9DCJ9x4UBINg3AlIaUUpRoFUsyaBZHQKc2sAoXsPd1fZQoaAZoCWgPQwgTYFj+fFsHwJSGlFKUaBVLMmgWR0CnOUcuBczJdX2UKGgGaAloD0MIBwlRvqDlAsCUhpRSlGgVSzJoFkdApzj2JrLyMHV9lChoBmgJaA9DCONw5ldzYAnAlIaUUpRoFUsyaBZHQKc4pLEDQqt1fZQoaAZoCWgPQwhkc9U8R8QCwJSGlFKUaBVLMmgWR0CnOEmdI5HVdX2UKGgGaAloD0MIzvxqDhAMAMCUhpRSlGgVSzJoFkdApzrLwvxpc3V9lChoBmgJaA9DCBheSfJcvxPAlIaUUpRoFUsyaBZHQKc6eiOearp1fZQoaAZoCWgPQwhrDaX2Itr9v5SGlFKUaBVLMmgWR0CnOihXr+o+dX2UKGgGaAloD0MI9x4uOe4U+L+UhpRSlGgVSzJoFkdApznMEPlMiHV9lChoBmgJaA9DCPwcHy3O2APAlIaUUpRoFUsyaBZHQKc7w4e9zwN1fZQoaAZoCWgPQwiWlSaloHsKwJSGlFKUaBVLMmgWR0CnO3G4qgAZdX2UKGgGaAloD0MIcv4mFCJgCsCUhpRSlGgVSzJoFkdApzsflp48l3V9lChoBmgJaA9DCNRDNLqDmPe/lIaUUpRoFUsyaBZHQKc6w3Ov+wV1fZQoaAZoCWgPQwgpsWt7u+UCwJSGlFKUaBVLMmgWR0CnPMGTLW7OdX2UKGgGaAloD0MIwHlx4qv9BsCUhpRSlGgVSzJoFkdApzxvY4ACGXV9lChoBmgJaA9DCF8lH7sL1A3AlIaUUpRoFUsyaBZHQKc8Ha0QbuN1fZQoaAZoCWgPQwhGXtbEAp/7v5SGlFKUaBVLMmgWR0CnO8Gp++dtdX2UKGgGaAloD0MIveMUHckFD8CUhpRSlGgVSzJoFkdApz24X668QXV9lChoBmgJaA9DCHgLJCh+LAfAlIaUUpRoFUsyaBZHQKc9Zhhpg1F1fZQoaAZoCWgPQwh8gO7LmQ0CwJSGlFKUaBVLMmgWR0CnPROE/SpjdX2UKGgGaAloD0MIcQFolC6dBsCUhpRSlGgVSzJoFkdApzy3dCVrynV9lChoBmgJaA9DCAyR09fztQ7AlIaUUpRoFUsyaBZHQKc+r9iMHbB1fZQoaAZoCWgPQwh/vFetTJgBwJSGlFKUaBVLMmgWR0CnPl24EwFldX2UKGgGaAloD0MINUbrqGoC/b+UhpRSlGgVSzJoFkdApz4LhzeXRnV9lChoBmgJaA9DCNV5VPzf0f6/lIaUUpRoFUsyaBZHQKc9r2xIJ7d1fZQoaAZoCWgPQwjzjlN0JFcFwJSGlFKUaBVLMmgWR0CnP5Z13dKvdX2UKGgGaAloD0MI+u3rwDkjC8CUhpRSlGgVSzJoFkdApz9EMqjJuHV9lChoBmgJaA9DCJS+EHLeHw7AlIaUUpRoFUsyaBZHQKc+8bcXWOJ1fZQoaAZoCWgPQwjGpL+XwgMKwJSGlFKUaBVLMmgWR0CnPpVstTUBdX2UKGgGaAloD0MIlbpkHCN5CsCUhpRSlGgVSzJoFkdAp0CF+XqqwXV9lChoBmgJaA9DCK+Xpghwuvy/lIaUUpRoFUsyaBZHQKdAM+/QBxR1fZQoaAZoCWgPQwiRD3o2q+4TwJSGlFKUaBVLMmgWR0CnP+Gf5DZ2dX2UKGgGaAloD0MIQdR9AFKrEcCUhpRSlGgVSzJoFkdApz+Fgnc+JXV9lChoBmgJaA9DCEyqtpvgm/q/lIaUUpRoFUsyaBZHQKdBbBTGYKJ1fZQoaAZoCWgPQwh6qkNuhosSwJSGlFKUaBVLMmgWR0CnQRnrIHTrdX2UKGgGaAloD0MIEXNJ1XbzBMCUhpRSlGgVSzJoFkdAp0DHW8RL9XV9lChoBmgJaA9DCFExzt+Egg7AlIaUUpRoFUsyaBZHQKdAaxHG0eF1fZQoaAZoCWgPQwi6TbhX5g0CwJSGlFKUaBVLMmgWR0CnQmLh73PBdX2UKGgGaAloD0MI5xcl6C9UDsCUhpRSlGgVSzJoFkdAp0IQnSfDk3V9lChoBmgJaA9DCLLV5ZSAWP2/lIaUUpRoFUsyaBZHQKdBvlZowmF1fZQoaAZoCWgPQwhcVIuIYlIGwJSGlFKUaBVLMmgWR0CnQWIfbKzSdX2UKGgGaAloD0MI2JyDZ0LT+b+UhpRSlGgVSzJoFkdAp0NSJ9AoonV9lChoBmgJaA9DCIDVkSOdoQfAlIaUUpRoFUsyaBZHQKdDAAG0NSZ1fZQoaAZoCWgPQwgRGsHG9a/4v5SGlFKUaBVLMmgWR0CnQq1kUbkwdX2UKGgGaAloD0MI4UIewY0UBMCUhpRSlGgVSzJoFkdAp0JRUPxx1nV9lChoBmgJaA9DCFLvqZz2dADAlIaUUpRoFUsyaBZHQKdERsXSBsh1fZQoaAZoCWgPQwi9OVyrPRwRwJSGlFKUaBVLMmgWR0CnQ/Sn+AEudX2UKGgGaAloD0MIkiQIV0BhEcCUhpRSlGgVSzJoFkdAp0OiLwWnCXV9lChoBmgJaA9DCAKAY8+eCwvAlIaUUpRoFUsyaBZHQKdDReiSJTF1fZQoaAZoCWgPQwjzVIfcDHf2v5SGlFKUaBVLMmgWR0CnRTHKwIMSdX2UKGgGaAloD0MIy2d5HtwdD8CUhpRSlGgVSzJoFkdAp0Tf1OCXhXV9lChoBmgJaA9DCNhGPNnNjPS/lIaUUpRoFUsyaBZHQKdEjXYlIEt1fZQoaAZoCWgPQwiO6J51jZbzv5SGlFKUaBVLMmgWR0CnRDEwN9YwdX2UKGgGaAloD0MITHFV2XflAcCUhpRSlGgVSzJoFkdAp0Ye49X9znV9lChoBmgJaA9DCNC2mnXGdwLAlIaUUpRoFUsyaBZHQKdFzRBNVR11fZQoaAZoCWgPQwhdaoR+pt71v5SGlFKUaBVLMmgWR0CnRXqIznA7dX2UKGgGaAloD0MI2Xkbmx3pAMCUhpRSlGgVSzJoFkdAp0Ue606YFHV9lChoBmgJaA9DCIWZtn9lZQjAlIaUUpRoFUsyaBZHQKdHCBVdX1d1fZQoaAZoCWgPQwiJRQw7jOkBwJSGlFKUaBVLMmgWR0CnRrXRG+bmdX2UKGgGaAloD0MIBFYOLbLdEcCUhpRSlGgVSzJoFkdAp0ZjTz/ZNHV9lChoBmgJaA9DCOSG3023DBDAlIaUUpRoFUsyaBZHQKdGBvxYq5N1ZS4="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 50000, "n_steps": 5, "gamma": 0.99, "gae_lambda": 1.0, "ent_coef": 0.0, "vf_coef": 0.5, "max_grad_norm": 0.5, "normalize_advantage": false, "system_info": {"OS": "Linux-5.10.147+-x86_64-with-glibc2.31 # 1 SMP Sat Dec 10 16:00:40 UTC 2022", "Python": "3.9.16", "Stable-Baselines3": "1.7.0", "PyTorch": "1.13.1+cu116", "GPU Enabled": "True", "Numpy": "1.22.4", "Gym": "0.21.0"}}
 
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVRQAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMG011bHRpSW5wdXRBY3RvckNyaXRpY1BvbGljeZSTlC4=", "__module__": "stable_baselines3.common.policies", "__doc__": "\n MultiInputActorClass policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space (Tuple)\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Uses the CombinedExtractor\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function MultiInputActorCriticPolicy.__init__ at 0x7f8249c790d0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7f8249c77340>"}, "verbose": 1, "policy_kwargs": {":type:": "<class 'dict'>", ":serialized:": "gAWVgQAAAAAAAAB9lCiMD29wdGltaXplcl9jbGFzc5SME3RvcmNoLm9wdGltLnJtc3Byb3CUjAdSTVNwcm9wlJOUjBBvcHRpbWl6ZXJfa3dhcmdzlH2UKIwFYWxwaGGURz/vrhR64UeujANlcHOURz7k+LWI42jxjAx3ZWlnaHRfZGVjYXmUSwB1dS4=", "optimizer_class": "<class 'torch.optim.rmsprop.RMSprop'>", "optimizer_kwargs": {"alpha": 0.99, "eps": 1e-05, "weight_decay": 0}}, "observation_space": {":type:": "<class 'gym.spaces.dict.Dict'>", ":serialized:": "gAWVUgMAAAAAAACMD2d5bS5zcGFjZXMuZGljdJSMBERpY3SUk5QpgZR9lCiMBnNwYWNlc5SMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwOZ3ltLnNwYWNlcy5ib3iUjANCb3iUk5QpgZR9lCiMBWR0eXBllIwFbnVtcHmUaBCTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowGX3NoYXBllEsDhZSMA2xvd5SMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYMAAAAAAAAAAAAIMEAACDBAAAgwZRoFUsDhZSMAUOUdJRSlIwEaGlnaJRoHSiWDAAAAAAAAAAAACBBAAAgQQAAIEGUaBVLA4WUaCB0lFKUjA1ib3VuZGVkX2JlbG93lGgdKJYDAAAAAAAAAAEBAZRoEowCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksDhZRoIHSUUpSMDWJvdW5kZWRfYWJvdmWUaB0olgMAAAAAAAAAAQEBlGgsSwOFlGggdJRSlIwKX25wX3JhbmRvbZROdWKMDGRlc2lyZWRfZ29hbJRoDSmBlH2UKGgQaBVoGEsDhZRoGmgdKJYMAAAAAAAAAAAAIMEAACDBAAAgwZRoFUsDhZRoIHSUUpRoI2gdKJYMAAAAAAAAAAAAIEEAACBBAAAgQZRoFUsDhZRoIHSUUpRoKGgdKJYDAAAAAAAAAAEBAZRoLEsDhZRoIHSUUpRoMmgdKJYDAAAAAAAAAAEBAZRoLEsDhZRoIHSUUpRoN051YowLb2JzZXJ2YXRpb26UaA0pgZR9lChoEGgVaBhLBoWUaBpoHSiWGAAAAAAAAAAAACDBAAAgwQAAIMEAACDBAAAgwQAAIMGUaBVLBoWUaCB0lFKUaCNoHSiWGAAAAAAAAAAAACBBAAAgQQAAIEEAACBBAAAgQQAAIEGUaBVLBoWUaCB0lFKUaChoHSiWBgAAAAAAAAABAQEBAQGUaCxLBoWUaCB0lFKUaDJoHSiWBgAAAAAAAAABAQEBAQGUaCxLBoWUaCB0lFKUaDdOdWJ1aBhOaBBOaDdOdWIu", "spaces": "OrderedDict([('achieved_goal', Box([-10. -10. -10.], [10. 10. 10.], (3,), float32)), ('desired_goal', Box([-10. -10. -10.], [10. 10. 10.], (3,), float32)), ('observation', Box([-10. -10. -10. -10. -10. -10.], [10. 10. 10. 10. 10. 10.], (6,), float32))])", "_shape": null, "dtype": null, "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVbQEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lGgFk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLA4WUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWDAAAAAAAAAAAAIC/AACAvwAAgL+UaApLA4WUjAFDlHSUUpSMBGhpZ2iUaBIolgwAAAAAAAAAAACAPwAAgD8AAIA/lGgKSwOFlGgVdJRSlIwNYm91bmRlZF9iZWxvd5RoEiiWAwAAAAAAAAABAQGUaAeMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLA4WUaBV0lFKUjA1ib3VuZGVkX2Fib3ZllGgSKJYDAAAAAAAAAAEBAZRoIUsDhZRoFXSUUpSMCl9ucF9yYW5kb22UTnViLg==", "dtype": "float32", "_shape": [3], "low": "[-1. -1. -1.]", "high": "[1. 1. 1.]", "bounded_below": "[ True True True]", "bounded_above": "[ True True True]", "_np_random": null}, "n_envs": 4, "num_timesteps": 2000000, "_total_timesteps": 2000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1680290443097352701, "learning_rate": 0.00025, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVwwIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4JDAgABlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMSC91c3IvbG9jYWwvbGliL3B5dGhvbjMuOS9kaXN0LXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/MGJN0vGp/IWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "_last_obs": {":type:": "<class 'collections.OrderedDict'>", ":serialized:": "gAWVuwEAAAAAAACMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwSbnVtcHkuY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QoljAAAAAAAAAAtQSaPsU1DrzOjgk/tQSaPsU1DrzOjgk/tQSaPsU1DrzOjgk/tQSaPsU1DrzOjgk/lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksESwOGlIwBQ5R0lFKUjAxkZXNpcmVkX2dvYWyUaAcoljAAAAAAAAAAM9DHP0f1vD8QKqY/0tjUvpCDj79sJj2/2b+hv0aItL/e8ME/sZuJv7PRjj/v+Ea/lGgOSwRLA4aUaBJ0lFKUjAtvYnNlcnZhdGlvbpRoByiWYAAAAAAAAAC1BJo+xTUOvM6OCT/xHqy7SLVIOsotJju1BJo+xTUOvM6OCT/xHqy7SLVIOsotJju1BJo+xTUOvM6OCT/xHqy7SLVIOsotJju1BJo+xTUOvM6OCT/xHqy7SLVIOsotJjuUaA5LBEsGhpRoEnSUUpR1Lg==", "achieved_goal": "[[ 0.30081716 -0.00867981 0.5373353 ]\n [ 0.30081716 -0.00867981 0.5373353 ]\n [ 0.30081716 -0.00867981 0.5373353 ]\n [ 0.30081716 -0.00867981 0.5373353 ]]", "desired_goal": "[[ 1.5610412 1.4762353 1.2981586]\n [-0.4157167 -1.1212025 -0.7388675]\n [-1.2636672 -1.4104087 1.5151632]\n [-1.0750638 1.1157745 -0.7772359]]", "observation": "[[ 0.30081716 -0.00867981 0.5373353 -0.00525271 0.00076564 0.00253569]\n [ 0.30081716 -0.00867981 0.5373353 -0.00525271 0.00076564 0.00253569]\n [ 0.30081716 -0.00867981 0.5373353 -0.00525271 0.00076564 0.00253569]\n [ 0.30081716 -0.00867981 0.5373353 -0.00525271 0.00076564 0.00253569]]"}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYEAAAAAAAAAAEBAQGUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwSFlIwBQ5R0lFKULg=="}, "_last_original_obs": {":type:": "<class 'collections.OrderedDict'>", ":serialized:": "gAWVuwEAAAAAAACMC2NvbGxlY3Rpb25zlIwLT3JkZXJlZERpY3SUk5QpUpQojA1hY2hpZXZlZF9nb2FslIwSbnVtcHkuY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QoljAAAAAAAAAA6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+6nIdPRlsGqxDI0o+lIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksESwOGlIwBQ5R0lFKUjAxkZXNpcmVkX2dvYWyUaAcoljAAAAAAAAAAkqUYvgeUDL5WqHU+9uyAPOp/lL1wMx09iejCvbVyzT3JFXI+XiyGvX1Htb3Ka8Q9lGgOSwRLA4aUaBJ0lFKUjAtvYnNlcnZhdGlvbpRoByiWYAAAAAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAADqch09GWwarEMjSj4AAAAAAAAAgAAAAACUaA5LBEsGhpRoEnSUUpR1Lg==", "achieved_goal": "[[ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01]]", "desired_goal": "[[-0.1490691 -0.13728343 0.23989996]\n [ 0.01573799 -0.0725096 0.03837913]\n [-0.09517009 0.10031644 0.23641123]\n [-0.06551431 -0.08851526 0.09590872]]", "observation": "[[ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]\n [ 3.8439669e-02 -2.1944723e-12 1.9740014e-01 0.0000000e+00\n -0.0000000e+00 0.0000000e+00]]"}, "_episode_num": 0, "use_sde": true, "sde_sample_freq": -1, "_current_progress_remaining": 0.0, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVHRAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIhQoOL4iI+r+UhpRSlIwBbJRLMowBdJRHQLP0eTEBKcx1fZQoaAZoCWgPQwj4b16c+Kr6v5SGlFKUaBVLMmgWR0Cz9FkQbuMNdX2UKGgGaAloD0MIsmMjEK+r/7+UhpRSlGgVSzJoFkdAs/Q5eyAxz3V9lChoBmgJaA9DCC5U/rW8cvq/lIaUUpRoFUsyaBZHQLP0GO7QLNR1fZQoaAZoCWgPQwiojlVKz7T7v5SGlFKUaBVLMmgWR0Cz9PBPfsNUdX2UKGgGaAloD0MI+igjLgDN+b+UhpRSlGgVSzJoFkdAs/TQLDye7XV9lChoBmgJaA9DCMAHr13aMPy/lIaUUpRoFUsyaBZHQLP0sJuEVWV1fZQoaAZoCWgPQwin5nKDoQ76v5SGlFKUaBVLMmgWR0Cz9JAnMMZxdX2UKGgGaAloD0MI34eDhCgf/7+UhpRSlGgVSzJoFkdAs/Ve8BdUsHV9lChoBmgJaA9DCIapLXWQl/y/lIaUUpRoFUsyaBZHQLP1Ps6q8151fZQoaAZoCWgPQwh56SYxCKz6v5SGlFKUaBVLMmgWR0Cz9R9A5aNddX2UKGgGaAloD0MI7DNnfcpx+L+UhpRSlGgVSzJoFkdAs/T+uGKyfXV9lChoBmgJaA9DCFoqb0c4Lfa/lIaUUpRoFUsyaBZHQLP10L4vexh1fZQoaAZoCWgPQwi4VnvYC0X8v5SGlFKUaBVLMmgWR0Cz9bCSzPa+dX2UKGgGaAloD0MIg8DKoUX2+7+UhpRSlGgVSzJoFkdAs/WQ+UyHmHV9lChoBmgJaA9DCOuoaoKoe/y/lIaUUpRoFUsyaBZHQLP1cGxD9fl1fZQoaAZoCWgPQwiFsBpLWNv8v5SGlFKUaBVLMmgWR0Cz9j+mR/3GdX2UKGgGaAloD0MIkQpjC0HO+b+UhpRSlGgVSzJoFkdAs/Yff3vhInV9lChoBmgJaA9DCDIDlfHvs/i/lIaUUpRoFUsyaBZHQLP1/+XJHRV1fZQoaAZoCWgPQwg8EcR5OIH/v5SGlFKUaBVLMmgWR0Cz9d9cjZ+QdX2UKGgGaAloD0MIGTigpStY/L+UhpRSlGgVSzJoFkdAs/a1i6QNkXV9lChoBmgJaA9DCJNuS+SCs/i/lIaUUpRoFUsyaBZHQLP2lWtEG7l1fZQoaAZoCWgPQwgE54wo7U39v5SGlFKUaBVLMmgWR0Cz9nXb/Ot5dX2UKGgGaAloD0MI/OO9amVC+r+UhpRSlGgVSzJoFkdAs/ZVbJOnEXV9lChoBmgJaA9DCJtyhXe5yPu/lIaUUpRoFUsyaBZHQLP3I9SuQp51fZQoaAZoCWgPQwjy6bEtAw74v5SGlFKUaBVLMmgWR0Cz9wO/UONHdX2UKGgGaAloD0MIKIHNOXgm+r+UhpRSlGgVSzJoFkdAs/bkJC0F83V9lChoBmgJaA9DCEBs6dFUD/u/lIaUUpRoFUsyaBZHQLP2w7gsK9h1fZQoaAZoCWgPQwird7gdGpb5v5SGlFKUaBVLMmgWR0Cz98wxesxPdX2UKGgGaAloD0MI+BisONWa/r+UhpRSlGgVSzJoFkdAs/esSPEKmnV9lChoBmgJaA9DCIfe4uE9R/u/lIaUUpRoFUsyaBZHQLP3jO/tY0V1fZQoaAZoCWgPQwhdFajF4CEAwJSGlFKUaBVLMmgWR0Cz92ytzS1FdX2UKGgGaAloD0MIkZkLXB7r+7+UhpRSlGgVSzJoFkdAs/h2tW+49XV9lChoBmgJaA9DCDGale1D3vu/lIaUUpRoFUsyaBZHQLP4VuiN83N1fZQoaAZoCWgPQwiBzTl4JjT4v5SGlFKUaBVLMmgWR0Cz+DeuieundX2UKGgGaAloD0MI641aYfpe+L+UhpRSlGgVSzJoFkdAs/gXfk3juXV9lChoBmgJaA9DCJSilXuBGfm/lIaUUpRoFUsyaBZHQLP5JzYEnst1fZQoaAZoCWgPQwj9E1ysqEH8v5SGlFKUaBVLMmgWR0Cz+QdbgTAWdX2UKGgGaAloD0MIuwuUFFiA+r+UhpRSlGgVSzJoFkdAs/joPbwjMXV9lChoBmgJaA9DCKRTVz7LEwDAlIaUUpRoFUsyaBZHQLP4yABkqc51fZQoaAZoCWgPQwiDMLd7uU/5v5SGlFKUaBVLMmgWR0Cz+dY1xbSrdX2UKGgGaAloD0MIi/87okI1/L+UhpRSlGgVSzJoFkdAs/m2ZYxL03V9lChoBmgJaA9DCE2CN6RRgQDAlIaUUpRoFUsyaBZHQLP5lyLQ5WB1fZQoaAZoCWgPQwjMm8O12sP6v5SGlFKUaBVLMmgWR0Cz+Xb3PAwgdX2UKGgGaAloD0MIJeoFn+Yk+b+UhpRSlGgVSzJoFkdAs/qRs1sLv3V9lChoBmgJaA9DCH7GhQMhmfe/lIaUUpRoFUsyaBZHQLP6cd7OVxF1fZQoaAZoCWgPQwhhcM0d/W/2v5SGlFKUaBVLMmgWR0Cz+lKg/TsqdX2UKGgGaAloD0MIsoAJ3Lob9r+UhpRSlGgVSzJoFkdAs/oyXVsk6nV9lChoBmgJaA9DCI2chT3tcPa/lIaUUpRoFUsyaBZHQLP7RRGc4HZ1fZQoaAZoCWgPQwiRgTy7fGv6v5SGlFKUaBVLMmgWR0Cz+yU12q1gdX2UKGgGaAloD0MI3QiLijid+r+UhpRSlGgVSzJoFkdAs/sF/tpmE3V9lChoBmgJaA9DCBjrG5jcqPm/lIaUUpRoFUsyaBZHQLP65dGy5Zt1fZQoaAZoCWgPQwj1vvG1Z9b+v5SGlFKUaBVLMmgWR0Cz+/57w8W9dX2UKGgGaAloD0MIv5gtWRXh+7+UhpRSlGgVSzJoFkdAs/veqDK5kXV9lChoBmgJaA9DCOLplbIM8fi/lIaUUpRoFUsyaBZHQLP7v4axX4l1fZQoaAZoCWgPQwg826M33Ef4v5SGlFKUaBVLMmgWR0Cz+59Mj/uLdX2UKGgGaAloD0MI/OHnvwev9b+UhpRSlGgVSzJoFkdAs/yYyGi5/nV9lChoBmgJaA9DCO8DkNrEyfi/lIaUUpRoFUsyaBZHQLP8eKHwgDB1fZQoaAZoCWgPQwiLNzKP/IH8v5SGlFKUaBVLMmgWR0Cz/FkgjhUBdX2UKGgGaAloD0MIIHpSJjV097+UhpRSlGgVSzJoFkdAs/w4oLG7z3V9lChoBmgJaA9DCLB2FOeo4/y/lIaUUpRoFUsyaBZHQLP9B5E+gUV1fZQoaAZoCWgPQwj2J/G5E2z3v5SGlFKUaBVLMmgWR0Cz/OdthuwYdX2UKGgGaAloD0MIscOY9PdS+b+UhpRSlGgVSzJoFkdAs/zH0XgtOHV9lChoBmgJaA9DCLqgvmVO1/y/lIaUUpRoFUsyaBZHQLP8p1QqI8B1fZQoaAZoCWgPQwiY+Q5+4sD3v5SGlFKUaBVLMmgWR0Cz/XcZUDMedX2UKGgGaAloD0MIwjBgyVUs97+UhpRSlGgVSzJoFkdAs/1W7Xg9/3V9lChoBmgJaA9DCLTnMjUJ3v2/lIaUUpRoFUsyaBZHQLP9N04iosJ1fZQoaAZoCWgPQwifr1kuGx38v5SGlFKUaBVLMmgWR0Cz/RbLyMDPdX2UKGgGaAloD0MIoYUEjC4PAMCUhpRSlGgVSzJoFkdAs/3nTNMXanV9lChoBmgJaA9DCAaE1sOXSfa/lIaUUpRoFUsyaBZHQLP9xzNliBp1fZQoaAZoCWgPQwjtLHqnAq76v5SGlFKUaBVLMmgWR0Cz/aeSbH6udX2UKGgGaAloD0MIN+LJbmY0+7+UhpRSlGgVSzJoFkdAs/2HAdn003V9lChoBmgJaA9DCNbm/1VHzvi/lIaUUpRoFUsyaBZHQLP+WT/Q0Gh1fZQoaAZoCWgPQwh9dytLdFb5v5SGlFKUaBVLMmgWR0Cz/jkmhM8HdX2UKGgGaAloD0MI7lpCPuhZ+b+UhpRSlGgVSzJoFkdAs/4ZhgE2YXV9lChoBmgJaA9DCERtG0ZBcPm/lIaUUpRoFUsyaBZHQLP9+QDV6NV1fZQoaAZoCWgPQwhlj1AzpMr7v5SGlFKUaBVLMmgWR0Cz/saT4cm0dX2UKGgGaAloD0MIwjI2dLP/9r+UhpRSlGgVSzJoFkdAs/6miO/+KnV9lChoBmgJaA9DCLdj6q7sAve/lIaUUpRoFUsyaBZHQLP+hyZKFqV1fZQoaAZoCWgPQwg0u+6tSMz2v5SGlFKUaBVLMmgWR0Cz/mah6By0dX2UKGgGaAloD0MIzuFa7WGv/b+UhpRSlGgVSzJoFkdAs/88BuGbkXV9lChoBmgJaA9DCMQI4dHG0fi/lIaUUpRoFUsyaBZHQLP/G+d9Ujt1fZQoaAZoCWgPQwhRMjm1M8z2v5SGlFKUaBVLMmgWR0Cz/vxJ7LMcdX2UKGgGaAloD0MIKT+p9um4/b+UhpRSlGgVSzJoFkdAs/7bwPRRdnV9lChoBmgJaA9DCIRkARO4dfi/lIaUUpRoFUsyaBZHQLP/p3VTaTR1fZQoaAZoCWgPQwj+mqxRD9H8v5SGlFKUaBVLMmgWR0Cz/4dVBD5TdX2UKGgGaAloD0MItCH/zCA++r+UhpRSlGgVSzJoFkdAs/9nvWpZOnV9lChoBmgJaA9DCBVXlX1XRPu/lIaUUpRoFUsyaBZHQLP/R2CuloF1fZQoaAZoCWgPQwivQspPqr33v5SGlFKUaBVLMmgWR0C0ABiliz9kdX2UKGgGaAloD0MIiXssfehC/b+UhpRSlGgVSzJoFkdAs//4eMhounV9lChoBmgJaA9DCJg1scBX9P2/lIaUUpRoFUsyaBZHQLP/2OJLuhN1fZQoaAZoCWgPQwirX+l8eFb4v5SGlFKUaBVLMmgWR0Cz/7haPjn3dX2UKGgGaAloD0MIm6285H9y/r+UhpRSlGgVSzJoFkdAtACFbeMyanV9lChoBmgJaA9DCAjMQ6Z8iPi/lIaUUpRoFUsyaBZHQLQAZU5uIh11fZQoaAZoCWgPQwgvou2Yuuv6v5SGlFKUaBVLMmgWR0C0AEW+j/ModX2UKGgGaAloD0MIVyJQ/YNIAMCUhpRSlGgVSzJoFkdAtAAlOtW+5HV9lChoBmgJaA9DCNNmnIaoQvm/lIaUUpRoFUsyaBZHQLQA9vrGBFx1fZQoaAZoCWgPQwiYUMHhBZH+v5SGlFKUaBVLMmgWR0C0ANbfpD/mdX2UKGgGaAloD0MIETRmEvXC97+UhpRSlGgVSzJoFkdAtAC3TnaFmHV9lChoBmgJaA9DCO5cGOlF7fy/lIaUUpRoFUsyaBZHQLQAltHhCMR1ZS4="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 50000, "n_steps": 10, "gamma": 0.99, "gae_lambda": 0.9, "ent_coef": 0.0, "vf_coef": 0.4, "max_grad_norm": 0.5, "normalize_advantage": false, "system_info": {"OS": "Linux-5.10.147+-x86_64-with-glibc2.31 # 1 SMP Sat Dec 10 16:00:40 UTC 2022", "Python": "3.9.16", "Stable-Baselines3": "1.7.0", "PyTorch": "1.13.1+cu116", "GPU Enabled": "True", "Numpy": "1.22.4", "Gym": "0.21.0"}}
replay.mp4 CHANGED
Binary files a/replay.mp4 and b/replay.mp4 differ
 
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": -2.5257808419875802, "std_reward": 0.9416321689202602, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-03-31T19:04:46.776355"}
 
1
+ {"mean_reward": -1.766916676098481, "std_reward": 0.2479151268138146, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-03-31T20:46:01.724939"}
vec_normalize.pkl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:adbdc8238009d8a8e3e47a5b6ee0737668a44efdb839fd3450ef98e332c6f091
3
  size 3056
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b3e0f43a55c671d50aa4814a2bcbaa065d9580786fbf9c346b6144d5c0ff1b7e
3
  size 3056