culteejen commited on
Commit
3ba2797
1 Parent(s): 2059226

Upload model to Hugging Face

Browse files
PPO-hardcoded.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:50da7b2bc35086000488ca29981b3f52e453e0634b3a4816f2a1dca680ca33b0
3
- size 142396
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e5eaeb9b0b013ed736f06dbc73e493b32af6c153fa8cf18ff1ec1b9feac36cd
3
+ size 142364
PPO-hardcoded/data CHANGED
@@ -4,20 +4,20 @@
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
- "__init__": "<function ActorCriticPolicy.__init__ at 0x7f30071e8ee0>",
8
- "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f30071e8f70>",
9
- "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f30071e9000>",
10
- "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f30071e9090>",
11
- "_build": "<function ActorCriticPolicy._build at 0x7f30071e9120>",
12
- "forward": "<function ActorCriticPolicy.forward at 0x7f30071e91b0>",
13
- "extract_features": "<function ActorCriticPolicy.extract_features at 0x7f30071e9240>",
14
- "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f30071e92d0>",
15
- "_predict": "<function ActorCriticPolicy._predict at 0x7f30071e9360>",
16
- "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f30071e93f0>",
17
- "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f30071e9480>",
18
- "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f30071e9510>",
19
  "__abstractmethods__": "frozenset()",
20
- "_abc_impl": "<_abc._abc_data object at 0x7f30071ec800>"
21
  },
22
  "verbose": true,
23
  "policy_kwargs": {},
@@ -48,7 +48,7 @@
48
  "_num_timesteps_at_start": 0,
49
  "seed": null,
50
  "action_noise": null,
51
- "start_time": 1681189254138184037,
52
  "learning_rate": 0.0003,
53
  "tensorboard_log": null,
54
  "lr_schedule": {
@@ -57,7 +57,7 @@
57
  },
58
  "_last_obs": {
59
  ":type:": "<class 'numpy.ndarray'>",
60
- ":serialized:": "gAWVxQAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJZQAAAAAAAAAJxigUMYAY8//WcWQtLiHkIAAMhCAICCQ5qZmT+a7CRCmuwkQgAAyELren9DboGgP5gE10H/WNRBihgsQvr1gEM3i5s/3o8ZQk/xEkIAAMhClIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksESwWGlIwBQ5R0lFKULg=="
61
  },
62
  "_last_episode_starts": {
63
  ":type:": "<class 'numpy.ndarray'>",
@@ -70,7 +70,7 @@
70
  "_current_progress_remaining": -0.0035199999999999676,
71
  "ep_info_buffer": {
72
  ":type:": "<class 'collections.deque'>",
73
- ":serialized:": "gAWVbxAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMICtejcD0KFMCUhpRSlIwBbJRN9QGMAXSUR0CFOSrwvxpddX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIVKHE/B3zN1fZQoaAZoCWgPQwgK16NwPQoUwJSGlFKUaBVN9QFoFkdAhUuI3rD633V9lChoBmgJaA9DCArXo3A9ChTAlIaUUpRoFU31AWgWR0CFS6xhUipvdX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIVMNNQCSzR1fZQoaAZoCWgPQwgK16NwPQoUwJSGlFKUaBVN9QFoFkdAhY56aCtihHV9lChoBmgJaA9DCHE9CtejiH/AlIaUUpRoFU3HAWgWR0CFjzFYMfA9dX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIWP/Ehq0t11fZQoaAZoCWgPQwgK16NwPQoUwJSGlFKUaBVN9QFoFkdAhZAQTVUdaXV9lChoBmgJaA9DCFK4HoXrVX/AlIaUUpRoFUuKaBZHQIWSkImgJ1J1fZQoaAZoCWgPQwg9CtejcFl/wJSGlFKUaBVLoGgWR0CFlI1CPZIydX2UKGgGaAloD0MIrkfhehRif8CUhpRSlGgVS9ZoFkdAhZYmBFuvU3V9lChoBmgJaA9DCDMzMzMzZ3/AlIaUUpRoFUv2aBZHQIWbOueSSvF1fZQoaAZoCWgPQwiamZmZmX1/wJSGlFKUaBVNggFoFkdAhZvZEDyOJnV9lChoBmgJaA9DCK5H4XoUXn/AlIaUUpRoFUu9aBZHQIWhm4I8hcJ1fZQoaAZoCWgPQwgfhetRuIZ/wJSGlFKUaBVNuwFoFkdAhaTIbfgrH3V9lChoBmgJaA9DCArXo3A9ChTAlIaUUpRoFU31AWgWR0CFpNLLZBcBdX2UKGgGaAloD0MIMzMzMzNTf8CUhpRSlGgVS3loFkdAhaoDQZ4wAXV9lChoBmgJaA9DCArXo3A9ChTAlIaUUpRoFU31AWgWR0CFrDtPYWcjdX2UKGgGaAloD0MI4XoUrkdhf8CUhpRSlGgVS9FoFkdAhbNsXaakRHV9lChoBmgJaA9DCArXo3A9ChTAlIaUUpRoFU31AWgWR0CFs3vddmg8dX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIW4TcXWOIZ1fZQoaAZoCWgPQwgK16NwPVJ/wJSGlFKUaBVLc2gWR0CFuGc3l0YCdX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIW9os3AEdN1fZQoaAZoCWgPQwhSuB6F611/wJSGlFKUaBVLvGgWR0CFwGn/DLr5dX2UKGgGaAloD0MIXI/C9Shof8CUhpRSlGgVS/xoFkdAhcKNfgJkXnV9lChoBmgJaA9DCAAAAAAAYH/AlIaUUpRoFUvJaBZHQIXF5k3CKrJ1fZQoaAZoCWgPQwgK16NwPQoUwJSGlFKUaBVN9QFoFkdAhcfzyz5XVHV9lChoBmgJaA9DCDMzMzMzZ3/AlIaUUpRoFUv2aBZHQIXJ7iIcinp1fZQoaAZoCWgPQwiamZmZmWl/wJSGlFKUaBVNBQFoFkdAhcyGEPDpDHV9lChoBmgJaA9DCBSuR+F6WH/AlIaUUpRoFUuaaBZHQIXOKPwNLDh1fZQoaAZoCWgPQwi4HoXrUXB/wJSGlFKUaBVNLwFoFkdAhgPITXarWHV9lChoBmgJaA9DCHE9CtejZH/AlIaUUpRoFUvmaBZHQIYE+P7vXsh1fZQoaAZoCWgPQwhcj8L1KGR/wJSGlFKUaBVL42gWR0CGDNNj9XLedX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIYQSQxN7Bx1fZQoaAZoCWgPQwgK16NwPQoUwJSGlFKUaBVN9QFoFkdAhhEIxQBPsXV9lChoBmgJaA9DCArXo3A9ChTAlIaUUpRoFU31AWgWR0CGE2qFRHf/dX2UKGgGaAloD0MIFK5H4Xpsf8CUhpRSlGgVTRcBaBZHQIYZftUn5SF1fZQoaAZoCWgPQwgK16NwPQoUwJSGlFKUaBVN9QFoFkdAhhuYCyQgcXV9lChoBmgJaA9DCDMzMzMza3/AlIaUUpRoFU0PAWgWR0CGG6ZP2wmmdX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIYfPQID5j91fZQoaAZoCWgPQwhxPQrXo0h/wJSGlFKUaBVLN2gWR0CGIQnQY1pCdX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIYq1ObiIcl1fZQoaAZoCWgPQwgK16NwPQoUwJSGlFKUaBVN9QFoFkdAhi1jZUT+N3V9lChoBmgJaA9DCArXo3A9ChTAlIaUUpRoFU31AWgWR0CGLXE61b7kdX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIY06ZBsyi51fZQoaAZoCWgPQwgK16NwPQoUwJSGlFKUaBVN9QFoFkdAhj3O0b961XV9lChoBmgJaA9DCArXo3A9ChTAlIaUUpRoFU31AWgWR0CGQFeBxxT9dX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIZAZRuTA311fZQoaAZoCWgPQwhI4XoUrod/wJSGlFKUaBVNwQFoFkdAhkV0ulGgBnV9lChoBmgJaA9DCAAAAAAAYH/AlIaUUpRoFUvJaBZHQIZFiY9gWrR1fZQoaAZoCWgPQwgfhetRuF5/wJSGlFKUaBVLwWgWR0CGSJllK9PDdX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIaGE34sVcl1fZQoaAZoCWgPQwgK16NwPQoUwJSGlFKUaBVN9QFoFkdAhoqOMdcSoXV9lChoBmgJaA9DCArXo3A9ChTAlIaUUpRoFU31AWgWR0CGirQyhzvJdX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIaNOvdM0xd1fZQoaAZoCWgPQwgK16NwPQoUwJSGlFKUaBVN9QFoFkdAhpiTlcQiA3V9lChoBmgJaA9DCArXo3A9ChTAlIaUUpRoFU31AWgWR0CGnbxG2CumdX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIad0Oqebut1fZQoaAZoCWgPQwgK16NwPQoUwJSGlFKUaBVN9QFoFkdAhqCLYoRZlnV9lChoBmgJaA9DCArXo3A9ChTAlIaUUpRoFU31AWgWR0CGqypd8iOedX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIau4HgP3BZ1fZQoaAZoCWgPQwgK16NwPQoYwJSGlFKUaBVN9QFoFkdAhq71GkN4JXV9lChoBmgJaA9DCArXo3A9ChTAlIaUUpRoFU31AWgWR0CGsXPrOZ9edX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIa7QUN8VpN1fZQoaAZoCWgPQwgK16NwPQoUwJSGlFKUaBVN9QFoFkdAhr9f3evZAnV9lChoBmgJaA9DCArXo3A9ChTAlIaUUpRoFU31AWgWR0CGv3TLns9kdX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIbB6pLmITJ1fZQoaAZoCWgPQwgK16NwPQoUwJSGlFKUaBVN9QFoFkdAhvsqXfIjnnV9lChoBmgJaA9DCArXo3A9ChTAlIaUUpRoFU31AWgWR0CHALIkJKJ3dX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIcAxvWH1vl1fZQoaAZoCWgPQwgK16NwPQoUwJSGlFKUaBVN9QFoFkdAhwLnWz4UOHV9lChoBmgJaA9DCArXo3A9ChTAlIaUUpRoFU31AWgWR0CHD+pBHCoCdX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIcT9u3trsV1fZQoaAZoCWgPQwgK16NwPQoUwJSGlFKUaBVN9QFoFkdAhxQLsjVx0nV9lChoBmgJaA9DCArXo3A9ChjAlIaUUpRoFU31AWgWR0CHF4ZMtbs4dX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIckFr2xptd1fZQoaAZoCWgPQwgK16NwPQoUwJSGlFKUaBVN9QFoFkdAhynLlFMIvHV9lChoBmgJaA9DCArXo3A9ChTAlIaUUpRoFU31AWgWR0CHKeBK+SKWdX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIcr3H/95yF1fZQoaAZoCWgPQwgK16NwPQoUwJSGlFKUaBVN9QFoFkdAhzdkl/pdKXV9lChoBmgJaA9DCArXo3A9ChTAlIaUUpRoFU31AWgWR0CHPXMJQcghdX2UKGgGaAloD0MICtejcD0KGMCUhpRSlGgVTfUBaBZHQIc9l4C6pYN1fZQoaAZoCWgPQwgK16NwPQoUwJSGlFKUaBVN9QFoFkdAh0Ba/yoXK3V9lChoBmgJaA9DCArXo3A9ChTAlIaUUpRoFU31AWgWR0CHd3NnoPkJdX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQId7Ie9zwMJ1fZQoaAZoCWgPQwgK16NwPQoUwJSGlFKUaBVN9QFoFkdAh3s2jGkvb3V9lChoBmgJaA9DCArXo3A9ChTAlIaUUpRoFU31AWgWR0CHfRwYtQKsdX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIeH2p84Pwx1fZQoaAZoCWgPQwgK16NwPQoUwJSGlFKUaBVN9QFoFkdAh44kehf0E3V9lChoBmgJaA9DCArXo3A9ChTAlIaUUpRoFU31AWgWR0CHjkB+4LCvdX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIeRJDu0CzV1fZQoaAZoCWgPQwgK16NwPQoUwJSGlFKUaBVN9QFoFkdAh5vHuJDVpnV9lChoBmgJaA9DCArXo3A9ChTAlIaUUpRoFU31AWgWR0CHoFvze40/dX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIegcMAmzB11fZQoaAZoCWgPQwgK16NwPQoYwJSGlFKUaBVN9QFoFkdAh6J79hqj8HV9lChoBmgJaA9DCArXo3A9ChTAlIaUUpRoFU31AWgWR0CHrZf+CK77dX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIeylLnLaEl1fZQoaAZoCWgPQwgK16NwPQoUwJSGlFKUaBVN9QFoFkdAh7KpcxCY1HV9lChoBmgJaA9DCArXo3A9ChjAlIaUUpRoFU31AWgWR0CHtJpSrHU+dWUu"
74
  },
75
  "ep_success_buffer": {
76
  ":type:": "<class 'collections.deque'>",
 
4
  ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==",
5
  "__module__": "stable_baselines3.common.policies",
6
  "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
7
+ "__init__": "<function ActorCriticPolicy.__init__ at 0x7f7b637e0ee0>",
8
+ "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f7b637e0f70>",
9
+ "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f7b637e1000>",
10
+ "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f7b637e1090>",
11
+ "_build": "<function ActorCriticPolicy._build at 0x7f7b637e1120>",
12
+ "forward": "<function ActorCriticPolicy.forward at 0x7f7b637e11b0>",
13
+ "extract_features": "<function ActorCriticPolicy.extract_features at 0x7f7b637e1240>",
14
+ "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f7b637e12d0>",
15
+ "_predict": "<function ActorCriticPolicy._predict at 0x7f7b637e1360>",
16
+ "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f7b637e13f0>",
17
+ "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f7b637e1480>",
18
+ "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f7b637e1510>",
19
  "__abstractmethods__": "frozenset()",
20
+ "_abc_impl": "<_abc._abc_data object at 0x7f7b63aaae00>"
21
  },
22
  "verbose": true,
23
  "policy_kwargs": {},
 
48
  "_num_timesteps_at_start": 0,
49
  "seed": null,
50
  "action_noise": null,
51
+ "start_time": 1681190423033058191,
52
  "learning_rate": 0.0003,
53
  "tensorboard_log": null,
54
  "lr_schedule": {
 
57
  },
58
  "_last_obs": {
59
  ":type:": "<class 'numpy.ndarray'>",
60
+ ":serialized:": "gAWVxQAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJZQAAAAAAAAAD/lmULeG4I/gw6XQdV1TkGaOZtBDsDoQmoW3D7dpJZCH5aEQuDCrEKUe7hCcQGPP0MpA0KU2JJBGM27QRsdu0Kfeps/QIsCQsvsmEG/4cVBlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksESwWGlIwBQ5R0lFKULg=="
61
  },
62
  "_last_episode_starts": {
63
  ":type:": "<class 'numpy.ndarray'>",
 
70
  "_current_progress_remaining": -0.0035199999999999676,
71
  "ep_info_buffer": {
72
  ":type:": "<class 'collections.deque'>",
73
+ ":serialized:": "gAWVVhAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIuB6F61EgbsCUhpRSlIwBbJRN9QGMAXSUR0CGEi1MM7U5dX2UKGgGaAloD0MImpmZmZllg8CUhpRSlGgVTQ8BaBZHQIYTqt1ZDAt1fZQoaAZoCWgPQwi4HoXrUeBtwJSGlFKUaBVN9QFoFkdAhhdT7VJ+UnV9lChoBmgJaA9DCLgehetRAG7AlIaUUpRoFU31AWgWR0CGHz3cpLEldX2UKGgGaAloD0MIuB6F61HgbcCUhpRSlGgVTfUBaBZHQIYjevwEyL11fZQoaAZoCWgPQwi4HoXrUSBuwJSGlFKUaBVN9QFoFkdAhiS/OdGy5nV9lChoBmgJaA9DCJqZmZmZA4PAlIaUUpRoFUv2aBZHQIYnKTGHYYl1fZQoaAZoCWgPQwjD9Shcj9CAwJSGlFKUaBVLbGgWR0CGKPn1WbPQdX2UKGgGaAloD0MIuB6F61HgbcCUhpRSlGgVTfUBaBZHQIYpCLfk3jx1fZQoaAZoCWgPQwg9CtejcJOEwJSGlFKUaBVNWAFoFkdAhjQsFEAo5XV9lChoBmgJaA9DCLgehetR4G3AlIaUUpRoFU31AWgWR0CGNFTisGPgdX2UKGgGaAloD0MIuB6F61HgbcCUhpRSlGgVTfUBaBZHQIY4xBcAzYV1fZQoaAZoCWgPQwi4HoXrUSBuwJSGlFKUaBVN9QFoFkdAhjpL8aXKKnV9lChoBmgJaA9DCLgehetRAG7AlIaUUpRoFU31AWgWR0CGfGZ62OQydX2UKGgGaAloD0MIuB6F61HgbcCUhpRSlGgVTfUBaBZHQIZ8mxbB42V1fZQoaAZoCWgPQwi4HoXrUQBuwJSGlFKUaBVN9QFoFkdAhoJYM4LkS3V9lChoBmgJaA9DCLgehetRAG7AlIaUUpRoFU31AWgWR0CGhCTr3TNMdX2UKGgGaAloD0MIexSuR+HehsCUhpRSlGgVTecBaBZHQIaRB08vEjx1fZQoaAZoCWgPQwi4HoXrUQBuwJSGlFKUaBVN9QFoFkdAhpFQBHTZx3V9lChoBmgJaA9DCOxRuB6FNYDAlIaUUpRoFUtGaBZHQIaThAD7qIJ1fZQoaAZoCWgPQwi4HoXrUSBuwJSGlFKUaBVN9QFoFkdAhpZlJ6IFeXV9lChoBmgJaA9DCLgehetRIG7AlIaUUpRoFU31AWgWR0CGl5clgMMJdX2UKGgGaAloD0MIFK5H4XpggsCUhpRSlGgVS89oFkdAhpmib2Dg63V9lChoBmgJaA9DCOF6FK5HIYTAlIaUUpRoFU09AWgWR0CGpLPpIMBqdX2UKGgGaAloD0MIuB6F61EAbsCUhpRSlGgVTfUBaBZHQIaoIPI4lyB1fZQoaAZoCWgPQwhcj8L1KOh/wJSGlFKUaBVLNGgWR0CGqecdYGMXdX2UKGgGaAloD0MIuB6F61HgbcCUhpRSlGgVTfUBaBZHQIaqJDVpbll1fZQoaAZoCWgPQwi4HoXrUQBuwJSGlFKUaBVN9QFoFkdAhqytdiUgS3V9lChoBmgJaA9DCLgehetR4G3AlIaUUpRoFU31AWgWR0CGtH7MPjGUdX2UKGgGaAloD0MIuB6F61HgbcCUhpRSlGgVTfUBaBZHQIa5dznzQNV1fZQoaAZoCWgPQwi4HoXrUQBuwJSGlFKUaBVN9QFoFkdAhrmylnAZbnV9lChoBmgJaA9DCI/C9Shct3/AlIaUUpRoFUsvaBZHQIa7Mk2P1ct1fZQoaAZoCWgPQwi4HoXrUQBuwJSGlFKUaBVN9QFoFkdAhryyE12q1nV9lChoBmgJaA9DCDMzMzMzJYDAlIaUUpRoFUtCaBZHQIa9M2UB4lh1fZQoaAZoCWgPQwh7FK5H4d6GwJSGlFKUaBVN5wFoFkdAhvaIBRyfc3V9lChoBmgJaA9DCOxRuB6FZYPAlIaUUpRoFU0OAWgWR0CG+HLytmthdX2UKGgGaAloD0MIw/UoXI+YhcCUhpRSlGgVTZgBaBZHQIb59XiiqQ11fZQoaAZoCWgPQwhSuB6F63uBwJSGlFKUaBVLlmgWR0CG/yRxtHhCdX2UKGgGaAloD0MI4XoUrkfzgsCUhpRSlGgVS/JoFkdAhwGfn4fwJHV9lChoBmgJaA9DCLgehetRIG7AlIaUUpRoFU31AWgWR0CHAb0ZFXq8dX2UKGgGaAloD0MIrkfhehTAgMCUhpRSlGgVS2ZoFkdAhwMGorFwUHV9lChoBmgJaA9DCFyPwvUo2H/AlIaUUpRoFUs0aBZHQIcFA0GeMAF1fZQoaAZoCWgPQwjsUbgehT2AwJSGlFKUaBVLRmgWR0CHB2q94/u9dX2UKGgGaAloD0MICtejcD32gcCUhpRSlGgVS7NoFkdAhwfuv2Xb/XV9lChoBmgJaA9DCBSuR+F6boDAlIaUUpRoFUtSaBZHQIcKcwBYFJR1fZQoaAZoCWgPQwhxPQrXo9CAwJSGlFKUaBVLbWgWR0CHDDyEtdzGdX2UKGgGaAloD0MIuB6F61EAbsCUhpRSlGgVTfUBaBZHQIcNbPSlWOp1fZQoaAZoCWgPQwiamZmZmQmBwJSGlFKUaBVLeWgWR0CHEN7j1f3OdX2UKGgGaAloD0MIuB6F61EgbsCUhpRSlGgVTfUBaBZHQIcScjJMg2Z1fZQoaAZoCWgPQwiF61G4HoeAwJSGlFKUaBVLWmgWR0CHE3IcR15jdX2UKGgGaAloD0MIuB6F61FAbsCUhpRSlGgVTfUBaBZHQIcbEKeCkGl1fZQoaAZoCWgPQwi4HoXrUeBtwJSGlFKUaBVN9QFoFkdAhxyMJQcghnV9lChoBmgJaA9DCLgehetRAG7AlIaUUpRoFU31AWgWR0CHJJKWcBludX2UKGgGaAloD0MIuB6F61EgbsCUhpRSlGgVTfUBaBZHQIcmWG9Htnh1fZQoaAZoCWgPQwhI4XoUrkWAwJSGlFKUaBVLSGgWR0CHKJCBwuM/dX2UKGgGaAloD0MIcT0K16N6hMCUhpRSlGgVTU4BaBZHQIcpEt29tdl1fZQoaAZoCWgPQwiamZmZmaeAwJSGlFKUaBVLYGgWR0CHK6etCAtndX2UKGgGaAloD0MIuB6F61FgbsCUhpRSlGgVTfUBaBZHQIctGPaL4vh1fZQoaAZoCWgPQwiuR+F6FF6AwJSGlFKUaBVLTWgWR0CHL9iPyTY/dX2UKGgGaAloD0MIuB6F61EgbsCUhpRSlGgVTfUBaBZHQIc12thd+od1fZQoaAZoCWgPQwi4HoXrUSBuwJSGlFKUaBVN9QFoFkdAhzpq3uuzQnV9lChoBmgJaA9DCLgehetRQG7AlIaUUpRoFU31AWgWR0CHPNzGxUvPdX2UKGgGaAloD0MIj8L1KFzPg8CUhpRSlGgVTSUBaBZHQIdyP2saKk51fZQoaAZoCWgPQwiuR+F6FMaGwJSGlFKUaBVN3QFoFkdAh3Jx6fJ3gXV9lChoBmgJaA9DCAAAAAAAIoHAlIaUUpRoFUt+aBZHQIdziB7NSqF1fZQoaAZoCWgPQwgzMzMzMy2AwJSGlFKUaBVLQmgWR0CHdS/gR9PUdX2UKGgGaAloD0MIpHA9CtdFgMCUhpRSlGgVS0poFkdAh3U3trsSkHV9lChoBmgJaA9DCFyPwvUo2H/AlIaUUpRoFUs0aBZHQId3VjZteld1fZQoaAZoCWgPQwiamZmZmaeAwJSGlFKUaBVLYGgWR0CHd5xaxHG0dX2UKGgGaAloD0MIuB6F61FOgMCUhpRSlGgVS1BoFkdAh3jIKtxMnXV9lChoBmgJaA9DCM3MzMzMFIDAlIaUUpRoFUs9aBZHQId6o/FBIFx1fZQoaAZoCWgPQwikcD0K18d/wJSGlFKUaBVLMmgWR0CHezdHlOoHdX2UKGgGaAloD0MI9ihcj8JFgMCUhpRSlGgVS0loFkdAh33A3T/hl3V9lChoBmgJaA9DCLgehetRIG7AlIaUUpRoFU31AWgWR0CHgMzuWrwOdX2UKGgGaAloD0MIuB6F61HgbcCUhpRSlGgVTfUBaBZHQIeMqdat9x91fZQoaAZoCWgPQwi4HoXrUSBuwJSGlFKUaBVN9QFoFkdAh4+AaWHDaXV9lChoBmgJaA9DCPYoXI/CCYHAlIaUUpRoFUt7aBZHQIeQ6agElmh1fZQoaAZoCWgPQwi4HoXrUQBuwJSGlFKUaBVN9QFoFkdAh5GRfOUt7XV9lChoBmgJaA9DCLgehetRIG7AlIaUUpRoFU31AWgWR0CHk4TlDF6zdX2UKGgGaAloD0MI7FG4HoU9gMCUhpRSlGgVS0ZoFkdAh5Oaol2NenV9lChoBmgJaA9DCLgehetRMoHAlIaUUpRoFUuCaBZHQIeUyJ9Aood1fZQoaAZoCWgPQwjsUbgehQWFwJSGlFKUaBVNcgFoFkdAh5/jZL7GenV9lChoBmgJaA9DCLgehetRAG7AlIaUUpRoFU31AWgWR0CHn/1loUSJdX2UKGgGaAloD0MI16NwPQodgMCUhpRSlGgVS0BoFkdAh6I7+1jRUnV9lChoBmgJaA9DCGZmZmZmXIbAlIaUUpRoFU3IAWgWR0CHo4kpI+W4dX2UKGgGaAloD0MISOF6FK63f8CUhpRSlGgVSzFoFkdAh6XzsQd0aXV9lChoBmgJaA9DCLgehetRIG7AlIaUUpRoFU31AWgWR0CHqCbMottidX2UKGgGaAloD0MIuB6F61EgbsCUhpRSlGgVTfUBaBZHQIe1uH8CPp91fZQoaAZoCWgPQwgAAAAAANh/wJSGlFKUaBVLM2gWR0CHt5MBZIQOdX2UKGgGaAloD0MIuB6F61FAbsCUhpRSlGgVTfUBaBZHQIe352ECeVd1fZQoaAZoCWgPQwjsUbgehbd/wJSGlFKUaBVLMGgWR0CHuP1/2Cd0dX2UKGgGaAloD0MI7FG4HoWnf8CUhpRSlGgVSzBoFkdAh7lndfsu4HV9lChoBmgJaA9DCLgehetR4G3AlIaUUpRoFU31AWgWR0CHustITXardX2UKGgGaAloD0MIFK5H4Xrof8CUhpRSlGgVSzZoFkdAh7vKFqSHM3V9lChoBmgJaA9DCLgehetRIG7AlIaUUpRoFU31AWgWR0CHvBO58Sf2dX2UKGgGaAloD0MIj8L1KFynf8CUhpRSlGgVSy9oFkdAh70hIOH313V9lChoBmgJaA9DCI/C9Shcp3/AlIaUUpRoFUsvaBZHQIe9agsbvPV1fZQoaAZoCWgPQwjD9Shcj0KBwJSGlFKUaBVLhWgWR0CHvbv+fh/BdX2UKGgGaAloD0MImpmZmZkJgcCUhpRSlGgVS3loFkdAh75z5oGpuXV9lChoBmgJaA9DCHE9Ctej6H/AlIaUUpRoFUs3aBZHQIe+/qqwQlN1ZS4="
74
  },
75
  "ep_success_buffer": {
76
  ":type:": "<class 'collections.deque'>",
PPO-hardcoded/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1f670145aa6649ce974d592b9fe4fa352e8658d40a6e5889d7dd0b827a9e1604
3
  size 84985
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b827966602eb29756396f59b61bd9f9b88687efecacc7a6deb3268aaab146c31
3
  size 84985
PPO-hardcoded/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9cc9ca21630eac31e812000c4d456c923fc16c9859750e39a853f1d4d49c249a
3
  size 41857
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7fead625f963d2c047deabaed2f743bf93a982d6031de78759a0185934c83ea7
3
  size 41857
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: RoombaAToB-Hardcoded
17
  metrics:
18
  - type: mean_reward
19
- value: -5.01 +/- 0.00
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: RoombaAToB-Hardcoded
17
  metrics:
18
  - type: mean_reward
19
+ value: -239.01 +/- 0.00
20
  name: mean_reward
21
  verified: false
22
  ---
config.json CHANGED
@@ -1 +1 @@
1
- {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f30071e8ee0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f30071e8f70>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f30071e9000>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f30071e9090>", "_build": "<function ActorCriticPolicy._build at 0x7f30071e9120>", "forward": "<function ActorCriticPolicy.forward at 0x7f30071e91b0>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7f30071e9240>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f30071e92d0>", "_predict": "<function ActorCriticPolicy._predict at 0x7f30071e9360>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f30071e93f0>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f30071e9480>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f30071e9510>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7f30071ec800>"}, "verbose": true, "policy_kwargs": {}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVhwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLBYWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWFAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAJRoC0sFhZSMAUOUdJRSlIwEaGlnaJRoEyiWFAAAAAAAAAAA6P1I2w9JQAAAyEIAAMhCAADIQpRoC0sFhZRoFnSUUpSMDWJvdW5kZWRfYmVsb3eUaBMolgUAAAAAAAAAAQEBAQGUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLBYWUaBZ0lFKUjA1ib3VuZGVkX2Fib3ZllGgTKJYFAAAAAAAAAAEBAQEBlGgiSwWFlGgWdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [5], "low": "[0. 0. 0. 0. 0.]", "high": "[5.2000000e+05 3.1415927e+00 1.0000000e+02 1.0000000e+02 1.0000000e+02]", "bounded_below": "[ True True True True True]", "bounded_above": "[ True True True True True]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gAWViAAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu", "n": 4, "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 4, "num_timesteps": 401408, "_total_timesteps": 400000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1681189254138184037, "learning_rate": 0.0003, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWV4QIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMVy9ob21lL25vaXNlYnJpZGdlLy5sb2NhbC9saWIvcHl0aG9uMy4xMC9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4JDAgQBlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMVy9ob21lL25vaXNlYnJpZGdlLy5sb2NhbC9saWIvcHl0aG9uMy4xMC9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/M6kqMFUyYYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVxQAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJZQAAAAAAAAAJxigUMYAY8//WcWQtLiHkIAAMhCAICCQ5qZmT+a7CRCmuwkQgAAyELren9DboGgP5gE10H/WNRBihgsQvr1gEM3i5s/3o8ZQk/xEkIAAMhClIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksESwWGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYEAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwSFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.0035199999999999676, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVbxAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMICtejcD0KFMCUhpRSlIwBbJRN9QGMAXSUR0CFOSrwvxpddX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIVKHE/B3zN1fZQoaAZoCWgPQwgK16NwPQoUwJSGlFKUaBVN9QFoFkdAhUuI3rD633V9lChoBmgJaA9DCArXo3A9ChTAlIaUUpRoFU31AWgWR0CFS6xhUipvdX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIVMNNQCSzR1fZQoaAZoCWgPQwgK16NwPQoUwJSGlFKUaBVN9QFoFkdAhY56aCtihHV9lChoBmgJaA9DCHE9CtejiH/AlIaUUpRoFU3HAWgWR0CFjzFYMfA9dX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIWP/Ehq0t11fZQoaAZoCWgPQwgK16NwPQoUwJSGlFKUaBVN9QFoFkdAhZAQTVUdaXV9lChoBmgJaA9DCFK4HoXrVX/AlIaUUpRoFUuKaBZHQIWSkImgJ1J1fZQoaAZoCWgPQwg9CtejcFl/wJSGlFKUaBVLoGgWR0CFlI1CPZIydX2UKGgGaAloD0MIrkfhehRif8CUhpRSlGgVS9ZoFkdAhZYmBFuvU3V9lChoBmgJaA9DCDMzMzMzZ3/AlIaUUpRoFUv2aBZHQIWbOueSSvF1fZQoaAZoCWgPQwiamZmZmX1/wJSGlFKUaBVNggFoFkdAhZvZEDyOJnV9lChoBmgJaA9DCK5H4XoUXn/AlIaUUpRoFUu9aBZHQIWhm4I8hcJ1fZQoaAZoCWgPQwgfhetRuIZ/wJSGlFKUaBVNuwFoFkdAhaTIbfgrH3V9lChoBmgJaA9DCArXo3A9ChTAlIaUUpRoFU31AWgWR0CFpNLLZBcBdX2UKGgGaAloD0MIMzMzMzNTf8CUhpRSlGgVS3loFkdAhaoDQZ4wAXV9lChoBmgJaA9DCArXo3A9ChTAlIaUUpRoFU31AWgWR0CFrDtPYWcjdX2UKGgGaAloD0MI4XoUrkdhf8CUhpRSlGgVS9FoFkdAhbNsXaakRHV9lChoBmgJaA9DCArXo3A9ChTAlIaUUpRoFU31AWgWR0CFs3vddmg8dX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIW4TcXWOIZ1fZQoaAZoCWgPQwgK16NwPVJ/wJSGlFKUaBVLc2gWR0CFuGc3l0YCdX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIW9os3AEdN1fZQoaAZoCWgPQwhSuB6F611/wJSGlFKUaBVLvGgWR0CFwGn/DLr5dX2UKGgGaAloD0MIXI/C9Shof8CUhpRSlGgVS/xoFkdAhcKNfgJkXnV9lChoBmgJaA9DCAAAAAAAYH/AlIaUUpRoFUvJaBZHQIXF5k3CKrJ1fZQoaAZoCWgPQwgK16NwPQoUwJSGlFKUaBVN9QFoFkdAhcfzyz5XVHV9lChoBmgJaA9DCDMzMzMzZ3/AlIaUUpRoFUv2aBZHQIXJ7iIcinp1fZQoaAZoCWgPQwiamZmZmWl/wJSGlFKUaBVNBQFoFkdAhcyGEPDpDHV9lChoBmgJaA9DCBSuR+F6WH/AlIaUUpRoFUuaaBZHQIXOKPwNLDh1fZQoaAZoCWgPQwi4HoXrUXB/wJSGlFKUaBVNLwFoFkdAhgPITXarWHV9lChoBmgJaA9DCHE9CtejZH/AlIaUUpRoFUvmaBZHQIYE+P7vXsh1fZQoaAZoCWgPQwhcj8L1KGR/wJSGlFKUaBVL42gWR0CGDNNj9XLedX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIYQSQxN7Bx1fZQoaAZoCWgPQwgK16NwPQoUwJSGlFKUaBVN9QFoFkdAhhEIxQBPsXV9lChoBmgJaA9DCArXo3A9ChTAlIaUUpRoFU31AWgWR0CGE2qFRHf/dX2UKGgGaAloD0MIFK5H4Xpsf8CUhpRSlGgVTRcBaBZHQIYZftUn5SF1fZQoaAZoCWgPQwgK16NwPQoUwJSGlFKUaBVN9QFoFkdAhhuYCyQgcXV9lChoBmgJaA9DCDMzMzMza3/AlIaUUpRoFU0PAWgWR0CGG6ZP2wmmdX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIYfPQID5j91fZQoaAZoCWgPQwhxPQrXo0h/wJSGlFKUaBVLN2gWR0CGIQnQY1pCdX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIYq1ObiIcl1fZQoaAZoCWgPQwgK16NwPQoUwJSGlFKUaBVN9QFoFkdAhi1jZUT+N3V9lChoBmgJaA9DCArXo3A9ChTAlIaUUpRoFU31AWgWR0CGLXE61b7kdX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIY06ZBsyi51fZQoaAZoCWgPQwgK16NwPQoUwJSGlFKUaBVN9QFoFkdAhj3O0b961XV9lChoBmgJaA9DCArXo3A9ChTAlIaUUpRoFU31AWgWR0CGQFeBxxT9dX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIZAZRuTA311fZQoaAZoCWgPQwhI4XoUrod/wJSGlFKUaBVNwQFoFkdAhkV0ulGgBnV9lChoBmgJaA9DCAAAAAAAYH/AlIaUUpRoFUvJaBZHQIZFiY9gWrR1fZQoaAZoCWgPQwgfhetRuF5/wJSGlFKUaBVLwWgWR0CGSJllK9PDdX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIaGE34sVcl1fZQoaAZoCWgPQwgK16NwPQoUwJSGlFKUaBVN9QFoFkdAhoqOMdcSoXV9lChoBmgJaA9DCArXo3A9ChTAlIaUUpRoFU31AWgWR0CGirQyhzvJdX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIaNOvdM0xd1fZQoaAZoCWgPQwgK16NwPQoUwJSGlFKUaBVN9QFoFkdAhpiTlcQiA3V9lChoBmgJaA9DCArXo3A9ChTAlIaUUpRoFU31AWgWR0CGnbxG2CumdX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIad0Oqebut1fZQoaAZoCWgPQwgK16NwPQoUwJSGlFKUaBVN9QFoFkdAhqCLYoRZlnV9lChoBmgJaA9DCArXo3A9ChTAlIaUUpRoFU31AWgWR0CGqypd8iOedX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIau4HgP3BZ1fZQoaAZoCWgPQwgK16NwPQoYwJSGlFKUaBVN9QFoFkdAhq71GkN4JXV9lChoBmgJaA9DCArXo3A9ChTAlIaUUpRoFU31AWgWR0CGsXPrOZ9edX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIa7QUN8VpN1fZQoaAZoCWgPQwgK16NwPQoUwJSGlFKUaBVN9QFoFkdAhr9f3evZAnV9lChoBmgJaA9DCArXo3A9ChTAlIaUUpRoFU31AWgWR0CGv3TLns9kdX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIbB6pLmITJ1fZQoaAZoCWgPQwgK16NwPQoUwJSGlFKUaBVN9QFoFkdAhvsqXfIjnnV9lChoBmgJaA9DCArXo3A9ChTAlIaUUpRoFU31AWgWR0CHALIkJKJ3dX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIcAxvWH1vl1fZQoaAZoCWgPQwgK16NwPQoUwJSGlFKUaBVN9QFoFkdAhwLnWz4UOHV9lChoBmgJaA9DCArXo3A9ChTAlIaUUpRoFU31AWgWR0CHD+pBHCoCdX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIcT9u3trsV1fZQoaAZoCWgPQwgK16NwPQoUwJSGlFKUaBVN9QFoFkdAhxQLsjVx0nV9lChoBmgJaA9DCArXo3A9ChjAlIaUUpRoFU31AWgWR0CHF4ZMtbs4dX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIckFr2xptd1fZQoaAZoCWgPQwgK16NwPQoUwJSGlFKUaBVN9QFoFkdAhynLlFMIvHV9lChoBmgJaA9DCArXo3A9ChTAlIaUUpRoFU31AWgWR0CHKeBK+SKWdX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIcr3H/95yF1fZQoaAZoCWgPQwgK16NwPQoUwJSGlFKUaBVN9QFoFkdAhzdkl/pdKXV9lChoBmgJaA9DCArXo3A9ChTAlIaUUpRoFU31AWgWR0CHPXMJQcghdX2UKGgGaAloD0MICtejcD0KGMCUhpRSlGgVTfUBaBZHQIc9l4C6pYN1fZQoaAZoCWgPQwgK16NwPQoUwJSGlFKUaBVN9QFoFkdAh0Ba/yoXK3V9lChoBmgJaA9DCArXo3A9ChTAlIaUUpRoFU31AWgWR0CHd3NnoPkJdX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQId7Ie9zwMJ1fZQoaAZoCWgPQwgK16NwPQoUwJSGlFKUaBVN9QFoFkdAh3s2jGkvb3V9lChoBmgJaA9DCArXo3A9ChTAlIaUUpRoFU31AWgWR0CHfRwYtQKsdX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIeH2p84Pwx1fZQoaAZoCWgPQwgK16NwPQoUwJSGlFKUaBVN9QFoFkdAh44kehf0E3V9lChoBmgJaA9DCArXo3A9ChTAlIaUUpRoFU31AWgWR0CHjkB+4LCvdX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIeRJDu0CzV1fZQoaAZoCWgPQwgK16NwPQoUwJSGlFKUaBVN9QFoFkdAh5vHuJDVpnV9lChoBmgJaA9DCArXo3A9ChTAlIaUUpRoFU31AWgWR0CHoFvze40/dX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIegcMAmzB11fZQoaAZoCWgPQwgK16NwPQoYwJSGlFKUaBVN9QFoFkdAh6J79hqj8HV9lChoBmgJaA9DCArXo3A9ChTAlIaUUpRoFU31AWgWR0CHrZf+CK77dX2UKGgGaAloD0MICtejcD0KFMCUhpRSlGgVTfUBaBZHQIeylLnLaEl1fZQoaAZoCWgPQwgK16NwPQoUwJSGlFKUaBVN9QFoFkdAh7KpcxCY1HV9lChoBmgJaA9DCArXo3A9ChjAlIaUUpRoFU31AWgWR0CHtJpSrHU+dWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 1850, "n_steps": 2048, "gamma": 0.99, "gae_lambda": 0.5, "ent_coef": 0.0, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 10, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWV4QIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMVy9ob21lL25vaXNlYnJpZGdlLy5sb2NhbC9saWIvcHl0aG9uMy4xMC9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4JDAgQBlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMVy9ob21lL25vaXNlYnJpZGdlLy5sb2NhbC9saWIvcHl0aG9uMy4xMC9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/yZmZmZmZmoWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "system_info": {"OS": "Linux-5.19.0-35-generic-x86_64-with-glibc2.35 # 36~22.04.1-Ubuntu SMP PREEMPT_DYNAMIC Fri Feb 17 15:17:25 UTC 2", "Python": "3.10.9", "Stable-Baselines3": "1.7.0", "PyTorch": "2.0.0", "GPU Enabled": "True", "Numpy": "1.23.5", "Gym": "0.21.0"}}
 
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVOwAAAAAAAACMIXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5wb2xpY2llc5SMEUFjdG9yQ3JpdGljUG9saWN5lJOULg==", "__module__": "stable_baselines3.common.policies", "__doc__": "\n Policy class for actor-critic algorithms (has both policy and value prediction).\n Used by A2C, PPO and the likes.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param ortho_init: Whether to use or not orthogonal initialization\n :param use_sde: Whether to use State Dependent Exploration or not\n :param log_std_init: Initial value for the log standard deviation\n :param full_std: Whether to use (n_features x n_actions) parameters\n for the std instead of only (n_features,) when using gSDE\n :param use_expln: Use ``expln()`` function instead of ``exp()`` to ensure\n a positive standard deviation (cf paper). It allows to keep variance\n above zero and prevent it from growing too fast. In practice, ``exp()`` is usually enough.\n :param squash_output: Whether to squash the output using a tanh function,\n this allows to ensure boundaries when using gSDE.\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param share_features_extractor: If True, the features extractor is shared between the policy and value networks.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function ActorCriticPolicy.__init__ at 0x7f7b637e0ee0>", "_get_constructor_parameters": "<function ActorCriticPolicy._get_constructor_parameters at 0x7f7b637e0f70>", "reset_noise": "<function ActorCriticPolicy.reset_noise at 0x7f7b637e1000>", "_build_mlp_extractor": "<function ActorCriticPolicy._build_mlp_extractor at 0x7f7b637e1090>", "_build": "<function ActorCriticPolicy._build at 0x7f7b637e1120>", "forward": "<function ActorCriticPolicy.forward at 0x7f7b637e11b0>", "extract_features": "<function ActorCriticPolicy.extract_features at 0x7f7b637e1240>", "_get_action_dist_from_latent": "<function ActorCriticPolicy._get_action_dist_from_latent at 0x7f7b637e12d0>", "_predict": "<function ActorCriticPolicy._predict at 0x7f7b637e1360>", "evaluate_actions": "<function ActorCriticPolicy.evaluate_actions at 0x7f7b637e13f0>", "get_distribution": "<function ActorCriticPolicy.get_distribution at 0x7f7b637e1480>", "predict_values": "<function ActorCriticPolicy.predict_values at 0x7f7b637e1510>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7f7b63aaae00>"}, "verbose": true, "policy_kwargs": {}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVhwEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLBYWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWFAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAJRoC0sFhZSMAUOUdJRSlIwEaGlnaJRoEyiWFAAAAAAAAAAA6P1I2w9JQAAAyEIAAMhCAADIQpRoC0sFhZRoFnSUUpSMDWJvdW5kZWRfYmVsb3eUaBMolgUAAAAAAAAAAQEBAQGUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLBYWUaBZ0lFKUjA1ib3VuZGVkX2Fib3ZllGgTKJYFAAAAAAAAAAEBAQEBlGgiSwWFlGgWdJRSlIwKX25wX3JhbmRvbZROdWIu", "dtype": "float32", "_shape": [5], "low": "[0. 0. 0. 0. 0.]", "high": "[5.2000000e+05 3.1415927e+00 1.0000000e+02 1.0000000e+02 1.0000000e+02]", "bounded_below": "[ True True True True True]", "bounded_above": "[ True True True True True]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gAWViAAAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZROdWIu", "n": 4, "_shape": [], "dtype": "int64", "_np_random": null}, "n_envs": 4, "num_timesteps": 401408, "_total_timesteps": 400000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1681190423033058191, "learning_rate": 0.0003, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWV4QIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMVy9ob21lL25vaXNlYnJpZGdlLy5sb2NhbC9saWIvcHl0aG9uMy4xMC9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4JDAgQBlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMVy9ob21lL25vaXNlYnJpZGdlLy5sb2NhbC9saWIvcHl0aG9uMy4xMC9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/M6kqMFUyYYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVxQAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJZQAAAAAAAAAD/lmULeG4I/gw6XQdV1TkGaOZtBDsDoQmoW3D7dpJZCH5aEQuDCrEKUe7hCcQGPP0MpA0KU2JJBGM27QRsdu0Kfeps/QIsCQsvsmEG/4cVBlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksESwWGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYEAAAAAAAAAAAAAACUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwSFlIwBQ5R0lFKULg=="}, "_last_original_obs": null, "_episode_num": 0, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": -0.0035199999999999676, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVVhAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIuB6F61EgbsCUhpRSlIwBbJRN9QGMAXSUR0CGEi1MM7U5dX2UKGgGaAloD0MImpmZmZllg8CUhpRSlGgVTQ8BaBZHQIYTqt1ZDAt1fZQoaAZoCWgPQwi4HoXrUeBtwJSGlFKUaBVN9QFoFkdAhhdT7VJ+UnV9lChoBmgJaA9DCLgehetRAG7AlIaUUpRoFU31AWgWR0CGHz3cpLEldX2UKGgGaAloD0MIuB6F61HgbcCUhpRSlGgVTfUBaBZHQIYjevwEyL11fZQoaAZoCWgPQwi4HoXrUSBuwJSGlFKUaBVN9QFoFkdAhiS/OdGy5nV9lChoBmgJaA9DCJqZmZmZA4PAlIaUUpRoFUv2aBZHQIYnKTGHYYl1fZQoaAZoCWgPQwjD9Shcj9CAwJSGlFKUaBVLbGgWR0CGKPn1WbPQdX2UKGgGaAloD0MIuB6F61HgbcCUhpRSlGgVTfUBaBZHQIYpCLfk3jx1fZQoaAZoCWgPQwg9CtejcJOEwJSGlFKUaBVNWAFoFkdAhjQsFEAo5XV9lChoBmgJaA9DCLgehetR4G3AlIaUUpRoFU31AWgWR0CGNFTisGPgdX2UKGgGaAloD0MIuB6F61HgbcCUhpRSlGgVTfUBaBZHQIY4xBcAzYV1fZQoaAZoCWgPQwi4HoXrUSBuwJSGlFKUaBVN9QFoFkdAhjpL8aXKKnV9lChoBmgJaA9DCLgehetRAG7AlIaUUpRoFU31AWgWR0CGfGZ62OQydX2UKGgGaAloD0MIuB6F61HgbcCUhpRSlGgVTfUBaBZHQIZ8mxbB42V1fZQoaAZoCWgPQwi4HoXrUQBuwJSGlFKUaBVN9QFoFkdAhoJYM4LkS3V9lChoBmgJaA9DCLgehetRAG7AlIaUUpRoFU31AWgWR0CGhCTr3TNMdX2UKGgGaAloD0MIexSuR+HehsCUhpRSlGgVTecBaBZHQIaRB08vEjx1fZQoaAZoCWgPQwi4HoXrUQBuwJSGlFKUaBVN9QFoFkdAhpFQBHTZx3V9lChoBmgJaA9DCOxRuB6FNYDAlIaUUpRoFUtGaBZHQIaThAD7qIJ1fZQoaAZoCWgPQwi4HoXrUSBuwJSGlFKUaBVN9QFoFkdAhpZlJ6IFeXV9lChoBmgJaA9DCLgehetRIG7AlIaUUpRoFU31AWgWR0CGl5clgMMJdX2UKGgGaAloD0MIFK5H4XpggsCUhpRSlGgVS89oFkdAhpmib2Dg63V9lChoBmgJaA9DCOF6FK5HIYTAlIaUUpRoFU09AWgWR0CGpLPpIMBqdX2UKGgGaAloD0MIuB6F61EAbsCUhpRSlGgVTfUBaBZHQIaoIPI4lyB1fZQoaAZoCWgPQwhcj8L1KOh/wJSGlFKUaBVLNGgWR0CGqecdYGMXdX2UKGgGaAloD0MIuB6F61HgbcCUhpRSlGgVTfUBaBZHQIaqJDVpbll1fZQoaAZoCWgPQwi4HoXrUQBuwJSGlFKUaBVN9QFoFkdAhqytdiUgS3V9lChoBmgJaA9DCLgehetR4G3AlIaUUpRoFU31AWgWR0CGtH7MPjGUdX2UKGgGaAloD0MIuB6F61HgbcCUhpRSlGgVTfUBaBZHQIa5dznzQNV1fZQoaAZoCWgPQwi4HoXrUQBuwJSGlFKUaBVN9QFoFkdAhrmylnAZbnV9lChoBmgJaA9DCI/C9Shct3/AlIaUUpRoFUsvaBZHQIa7Mk2P1ct1fZQoaAZoCWgPQwi4HoXrUQBuwJSGlFKUaBVN9QFoFkdAhryyE12q1nV9lChoBmgJaA9DCDMzMzMzJYDAlIaUUpRoFUtCaBZHQIa9M2UB4lh1fZQoaAZoCWgPQwh7FK5H4d6GwJSGlFKUaBVN5wFoFkdAhvaIBRyfc3V9lChoBmgJaA9DCOxRuB6FZYPAlIaUUpRoFU0OAWgWR0CG+HLytmthdX2UKGgGaAloD0MIw/UoXI+YhcCUhpRSlGgVTZgBaBZHQIb59XiiqQ11fZQoaAZoCWgPQwhSuB6F63uBwJSGlFKUaBVLlmgWR0CG/yRxtHhCdX2UKGgGaAloD0MI4XoUrkfzgsCUhpRSlGgVS/JoFkdAhwGfn4fwJHV9lChoBmgJaA9DCLgehetRIG7AlIaUUpRoFU31AWgWR0CHAb0ZFXq8dX2UKGgGaAloD0MIrkfhehTAgMCUhpRSlGgVS2ZoFkdAhwMGorFwUHV9lChoBmgJaA9DCFyPwvUo2H/AlIaUUpRoFUs0aBZHQIcFA0GeMAF1fZQoaAZoCWgPQwjsUbgehT2AwJSGlFKUaBVLRmgWR0CHB2q94/u9dX2UKGgGaAloD0MICtejcD32gcCUhpRSlGgVS7NoFkdAhwfuv2Xb/XV9lChoBmgJaA9DCBSuR+F6boDAlIaUUpRoFUtSaBZHQIcKcwBYFJR1fZQoaAZoCWgPQwhxPQrXo9CAwJSGlFKUaBVLbWgWR0CHDDyEtdzGdX2UKGgGaAloD0MIuB6F61EAbsCUhpRSlGgVTfUBaBZHQIcNbPSlWOp1fZQoaAZoCWgPQwiamZmZmQmBwJSGlFKUaBVLeWgWR0CHEN7j1f3OdX2UKGgGaAloD0MIuB6F61EgbsCUhpRSlGgVTfUBaBZHQIcScjJMg2Z1fZQoaAZoCWgPQwiF61G4HoeAwJSGlFKUaBVLWmgWR0CHE3IcR15jdX2UKGgGaAloD0MIuB6F61FAbsCUhpRSlGgVTfUBaBZHQIcbEKeCkGl1fZQoaAZoCWgPQwi4HoXrUeBtwJSGlFKUaBVN9QFoFkdAhxyMJQcghnV9lChoBmgJaA9DCLgehetRAG7AlIaUUpRoFU31AWgWR0CHJJKWcBludX2UKGgGaAloD0MIuB6F61EgbsCUhpRSlGgVTfUBaBZHQIcmWG9Htnh1fZQoaAZoCWgPQwhI4XoUrkWAwJSGlFKUaBVLSGgWR0CHKJCBwuM/dX2UKGgGaAloD0MIcT0K16N6hMCUhpRSlGgVTU4BaBZHQIcpEt29tdl1fZQoaAZoCWgPQwiamZmZmaeAwJSGlFKUaBVLYGgWR0CHK6etCAtndX2UKGgGaAloD0MIuB6F61FgbsCUhpRSlGgVTfUBaBZHQIctGPaL4vh1fZQoaAZoCWgPQwiuR+F6FF6AwJSGlFKUaBVLTWgWR0CHL9iPyTY/dX2UKGgGaAloD0MIuB6F61EgbsCUhpRSlGgVTfUBaBZHQIc12thd+od1fZQoaAZoCWgPQwi4HoXrUSBuwJSGlFKUaBVN9QFoFkdAhzpq3uuzQnV9lChoBmgJaA9DCLgehetRQG7AlIaUUpRoFU31AWgWR0CHPNzGxUvPdX2UKGgGaAloD0MIj8L1KFzPg8CUhpRSlGgVTSUBaBZHQIdyP2saKk51fZQoaAZoCWgPQwiuR+F6FMaGwJSGlFKUaBVN3QFoFkdAh3Jx6fJ3gXV9lChoBmgJaA9DCAAAAAAAIoHAlIaUUpRoFUt+aBZHQIdziB7NSqF1fZQoaAZoCWgPQwgzMzMzMy2AwJSGlFKUaBVLQmgWR0CHdS/gR9PUdX2UKGgGaAloD0MIpHA9CtdFgMCUhpRSlGgVS0poFkdAh3U3trsSkHV9lChoBmgJaA9DCFyPwvUo2H/AlIaUUpRoFUs0aBZHQId3VjZteld1fZQoaAZoCWgPQwiamZmZmaeAwJSGlFKUaBVLYGgWR0CHd5xaxHG0dX2UKGgGaAloD0MIuB6F61FOgMCUhpRSlGgVS1BoFkdAh3jIKtxMnXV9lChoBmgJaA9DCM3MzMzMFIDAlIaUUpRoFUs9aBZHQId6o/FBIFx1fZQoaAZoCWgPQwikcD0K18d/wJSGlFKUaBVLMmgWR0CHezdHlOoHdX2UKGgGaAloD0MI9ihcj8JFgMCUhpRSlGgVS0loFkdAh33A3T/hl3V9lChoBmgJaA9DCLgehetRIG7AlIaUUpRoFU31AWgWR0CHgMzuWrwOdX2UKGgGaAloD0MIuB6F61HgbcCUhpRSlGgVTfUBaBZHQIeMqdat9x91fZQoaAZoCWgPQwi4HoXrUSBuwJSGlFKUaBVN9QFoFkdAh4+AaWHDaXV9lChoBmgJaA9DCPYoXI/CCYHAlIaUUpRoFUt7aBZHQIeQ6agElmh1fZQoaAZoCWgPQwi4HoXrUQBuwJSGlFKUaBVN9QFoFkdAh5GRfOUt7XV9lChoBmgJaA9DCLgehetRIG7AlIaUUpRoFU31AWgWR0CHk4TlDF6zdX2UKGgGaAloD0MI7FG4HoU9gMCUhpRSlGgVS0ZoFkdAh5Oaol2NenV9lChoBmgJaA9DCLgehetRMoHAlIaUUpRoFUuCaBZHQIeUyJ9Aood1fZQoaAZoCWgPQwjsUbgehQWFwJSGlFKUaBVNcgFoFkdAh5/jZL7GenV9lChoBmgJaA9DCLgehetRAG7AlIaUUpRoFU31AWgWR0CHn/1loUSJdX2UKGgGaAloD0MI16NwPQodgMCUhpRSlGgVS0BoFkdAh6I7+1jRUnV9lChoBmgJaA9DCGZmZmZmXIbAlIaUUpRoFU3IAWgWR0CHo4kpI+W4dX2UKGgGaAloD0MISOF6FK63f8CUhpRSlGgVSzFoFkdAh6XzsQd0aXV9lChoBmgJaA9DCLgehetRIG7AlIaUUpRoFU31AWgWR0CHqCbMottidX2UKGgGaAloD0MIuB6F61EgbsCUhpRSlGgVTfUBaBZHQIe1uH8CPp91fZQoaAZoCWgPQwgAAAAAANh/wJSGlFKUaBVLM2gWR0CHt5MBZIQOdX2UKGgGaAloD0MIuB6F61FAbsCUhpRSlGgVTfUBaBZHQIe352ECeVd1fZQoaAZoCWgPQwjsUbgehbd/wJSGlFKUaBVLMGgWR0CHuP1/2Cd0dX2UKGgGaAloD0MI7FG4HoWnf8CUhpRSlGgVSzBoFkdAh7lndfsu4HV9lChoBmgJaA9DCLgehetR4G3AlIaUUpRoFU31AWgWR0CHustITXardX2UKGgGaAloD0MIFK5H4Xrof8CUhpRSlGgVSzZoFkdAh7vKFqSHM3V9lChoBmgJaA9DCLgehetRIG7AlIaUUpRoFU31AWgWR0CHvBO58Sf2dX2UKGgGaAloD0MIj8L1KFynf8CUhpRSlGgVSy9oFkdAh70hIOH313V9lChoBmgJaA9DCI/C9Shcp3/AlIaUUpRoFUsvaBZHQIe9agsbvPV1fZQoaAZoCWgPQwjD9Shcj0KBwJSGlFKUaBVLhWgWR0CHvbv+fh/BdX2UKGgGaAloD0MImpmZmZkJgcCUhpRSlGgVS3loFkdAh75z5oGpuXV9lChoBmgJaA9DCHE9Ctej6H/AlIaUUpRoFUs3aBZHQIe+/qqwQlN1ZS4="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 1850, "n_steps": 2048, "gamma": 0.99, "gae_lambda": 0.5, "ent_coef": 0.0, "vf_coef": 0.5, "max_grad_norm": 0.5, "batch_size": 64, "n_epochs": 10, "clip_range": {":type:": "<class 'function'>", ":serialized:": "gAWV4QIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMVy9ob21lL25vaXNlYnJpZGdlLy5sb2NhbC9saWIvcHl0aG9uMy4xMC9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4JDAgQBlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMVy9ob21lL25vaXNlYnJpZGdlLy5sb2NhbC9saWIvcHl0aG9uMy4xMC9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/yZmZmZmZmoWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "clip_range_vf": null, "normalize_advantage": true, "target_kl": null, "system_info": {"OS": "Linux-5.19.0-35-generic-x86_64-with-glibc2.35 # 36~22.04.1-Ubuntu SMP PREEMPT_DYNAMIC Fri Feb 17 15:17:25 UTC 2", "Python": "3.10.9", "Stable-Baselines3": "1.7.0", "PyTorch": "2.0.0", "GPU Enabled": "True", "Numpy": "1.23.5", "Gym": "0.21.0"}}
replay.mp4 CHANGED
Binary files a/replay.mp4 and b/replay.mp4 differ
 
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": -5.009999999999937, "std_reward": 8.881784197001252e-16, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-04-10T22:13:53.022883"}
 
1
+ {"mean_reward": -239.00999999999857, "std_reward": 2.842170943040401e-14, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-04-10T22:33:21.424035"}