Upload model to Hugging Face
Browse files- DQN-default.zip +1 -1
- DQN-default/data +19 -19
- DQN-default/policy.optimizer.pth +1 -1
- DQN-default/policy.pth +1 -1
- README.md +1 -1
- config.json +1 -1
- replay.mp4 +0 -0
- results.json +1 -1
DQN-default.zip
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 105963
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a31e8ea220793e410b9636b7630d4655f395bbc9ebb5ee7cd3eeaa2471c89ad2
|
3 |
size 105963
|
DQN-default/data
CHANGED
@@ -4,15 +4,15 @@
|
|
4 |
":serialized:": "gAWVMAAAAAAAAACMHnN0YWJsZV9iYXNlbGluZXMzLmRxbi5wb2xpY2llc5SMCURRTlBvbGljeZSTlC4=",
|
5 |
"__module__": "stable_baselines3.dqn.policies",
|
6 |
"__doc__": "\n Policy class with Q-Value Net and target net for DQN\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
|
7 |
-
"__init__": "<function DQNPolicy.__init__ at
|
8 |
-
"_build": "<function DQNPolicy._build at
|
9 |
-
"make_q_net": "<function DQNPolicy.make_q_net at
|
10 |
-
"forward": "<function DQNPolicy.forward at
|
11 |
-
"_predict": "<function DQNPolicy._predict at
|
12 |
-
"_get_constructor_parameters": "<function DQNPolicy._get_constructor_parameters at
|
13 |
-
"set_training_mode": "<function DQNPolicy.set_training_mode at
|
14 |
"__abstractmethods__": "frozenset()",
|
15 |
-
"_abc_impl": "<_abc._abc_data object at
|
16 |
},
|
17 |
"verbose": true,
|
18 |
"policy_kwargs": {},
|
@@ -31,7 +31,7 @@
|
|
31 |
},
|
32 |
"action_space": {
|
33 |
":type:": "<class 'gym.spaces.discrete.Discrete'>",
|
34 |
-
":serialized:": "gAWVNAsAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////
|
35 |
"n": 4,
|
36 |
"_shape": [],
|
37 |
"dtype": "int64",
|
@@ -43,7 +43,7 @@
|
|
43 |
"_num_timesteps_at_start": 0,
|
44 |
"seed": null,
|
45 |
"action_noise": null,
|
46 |
-
"start_time":
|
47 |
"learning_rate": 0.0001,
|
48 |
"tensorboard_log": null,
|
49 |
"lr_schedule": {
|
@@ -52,7 +52,7 @@
|
|
52 |
},
|
53 |
"_last_obs": {
|
54 |
":type:": "<class 'numpy.ndarray'>",
|
55 |
-
":serialized:": "
|
56 |
},
|
57 |
"_last_episode_starts": {
|
58 |
":type:": "<class 'numpy.ndarray'>",
|
@@ -60,15 +60,15 @@
|
|
60 |
},
|
61 |
"_last_original_obs": {
|
62 |
":type:": "<class 'numpy.ndarray'>",
|
63 |
-
":serialized:": "
|
64 |
},
|
65 |
-
"_episode_num":
|
66 |
"use_sde": false,
|
67 |
"sde_sample_freq": -1,
|
68 |
"_current_progress_remaining": 0.0,
|
69 |
"ep_info_buffer": {
|
70 |
":type:": "<class 'collections.deque'>",
|
71 |
-
":serialized:": "
|
72 |
},
|
73 |
"ep_success_buffer": {
|
74 |
":type:": "<class 'collections.deque'>",
|
@@ -87,12 +87,12 @@
|
|
87 |
":serialized:": "gAWVNQAAAAAAAACMIHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5idWZmZXJzlIwMUmVwbGF5QnVmZmVylJOULg==",
|
88 |
"__module__": "stable_baselines3.common.buffers",
|
89 |
"__doc__": "\n Replay buffer used in off-policy algorithms like SAC/TD3.\n\n :param buffer_size: Max number of element in the buffer\n :param observation_space: Observation space\n :param action_space: Action space\n :param device: PyTorch device\n :param n_envs: Number of parallel environments\n :param optimize_memory_usage: Enable a memory efficient variant\n of the replay buffer which reduces by almost a factor two the memory used,\n at a cost of more complexity.\n See https://github.com/DLR-RM/stable-baselines3/issues/37#issuecomment-637501195\n and https://github.com/DLR-RM/stable-baselines3/pull/28#issuecomment-637559274\n Cannot be used in combination with handle_timeout_termination.\n :param handle_timeout_termination: Handle timeout termination (due to timelimit)\n separately and treat the task as infinite horizon task.\n https://github.com/DLR-RM/stable-baselines3/issues/284\n ",
|
90 |
-
"__init__": "<function ReplayBuffer.__init__ at
|
91 |
-
"add": "<function ReplayBuffer.add at
|
92 |
-
"sample": "<function ReplayBuffer.sample at
|
93 |
-
"_get_samples": "<function ReplayBuffer._get_samples at
|
94 |
"__abstractmethods__": "frozenset()",
|
95 |
-
"_abc_impl": "<_abc._abc_data object at
|
96 |
},
|
97 |
"replay_buffer_kwargs": {},
|
98 |
"train_freq": {
|
|
|
4 |
":serialized:": "gAWVMAAAAAAAAACMHnN0YWJsZV9iYXNlbGluZXMzLmRxbi5wb2xpY2llc5SMCURRTlBvbGljeZSTlC4=",
|
5 |
"__module__": "stable_baselines3.dqn.policies",
|
6 |
"__doc__": "\n Policy class with Q-Value Net and target net for DQN\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
|
7 |
+
"__init__": "<function DQNPolicy.__init__ at 0x7fe79b873520>",
|
8 |
+
"_build": "<function DQNPolicy._build at 0x7fe79b8735b0>",
|
9 |
+
"make_q_net": "<function DQNPolicy.make_q_net at 0x7fe79b873640>",
|
10 |
+
"forward": "<function DQNPolicy.forward at 0x7fe79b8736d0>",
|
11 |
+
"_predict": "<function DQNPolicy._predict at 0x7fe79b873760>",
|
12 |
+
"_get_constructor_parameters": "<function DQNPolicy._get_constructor_parameters at 0x7fe79b8737f0>",
|
13 |
+
"set_training_mode": "<function DQNPolicy.set_training_mode at 0x7fe79b873880>",
|
14 |
"__abstractmethods__": "frozenset()",
|
15 |
+
"_abc_impl": "<_abc._abc_data object at 0x7fe79b8868c0>"
|
16 |
},
|
17 |
"verbose": true,
|
18 |
"policy_kwargs": {},
|
|
|
31 |
},
|
32 |
"action_space": {
|
33 |
":type:": "<class 'gym.spaces.discrete.Discrete'>",
|
34 |
+
":serialized:": "gAWVNAsAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZSMFG51bXB5LnJhbmRvbS5fcGlja2xllIwSX19yYW5kb21zdGF0ZV9jdG9ylJOUjAdNVDE5OTM3lIWUUpR9lCiMDWJpdF9nZW5lcmF0b3KUaBSMBXN0YXRllH2UKIwDa2V5lIwSbnVtcHkuY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QolsAJAAAAAAAA/HeT+DTgV1KAtu+YENCzNwRvBBq6gIJE8+pP5LxeQewk6CFTYWt3V+fcBAp8D0lSogc8YX1OsiAmQXHwrHjLidCOpnyHlWBCFdq4KWHuv7RZKaREigrmsVb+Hqk79I/U/6j4WCNS7lB1eZap2euPoG5ovOvFtG0j1UMEwQ3PNSc8gsrM4PhN1JL3t3Lvz7fFXfm0rw5/nfC4D6T5SlVZnLGXCYEN0wGBy3fxbGenwdlzbyGxCkIIiu0+4ahwSLtCqXFgEx9oQ/m4ycl3XwnwA0d08J9XzxcdWKcT7qMTDjkw6ZR3AQLVisbkmUKwf2g3CtZ+GWhbRMKdmG5jNDhdZPIqYS6AUe2EfU05zdvxBfDV3f/WyuxMGRi7ClawqPB3yUsv7UQkARDOHxl3LEXvyWi2/2tXP7v0Yu4u2LyYVJRqIa0cDy3JXSoaxwmIK8tUFkT/PRHJbaPikZF/tZhvROASeblCVj9dFeZH1sp6Ya6U8TKNmfXAAJFK5Xn/fFNsNpI+Rfabdudkx0LKToSAtVR5A3mTMx0UCFXegMj1h2U0lFMeN+3nN1rlUEnbNZxtS4isGwH+w26kgXErnvs+V+qnQoriglip/lQYrZx3IiXvjmSqTOienH1QKTB62qxQzro23mx4wKPraN5EZ0iI8qouo2B2H6/92tEdgf9Y4mOSc2rfgilZLBMcvOy3rGqcjBxctnvQECERZJV7osqTpwLWi0q2R6bzWmzOjAmRJ9hZ81RWz8M1vePj4fbLQm7bZlquKL/3RL5b54HYEsR/YjHkF6iirS6dsto4LeU0ntRfUd04qI6gvrFoJ8Xt5QUWrF7EKyWTTRVqVbflMN9zF68GrzOwU25maCon8twXumTcFxpRlKiQHJu5RmDx3W7bvG5Va7iZ8bq5WeZYokJ6zNxjmlkrQ5eSjLw3qohX/ve2LTQVSvnnCP0G06VSAXB995dQfjpuKNUqt45GJxYd9gFw3/H5tIuG4sAydj5PdnW9vRkRujYnYSYEeEIJB947BkzAboYaZ6xcGOzlX43xmSvMEbR3YSTno7T9CbHCJ9mZKAoxHStM23chmw6RgdZhuaQdOhzMBsZn+Ks+p0dMLxEkl53gBkhbGqlLn/2fnuC709Zvxr5wdX1U+kXFoO8faiZ3/hlCkFx/cka/xn17TzxIVcMB50fvz/Fhf15vf9NOGPNKyLiIaSD0X+2/8d2MoGUroQ03up69+cDf+npxcIyoOcX+9lkkgyvcIypininzcyl/+XM7LFWzs0ismfSquwtbh8HqDxPFY7OiItu0/Jz52bL0ZOnvLlQrBE2wJteXkbwFm1DSSe0hZyPFvQ2Y7EEfGSpACPN23oy/5HmJwiyExODxGWjV7acV9GULD5FXIM9hf0ifRgCXfrDMl8QvhDJbGi2Jxt8EdwJOsey3KuKHF1jgNyOaZaaxlQOsKceJOUO6GyTQk3TrzV0wZP/kpXV6x3h9ocfE5XPXdPYTm0XbhYRiwfme495M5UwRZDosjCUqU65KInBP4lhde6fTlU6RAJOt9A/YQBp2x88+NLK7uerInxKl1hTDkN6oGW18AH6NtdLHW6lQFHIp62LRshsxHv+ofQCnt2F3vCaAmnmgIpdbi4P5Nm5EQZo3SRsRr0QjqK3GqQzaEF5GrV9J9ITDf46WUwk+g1wBfVzhZuqRdKtZHCeJmy3kSyzIWskpqeQzpiGHx2QKQ8KfB0RwHl4WeEe1rqSkwxXyqDhSAB/sK/lmhaKBAxdSxUjQob2YpWnAk8BAtyB2A3YZU0eP8Q3end8xtV/EVlFZ8gDc4peZDeLMKEITLA/LhOme/mFRDFpHM+VRTUM85hu8/j3grNemL5+8QCg6yQIK7UMZiTy6rgtIhs1Mg+iFVJ3ABKAAqqa+hM/E5vdnf4+/sv1F3SUEz4uB6ht4Wb5ahC8Y/eThDdxcHszTlp23hSoCS7Cgvvnqq5t9ehR6aCosdtNoWqKzw6roKcOpASAOlV5alGT+eHvZuR2lE0n9z2ywDwUB1HodvkpE7qJjQiav87IaPIaMTAc2zUbop8wUuQRr+CmArTSsp2Yx0BHFa0I5vIndjrAljtx4AARXCw/yHY46KAdfL8SvZV57tVPBadWsGVIbyxh8Jhfe2FuizUK/4Wmk3GU0ThnfpGoyPL9uaPsT7IT+su7LqvPoaDoXM9onlsOhk6epSKDr0jFMJ4QpxlKWsTE69y8vGEe48IkLhf7oAWNxDnmgvb4l3KuUJz15WzZYCubb4NhYozWTuEPgSrv57SPbs2Wz+dAwVgdda8+Z4U2PVxh7pFW0KDWL6vra1PBpQMrfmuGOU7s3ySZ9+GYpxaf5SRHqfGBxzheocWLsbxjpJEjzac/sZasVApeMW3/L4fPKhNdSzI6yZMtN9cfT9ANNl+gcZRClwMcAHR/c3yZZIFRbJLNbspe9Kx0kQdamNhEZecsn3L+D4/RkzKki4YuuzQeGugRZwO6/tEhUGYikozNOtiPIR+JNqmyYcANMGueFoGO1WsC9yr+MY8c5jcDNue59n8Lrq/jP0dwVGVI874XrkGW7WjrRt1bj2N2imFsZ65hsQtPF1A9DssJXl9Xgl9Bind8MHaLQ2MDOvW0o3afH/Sp5o3x5kLc3v1fUppRp1t8AJW1ieJZQVMwSSuT3Qhk6+gDoU/1V3IQRlmAJmkzMLDWmMv3QzCqheQOELpob6y0JQ0aCYhKpaKv9s2OoWJ/bSwS+12YTQmpyAJThLPiIF0iVJmnVy3pfmOupVC+vA3WrjZErUGM0N4AvHyVwAttS82irz+8j27QW4cNcD81VR2f35RDwrQQYEoqoacCriQpKtrdLpvx1V3qdH3Vy90nFX3huhkjBzkH+z5GVKvgkrtWjjTRZb01s1k5htI5RL8d7jc5jjIV629+VPzq7Itbd80qeiofP8zg/QSuapfjU3x9eFyFkgpCf7BZqSxNbf+refFi14ElgOS0hBe3NRfaMXemWFAw9ed0Jtv7Sdbs+NyKsSKMjI6q+lX0VGstSYOIO1Mh0ZcSrcZ/OuF44q6TXjJ8PsMmoHRLazweEWQW7WgkOZX6UwpliVSdar60Xu4SjMUB+7fFBZgNUEAhmRIVMo09Ypq/YCA/3hPRbLhYviK2upGZVNHN2Ja/qGZF2WH4991wTpK1CeXfv4rv6h7FlAU6/PbRcOM4/HlbKUew+BXUKfE/rEfc9XzDx6uB4D8HUbNgjLa/WhGEFIYIIkc6facNrAj75Vp6Ic08Tw6piicsm0GDcWZOJgwUpNyfvU1Hffho01gTteteRmtaYwl9L2vlriHbWvBYTlGgKjAJ1NJSJiIeUUpQoSwNoDk5OTkr/////Sv////9LAHSUYk1wAoWUjAFDlHSUUpSMA3Bvc5RL7HWMCWhhc19nYXVzc5RLAIwFZ2F1c3OURwAAAAAAAAAAdWJ1Yi4=",
|
35 |
"n": 4,
|
36 |
"_shape": [],
|
37 |
"dtype": "int64",
|
|
|
43 |
"_num_timesteps_at_start": 0,
|
44 |
"seed": null,
|
45 |
"action_noise": null,
|
46 |
+
"start_time": 1680996362691066755,
|
47 |
"learning_rate": 0.0001,
|
48 |
"tensorboard_log": null,
|
49 |
"lr_schedule": {
|
|
|
52 |
},
|
53 |
"_last_obs": {
|
54 |
":type:": "<class 'numpy.ndarray'>",
|
55 |
+
":serialized:": "gAWV1QAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJZgAAAAAAAAAPF2pMHo2pxCE622PwAAyELLRdhBxGN2QZBKAUJHGLNCUh+DPzdpEkIAAMhCcWR5Qq3DjUK6ubhCivRQPwAAyEKb8cBCAADIQgCAFEMAAMhC67cXP7g/xUIAAMhCFTK1QpSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJLBEsGhpSMAUOUdJRSlC4="
|
56 |
},
|
57 |
"_last_episode_starts": {
|
58 |
":type:": "<class 'numpy.ndarray'>",
|
|
|
60 |
},
|
61 |
"_last_original_obs": {
|
62 |
":type:": "<class 'numpy.ndarray'>",
|
63 |
+
":serialized:": "gAWV1QAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJZgAAAAAAAAAHJpmcH7BZ5CvFa0PwAAyEI+6eFBFzOGQfIrB0LbsLNC0GmBP/PyGEIAAMhCOit7Qte/kEJmBrlCx5JOPwAAyEJkC8RCAADIQgAAFkMAAMhCV4cWP9PFxkIAAMhC56a2QpSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJLBEsGhpSMAUOUdJRSlC4="
|
64 |
},
|
65 |
+
"_episode_num": 3279,
|
66 |
"use_sde": false,
|
67 |
"sde_sample_freq": -1,
|
68 |
"_current_progress_remaining": 0.0,
|
69 |
"ep_info_buffer": {
|
70 |
":type:": "<class 'collections.deque'>",
|
71 |
+
":serialized:": "gAWV4AsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHwGLb37UG3WqMAWyUSziMAXSUR0Bk0/ZyuIRAdX2UKGgGR8BjwjGza9K3aAdLKmgIR0Bk1i9ugpSadX2UKGgGR8Bg9iL0jC53aAdLPmgIR0Bk2LU5MlC1dX2UKGgGR8BVMGQSzw+daAdLZ2gIR0Bk21iH6/IsdX2UKGgGR8BXCIUahpQDaAdLgmgIR0Bk26dpZfUndX2UKGgGR8Bh2QIWxhUjaAdLa2gIR0Bk3lum78NydX2UKGgGR8BjgfKISDh+aAdLJ2gIR0Bk3m1D0DlpdX2UKGgGR8Bkw0YXO4XoaAdLHmgIR0Bk4KqIacZtdX2UKGgGR8BF5G21D0DmaAdLaGgIR0Bk4MSK3uuzdX2UKGgGR8BkBtId2gWaaAdLJ2gIR0Bk47MJQcghdX2UKGgGR8BDOzbnHNoraAdLV2gIR0Bk5SkZaV2SdX2UKGgGR8BDcJ3HJcPfaAdLR2gIR0Bk5kCNjslcdX2UKGgGR8BVAwGr0aqCaAdLVGgIR0Bk6iA4GUwBdX2UKGgGR8BdP4qgAZKnaAdLRWgIR0Bk6nFefI0ZdX2UKGgGRz/vGcOLBKtgaAdLyWgIR0Bk6zp1RtP6dX2UKGgGR8Bkw0YXO4XoaAdLHmgIR0Bk7NNN8E3bdX2UKGgGR8BQ9ymZVn27aAdLXmgIR0Bk7YEbHZK4dX2UKGgGR8BaUzLOiWVvaAdLVWgIR0Bk8a7I1cdHdX2UKGgGR8BLeKv3ai9JaAdLYWgIR0Bk9LxG2CumdX2UKGgGR8Bi8vcnE2pAaAdLLWgIR0Bk9REc81XOdX2UKGgGR8BYEsCHRCyAaAdLfGgIR0Bk9jSJCSiedX2UKGgGR8Bkf11jiGWVaAdLJWgIR0Bk+PJeVs1sdX2UKGgGR0Bdupc1O0swaAdLyWgIR0Bk+XSQYDT0dX2UKGgGR8BabAYtQKrraAdLR2gIR0Bk+n/tIClrdX2UKGgGR8BjPH6GgzxgaAdLK2gIR0Bk/E+X7cfvdX2UKGgGR0B3T0eXAuZkaAdLhGgIR0Bk/tejVQQ+dX2UKGgGR8BWK07r9l3AaAdLS2gIR0Bk/0IsyzomdX2UKGgGR8Bgh5InSfDlaAdLRWgIR0Bk/9JSR8txdX2UKGgGR8Bd5h6jWTX8aAdLR2gIR0BlAcKzAvcrdX2UKGgGR8BjF1iQT238aAdLK2gIR0BlBPwPRRdhdX2UKGgGR8Bj9cvkBCD3aAdLJGgIR0BlB8Re1KGtdX2UKGgGRz/1A/TspoboaAdLj2gIR0BlCjJ0W/JvdX2UKGgGR0BW/O49X9zfaAdLyWgIR0BlDjPQfIS2dX2UKGgGR8BhlUY2sJY1aAdLOWgIR0BlDoPTXrdFdX2UKGgGR0BgNLYukDZEaAdLyWgIR0BlDyH6/IsAdX2UKGgGR8Bj+DsWweNlaAdLJmgIR0BlESErXlKcdX2UKGgGR8BhIK/qPfbcaAdLRWgIR0BlFF9F4LThdX2UKGgGR0BC08dYGMXKaAdLyWgIR0BlFwLw4KhMdX2UKGgGR8BVkJIczZYgaAdLdmgIR0BlF4dXDFZQdX2UKGgGR8BjJnwNLDhtaAdLL2gIR0BlF/hS9/SZdX2UKGgGR8BV7Fpj+aScaAdLaGgIR0BlGSApazNVdX2UKGgGR8BkoLfLs8gZaAdLH2gIR0BlGZPKuB+XdX2UKGgGR8BkGOkpI+W4aAdLI2gIR0BlGsl9jPOZdX2UKGgGR8BU9S+HrQgLaAdLaWgIR0BlH5R4yGi6dX2UKGgGR8BVyv7aZhKEaAdLXmgIR0BlIFSn+AEudX2UKGgGR8BjNW+wkgOjaAdLKmgIR0BlIsoUi6g/dX2UKGgGR8Bj1okAxSHeaAdLJWgIR0BlIzCYTj//dX2UKGgGR8Bi9xFG5MDfaAdLLGgIR0BlJon2IwdsdX2UKGgGR8BgUiU9pyp8aAdLQWgIR0BlJ9kSVW0adX2UKGgGR0BZ0rw4KhL5aAdLyWgIR0BlKO/cnE2pdX2UKGgGR0BVIpvo/zJ7aAdLyWgIR0BlKieCkGiYdX2UKGgGR8Bis+bLEDQraAdLLmgIR0BlK2xOclPadX2UKGgGR8BldA5ksjFAaAdLG2gIR0BlLYESuhbodX2UKGgGR8BYooX9BKL9aAdLVmgIR0BlL5WxQizLdX2UKGgGR8BhC4iX6ZYxaAdLL2gIR0BlMR0yP+4tdX2UKGgGR8ALlP557gKnaAdLd2gIR0BlM0pkPMB7dX2UKGgGR8Bji85jpcHGaAdLKWgIR0BlNEX7+DODdX2UKGgGR8BfVNRBNVR2aAdLPWgIR0BlNFmFrVOLdX2UKGgGR8BlUQkona37aAdLHmgIR0BlNbs6aLGadX2UKGgGR0BhhZWtEG7jaAdLyWgIR0BlNig2606YdX2UKGgGR8BjgqyhSLqEaAdLKGgIR0BlN3iDM/yHdX2UKGgGR8BikVcY64lQaAdLKGgIR0BlONPxhDw6dX2UKGgGR8BciS8an753aAdLN2gIR0BlOlhVlwtKdX2UKGgGR8BYjFERaouPaAdLXWgIR0BlO3m1YyO8dX2UKGgGR8BkDB6OYIBzaAdLJmgIR0BlO7y8SPELdX2UKGgGR8BAQhC+lCTmaAdLTGgIR0BlPVg4OtnxdX2UKGgGR8Bjtb/yXlbNaAdLJmgIR0BlPV/e+Eh8dX2UKGgGR8Ba/QWrOqvNaAdLK2gIR0BlPul0o0AMdX2UKGgGR8BVdUmY0EX+aAdLQGgIR0BlQLFMqSX/dX2UKGgGR8BjAqT6i0v5aAdLLGgIR0BlQ/+S8rZrdX2UKGgGR8BZcEAT7EYPaAdLWWgIR0BlRDCDVYp2dX2UKGgGR8Bk6ctXgccVaAdLHWgIR0BlRkOG0u14dX2UKGgGR8BkaSTMaCL/aAdLIGgIR0BlRq/wiJO4dX2UKGgGR8BlBkfs/pt8aAdLHWgIR0BlSI6wMYuTdX2UKGgGR8BgtHNA1NxmaAdLIWgIR0BlSTgflp49dX2UKGgGR8Bj8rzf779AaAdLI2gIR0BlSyzE74i5dX2UKGgGR0BanF3pwCKaaAdLyWgIR0BlTMCHRCyAdX2UKGgGR8AI7w2ETQE7aAdLyWgIR0BlTkQ9RrJsdX2UKGgGR8Bjko24uscRaAdLMGgIR0BlTuDe0ojOdX2UKGgGR8BhGSdlNDc/aAdLRWgIR0BlVBSpBHCodX2UKGgGR8BcJw75mAbyaAdLZmgIR0BlVIgJTl1bdX2UKGgGR8BcTVPznRsuaAdLaGgIR0BlViwfQrtmdX2UKGgGR0BKt19nbqQjaAdLyWgIR0BlWHcrRSgodX2UKGgGR8BisOaa1Cw9aAdLNGgIR0BlWiLfk3judX2UKGgGR8BimdK7I1cdaAdLLmgIR0BlXAwfyPMjdX2UKGgGR8BQo/6TGHYZaAdLZGgIR0BlXEBIWgvldX2UKGgGR8Bjtb/yXlbNaAdLJmgIR0BlXSy6cy31dX2UKGgGR8Bj5V1hb4ahaAdLJmgIR0BlXySA6MisdX2UKGgGR8BjwDRYzSCwaAdLMGgIR0BlYM+5e7cxdX2UKGgGR0BBrI/qxC6ZaAdLyWgIR0BlY4WrOqvNdX2UKGgGR8BggO9rXUYsaAdLP2gIR0BlZY287IT5dX2UKGgGR8BkoLfLs8gZaAdLH2gIR0BlZfFcY64ldX2UKGgGR8BSf8GcFyJbaAdLW2gIR0BlZicLBsQ/dX2UKGgGR8BkbW3fAKv3aAdLK2gIR0BlaOWUr08OdX2UKGgGR8BkX4UtZmqYaAdLK2gIR0BlaTWZqmCRdX2UKGgGR8BlLPJNj9XLaAdLHWgIR0Bla3Vf/m1ZdX2UKGgGR8BnAVxCIDYAaAdLyWgIR0Bla4dZJTVEdX2UKGgGR8BbaL4SHuZ1aAdLUGgIR0BlbFDBuXNUdX2UKGgGR8BdYTt1IRRNaAdLJ2gIR0Blbnt4RmK7dX2UKGgGR8BdAhc7hegMaAdLXWgIR0Blco/7iyY5dWUu"
|
72 |
},
|
73 |
"ep_success_buffer": {
|
74 |
":type:": "<class 'collections.deque'>",
|
|
|
87 |
":serialized:": "gAWVNQAAAAAAAACMIHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5idWZmZXJzlIwMUmVwbGF5QnVmZmVylJOULg==",
|
88 |
"__module__": "stable_baselines3.common.buffers",
|
89 |
"__doc__": "\n Replay buffer used in off-policy algorithms like SAC/TD3.\n\n :param buffer_size: Max number of element in the buffer\n :param observation_space: Observation space\n :param action_space: Action space\n :param device: PyTorch device\n :param n_envs: Number of parallel environments\n :param optimize_memory_usage: Enable a memory efficient variant\n of the replay buffer which reduces by almost a factor two the memory used,\n at a cost of more complexity.\n See https://github.com/DLR-RM/stable-baselines3/issues/37#issuecomment-637501195\n and https://github.com/DLR-RM/stable-baselines3/pull/28#issuecomment-637559274\n Cannot be used in combination with handle_timeout_termination.\n :param handle_timeout_termination: Handle timeout termination (due to timelimit)\n separately and treat the task as infinite horizon task.\n https://github.com/DLR-RM/stable-baselines3/issues/284\n ",
|
90 |
+
"__init__": "<function ReplayBuffer.__init__ at 0x7fe79b86f130>",
|
91 |
+
"add": "<function ReplayBuffer.add at 0x7fe79b86f1c0>",
|
92 |
+
"sample": "<function ReplayBuffer.sample at 0x7fe79b86f250>",
|
93 |
+
"_get_samples": "<function ReplayBuffer._get_samples at 0x7fe79b86f2e0>",
|
94 |
"__abstractmethods__": "frozenset()",
|
95 |
+
"_abc_impl": "<_abc._abc_data object at 0x7fe79b9df8c0>"
|
96 |
},
|
97 |
"replay_buffer_kwargs": {},
|
98 |
"train_freq": {
|
DQN-default/policy.optimizer.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 43951
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1fbb4a01d457dd5b85b53c8aad221fa65067e43b448c7b61e5f795dc679ab826
|
3 |
size 43951
|
DQN-default/policy.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 43009
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:34647f4c6bb65abf3a18b725174195a7d0a286af592272bac6f813209b7c0558
|
3 |
size 43009
|
README.md
CHANGED
@@ -16,7 +16,7 @@ model-index:
|
|
16 |
type: RoombaAToB
|
17 |
metrics:
|
18 |
- type: mean_reward
|
19 |
-
value:
|
20 |
name: mean_reward
|
21 |
verified: false
|
22 |
---
|
|
|
16 |
type: RoombaAToB
|
17 |
metrics:
|
18 |
- type: mean_reward
|
19 |
+
value: -117.23 +/- 40.81
|
20 |
name: mean_reward
|
21 |
verified: false
|
22 |
---
|
config.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVMAAAAAAAAACMHnN0YWJsZV9iYXNlbGluZXMzLmRxbi5wb2xpY2llc5SMCURRTlBvbGljeZSTlC4=", "__module__": "stable_baselines3.dqn.policies", "__doc__": "\n Policy class with Q-Value Net and target net for DQN\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function DQNPolicy.__init__ at 0x7f271a077520>", "_build": "<function DQNPolicy._build at 0x7f271a0775b0>", "make_q_net": "<function DQNPolicy.make_q_net at 0x7f271a077640>", "forward": "<function DQNPolicy.forward at 0x7f271a0776d0>", "_predict": "<function DQNPolicy._predict at 0x7f271a077760>", "_get_constructor_parameters": "<function DQNPolicy._get_constructor_parameters at 0x7f271a0777f0>", "set_training_mode": "<function DQNPolicy.set_training_mode at 0x7f271a077880>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7f271a47edc0>"}, "verbose": true, "policy_kwargs": {}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVkQEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLBoWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWGAAAAAAAAAAAABbEAADIwwAAAAAAAAAAAAAAAAAAAACUaAtLBoWUjAFDlHSUUpSMBGhpZ2iUaBMolhgAAAAAAAAAAAAWRAAAyEPbD0lAAADIQgAAyEIAAMhClGgLSwaFlGgWdJRSlIwNYm91bmRlZF9iZWxvd5RoEyiWBgAAAAAAAAABAQEBAQGUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLBoWUaBZ0lFKUjA1ib3VuZGVkX2Fib3ZllGgTKJYGAAAAAAAAAAEBAQEBAZRoIksGhZRoFnSUUpSMCl9ucF9yYW5kb22UTnViLg==", "dtype": "float32", "_shape": [6], "low": "[-600. -400. 0. 0. 0. 0.]", "high": "[600. 400. 3.1415927 100. 100. 100. ]", "bounded_below": "[ True True True True True True]", "bounded_above": "[ True True True True True True]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gAWVNAsAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZSMFG51bXB5LnJhbmRvbS5fcGlja2xllIwSX19yYW5kb21zdGF0ZV9jdG9ylJOUjAdNVDE5OTM3lIWUUpR9lCiMDWJpdF9nZW5lcmF0b3KUaBSMBXN0YXRllH2UKIwDa2V5lIwSbnVtcHkuY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QolsAJAAAAAAAA2oqCETT2zjx0rhixTUVQLKFaEtrmhv3+heEQMj8hgue/95d6rF2ARzDd3z0cTa37qIpoaSxgkTW1BpAL223cqa2ERljmVAZyAnFXW2IM07yRwqK/+S0wL0RuePVCcKVNVT1/zpkGnfXOSjh+xx4kNFEjKapbUGfEoK+PJqbXE7tdRF/eGF+icG+3BEDH+GBAM3ms9OL0H6jI/gNBYxh5SytWm9z5twmXzYmHzrAshORvBeWiEM2Ff7XqBp8OwgQCPrnOGD2Ja5KqigjHJGf5c3TuyW+QVbpdUl/9bD1U5HqXEDbYqwQQJC6EJ+jlYvJ+jV0mFsxtQXRlWP1FdZF0fePKuXTwKpnFnmTn4Jg84iKoPspMWDm0vHqR7h8DTrjOijjR74Hw/JIcW2Acj0bcLurwqtdEt+Du0LA/hNqu3Ogh8dUkpP0QzNhBp+ZyZdwL78VzlzpLAAA6bfu9i8jvBdGOSFQvgMtiEwmZG/TQqrag+8YTSC2xHf+u80Yql4LJT0lDxPpYQlfq2HssBfgGJp+LLQayp86ar5owF6a81Dg7TFse85yvm/kw2DnrFHPyd571wBRRgwLLRfdwxnaJ2yAM8RSwuDbrT4YFL/9QlVXf/usACfc7KUsd3DdGVFfkGPuvPOGD4PMEo9tuwAYUZWY4Of5aVf6eSGqSZxzWeFq5SPuqPG6OJt94ac7O07PoeJWGC1tgU06oxw4phD28P4AFRjtTzmk4I599EV+fnJWFq2OsiQ9omG7WWtjPi9sOqRnaqXOYsoBgofrDcEwRQrwjTUrwxZ4Pum66PxB8MPsPK2yy+YLejfTBT06h9Pbu4R2bXBwOJjoxl0+wPiUZXk5qe9RDRl++hxFw0mr++2C4OyQw9jKg1hFjicOLkNgYhqlPeFCPUWSnxitHjkceXb4fZK5TJrbR2SFdqriItXSgaOQeNjrMj1umOcBgcd/YYs0QvEf8OuyKjEd3PZl7I48SlhO79my5Q3B2qvfiwMLIgmKEp0M1uMafJwz3yFaQuTSIxVaNWfnz3KcEMAw+GZVUC3owIbs+b96qZaZC9k8N5qzSZJnKkXVV5X5G26hMRMEkfbK2cwkIzOWy+8E417tv/QcNMxJa4NoTYyVOJjVd1tObnVHK97zk5essAxpHV0yL1L1AH3cAiQ/5lyWgpCOVr0iCzbuEoBh6NiPs8ijy3Vvk5AFCp3jv3cQZK5Hc+rYAhituTT/r4zDRGsOvojBmbGFsdX+0QFwnCEwo4zCUBYmdaHLuGROOd++2c7DiOqmX/4DvdwTv9vt50sr7b/dJhvnm+owF/LOTHY+EJkoproMOtXDqaN2ss9W4iZLNKUHUEMU8RUSRIyZoUyqkV43BfDE0xgXqtGZ8BaA7dsYY0YiOWrioVdFRm0Q+jBsPsMtAiUwzTpBlH86bU3Yjk+OEWh6V1ZdTxZQiT1ONxGcV1eF1uK5q/AvntDaUBnVBS7GYVZoYgjTfrFwW2IuiTNWClWtQxEjP7MGXeetUFieFWcAxnKfBfvN2uvdCBSORmjAtLJ9pB4DnxcQwJAgTkVSy+KYax/q6ryUYehPMQvOEFv0lRv8Sc/ldDUWJ2n9wBOfzHQxFR4zmeoNA3GEWJrGTiOCXAVaSP6uzE7WsJ1H4MTWp5SBuklyPOIkbds+9Lq7wdYlbNWUsprUyVCbBwbS/ER111HGu0aTIZkyaS1PL6BTY8UfafQuHudI7fq+gUzefASLFykrNix1SrSNP1xfu2JpqnyhUZVcFLkFi4it1bIKVE8QsdRaT6A1RQBi8W0pXe8gDxDKvXJRhlvSSpHepyLfIW6TKxAgJEAnQ+DU/55XZCfD0EZrxdHjPHx2B/2VRJcK9M/DQoIsbcOYtHraPhxedCwjcb57s9ar6W9L0bxsoF+5kmGfsON8tGm8CO9R1hdx3PwJlrk5pAR4RgvjdyQmUjtr2I7UanVd2Ciy6xuPKfCDR9hlIJyK7mpN300buMjkcoiJKmpEOd23UUiywLRnYA7pgoA7RHHBz7jqrc9K8Jqk4sVXnorNnCvqdCqVY5LbZMw+edZ6y7ycTP6zdzXQhyEzwdtt+r57RBqFIJOY+RwVkglGJfde3dpAR7XEuk4VWbrJoEt7MBOMHQUymvoKRasBmAqZe3WENkIBQCZEZ1dgvVhO+YZ5Nca1uT3lmgYvu53R8XVuFBAqPIAhfPb9Bo63GRzGCwDgT24HYiT3QNxPN24bxfQnw694EQlXIHPG4iTpXMTPiXlvyPB1bhvpQSMp+93qiNBTMGzeafdggFfTK2P0MiMX92CTOYjd18rPy9EZkehKQP5rVX55SI0H/qp0G/t9mdVYDJe82Zua7zSB1EWWwmXQPrh5XO0+dREHppH72yUAetFLOMGGBu+K7XCunOtxoK1kp6rGqf1UVlqgCU1zN6yG1J8iZAq1El8b6J+FnaeDUQjYuRliUp6X/STGO0NfaEtdPeqgUclVtUgeN7867438utbWuZ+I6FPm3gK54S9GrmVfRVMCN8d3Ya700F16GDWYMGoOLs84KBrgefmuX+/WA6Pxp83eMrUSIEg+NNICuoMF/sfmcquXh/BwQV5+A6sNPraUPdiFX6v+P0Vh9CcmXdxh+36NOQnJ3brunAeA2RYLKVeXd61DSZ50n8EU6wgAJW6ADVGJipApf9PiYuTH336vgI0SR22n0c+OA7KSFlp+lzGNEng3ELDljbVuokr2f2ex14/hjBk/ehZGhqXw7GntrxbqUd0pUZT7Wb5hUOvcqfz1UhEkVHGEdbNPXZ5iDCWyop+Oo0FB8Zb/YyBAb4T/sQyx2VTNV2joa71yYY845nNgXlB4HdUz2tzsMdnL4c3pk9Ia4mWDbKXp4+q0mHcWOXfn60tMR3whohFsRUd+Bs/aEHhkqNch19amI4CLNTidn2ouUCR6aaGgSgn3t+rwE8y2rEwXkvRmPcL2eBPi145bcrPj4o+ziLKpmCngeRyD+NwIVfeKh0Hid5Fm9hmhfHb4NRlFK8sacS8dYwMG5yU3d5GjpZxpxFr9jamtFFPTPM+WggCWU6nTbPlxYGWlxAK9oSy/DVJQm2dsahVJGU0HtoofeIX1sj1wThdTnbqMt+0WHz5R1M/ZfaMCZJ+TtCg8YRpCvBFoJvEz6i6II5bY4zGAMNfYzVEytS42E0BSGiHr4kebDDWWd3a17vqabmCT+29HHn20O2IaHGib0tOVa2iUoeasPUP37jfZZ9jJU0Kdwc9a64l/DsfR13yayK5LgCmRj+d2ZS7/2lEKsZXsYZKy/ojN53jPU7PYA8WCvrmXdq9woUbXLrRmANO+blGgKjAJ1NJSJiIeUUpQoSwNoDk5OTkr/////Sv////9LAHSUYk1wAoWUjAFDlHSUUpSMA3Bvc5RLFHWMCWhhc19nYXVzc5RLAIwFZ2F1c3OURwAAAAAAAAAAdWJ1Yi4=", "n": 4, "_shape": [], "dtype": "int64", "_np_random": "RandomState(MT19937)"}, "n_envs": 4, "num_timesteps": 300000, "_total_timesteps": 300000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1680996086558856980, "learning_rate": 0.0001, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWV4QIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMVy9ob21lL25vaXNlYnJpZGdlLy5sb2NhbC9saWIvcHl0aG9uMy4xMC9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4JDAgQBlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMVy9ob21lL25vaXNlYnJpZGdlLy5sb2NhbC9saWIvcHl0aG9uMy4xMC9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/Gjbi6xxDLYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWV1QAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJZgAAAAAAAAAAAA8EIAAMhCXtoxPwAAyEIAAMhCBTgpQve9A0KPc3tCNPT5Po7+DUIAAMhCcy6VQsYFjUF8P6xCFwW8PwAAyEIAAMhCAADIQsEFDUP8GcdCpsIDPzVgwkLNWcZCEL+cQpSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJLBEsGhpSMAUOUdJRSlC4="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYEAAAAAAAAAAEBAQGUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwSFlIwBQ5R0lFKULg=="}, "_last_original_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWV1QAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJZgAAAAAAAAAAAA80IAAMhCcEowPwAAyEIAAMhCDSsvQq6xCELZ1n5CrPj0Pgy8FEIAAMhCdt6XQsYFjUF8P6xCSjivP8coAEJS6kRCLAkdQtaDDkOoZsdCa6wCP8EQxEIAAMhCa0WfQpSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJLBEsGhpSMAUOUdJRSlC4="}, "_episode_num": 2728, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": 0.0, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWV4AsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHwCDHM8ox59qMAWyUS0uMAXSUR0Bkh42MsH0LdX2UKGgGR8BmOWKTB68haAdLGGgIR0BkiVqHoHLSdX2UKGgGR0CEvtPNVzZIaAdLb2gIR0BkjQNmUW2xdX2UKGgGR8BgybTQVsUJaAdLP2gIR0BkjiDM/yG0dX2UKGgGR0B1O8065oXbaAdLyWgIR0Bkj5WNm16WdX2UKGgGR0CFsAz3RG+caAdLyWgIR0BkkSQHRkVfdX2UKGgGR0B//JOuaF23aAdLT2gIR0BkkwBYFJQMdX2UKGgGR0BBxdQ40dilaAdLSGgIR0Bkk5/3FkxzdX2UKGgGR0Bm8m/N7jT8aAdLTWgIR0BkmVpItlI3dX2UKGgGR0BKUjifg75maAdLkmgIR0BkmoyZa3ZxdX2UKGgGR8BegWVJL/S6aAdLR2gIR0Bkn9oi9qUNdX2UKGgGR0B08LteD3/QaAdLyWgIR0BkoD8k2P1ddX2UKGgGR0BoV4NiH6/JaAdLyWgIR0Bkoi+i8FpxdX2UKGgGR0Bk/rpqynk1aAdLMWgIR0Bko/kLhJiBdX2UKGgGR8BjEPbEgntwaAdLKmgIR0BkpyYqoZQ6dX2UKGgGR8BXsDKcNH6NaAdLbmgIR0BkqD5M10kodX2UKGgGR8Bw4XjS5RTCaAdLyWgIR0BkqK1TisGQdX2UKGgGR0Ah8ZXuE25yaAdLWWgIR0BkqQ1P3ztkdX2UKGgGR8BcinGXHBDYaAdLSmgIR0BkrObCrLhadX2UKGgGR0B9L8F8ohIOaAdLPWgIR0BkrRYcNpdsdX2UKGgGR0BptBouf29MaAdLSmgIR0BkrmWv8qFzdX2UKGgGR8Bkr4B1cMVlaAdLGmgIR0BkrxSiudPMdX2UKGgGR0Bz6N7ojfNzaAdLTGgIR0BksrkdV/+bdX2UKGgGR8AxCC3PRiPRaAdLQGgIR0Bks+gFotcwdX2UKGgGR8BZn6uGKyfMaAdLUmgIR0BktLFCLMs6dX2UKGgGR8BSsRagVXV9aAdLMmgIR0Bkt79XLeQ/dX2UKGgGR0BTuoGlhw2maAdLyWgIR0BkuGsvIwM6dX2UKGgGR0B2StE7W/ahaAdLPmgIR0BkuWi35N48dX2UKGgGR0CC7pjABT4taAdLXWgIR0Bkuem1pj+adX2UKGgGR8Bkc8enyd4FaAdLImgIR0BkvIH3UQTVdX2UKGgGR8Bdwq/IsAeaaAdLRmgIR0BkvS1kUbkwdX2UKGgGR0B9p88TzundaAdLVmgIR0Bkwu8M/hVEdX2UKGgGR0BUVwnDziCKaAdLyWgIR0Bkx45PuXu3dX2UKGgGR0BU6xLsa86FaAdLyWgIR0BkyIxi5NGmdX2UKGgGR0BhLZlJ6IFeaAdLIGgIR0BkygagmJFcdX2UKGgGR0BkumEPDpC8aAdLKWgIR0Bky7gAIY3vdX2UKGgGR0BZpdOmBOHnaAdLd2gIR0Bky/w1BMSLdX2UKGgGR0CAiBIH1OCYaAdLyWgIR0BkzFfu1F6SdX2UKGgGR0B1J5Majvd/aAdLUGgIR0Bk0CgXdj5LdX2UKGgGR0B8kDUc4o7WaAdLPGgIR0Bk0OOn2qT9dX2UKGgGR0B7MzBsQ/X5aAdLUGgIR0Bk0ep0fYBedX2UKGgGR0B+zkZR8+ibaAdLT2gIR0Bk0hzRx95RdX2UKGgGR0B9/9RCQcPwaAdLPmgIR0Bk1abz9S/CdX2UKGgGR0BUHCf+S8raaAdLJmgIR0Bk2IIQe3hGdX2UKGgGR0B/WX4k/r0KaAdLWmgIR0Bk3yhQFcIJdX2UKGgGR8BpIYHcDbJwaAdLyWgIR0Bk31utOmBOdX2UKGgGR0B6DBoFmnO0aAdLw2gIR0Bk4LiVB2OidX2UKGgGR0B4vEaCL/CJaAdLyWgIR0Bk4Qht+CsfdX2UKGgGR0BHeN65Xlr/aAdLJmgIR0Bk4+c4HX2/dX2UKGgGR0CATTQuVX3haAdLSGgIR0Bk6UVQAMlUdX2UKGgGR8BRx3pwCKaYaAdLkmgIR0Bk6mw5eZ5SdX2UKGgGR8A+Kh/RVp9JaAdLKmgIR0Bk7ZSP2f03dX2UKGgGR0B3ix3fQ8fWaAdLyWgIR0Bk7nM4cWCVdX2UKGgGR0Bk3jsD4gzQaAdLyWgIR0Bk7/QfIS13dX2UKGgGR8BhE2IMz/IbaAdLMWgIR0Bk8VP+GXXzdX2UKGgGR8BWVr655JK8aAdLG2gIR0Bk82TmnwXqdX2UKGgGR8Awc3S8an76aAdLPGgIR0Bk9I75mAbydX2UKGgGR8BILiAUcn3MaAdLKGgIR0Bk94Ox0MgEdX2UKGgGR0CEtgyQgcLjaAdLumgIR0Bk93pt78ekdX2UKGgGR0A14saKk2xZaAdLOGgIR0Bk97pxFRYSdX2UKGgGR0CTRRdgOSW7aAdLhWgIR0Bk+KU/wAlwdX2UKGgGR0B1sMtVaOghaAdLTWgIR0Bk/WmelKsddX2UKGgGR8Bd9Pgeii7DaAdLRmgIR0Bk/fSYw7DEdX2UKGgGR8BgUPfoA4n4aAdLLmgIR0BlAVa6jFhodX2UKGgGR0COG+iwjdHlaAdLiGgIR0BlAgQUYbbUdX2UKGgGR0BwJyI/JNj9aAdLTWgIR0BlA0oDxLCfdX2UKGgGR0CGRjVo6CDmaAdLrmgIR0BlBLjWCmMwdX2UKGgGR0BxHyg6EJ0GaAdLLWgIR0BlBO6mO2iMdX2UKGgGR0Bhzx3/xUedaAdLLGgIR0BlBX+fh/AkdX2UKGgGR0B0FC74BV+7aAdLNGgIR0BlCLcbiqACdX2UKGgGR0BpruQSzw+daAdLVGgIR0BlCb5Ec81XdX2UKGgGR0B1UwlJHy3DaAdLQmgIR0BlCf6AOJ+EdX2UKGgGR8Bklfp6hQFcaAdLIWgIR0BlC2MwUQCkdX2UKGgGR0BsT1uvUz9CaAdLKGgIR0BlDQ+t8uzydX2UKGgGR8BgiKGUOd5IaAdLRGgIR0BlDwAKfFrEdX2UKGgGR0BhbcO09hZyaAdLM2gIR0BlD0Q04zacdX2UKGgGR0B1xP0mMOwxaAdLM2gIR0BlEuTA31jBdX2UKGgGR0CHXAvaDf3waAdLuGgIR0BlE5YA80UHdX2UKGgGR0BcUGhEjPfLaAdLOmgIR0BlE72exwAEdX2UKGgGR8Bg+x6lchTwaAdLJmgIR0BlFeSr5qM4dX2UKGgGR0BhCKmALApKaAdLIGgIR0BlFhv1lGwzdX2UKGgGR8BiiswlByCGaAdLMWgIR0BlF4OH31zydX2UKGgGR8Bk7aiVSn+AaAdLHGgIR0BlGEwBYFJQdX2UKGgGR8Bk5g9/z8P4aAdLHWgIR0BlGcUqQRwqdX2UKGgGR0Bw/roicG1QaAdLSmgIR0BlG6InBtUGdX2UKGgGR8BKrKeCkGiYaAdLNWgIR0BlHGDvmYBvdX2UKGgGR0CJ6CnF5v9+aAdLyWgIR0BlHKMrEtNBdX2UKGgGR0BhWKTY/Vy4aAdLIWgIR0BlHjNyHVPOdX2UKGgGR8BiiXDP4VRDaAdLMGgIR0BlIBHLA57xdX2UKGgGR0CCAnrtVrAQaAdLR2gIR0BlJWI9C/oJdX2UKGgGR0BQ6575VOsUaAdLtmgIR0BlJ5OYYzi0dX2UKGgGR8AgH/RVp9JCaAdLLWgIR0BlKvcL0BfbdX2UKGgGR0BkUs1AJLM+aAdLyWgIR0BlK9bJOnEVdX2UKGgGR0B8rs8Md92HaAdLwWgIR0BlLNKGtZFHdX2UKGgGR8BgCWQOnVG1aAdLPGgIR0BlMGPHT7VKdX2UKGgGR0B2R6cx0uDjaAdLVWgIR0BlMXhfjS5RdX2UKGgGR8BsmkvduYQbaAdLyWgIR0BlNJ0lqrR0dX2UKGgGR0BVz9YOlO45aAdLSGgIR0BlNdejVQQ+dX2UKGgGR0Bllf/FR51OaAdLvWgIR0BlOwB1cMVldX2UKGgGR0B8Y0AS39aVaAdLY2gIR0BlPAzch1TzdWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 15625, "buffer_size": 100000, "batch_size": 32, "learning_starts": 50000, "tau": 1.0, "gamma": 0.99, "gradient_steps": 1, "optimize_memory_usage": false, "replay_buffer_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVNQAAAAAAAACMIHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5idWZmZXJzlIwMUmVwbGF5QnVmZmVylJOULg==", "__module__": "stable_baselines3.common.buffers", "__doc__": "\n Replay buffer used in off-policy algorithms like SAC/TD3.\n\n :param buffer_size: Max number of element in the buffer\n :param observation_space: Observation space\n :param action_space: Action space\n :param device: PyTorch device\n :param n_envs: Number of parallel environments\n :param optimize_memory_usage: Enable a memory efficient variant\n of the replay buffer which reduces by almost a factor two the memory used,\n at a cost of more complexity.\n See https://github.com/DLR-RM/stable-baselines3/issues/37#issuecomment-637501195\n and https://github.com/DLR-RM/stable-baselines3/pull/28#issuecomment-637559274\n Cannot be used in combination with handle_timeout_termination.\n :param handle_timeout_termination: Handle timeout termination (due to timelimit)\n separately and treat the task as infinite horizon task.\n https://github.com/DLR-RM/stable-baselines3/issues/284\n ", "__init__": "<function ReplayBuffer.__init__ at 0x7f271a073130>", "add": "<function ReplayBuffer.add at 0x7f271a0731c0>", "sample": "<function ReplayBuffer.sample at 0x7f271a073250>", "_get_samples": "<function ReplayBuffer._get_samples at 0x7f271a0732e0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7f271a004440>"}, "replay_buffer_kwargs": {}, "train_freq": {":type:": "<class 'stable_baselines3.common.type_aliases.TrainFreq'>", ":serialized:": "gAWVYQAAAAAAAACMJXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi50eXBlX2FsaWFzZXOUjAlUcmFpbkZyZXGUk5RLBGgAjBJUcmFpbkZyZXF1ZW5jeVVuaXSUk5SMBHN0ZXCUhZRSlIaUgZQu"}, "actor": null, "use_sde_at_warmup": false, "exploration_initial_eps": 1.0, "exploration_final_eps": 0.05, "exploration_fraction": 0.1, "target_update_interval": 625, "_n_calls": 75000, "max_grad_norm": 10, "exploration_rate": 0.05, "exploration_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVgQMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLBEsTQyhkAXwAGACIAWsEcgiIAFMAiAJkAXwAGACIAIgCGAAUAIgBGwAXAFMAlE5LAYaUKYwScHJvZ3Jlc3NfcmVtYWluaW5nlIWUjFcvaG9tZS9ub2lzZWJyaWRnZS8ubG9jYWwvbGliL3B5dGhvbjMuMTAvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEtwQwYMAQQBGAKUjANlbmSUjAxlbmRfZnJhY3Rpb26UjAVzdGFydJSHlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjFcvaG9tZS9ub2lzZWJyaWRnZS8ubG9jYWwvbGliL3B5dGhvbjMuMTAvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpRoHSlSlGgdKVKUh5R0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCN9lH2UKGgYaA2MDF9fcXVhbG5hbWVfX5SMG2dldF9saW5lYXJfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lChoCowIYnVpbHRpbnOUjAVmbG9hdJSTlIwGcmV0dXJulGgvdYwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBmMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHP6mZmZmZmZqFlFKUaDdHP7mZmZmZmZqFlFKUaDdHP/AAAAAAAACFlFKUh5SMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "batch_norm_stats": [], "batch_norm_stats_target": [], "system_info": {"OS": "Linux-5.19.0-35-generic-x86_64-with-glibc2.35 # 36~22.04.1-Ubuntu SMP PREEMPT_DYNAMIC Fri Feb 17 15:17:25 UTC 2", "Python": "3.10.9", "Stable-Baselines3": "1.7.0", "PyTorch": "2.0.0", "GPU Enabled": "True", "Numpy": "1.23.5", "Gym": "0.21.0"}}
|
|
|
1 |
+
{"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVMAAAAAAAAACMHnN0YWJsZV9iYXNlbGluZXMzLmRxbi5wb2xpY2llc5SMCURRTlBvbGljeZSTlC4=", "__module__": "stable_baselines3.dqn.policies", "__doc__": "\n Policy class with Q-Value Net and target net for DQN\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function DQNPolicy.__init__ at 0x7fe79b873520>", "_build": "<function DQNPolicy._build at 0x7fe79b8735b0>", "make_q_net": "<function DQNPolicy.make_q_net at 0x7fe79b873640>", "forward": "<function DQNPolicy.forward at 0x7fe79b8736d0>", "_predict": "<function DQNPolicy._predict at 0x7fe79b873760>", "_get_constructor_parameters": "<function DQNPolicy._get_constructor_parameters at 0x7fe79b8737f0>", "set_training_mode": "<function DQNPolicy.set_training_mode at 0x7fe79b873880>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7fe79b8868c0>"}, "verbose": true, "policy_kwargs": {}, "observation_space": {":type:": "<class 'gym.spaces.box.Box'>", ":serialized:": "gAWVkQEAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLBoWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWGAAAAAAAAAAAABbEAADIwwAAAAAAAAAAAAAAAAAAAACUaAtLBoWUjAFDlHSUUpSMBGhpZ2iUaBMolhgAAAAAAAAAAAAWRAAAyEPbD0lAAADIQgAAyEIAAMhClGgLSwaFlGgWdJRSlIwNYm91bmRlZF9iZWxvd5RoEyiWBgAAAAAAAAABAQEBAQGUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLBoWUaBZ0lFKUjA1ib3VuZGVkX2Fib3ZllGgTKJYGAAAAAAAAAAEBAQEBAZRoIksGhZRoFnSUUpSMCl9ucF9yYW5kb22UTnViLg==", "dtype": "float32", "_shape": [6], "low": "[-600. -400. 0. 0. 0. 0.]", "high": "[600. 400. 3.1415927 100. 100. 100. ]", "bounded_below": "[ True True True True True True]", "bounded_above": "[ True True True True True True]", "_np_random": null}, "action_space": {":type:": "<class 'gym.spaces.discrete.Discrete'>", ":serialized:": "gAWVNAsAAAAAAACME2d5bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpRLBIwGX3NoYXBllCmMBWR0eXBllIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYowKX25wX3JhbmRvbZSMFG51bXB5LnJhbmRvbS5fcGlja2xllIwSX19yYW5kb21zdGF0ZV9jdG9ylJOUjAdNVDE5OTM3lIWUUpR9lCiMDWJpdF9nZW5lcmF0b3KUaBSMBXN0YXRllH2UKIwDa2V5lIwSbnVtcHkuY29yZS5udW1lcmljlIwLX2Zyb21idWZmZXKUk5QolsAJAAAAAAAA/HeT+DTgV1KAtu+YENCzNwRvBBq6gIJE8+pP5LxeQewk6CFTYWt3V+fcBAp8D0lSogc8YX1OsiAmQXHwrHjLidCOpnyHlWBCFdq4KWHuv7RZKaREigrmsVb+Hqk79I/U/6j4WCNS7lB1eZap2euPoG5ovOvFtG0j1UMEwQ3PNSc8gsrM4PhN1JL3t3Lvz7fFXfm0rw5/nfC4D6T5SlVZnLGXCYEN0wGBy3fxbGenwdlzbyGxCkIIiu0+4ahwSLtCqXFgEx9oQ/m4ycl3XwnwA0d08J9XzxcdWKcT7qMTDjkw6ZR3AQLVisbkmUKwf2g3CtZ+GWhbRMKdmG5jNDhdZPIqYS6AUe2EfU05zdvxBfDV3f/WyuxMGRi7ClawqPB3yUsv7UQkARDOHxl3LEXvyWi2/2tXP7v0Yu4u2LyYVJRqIa0cDy3JXSoaxwmIK8tUFkT/PRHJbaPikZF/tZhvROASeblCVj9dFeZH1sp6Ya6U8TKNmfXAAJFK5Xn/fFNsNpI+Rfabdudkx0LKToSAtVR5A3mTMx0UCFXegMj1h2U0lFMeN+3nN1rlUEnbNZxtS4isGwH+w26kgXErnvs+V+qnQoriglip/lQYrZx3IiXvjmSqTOienH1QKTB62qxQzro23mx4wKPraN5EZ0iI8qouo2B2H6/92tEdgf9Y4mOSc2rfgilZLBMcvOy3rGqcjBxctnvQECERZJV7osqTpwLWi0q2R6bzWmzOjAmRJ9hZ81RWz8M1vePj4fbLQm7bZlquKL/3RL5b54HYEsR/YjHkF6iirS6dsto4LeU0ntRfUd04qI6gvrFoJ8Xt5QUWrF7EKyWTTRVqVbflMN9zF68GrzOwU25maCon8twXumTcFxpRlKiQHJu5RmDx3W7bvG5Va7iZ8bq5WeZYokJ6zNxjmlkrQ5eSjLw3qohX/ve2LTQVSvnnCP0G06VSAXB995dQfjpuKNUqt45GJxYd9gFw3/H5tIuG4sAydj5PdnW9vRkRujYnYSYEeEIJB947BkzAboYaZ6xcGOzlX43xmSvMEbR3YSTno7T9CbHCJ9mZKAoxHStM23chmw6RgdZhuaQdOhzMBsZn+Ks+p0dMLxEkl53gBkhbGqlLn/2fnuC709Zvxr5wdX1U+kXFoO8faiZ3/hlCkFx/cka/xn17TzxIVcMB50fvz/Fhf15vf9NOGPNKyLiIaSD0X+2/8d2MoGUroQ03up69+cDf+npxcIyoOcX+9lkkgyvcIypininzcyl/+XM7LFWzs0ismfSquwtbh8HqDxPFY7OiItu0/Jz52bL0ZOnvLlQrBE2wJteXkbwFm1DSSe0hZyPFvQ2Y7EEfGSpACPN23oy/5HmJwiyExODxGWjV7acV9GULD5FXIM9hf0ifRgCXfrDMl8QvhDJbGi2Jxt8EdwJOsey3KuKHF1jgNyOaZaaxlQOsKceJOUO6GyTQk3TrzV0wZP/kpXV6x3h9ocfE5XPXdPYTm0XbhYRiwfme495M5UwRZDosjCUqU65KInBP4lhde6fTlU6RAJOt9A/YQBp2x88+NLK7uerInxKl1hTDkN6oGW18AH6NtdLHW6lQFHIp62LRshsxHv+ofQCnt2F3vCaAmnmgIpdbi4P5Nm5EQZo3SRsRr0QjqK3GqQzaEF5GrV9J9ITDf46WUwk+g1wBfVzhZuqRdKtZHCeJmy3kSyzIWskpqeQzpiGHx2QKQ8KfB0RwHl4WeEe1rqSkwxXyqDhSAB/sK/lmhaKBAxdSxUjQob2YpWnAk8BAtyB2A3YZU0eP8Q3end8xtV/EVlFZ8gDc4peZDeLMKEITLA/LhOme/mFRDFpHM+VRTUM85hu8/j3grNemL5+8QCg6yQIK7UMZiTy6rgtIhs1Mg+iFVJ3ABKAAqqa+hM/E5vdnf4+/sv1F3SUEz4uB6ht4Wb5ahC8Y/eThDdxcHszTlp23hSoCS7Cgvvnqq5t9ehR6aCosdtNoWqKzw6roKcOpASAOlV5alGT+eHvZuR2lE0n9z2ywDwUB1HodvkpE7qJjQiav87IaPIaMTAc2zUbop8wUuQRr+CmArTSsp2Yx0BHFa0I5vIndjrAljtx4AARXCw/yHY46KAdfL8SvZV57tVPBadWsGVIbyxh8Jhfe2FuizUK/4Wmk3GU0ThnfpGoyPL9uaPsT7IT+su7LqvPoaDoXM9onlsOhk6epSKDr0jFMJ4QpxlKWsTE69y8vGEe48IkLhf7oAWNxDnmgvb4l3KuUJz15WzZYCubb4NhYozWTuEPgSrv57SPbs2Wz+dAwVgdda8+Z4U2PVxh7pFW0KDWL6vra1PBpQMrfmuGOU7s3ySZ9+GYpxaf5SRHqfGBxzheocWLsbxjpJEjzac/sZasVApeMW3/L4fPKhNdSzI6yZMtN9cfT9ANNl+gcZRClwMcAHR/c3yZZIFRbJLNbspe9Kx0kQdamNhEZecsn3L+D4/RkzKki4YuuzQeGugRZwO6/tEhUGYikozNOtiPIR+JNqmyYcANMGueFoGO1WsC9yr+MY8c5jcDNue59n8Lrq/jP0dwVGVI874XrkGW7WjrRt1bj2N2imFsZ65hsQtPF1A9DssJXl9Xgl9Bind8MHaLQ2MDOvW0o3afH/Sp5o3x5kLc3v1fUppRp1t8AJW1ieJZQVMwSSuT3Qhk6+gDoU/1V3IQRlmAJmkzMLDWmMv3QzCqheQOELpob6y0JQ0aCYhKpaKv9s2OoWJ/bSwS+12YTQmpyAJThLPiIF0iVJmnVy3pfmOupVC+vA3WrjZErUGM0N4AvHyVwAttS82irz+8j27QW4cNcD81VR2f35RDwrQQYEoqoacCriQpKtrdLpvx1V3qdH3Vy90nFX3huhkjBzkH+z5GVKvgkrtWjjTRZb01s1k5htI5RL8d7jc5jjIV629+VPzq7Itbd80qeiofP8zg/QSuapfjU3x9eFyFkgpCf7BZqSxNbf+refFi14ElgOS0hBe3NRfaMXemWFAw9ed0Jtv7Sdbs+NyKsSKMjI6q+lX0VGstSYOIO1Mh0ZcSrcZ/OuF44q6TXjJ8PsMmoHRLazweEWQW7WgkOZX6UwpliVSdar60Xu4SjMUB+7fFBZgNUEAhmRIVMo09Ypq/YCA/3hPRbLhYviK2upGZVNHN2Ja/qGZF2WH4991wTpK1CeXfv4rv6h7FlAU6/PbRcOM4/HlbKUew+BXUKfE/rEfc9XzDx6uB4D8HUbNgjLa/WhGEFIYIIkc6facNrAj75Vp6Ic08Tw6piicsm0GDcWZOJgwUpNyfvU1Hffho01gTteteRmtaYwl9L2vlriHbWvBYTlGgKjAJ1NJSJiIeUUpQoSwNoDk5OTkr/////Sv////9LAHSUYk1wAoWUjAFDlHSUUpSMA3Bvc5RL7HWMCWhhc19nYXVzc5RLAIwFZ2F1c3OURwAAAAAAAAAAdWJ1Yi4=", "n": 4, "_shape": [], "dtype": "int64", "_np_random": "RandomState(MT19937)"}, "n_envs": 4, "num_timesteps": 300000, "_total_timesteps": 300000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1680996362691066755, "learning_rate": 0.0001, "tensorboard_log": null, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWV4QIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMVy9ob21lL25vaXNlYnJpZGdlLy5sb2NhbC9saWIvcHl0aG9uMy4xMC9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZSMBGZ1bmOUS4JDAgQBlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMVy9ob21lL25vaXNlYnJpZGdlLy5sb2NhbC9saWIvcHl0aG9uMy4xMC9zaXRlLXBhY2thZ2VzL3N0YWJsZV9iYXNlbGluZXMzL2NvbW1vbi91dGlscy5weZR1Tk5oAIwQX21ha2VfZW1wdHlfY2VsbJSTlClSlIWUdJRSlIwcY2xvdWRwaWNrbGUuY2xvdWRwaWNrbGVfZmFzdJSMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGgffZR9lChoFmgNjAxfX3F1YWxuYW1lX1+UjBljb25zdGFudF9mbi48bG9jYWxzPi5mdW5jlIwPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoF4wHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/Gjbi6xxDLYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWV1QAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJZgAAAAAAAAAPF2pMHo2pxCE622PwAAyELLRdhBxGN2QZBKAUJHGLNCUh+DPzdpEkIAAMhCcWR5Qq3DjUK6ubhCivRQPwAAyEKb8cBCAADIQgCAFEMAAMhC67cXP7g/xUIAAMhCFTK1QpSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJLBEsGhpSMAUOUdJRSlC4="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYEAAAAAAAAAAEBAQGUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSwSFlIwBQ5R0lFKULg=="}, "_last_original_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWV1QAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJZgAAAAAAAAAHJpmcH7BZ5CvFa0PwAAyEI+6eFBFzOGQfIrB0LbsLNC0GmBP/PyGEIAAMhCOit7Qte/kEJmBrlCx5JOPwAAyEJkC8RCAADIQgAAFkMAAMhCV4cWP9PFxkIAAMhC56a2QpSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJLBEsGhpSMAUOUdJRSlC4="}, "_episode_num": 3279, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": 0.0, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWV4AsAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHwGLb37UG3WqMAWyUSziMAXSUR0Bk0/ZyuIRAdX2UKGgGR8BjwjGza9K3aAdLKmgIR0Bk1i9ugpSadX2UKGgGR8Bg9iL0jC53aAdLPmgIR0Bk2LU5MlC1dX2UKGgGR8BVMGQSzw+daAdLZ2gIR0Bk21iH6/IsdX2UKGgGR8BXCIUahpQDaAdLgmgIR0Bk26dpZfUndX2UKGgGR8Bh2QIWxhUjaAdLa2gIR0Bk3lum78NydX2UKGgGR8BjgfKISDh+aAdLJ2gIR0Bk3m1D0DlpdX2UKGgGR8Bkw0YXO4XoaAdLHmgIR0Bk4KqIacZtdX2UKGgGR8BF5G21D0DmaAdLaGgIR0Bk4MSK3uuzdX2UKGgGR8BkBtId2gWaaAdLJ2gIR0Bk47MJQcghdX2UKGgGR8BDOzbnHNoraAdLV2gIR0Bk5SkZaV2SdX2UKGgGR8BDcJ3HJcPfaAdLR2gIR0Bk5kCNjslcdX2UKGgGR8BVAwGr0aqCaAdLVGgIR0Bk6iA4GUwBdX2UKGgGR8BdP4qgAZKnaAdLRWgIR0Bk6nFefI0ZdX2UKGgGRz/vGcOLBKtgaAdLyWgIR0Bk6zp1RtP6dX2UKGgGR8Bkw0YXO4XoaAdLHmgIR0Bk7NNN8E3bdX2UKGgGR8BQ9ymZVn27aAdLXmgIR0Bk7YEbHZK4dX2UKGgGR8BaUzLOiWVvaAdLVWgIR0Bk8a7I1cdHdX2UKGgGR8BLeKv3ai9JaAdLYWgIR0Bk9LxG2CumdX2UKGgGR8Bi8vcnE2pAaAdLLWgIR0Bk9REc81XOdX2UKGgGR8BYEsCHRCyAaAdLfGgIR0Bk9jSJCSiedX2UKGgGR8Bkf11jiGWVaAdLJWgIR0Bk+PJeVs1sdX2UKGgGR0Bdupc1O0swaAdLyWgIR0Bk+XSQYDT0dX2UKGgGR8BabAYtQKrraAdLR2gIR0Bk+n/tIClrdX2UKGgGR8BjPH6GgzxgaAdLK2gIR0Bk/E+X7cfvdX2UKGgGR0B3T0eXAuZkaAdLhGgIR0Bk/tejVQQ+dX2UKGgGR8BWK07r9l3AaAdLS2gIR0Bk/0IsyzomdX2UKGgGR8Bgh5InSfDlaAdLRWgIR0Bk/9JSR8txdX2UKGgGR8Bd5h6jWTX8aAdLR2gIR0BlAcKzAvcrdX2UKGgGR8BjF1iQT238aAdLK2gIR0BlBPwPRRdhdX2UKGgGR8Bj9cvkBCD3aAdLJGgIR0BlB8Re1KGtdX2UKGgGRz/1A/TspoboaAdLj2gIR0BlCjJ0W/JvdX2UKGgGR0BW/O49X9zfaAdLyWgIR0BlDjPQfIS2dX2UKGgGR8BhlUY2sJY1aAdLOWgIR0BlDoPTXrdFdX2UKGgGR0BgNLYukDZEaAdLyWgIR0BlDyH6/IsAdX2UKGgGR8Bj+DsWweNlaAdLJmgIR0BlESErXlKcdX2UKGgGR8BhIK/qPfbcaAdLRWgIR0BlFF9F4LThdX2UKGgGR0BC08dYGMXKaAdLyWgIR0BlFwLw4KhMdX2UKGgGR8BVkJIczZYgaAdLdmgIR0BlF4dXDFZQdX2UKGgGR8BjJnwNLDhtaAdLL2gIR0BlF/hS9/SZdX2UKGgGR8BV7Fpj+aScaAdLaGgIR0BlGSApazNVdX2UKGgGR8BkoLfLs8gZaAdLH2gIR0BlGZPKuB+XdX2UKGgGR8BkGOkpI+W4aAdLI2gIR0BlGsl9jPOZdX2UKGgGR8BU9S+HrQgLaAdLaWgIR0BlH5R4yGi6dX2UKGgGR8BVyv7aZhKEaAdLXmgIR0BlIFSn+AEudX2UKGgGR8BjNW+wkgOjaAdLKmgIR0BlIsoUi6g/dX2UKGgGR8Bj1okAxSHeaAdLJWgIR0BlIzCYTj//dX2UKGgGR8Bi9xFG5MDfaAdLLGgIR0BlJon2IwdsdX2UKGgGR8BgUiU9pyp8aAdLQWgIR0BlJ9kSVW0adX2UKGgGR0BZ0rw4KhL5aAdLyWgIR0BlKO/cnE2pdX2UKGgGR0BVIpvo/zJ7aAdLyWgIR0BlKieCkGiYdX2UKGgGR8Bis+bLEDQraAdLLmgIR0BlK2xOclPadX2UKGgGR8BldA5ksjFAaAdLG2gIR0BlLYESuhbodX2UKGgGR8BYooX9BKL9aAdLVmgIR0BlL5WxQizLdX2UKGgGR8BhC4iX6ZYxaAdLL2gIR0BlMR0yP+4tdX2UKGgGR8ALlP557gKnaAdLd2gIR0BlM0pkPMB7dX2UKGgGR8Bji85jpcHGaAdLKWgIR0BlNEX7+DODdX2UKGgGR8BfVNRBNVR2aAdLPWgIR0BlNFmFrVOLdX2UKGgGR8BlUQkona37aAdLHmgIR0BlNbs6aLGadX2UKGgGR0BhhZWtEG7jaAdLyWgIR0BlNig2606YdX2UKGgGR8BjgqyhSLqEaAdLKGgIR0BlN3iDM/yHdX2UKGgGR8BikVcY64lQaAdLKGgIR0BlONPxhDw6dX2UKGgGR8BciS8an753aAdLN2gIR0BlOlhVlwtKdX2UKGgGR8BYjFERaouPaAdLXWgIR0BlO3m1YyO8dX2UKGgGR8BkDB6OYIBzaAdLJmgIR0BlO7y8SPELdX2UKGgGR8BAQhC+lCTmaAdLTGgIR0BlPVg4OtnxdX2UKGgGR8Bjtb/yXlbNaAdLJmgIR0BlPV/e+Eh8dX2UKGgGR8Ba/QWrOqvNaAdLK2gIR0BlPul0o0AMdX2UKGgGR8BVdUmY0EX+aAdLQGgIR0BlQLFMqSX/dX2UKGgGR8BjAqT6i0v5aAdLLGgIR0BlQ/+S8rZrdX2UKGgGR8BZcEAT7EYPaAdLWWgIR0BlRDCDVYp2dX2UKGgGR8Bk6ctXgccVaAdLHWgIR0BlRkOG0u14dX2UKGgGR8BkaSTMaCL/aAdLIGgIR0BlRq/wiJO4dX2UKGgGR8BlBkfs/pt8aAdLHWgIR0BlSI6wMYuTdX2UKGgGR8BgtHNA1NxmaAdLIWgIR0BlSTgflp49dX2UKGgGR8Bj8rzf779AaAdLI2gIR0BlSyzE74i5dX2UKGgGR0BanF3pwCKaaAdLyWgIR0BlTMCHRCyAdX2UKGgGR8AI7w2ETQE7aAdLyWgIR0BlTkQ9RrJsdX2UKGgGR8Bjko24uscRaAdLMGgIR0BlTuDe0ojOdX2UKGgGR8BhGSdlNDc/aAdLRWgIR0BlVBSpBHCodX2UKGgGR8BcJw75mAbyaAdLZmgIR0BlVIgJTl1bdX2UKGgGR8BcTVPznRsuaAdLaGgIR0BlViwfQrtmdX2UKGgGR0BKt19nbqQjaAdLyWgIR0BlWHcrRSgodX2UKGgGR8BisOaa1Cw9aAdLNGgIR0BlWiLfk3judX2UKGgGR8BimdK7I1cdaAdLLmgIR0BlXAwfyPMjdX2UKGgGR8BQo/6TGHYZaAdLZGgIR0BlXEBIWgvldX2UKGgGR8Bjtb/yXlbNaAdLJmgIR0BlXSy6cy31dX2UKGgGR8Bj5V1hb4ahaAdLJmgIR0BlXySA6MisdX2UKGgGR8BjwDRYzSCwaAdLMGgIR0BlYM+5e7cxdX2UKGgGR0BBrI/qxC6ZaAdLyWgIR0BlY4WrOqvNdX2UKGgGR8BggO9rXUYsaAdLP2gIR0BlZY287IT5dX2UKGgGR8BkoLfLs8gZaAdLH2gIR0BlZfFcY64ldX2UKGgGR8BSf8GcFyJbaAdLW2gIR0BlZicLBsQ/dX2UKGgGR8BkbW3fAKv3aAdLK2gIR0BlaOWUr08OdX2UKGgGR8BkX4UtZmqYaAdLK2gIR0BlaTWZqmCRdX2UKGgGR8BlLPJNj9XLaAdLHWgIR0Bla3Vf/m1ZdX2UKGgGR8BnAVxCIDYAaAdLyWgIR0Bla4dZJTVEdX2UKGgGR8BbaL4SHuZ1aAdLUGgIR0BlbFDBuXNUdX2UKGgGR8BdYTt1IRRNaAdLJ2gIR0Blbnt4RmK7dX2UKGgGR8BdAhc7hegMaAdLXWgIR0Blco/7iyY5dWUu"}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 15625, "buffer_size": 100000, "batch_size": 32, "learning_starts": 50000, "tau": 1.0, "gamma": 0.99, "gradient_steps": 1, "optimize_memory_usage": false, "replay_buffer_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVNQAAAAAAAACMIHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5idWZmZXJzlIwMUmVwbGF5QnVmZmVylJOULg==", "__module__": "stable_baselines3.common.buffers", "__doc__": "\n Replay buffer used in off-policy algorithms like SAC/TD3.\n\n :param buffer_size: Max number of element in the buffer\n :param observation_space: Observation space\n :param action_space: Action space\n :param device: PyTorch device\n :param n_envs: Number of parallel environments\n :param optimize_memory_usage: Enable a memory efficient variant\n of the replay buffer which reduces by almost a factor two the memory used,\n at a cost of more complexity.\n See https://github.com/DLR-RM/stable-baselines3/issues/37#issuecomment-637501195\n and https://github.com/DLR-RM/stable-baselines3/pull/28#issuecomment-637559274\n Cannot be used in combination with handle_timeout_termination.\n :param handle_timeout_termination: Handle timeout termination (due to timelimit)\n separately and treat the task as infinite horizon task.\n https://github.com/DLR-RM/stable-baselines3/issues/284\n ", "__init__": "<function ReplayBuffer.__init__ at 0x7fe79b86f130>", "add": "<function ReplayBuffer.add at 0x7fe79b86f1c0>", "sample": "<function ReplayBuffer.sample at 0x7fe79b86f250>", "_get_samples": "<function ReplayBuffer._get_samples at 0x7fe79b86f2e0>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7fe79b9df8c0>"}, "replay_buffer_kwargs": {}, "train_freq": {":type:": "<class 'stable_baselines3.common.type_aliases.TrainFreq'>", ":serialized:": "gAWVYQAAAAAAAACMJXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi50eXBlX2FsaWFzZXOUjAlUcmFpbkZyZXGUk5RLBGgAjBJUcmFpbkZyZXF1ZW5jeVVuaXSUk5SMBHN0ZXCUhZRSlIaUgZQu"}, "actor": null, "use_sde_at_warmup": false, "exploration_initial_eps": 1.0, "exploration_final_eps": 0.05, "exploration_fraction": 0.1, "target_update_interval": 625, "_n_calls": 75000, "max_grad_norm": 10, "exploration_rate": 0.05, "exploration_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVgQMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLBEsTQyhkAXwAGACIAWsEcgiIAFMAiAJkAXwAGACIAIgCGAAUAIgBGwAXAFMAlE5LAYaUKYwScHJvZ3Jlc3NfcmVtYWluaW5nlIWUjFcvaG9tZS9ub2lzZWJyaWRnZS8ubG9jYWwvbGliL3B5dGhvbjMuMTAvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlEtwQwYMAQQBGAKUjANlbmSUjAxlbmRfZnJhY3Rpb26UjAVzdGFydJSHlCl0lFKUfZQojAtfX3BhY2thZ2VfX5SMGHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbpSMCF9fbmFtZV9flIwec3RhYmxlX2Jhc2VsaW5lczMuY29tbW9uLnV0aWxzlIwIX19maWxlX1+UjFcvaG9tZS9ub2lzZWJyaWRnZS8ubG9jYWwvbGliL3B5dGhvbjMuMTAvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpRoHSlSlGgdKVKUh5R0lFKUjBxjbG91ZHBpY2tsZS5jbG91ZHBpY2tsZV9mYXN0lIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCN9lH2UKGgYaA2MDF9fcXVhbG5hbWVfX5SMG2dldF9saW5lYXJfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lChoCowIYnVpbHRpbnOUjAVmbG9hdJSTlIwGcmV0dXJulGgvdYwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBmMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHP6mZmZmZmZqFlFKUaDdHP7mZmZmZmZqFlFKUaDdHP/AAAAAAAACFlFKUh5SMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "batch_norm_stats": [], "batch_norm_stats_target": [], "system_info": {"OS": "Linux-5.19.0-35-generic-x86_64-with-glibc2.35 # 36~22.04.1-Ubuntu SMP PREEMPT_DYNAMIC Fri Feb 17 15:17:25 UTC 2", "Python": "3.10.9", "Stable-Baselines3": "1.7.0", "PyTorch": "2.0.0", "GPU Enabled": "True", "Numpy": "1.23.5", "Gym": "0.21.0"}}
|
replay.mp4
CHANGED
Binary files a/replay.mp4 and b/replay.mp4 differ
|
|
results.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"mean_reward":
|
|
|
1 |
+
{"mean_reward": -117.23120850000001, "std_reward": 40.80663827865989, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-04-08T16:28:53.667165"}
|