Quentin Gallouédec
commited on
Commit
•
c6448fe
1
Parent(s):
b74096c
Initial commit
Browse files- README.md +1 -1
- args.yml +2 -2
- ddpg-AcrobotSwingupDMC-v0.zip +1 -1
- ddpg-AcrobotSwingupDMC-v0/actor.optimizer.pth +1 -1
- ddpg-AcrobotSwingupDMC-v0/critic.optimizer.pth +1 -1
- ddpg-AcrobotSwingupDMC-v0/data +19 -19
- ddpg-AcrobotSwingupDMC-v0/policy.pth +1 -1
- replay.mp4 +2 -2
- results.json +1 -1
- train_eval_metrics.zip +2 -2
README.md
CHANGED
@@ -16,7 +16,7 @@ model-index:
|
|
16 |
type: AcrobotSwingupDMC-v0
|
17 |
metrics:
|
18 |
- type: mean_reward
|
19 |
-
value:
|
20 |
name: mean_reward
|
21 |
verified: false
|
22 |
---
|
|
|
16 |
type: AcrobotSwingupDMC-v0
|
17 |
metrics:
|
18 |
- type: mean_reward
|
19 |
+
value: 63.99 +/- 45.62
|
20 |
name: mean_reward
|
21 |
verified: false
|
22 |
---
|
args.yml
CHANGED
@@ -54,13 +54,13 @@
|
|
54 |
- - save_replay_buffer
|
55 |
- false
|
56 |
- - seed
|
57 |
-
-
|
58 |
- - storage
|
59 |
- null
|
60 |
- - study_name
|
61 |
- null
|
62 |
- - tensorboard_log
|
63 |
-
- runs/AcrobotSwingupDMC-
|
64 |
- - track
|
65 |
- true
|
66 |
- - trained_agent
|
|
|
54 |
- - save_replay_buffer
|
55 |
- false
|
56 |
- - seed
|
57 |
+
- 1984220215
|
58 |
- - storage
|
59 |
- null
|
60 |
- - study_name
|
61 |
- null
|
62 |
- - tensorboard_log
|
63 |
+
- runs/AcrobotSwingupDMC-v0__ddpg__1984220215__1673811006
|
64 |
- - track
|
65 |
- true
|
66 |
- - trained_agent
|
ddpg-AcrobotSwingupDMC-v0.zip
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 3021849
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b7da56762a6d64c601841ab6591fa7559bbcf54f7e25491f156d838b98ec5606
|
3 |
size 3021849
|
ddpg-AcrobotSwingupDMC-v0/actor.optimizer.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 504751
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:30ded1fe78fd888d2ab4b58d62ec8bf80126b0036a156f5bb7c5621cc9c0ccf5
|
3 |
size 504751
|
ddpg-AcrobotSwingupDMC-v0/critic.optimizer.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 995055
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f5c31d67e4ba48bb9c4779097617312b5b32429e1370f8d519565762ceffbf2b
|
3 |
size 995055
|
ddpg-AcrobotSwingupDMC-v0/data
CHANGED
@@ -4,16 +4,16 @@
|
|
4 |
":serialized:": "gAWVMAAAAAAAAACMHnN0YWJsZV9iYXNlbGluZXMzLnRkMy5wb2xpY2llc5SMCVREM1BvbGljeZSTlC4=",
|
5 |
"__module__": "stable_baselines3.td3.policies",
|
6 |
"__doc__": "\n Policy class (with both actor and critic) for TD3.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n :param n_critics: Number of critic networks to create.\n :param share_features_extractor: Whether to share or not the features extractor\n between the actor and the critic (this saves computation time)\n ",
|
7 |
-
"__init__": "<function TD3Policy.__init__ at
|
8 |
-
"_build": "<function TD3Policy._build at
|
9 |
-
"_get_constructor_parameters": "<function TD3Policy._get_constructor_parameters at
|
10 |
-
"make_actor": "<function TD3Policy.make_actor at
|
11 |
-
"make_critic": "<function TD3Policy.make_critic at
|
12 |
-
"forward": "<function TD3Policy.forward at
|
13 |
-
"_predict": "<function TD3Policy._predict at
|
14 |
-
"set_training_mode": "<function TD3Policy.set_training_mode at
|
15 |
"__abstractmethods__": "frozenset()",
|
16 |
-
"_abc_impl": "<_abc._abc_data object at
|
17 |
},
|
18 |
"verbose": 1,
|
19 |
"policy_kwargs": {
|
@@ -31,7 +31,7 @@
|
|
31 |
},
|
32 |
"observation_space": {
|
33 |
":type:": "<class 'gym.spaces.box.Box'>",
|
34 |
-
":serialized:": "gAWVPAwAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLBoWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWGAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP+UaAtLBoWUjAFDlHSUUpSMBGhpZ2iUaBMolhgAAAAAAAAAAACAfwAAgH8AAIB/AACAfwAAgH8AAIB/lGgLSwaFlGgWdJRSlIwNYm91bmRlZF9iZWxvd5RoEyiWBgAAAAAAAAAAAAAAAACUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////
|
35 |
"dtype": "float32",
|
36 |
"_shape": [
|
37 |
6
|
@@ -70,12 +70,12 @@
|
|
70 |
"initial_noise": null,
|
71 |
"noise_prev": "[0.]"
|
72 |
},
|
73 |
-
"start_time":
|
74 |
"learning_rate": {
|
75 |
":type:": "<class 'function'>",
|
76 |
":serialized:": "gAWVCQMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMay9ncGZzZHN3b3JrL3Byb2plY3RzL3JlY2gvdWxpL3VwZjgyc3AvZW52X2RtYy9saWIvcHl0aG9uMy45L3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgkMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxrL2dwZnNkc3dvcmsvcHJvamVjdHMvcmVjaC91bGkvdXBmODJzcC9lbnZfZG1jL2xpYi9weXRob24zLjkvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpSMHGNsb3VkcGlja2xlLmNsb3VkcGlja2xlX2Zhc3SUjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoH32UfZQoaBZoDYwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBeMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHPxo24uscQy2FlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="
|
77 |
},
|
78 |
-
"tensorboard_log": "runs/AcrobotSwingupDMC-
|
79 |
"lr_schedule": {
|
80 |
":type:": "<class 'function'>",
|
81 |
":serialized:": "gAWVCQMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMay9ncGZzZHN3b3JrL3Byb2plY3RzL3JlY2gvdWxpL3VwZjgyc3AvZW52X2RtYy9saWIvcHl0aG9uMy45L3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgkMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxrL2dwZnNkc3dvcmsvcHJvamVjdHMvcmVjaC91bGkvdXBmODJzcC9lbnZfZG1jL2xpYi9weXRob24zLjkvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpSMHGNsb3VkcGlja2xlLmNsb3VkcGlja2xlX2Zhc3SUjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoH32UfZQoaBZoDYwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBeMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHPxo24uscQy2FlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="
|
@@ -87,7 +87,7 @@
|
|
87 |
},
|
88 |
"_last_original_obs": {
|
89 |
":type:": "<class 'numpy.ndarray'>",
|
90 |
-
":serialized:": "
|
91 |
},
|
92 |
"_episode_num": 1000,
|
93 |
"use_sde": false,
|
@@ -95,7 +95,7 @@
|
|
95 |
"_current_progress_remaining": 0.0,
|
96 |
"ep_info_buffer": {
|
97 |
":type:": "<class 'collections.deque'>",
|
98 |
-
":serialized:": "
|
99 |
},
|
100 |
"ep_success_buffer": {
|
101 |
":type:": "<class 'collections.deque'>",
|
@@ -114,12 +114,12 @@
|
|
114 |
":serialized:": "gAWVNQAAAAAAAACMIHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5idWZmZXJzlIwMUmVwbGF5QnVmZmVylJOULg==",
|
115 |
"__module__": "stable_baselines3.common.buffers",
|
116 |
"__doc__": "\n Replay buffer used in off-policy algorithms like SAC/TD3.\n\n :param buffer_size: Max number of element in the buffer\n :param observation_space: Observation space\n :param action_space: Action space\n :param device: PyTorch device\n :param n_envs: Number of parallel environments\n :param optimize_memory_usage: Enable a memory efficient variant\n of the replay buffer which reduces by almost a factor two the memory used,\n at a cost of more complexity.\n See https://github.com/DLR-RM/stable-baselines3/issues/37#issuecomment-637501195\n and https://github.com/DLR-RM/stable-baselines3/pull/28#issuecomment-637559274\n Cannot be used in combination with handle_timeout_termination.\n :param handle_timeout_termination: Handle timeout termination (due to timelimit)\n separately and treat the task as infinite horizon task.\n https://github.com/DLR-RM/stable-baselines3/issues/284\n ",
|
117 |
-
"__init__": "<function ReplayBuffer.__init__ at
|
118 |
-
"add": "<function ReplayBuffer.add at
|
119 |
-
"sample": "<function ReplayBuffer.sample at
|
120 |
-
"_get_samples": "<function ReplayBuffer._get_samples at
|
121 |
"__abstractmethods__": "frozenset()",
|
122 |
-
"_abc_impl": "<_abc._abc_data object at
|
123 |
},
|
124 |
"replay_buffer_kwargs": {},
|
125 |
"train_freq": {
|
|
|
4 |
":serialized:": "gAWVMAAAAAAAAACMHnN0YWJsZV9iYXNlbGluZXMzLnRkMy5wb2xpY2llc5SMCVREM1BvbGljeZSTlC4=",
|
5 |
"__module__": "stable_baselines3.td3.policies",
|
6 |
"__doc__": "\n Policy class (with both actor and critic) for TD3.\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n :param n_critics: Number of critic networks to create.\n :param share_features_extractor: Whether to share or not the features extractor\n between the actor and the critic (this saves computation time)\n ",
|
7 |
+
"__init__": "<function TD3Policy.__init__ at 0x15dd98280>",
|
8 |
+
"_build": "<function TD3Policy._build at 0x15dd98310>",
|
9 |
+
"_get_constructor_parameters": "<function TD3Policy._get_constructor_parameters at 0x15dd983a0>",
|
10 |
+
"make_actor": "<function TD3Policy.make_actor at 0x15dd98430>",
|
11 |
+
"make_critic": "<function TD3Policy.make_critic at 0x15dd984c0>",
|
12 |
+
"forward": "<function TD3Policy.forward at 0x15dd98550>",
|
13 |
+
"_predict": "<function TD3Policy._predict at 0x15dd985e0>",
|
14 |
+
"set_training_mode": "<function TD3Policy.set_training_mode at 0x15dd98670>",
|
15 |
"__abstractmethods__": "frozenset()",
|
16 |
+
"_abc_impl": "<_abc._abc_data object at 0x15dd92ac0>"
|
17 |
},
|
18 |
"verbose": 1,
|
19 |
"policy_kwargs": {
|
|
|
31 |
},
|
32 |
"observation_space": {
|
33 |
":type:": "<class 'gym.spaces.box.Box'>",
|
34 |
+
":serialized:": "gAWVPAwAAAAAAACMDmd5bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMBl9zaGFwZZRLBoWUjANsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWGAAAAAAAAAAAAID/AACA/wAAgP8AAID/AACA/wAAgP+UaAtLBoWUjAFDlHSUUpSMBGhpZ2iUaBMolhgAAAAAAAAAAACAfwAAgH8AAIB/AACAfwAAgH8AAIB/lGgLSwaFlGgWdJRSlIwNYm91bmRlZF9iZWxvd5RoEyiWBgAAAAAAAAAAAAAAAACUaAiMAmIxlImIh5RSlChLA4wBfJROTk5K/////0r/////SwB0lGJLBoWUaBZ0lFKUjA1ib3VuZGVkX2Fib3ZllGgTKJYGAAAAAAAAAAAAAAAAAJRoIksGhZRoFnSUUpSMCl9ucF9yYW5kb22UjBRudW1weS5yYW5kb20uX3BpY2tsZZSMEl9fcmFuZG9tc3RhdGVfY3RvcpSTlIwHTVQxOTkzN5RoLowUX19iaXRfZ2VuZXJhdG9yX2N0b3KUk5SGlFKUfZQojA1iaXRfZ2VuZXJhdG9ylIwHTVQxOTkzN5SMBXN0YXRllH2UKIwDa2V5lGgTKJbACQAAAAAAAAAAAIDO/UUSK+SzQxpEYygPLMsTFdbShBtsgGSc0PxxD1V7WKwUYv60imTyPiF1ZN50ZI2FTYXvAdfFgX0NLJWw/xmDEcbxVcyNIh4vEUl0MOHsN2cjfizqwDVujdvomrcTdl8il+RRAAgG82F8c9Vq0dr5y7O5Z50GPPJMUxdDLtiluncOsSCysn0KXEDS1ugrR5adxHiH46sglf0387AMZIk9mf3gTwF2mquo3cBgkp79eBdKEDa7xTZz3lzxbA723Y+An4Gxhc/NBNZA5EoELW2ThtprS1k6Ixzt8TQLWsvW6rnBG4Q2oHG8A0SurKcyXHtoy77DCgAPIFLnLUndnJyjQzyZ2GJnCTXMgDs5EMlqkVn9Bjs5NZ9Yrqy1/+Q0iz1LSBvr61Fe3hYE9pvraBTPvkfmWuO/ZjL4uhm2LYnwXwUDpU1DzYev0WTh3m13iONz5qD4zMH1qqFSzNWJrpmPC3H28boIBFIaT+tlS349YGNX1ybZTjX/Q9TGgguIlEhS9y+EmxCslxT/2II3ZvUUxvVB6oGp+Gt4ayx4Y4rCSQRPAWpP83KkkntflRhROGBbXctbtTE6pEkWvqyCW3N283nqIhMEO4FjDx9MsVNYi4Zp4QbEbPpgQmdjqbggxm3qHtEriWbGi6dT03K9Xtqwq4tnOVqlCZxT01dKzaEPyqdL5giqt+qdHoADyZ+K4P+mhiiK8ddZKi8s8RWv7Pzzg3VAZMGk/EhViC5kdK/2Kjg2pMhbV3NsVjJ/4Yhbn0EUmAxnbZbllj+QhKAxkgYRKE8M8Z2U7oUUuHojDiuP8PeZ4CfIa53cJrX695AKlhDaap0dsbRzy1iR8ERSls+6+vKpzlpkIJ2WabHgh8Z44Kc36tqWSItD+TnbSt5IEW83IA623KP1BZ8dX+a8WGxBlKp4bimzWVpYo1G/Mo7CYxJEg9pOcHjNT2jvHm1rSk5Y1yUTWes27wmi0nFJYbSp4M6Awqii6zEWgQn9C3/3aCp4+83bsXn/0m+uoOuHoeYeMa58ykVioUHUMnbEWfHoT6pWvdP7gYDxwPHh7WuCOsLpTcjC1ktCQN3kpDc88u5t5LK37AAWIaFT1Sd9NgNKBdKT9CHPHPyt+MeWe/ojHnR4ItrnXGxJfcDDI5e05Vt852e9SCf0p92bRlQgUC0saLbwnTTyGLJ0E3RuKtF/ygQ8Dva2axoUiXUtiRqAk5JlaqijSKfDeRONvygvYrbjU1yGzTCj00JW3q6C5BM1L0XQQ+j2c643ClDP7C3f5B0w1i6AuJWpr+j5OOaDR043F+CnHUTtdnOGFDXKH1C5fCx7bjq2WgrmnWSzAQWXdat9hEfGRE2SGT/FAXgx4T4rO6/NpomltJCHJri6h1ZAm5w0xjQiU72qmL9Nf22HeFV/SsA34HmQ1SyLUNvD6uEqZXcZDpwp2F2+lO53nUiHLTTtvcPLK0ySAaM4BcZVBgdHm1J3bj0NxppSySJFHHd8j+nsyhhVIBTiEamba8xOKuhtZ7BoRCmCxOxyDTCzneBwYUVXII84rJnBrh5fe1qYuqWBRzfn2fWAeYj78WBDpI7/KB8cKF37PWaJAkzBLgqUsFtjgSGM09T/HeqphXFLLpC0Diffru8OE0iK+TxIY93ppW+SttYV8mzXQRtXK0c3YpPw2uYa8wTwIlqpOtq1E8jw0cZVVm/b38RtAbTUPLTfpq1KkRNhjCXFy7+sueMdzJwKuLTUDodt6XDKZJYrOtRFM/7bfOLyInIOBalJI3hTQ0YN4M/wAZys4jyrx0g7QJFqEG0w8eLqzcIL+nzgedSn352hMiqSuW/jdz4IJIzcNNmGHa4zXPp4JYbDMk5xqITlOT5/5ze1QrsP3ApXW5t9YPueGVrXcKKqj9uQ6IQK4eWgxiCIWG0kNckMGjqRQPOrdDHqIrI5DBFO2fvN9ZWS59rJwL/vmwAXOYrsBqnF187ep7wQ23i1cnb5aG551xDv3PWoIXQAlukrzlWV5CWbozskFNoVWSJKk8SND8p4oG+wahutUAa4xN7AlkgBg3niIyOeXpYrmI3E2uoWIRVUVFg5oKBOOPahOAZ747uDhBMKswJUgnwjtKicBlfqY19I9fJcDr64ZOMuNUkl5o10HNFalHEgIP6g3aK3czl4N6dAYg7W0klWtrD15l6bwhCqj6X82+5q2MFYjaaiXwKCf2Ox9flcgJKZHMDFVd9t8iTIB8G8kWdZvCjElCO9PI7eaboONlXedcagcvfAf0LSsJgvIAfyeJs1FdUQzaKncXVoRmh8gfF0xbYe5xoOWrw3srZAnTKVRwKABRx/y25uBO1d+oqEveifeakiSof3gDVA5IfBDoQMWPqFKC6Ot3zC15mZzF1WIMbrcrIOxe8WpHHLYvqXdLAYaFA7M4qjKFpKijY7BH49mUk7QzUBjs6+mo5tk/S5bw67ssFLA+w0vwYl41g4RjiddCXr+UzfwAdA2fsiDZqidcu4pSFhG23n65zWz7LriRpkxWZkAVWVXR2m3JmGXRZDviKd/Ed8eJVLmQzuVJCPmf82erP2U5NriNd2+Do2eHpoqW7OCrBOzQQoPkN5T3gdokZNHi9QvdlhnPPPu6Gyg+DEeUjFaqk02PO5zfxyL/428H8CVsjSCQ5H3yVX5CIRlVQD0GdQI622t/I4JxFZVqrWG3YK3QaWYGPx6LOHqMhG/nMJYiuhwkjKqGgtB3uDPj6BtZcVmqq6iOfZehKhEKc0o9tjMGkAZ3sT4X4jJV6rZrfbpqf4Sz6dRmEKx9nKlZVPQfYUasXiTfjVVi2dsHXN/4RGEFd422YHlqlLvxdo3DyXvb/ZSeV41551UE45Y24OpT0YP7P0Bh7opG8uOii7jIbnpMHbU42DP2x/J+mkfX0dNrFIzyDTx6xYDUEEEL42d85XSN1Ew08iP63AyRXUYkwWnothJTvReq49k0MEPP9EJSCrLMbAvdMjhyGoEyeoX5pVAmLPjOHqWxRq77xCQfKW5mSopJJ/P0PqIZKNVsiozjUrWHf6BMzQDJRgP/Hmeah/a89UFlG9bh6FcE8/jrp/EeiLcr0uuC9GdzUMbWUCnBW6V5I2IrJin5Qv6JZXqVZt2qCCPXQ24KRlsTGEKVbjVd1Brpmh6MEn1wEaU1KYCUdunjpgw+hM+vuXXQb/nja+xBsgpGu6PrG6/8BCZmw+zEkclzmArG0MkbXctvBt2JhLSEp9YhXJTySXlGOdoM1eJyka067nofk7ADD4RwHAxxFTjUftbuE8PYusdI4fW8bZWryLuh+lLrclIUOAkX+azHygzppQfWPQYpRoCIwCdTSUiYiHlFKUKEsDaAxOTk5K/////0r/////SwB0lGJNcAKFlGgWdJRSlIwDcG9zlE1wAnWMCWhhc19nYXVzc5RLAIwFZ2F1c3OURwAAAAAAAAAAdWJ1Yi4=",
|
35 |
"dtype": "float32",
|
36 |
"_shape": [
|
37 |
6
|
|
|
70 |
"initial_noise": null,
|
71 |
"noise_prev": "[0.]"
|
72 |
},
|
73 |
+
"start_time": 1673811008957099024,
|
74 |
"learning_rate": {
|
75 |
":type:": "<class 'function'>",
|
76 |
":serialized:": "gAWVCQMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMay9ncGZzZHN3b3JrL3Byb2plY3RzL3JlY2gvdWxpL3VwZjgyc3AvZW52X2RtYy9saWIvcHl0aG9uMy45L3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgkMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxrL2dwZnNkc3dvcmsvcHJvamVjdHMvcmVjaC91bGkvdXBmODJzcC9lbnZfZG1jL2xpYi9weXRob24zLjkvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpSMHGNsb3VkcGlja2xlLmNsb3VkcGlja2xlX2Zhc3SUjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoH32UfZQoaBZoDYwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBeMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHPxo24uscQy2FlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="
|
77 |
},
|
78 |
+
"tensorboard_log": "runs/AcrobotSwingupDMC-v0__ddpg__4000244894__1673811006/AcrobotSwingupDMC-v0",
|
79 |
"lr_schedule": {
|
80 |
":type:": "<class 'function'>",
|
81 |
":serialized:": "gAWVCQMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwSIAFMAlE6FlCmMAV+UhZSMay9ncGZzZHN3b3JrL3Byb2plY3RzL3JlY2gvdWxpL3VwZjgyc3AvZW52X2RtYy9saWIvcHl0aG9uMy45L3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5RLgkMCAAGUjAN2YWyUhZQpdJRSlH2UKIwLX19wYWNrYWdlX1+UjBhzdGFibGVfYmFzZWxpbmVzMy5jb21tb26UjAhfX25hbWVfX5SMHnN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi51dGlsc5SMCF9fZmlsZV9flIxrL2dwZnNkc3dvcmsvcHJvamVjdHMvcmVjaC91bGkvdXBmODJzcC9lbnZfZG1jL2xpYi9weXRob24zLjkvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpSMHGNsb3VkcGlja2xlLmNsb3VkcGlja2xlX2Zhc3SUjBJfZnVuY3Rpb25fc2V0c3RhdGWUk5RoH32UfZQoaBZoDYwMX19xdWFsbmFtZV9flIwZY29uc3RhbnRfZm4uPGxvY2Fscz4uZnVuY5SMD19fYW5ub3RhdGlvbnNfX5R9lIwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBeMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHPxo24uscQy2FlFKUhZSMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="
|
|
|
87 |
},
|
88 |
"_last_original_obs": {
|
89 |
":type:": "<class 'numpy.ndarray'>",
|
90 |
+
":serialized:": "gAWVjQAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYYAAAAAAAAAGSnUj825ga90XcRv3Pcfz8rYwtAF5AWQZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGJLAUsGhpSMAUOUdJRSlC4="
|
91 |
},
|
92 |
"_episode_num": 1000,
|
93 |
"use_sde": false,
|
|
|
95 |
"_current_progress_remaining": 0.0,
|
96 |
"ep_info_buffer": {
|
97 |
":type:": "<class 'collections.deque'>",
|
98 |
+
":serialized:": "gAWVRAwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHQFN56jWTX8SMAWyUTegDjAF0lEdAwy+kiSq2jXV9lChoBkcAAAAAAAAAAGgHTegDaAhHQMM091jAi3Z1fZQoaAZHQGFUyWRigChoB03oA2gIR0DDOldZJTVEdX2UKGgGR0BhX93yI55raAdN6ANoCEdAwz+1R1oxpXV9lChoBkdAZkBlkpZwGWgHTegDaAhHQMNFFUzCUHJ1fZQoaAZHQFSValk6LfloB03oA2gIR0DDSnaABkqddX2UKGgGR0BZ6qxHG0eEaAdN6ANoCEdAw0/VKDkELnV9lChoBkdAYCEjfNzKcWgHTegDaAhHQMNVM3f642F1fZQoaAZHQFCzUt7KJVNoB03oA2gIR0DDWpRLh73PdX2UKGgGR0BDpU/wAlv7aAdN6ANoCEdAw1/yqlP8AXV9lChoBkdAagk1y/9Hc2gHTegDaAhHQMNlUcWCVbB1fZQoaAZHQDvS+10DEFZoB03oA2gIR0DDaqoPf8/EdX2UKGgGR0ArRaCcwxnGaAdN6ANoCEdAw3AEf4h2XHV9lChoBkdAV4pH4Glhw2gHTegDaAhHQMN1YmZE2Hd1fZQoaAZHQGQyk1uR9w5oB03oA2gIR0DDesEbWEsbdX2UKGgGR0BwFYWEbo8qaAdN6ANoCEdAw4AgDW9UTHV9lChoBkdAWJz0th/iHmgHTegDaAhHQMOFgNapxWF1fZQoaAZHQF7uRbbDdgxoB03oA2gIR0DDit16sySFdX2UKGgGR0BXe0R8MNMHaAdN6ANoCEdAw5A7JBgNPXV9lChoBkdAZWpkz41xbWgHTegDaAhHQMOVnFt8/lh1fZQoaAZHQGKsQgcLjPxoB03oA2gIR0DDmvrzGxUvdX2UKGgGR0Btt3UDuBtlaAdN6ANoCEdAw6BZevZAZHV9lChoBkc/sOv+wTufEmgHTegDaAhHQMOltwQ176Z1fZQoaAZHQGBG0Vi4J/poB03oA2gIR0DDqxWUUwi8dX2UKGgGRz/ZaR6nivPkaAdN6ANoCEdAw7B0nPVurXV9lChoBkdAYHYTtb9qDmgHTegDaAhHQMO46L/S6Ud1fZQoaAZHQEaMIrvsqrloB03oA2gIR0DDvkhL26CldX2UKGgGR0BcAxa1TisGaAdN6ANoCEdAw8On1yNn5HV9lChoBkdAbtDXAdn002gHTegDaAhHQMPJCIpx3mp1fZQoaAZHQGcvVfVqeshoB03oA2gIR0DDzmac/dIodX2UKGgGR0BAdkrGza9LaAdN6ANoCEdAw9PH0lJHy3V9lChoBkdASewkNWluWWgHTegDaAhHQMPZKOzIFNd1fZQoaAZHP7pcxCY1He9oB03oA2gIR0DD3oo5Lh73dX2UKGgGR0BC3DXFtKqXaAdN6ANoCEdAw+PqKw6hg3V9lChoBkdAYKhsFdLQHGgHTegDaAhHQMPpSqk/KQt1fZQoaAZHQFEGe5Fw1ixoB03oA2gIR0DD7qUd5prUdX2UKGgGR0BaH2jsUqQSaAdN6ANoCEdAw/QEzDXOGHV9lChoBkc/k0GeMAFPi2gHTegDaAhHQMP5VZbpu/F1fZQoaAZHQGkHJeNT989oB03oA2gIR0DD/qO0gKWtdX2UKGgGR0AfPABT4tYkaAdN6ANoCEdAxAPvz4k/r3V9lChoBkdAcm6nG8274GgHTegDaAhHQMQJP7p3X7N1fZQoaAZHQDaZ+so2GZhoB03oA2gIR0DEDo3M+u/2dX2UKGgGR0BBcgH/tICmaAdN6ANoCEdAxBPdDm8ujHV9lChoBkdAQ0Fk4FRpDmgHTegDaAhHQMQZLCrDIil1fZQoaAZHQG6GW87IT5BoB03oA2gIR0DEHnhdt2s8dX2UKGgGR0AlMAHVwxWUaAdN6ANoCEdAxCPINoakynV9lChoBkdAGPhgE2YOUmgHTegDaAhHQMQpF4Kpkwx1fZQoaAZHQFpZ4GUwBYFoB03oA2gIR0DELmPcUM5PdX2UKGgGR0B1DrAaef7KaAdN6ANoCEdAxDOxssxwhnV9lChoBkdAYGGSDh99dGgHTegDaAhHQMQ4/7N0NjN1fZQoaAZHP/dzCDVYp2FoB03oA2gIR0DEQV+AVfu1dX2UKGgGRz+25vtMPBi1aAdN6ANoCEdAxEawK5TZQHV9lChoBkdAXaccxTKkmGgHTegDaAhHQMRL/K0+kgx1fZQoaAZHQCqLfzjFQ2xoB03oA2gIR0DEUUQd8zAOdX2UKGgGR0AMDK1XvH94aAdN6ANoCEdAxFaQTJQtSXV9lChoBkdAbliNaQmu1WgHTegDaAhHQMRb3x9oexR1fZQoaAZHP7cg+yJKraNoB03oA2gIR0DEYSrd8Aq/dX2UKGgGR0BbvoUnG828aAdN6ANoCEdAxGZ4LofSyHV9lChoBkdASN5GlQ/HHWgHTegDaAhHQMRrw7Y02tN1fZQoaAZHQGDScgQpWmxoB03oA2gIR0DEcQ8se4kNdX2UKGgGR0BIjIacZtN0aAdN6ANoCEdAxHZe5xzaK3V9lChoBkdAek0i6QNkOWgHTegDaAhHQMR7rOlGgBd1fZQoaAZHP9mgoPTXrdFoB03oA2gIR0DEgPxcu8K5dX2UKGgGRz+yQNkOI68yaAdN6ANoCEdAxIZJ15B1LnV9lChoBkdAKrTW5H3DemgHTegDaAhHQMSLmPw/gR91fZQoaAZHQFSDjt5UtI1oB03oA2gIR0DEkOXUYsNEdX2UKGgGRz+6CSRr8BMjaAdN6ANoCEdAxJY1PGhmG3V9lChoBkdAYSnMCcPOIWgHTegDaAhHQMSbgNOuaF51fZQoaAZHQEEuX+l0o0BoB03oA2gIR0DEoNI5YHPedX2UKGgGR0BZxAs9SuQqaAdN6ANoCEdAxKYfdyDIzXV9lChoBkdAbX5g8bJfY2gHTegDaAhHQMSrbJSiudR1fZQoaAZHQDFS1v2oNutoB03oA2gIR0DEsLoO4G2UdX2UKGgGR0BmApNKyv9taAdN6ANoCEdAxLYJ2A5Jb3V9lChoBkcAAAAAAAAAAGgHTegDaAhHQMS7WD81n/V1fZQoaAZHQFNY/e+Eh7poB03oA2gIR0DEwKMHnlnzdX2UKGgGR0BoYctdzGPxaAdN6ANoCEdAxMkA9nscAHV9lChoBkdATBcsvqTr3WgHTegDaAhHQMTOTSV4X411fZQoaAZHQGrl5YYBNmFoB03oA2gIR0DE05QrrgO0dX2UKGgGR0A8t+MZP2wnaAdN6ANoCEdAxNjbT3qRl3V9lChoBkdAZHunF5v9+GgHTegDaAhHQMTeI30XgtR1fZQoaAZHQE5b6MR6F/RoB03oA2gIR0DE42zY287IdX2UKGgGRwAAAAAAAAAAaAdN6ANoCEdAxOixxGUfP3V9lChoBkdAZeqAtnPE9GgHTegDaAhHQMTt99hRZU11fZQoaAZHQF/ESw4bS7ZoB03oA2gIR0DE8z2Zy+6AdX2UKGgGRz/gtI9TxXnyaAdN6ANoCEdAxPiFmDlHSXV9lChoBkdAU0OVrylN12gHTegDaAhHQMT9zMYl6Z91fZQoaAZHQEQ/SuyNXHRoB03oA2gIR0DFAxV1fVqfdX2UKGgGR0BTAPbCaZx8aAdN6ANoCEdAxQhcIKtxMnV9lChoBkdAWLDsNUfgaWgHTegDaAhHQMUNpFJQLux1fZQoaAZHQAzYkNWluWNoB03oA2gIR0DFEujxoZhsdX2UKGgGRz/hp6Y3Ns3yaAdN6ANoCEdAxRgwgXdj5XV9lChoBkdAaClr7fpD/mgHTegDaAhHQMUdd5yuIRB1fZQoaAZHQFui2v0RODdoB03oA2gIR0DFIsFZX+2mdX2UKGgGR0Bpzi+8Gs3iaAdN6ANoCEdAxSgIRDCxeXV9lChoBkc/5Eth/iHZb2gHTegDaAhHQMUtUCCz1K51fZQoaAZHP3vAGjbi6xxoB03oA2gIR0DFMpQTsY2sdX2UKGgGR0BEoNwzch1UaAdN6ANoCEdAxTfahzvJBHV9lChoBkdAOO8VUMoc72gHTegDaAhHQMU9IiVKPGR1fZQoaAZHQGYgj3M6ikBoB03oA2gIR0DFQmhZGKAKdX2UKGgGR0BNglERaouPaAdN6ANoCEdAxUevJMg2ZXVlLg=="
|
99 |
},
|
100 |
"ep_success_buffer": {
|
101 |
":type:": "<class 'collections.deque'>",
|
|
|
114 |
":serialized:": "gAWVNQAAAAAAAACMIHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5idWZmZXJzlIwMUmVwbGF5QnVmZmVylJOULg==",
|
115 |
"__module__": "stable_baselines3.common.buffers",
|
116 |
"__doc__": "\n Replay buffer used in off-policy algorithms like SAC/TD3.\n\n :param buffer_size: Max number of element in the buffer\n :param observation_space: Observation space\n :param action_space: Action space\n :param device: PyTorch device\n :param n_envs: Number of parallel environments\n :param optimize_memory_usage: Enable a memory efficient variant\n of the replay buffer which reduces by almost a factor two the memory used,\n at a cost of more complexity.\n See https://github.com/DLR-RM/stable-baselines3/issues/37#issuecomment-637501195\n and https://github.com/DLR-RM/stable-baselines3/pull/28#issuecomment-637559274\n Cannot be used in combination with handle_timeout_termination.\n :param handle_timeout_termination: Handle timeout termination (due to timelimit)\n separately and treat the task as infinite horizon task.\n https://github.com/DLR-RM/stable-baselines3/issues/284\n ",
|
117 |
+
"__init__": "<function ReplayBuffer.__init__ at 0x15dd96dd0>",
|
118 |
+
"add": "<function ReplayBuffer.add at 0x15dd96e60>",
|
119 |
+
"sample": "<function ReplayBuffer.sample at 0x15dd96ef0>",
|
120 |
+
"_get_samples": "<function ReplayBuffer._get_samples at 0x15dd96f80>",
|
121 |
"__abstractmethods__": "frozenset()",
|
122 |
+
"_abc_impl": "<_abc._abc_data object at 0x15dd36300>"
|
123 |
},
|
124 |
"replay_buffer_kwargs": {},
|
125 |
"train_freq": {
|
ddpg-AcrobotSwingupDMC-v0/policy.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1498141
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c12f2f779f204501a51d10f296b6efde52e8256d40897cf60a4dd499be096f2e
|
3 |
size 1498141
|
replay.mp4
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ccdeb4ee7dfda830f556731466a081ca5c470f6c684640b37cd6890303c94e6c
|
3 |
+
size 256725
|
results.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"mean_reward":
|
|
|
1 |
+
{"mean_reward": 63.98670130000001, "std_reward": 45.619853380275124, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2023-01-16T08:48:02.395143"}
|
train_eval_metrics.zip
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:258bde2e57f54e78370fa93b9e6f9e82a34c18ba91a077173e1e7b9fa9f53df1
|
3 |
+
size 41438
|