bospoort commited on
Commit
f389de0
1 Parent(s): 4e28e36

Upload DQN LunarLander-v2 trained agent

Browse files
README.md ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: stable-baselines3
3
+ tags:
4
+ - LunarLander-v2
5
+ - deep-reinforcement-learning
6
+ - reinforcement-learning
7
+ - stable-baselines3
8
+ model-index:
9
+ - name: dqn
10
+ results:
11
+ - task:
12
+ type: reinforcement-learning
13
+ name: reinforcement-learning
14
+ dataset:
15
+ name: LunarLander-v2
16
+ type: LunarLander-v2
17
+ metrics:
18
+ - type: mean_reward
19
+ value: -116.97 +/- 89.45
20
+ name: mean_reward
21
+ verified: false
22
+ ---
23
+
24
+ # **dqn** Agent playing **LunarLander-v2**
25
+ This is a trained model of a **dqn** agent playing **LunarLander-v2**
26
+ using the [stable-baselines3 library](https://github.com/DLR-RM/stable-baselines3).
27
+
28
+ ## Usage (with Stable-baselines3)
29
+ TODO: Add your code
30
+
31
+
32
+ ```python
33
+ from stable_baselines3 import ...
34
+ from huggingface_sb3 import load_from_hub
35
+
36
+ ...
37
+ ```
config.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"policy_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVMAAAAAAAAACMHnN0YWJsZV9iYXNlbGluZXMzLmRxbi5wb2xpY2llc5SMCURRTlBvbGljeZSTlC4=", "__module__": "stable_baselines3.dqn.policies", "__annotations__": "{'q_net': <class 'stable_baselines3.dqn.policies.QNetwork'>, 'q_net_target': <class 'stable_baselines3.dqn.policies.QNetwork'>}", "__doc__": "\n Policy class with Q-Value Net and target net for DQN\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ", "__init__": "<function DQNPolicy.__init__ at 0x7fd5331deb60>", "_build": "<function DQNPolicy._build at 0x7fd5331dec00>", "make_q_net": "<function DQNPolicy.make_q_net at 0x7fd5331deca0>", "forward": "<function DQNPolicy.forward at 0x7fd5331ded40>", "_predict": "<function DQNPolicy._predict at 0x7fd5331dede0>", "_get_constructor_parameters": "<function DQNPolicy._get_constructor_parameters at 0x7fd5331dee80>", "set_training_mode": "<function DQNPolicy.set_training_mode at 0x7fd5331def20>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7fd5331e9940>"}, "verbose": 1, "policy_kwargs": {}, "num_timesteps": 1000000, "_total_timesteps": 1000000, "_num_timesteps_at_start": 0, "seed": null, "action_noise": null, "start_time": 1706575822237294089, "learning_rate": 0.0001, "tensorboard_log": null, "_last_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAANhU7b6sHBY+QI/KvUQn37ssifO74MD0uwAAAAAAAAAASSgbv0wEQz7Shq29PN6Ovef2Brww3Yi8AAAAAAAAAAAznXm9NhQhP3BZ/73AAFO9OmBYPACNA70AAAAAAAAAAM2QpDsZjCo/WhC2vSVWqrzP0bU6S7eQvAAAAAAAAAAAS7JHv2xKKz6PkpG9QyKqPHoy4L0Bt6g9AACAPwAAgD9WTpS+Cx6jPhsokb3d5iC9XJ8hPTrPc7wAAAAAAAAAAEinJb8pwu4+UqMavY0H2r2mIAQ96v8AvAAAAAAAAAAAvHwVv0xypj8dWmG+gF7YvZ/EHb7AgKM8AAAAAAAAAAClDvq+pWqXPvtR47wjAQm9EdnWPKDI1jwAAAAAAAAAANPYyL4Qbag+f4W/vTr9N70Bfna9EnKlPAAAAAAAAAAAmv16PtTHkD+t7yu+bEJbvZUm07sh0ha8AAAAAAAAAACzrLQ9a/dEP3WhYL37+hi9hwXQPKqkTrwAAAAAAAAAAErLrD50PVg/LoXUuxswh72RwQU9Rhg9OwAAAAAAAAAAoDZIvnSg9j7Fvca92VVhvYowqrwazOE8AAAAAAAAAACy1VG/fHFDP1qKvb0etMK9StILvap8bbwAAAAAAAAAAIU+J7/U1l0+IgA1vR3427yEJVE83fGaPAAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_last_episode_starts": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAEBAQEBAQEBAQEBAQEBAQGUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="}, "_last_original_obs": {":type:": "<class 'numpy.ndarray'>", ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAALbS7L7VRBY+54LLvbKtH71UTOe7W4fvuwAAAAAAAAAANPAav7qfRD5wy8S9O2cyvV+O8ruTr+s8AAAAAAAAAADNcHS9MmAhP2DX/L13b069lq9yPEL0AL0AAAAAAAAAAJr9wTvBqio/lhaavRaLgr29yxQ7Ht2XuwAAAAAAAAAAbYZHv8TRKj71foq9Q7yiPACi6L0yL6E9AACAPwAAgD9z8JO+8pGjPqsceL1TpTq9jKskPep437sAAAAAAAAAAEeOJb8m/O8+z+pDvWpLpL1zvQU9zG4FPQAAAAAAAAAAKu0Uv0TApj+Sl2++Kf3zvTrKHr7kOIA8AAAAAAAAAAAD7Pm+Oc2XPlUembwNcNS72RvMPHCSJbwAAAAAAAAAAJZfyL6n8ag+wPPSvSYlj7zcoHq9k45vPQAAAAAAAAAA+rZ8PkzvkD+IwDu+n//CvYMRxLuZNMG8AAAAAAAAAACaz7U9gi5FP6vRW73Tdpm9AzDVPC3EY7wAAAAAAAAAAJrTrD7Jnlg//qRqvCEDI71JKgU9gsMMPQAAAAAAAAAA4DtHvsRC9z5KCeC9S5+mvb96tbx/iY08AAAAAAAAAACQmFG/pP1DPx3N4r3lTs69VdoIvXpd+rwAAAAAAAAAADAiJ78ndV4+8Mv2vCkHVr3wpkE856cBPQAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="}, "_episode_num": 2180, "use_sde": false, "sde_sample_freq": -1, "_current_progress_remaining": 0.0, "_stats_window_size": 100, "ep_info_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVRAwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHwD6dyOq//NuMAWyUTegDjAF0lEdAsQ1Vvfj0c3V9lChoBkfAZSg/BWPtD2gHTV0DaAhHQLEN7+j/Mnt1fZQoaAZHwFRg5Xlr/KhoB03oA2gIR0CxELe1OTJRdX2UKGgGR8BSrXsolUqAaAdN6ANoCEdAsRHyY6XBxnV9lChoBkfAJFuRDCxeLWgHTegDaAhHQLETYn8baRJ1fZQoaAZHP/w/IbOu7pVoB03oA2gIR0CxFLwEEC/5dX2UKGgGR8BowfPVurIYaAdNpQNoCEdAsRUcWrOqvXV9lChoBkfAJKVkUbkwOGgHTegDaAhHQLEW/WrwOON1fZQoaAZHwB7haHKwIMVoB03oA2gIR0CxFxIeT3ZgdX2UKGgGR8BGWN/FzdULaAdN6ANoCEdAsRceqJdjXnV9lChoBkfAVBBIatLcsWgHTegDaAhHQLEXuZUT+Nt1fZQoaAZHwEcWL3sXzlNoB03oA2gIR0CxGGP7WNFSdX2UKGgGR8BYoUit7rs0aAdN6ANoCEdAsRif4EfT1HV9lChoBkfALlQjD8+A3GgHTegDaAhHQLEav6QeV9p1fZQoaAZHwGjWUhFEy+JoB03CA2gIR0CxHHqqn3tbdX2UKGgGR8BA+IwEhaC+aAdN6ANoCEdAsRyYbrC3w3V9lChoBkfATli2c8TzumgHTegDaAhHQLEfeXu3MIN1fZQoaAZHwFrMe5nUUfxoB03oA2gIR0CxIBUV32VWdX2UKGgGR8AXGlJpWV/uaAdN6ANoCEdAsSLl1QqI8HV9lChoBkdAUU5og3cYZWgHTcUDaAhHQLEjUWAf+0h1fZQoaAZHwGMe3PiT+vRoB01xA2gIR0CxJI8hTwUhdX2UKGgGR8BmvTF+/gzhaAdN9gJoCEdAsSUP987ZF3V9lChoBkfAZCklt0mtyWgHTTMDaAhHQLElUdkauOl1fZQoaAZHwE3y8mKIi1RoB03oA2gIR0CxJW/vjOs1dX2UKGgGR8AqVd30PH1faAdN6ANoCEdAsSZ04tHx0HV9lChoBkfAYSbTNt65XmgHTSEDaAhHQLEnFw++ueV1fZQoaAZHQEQu4EwFkhBoB03IA2gIR0CxJ8ujynUEdX2UKGgGR8BYlrUXpGF0aAdN6ANoCEdAsShjlfZ26nV9lChoBkfATfuzSkTHsGgHTegDaAhHQLEp5DG96C11fZQoaAZHwCSwZVGTcItoB03oA2gIR0CxLPMD8tPIdX2UKGgGR8BRo6Mm4RVZaAdN6ANoCEdAsS8lv2oNu3V9lChoBkfARCIsPJ7swGgHTegDaAhHQLEvS9/z8P51fZQoaAZHwD0v9m6GxlhoB03oA2gIR0CxMo3AymALdX2UKGgGR8BVy5rxiG34aAdN6ANoCEdAsTM4cBEKE3V9lChoBkfAY6gmelKsdWgHTV8DaAhHQLEzds8PnSx1fZQoaAZHP/NdmQKa5PNoB03bA2gIR0CxNagLeANHdX2UKGgGR8Bk7PbZezD5aAdNywNoCEdAsTdetzS1E3V9lChoBkfAVB11QqI8AGgHTegDaAhHQLE3c6w+t8x1fZQoaAZHwGUPm/WUbDNoB03WA2gIR0CxN88rNGExdX2UKGgGR8BWbcenyd4FaAdN6ANoCEdAsTg71nM+vHV9lChoBkfAZ+p3bEgnt2gHTZADaAhHQLE4ZqgRK6F1fZQoaAZHwEa5QHiWE9NoB03oA2gIR0CxOTVOTJQtdX2UKGgGR8BrH9dszl90aAdNvQNoCEdAsTnJHI6sAHV9lChoBkdAT7V4gRsdk2gHTa0DaAhHQLE6Iaef7Jp1fZQoaAZHwEG+jv/io89oB03oA2gIR0CxPJi8e0XxdX2UKGgGR8BlctcdHUc5aAdNPANoCEdAsTy7csUZenV9lChoBkfAZUd1g6U7jmgHTRQDaAhHQLE9+4nWrfd1fZQoaAZHQFEfomois4loB001A2gIR0CxPnI3aSLZdX2UKGgGR8BjKfa+N96UaAdNuAJoCEdAsT8BcNYr8XV9lChoBkfAYZ7yLhrFfmgHTdgCaAhHQLFCTWnTAnF1fZQoaAZHwGAo2+wkgOloB01uA2gIR0CxQzUjPfKqdX2UKGgGR8BGS1WbPQfIaAdN6ANoCEdAsUWTbUPQOXV9lChoBkfAYtg7xusLfGgHTTADaAhHQLFHLu7HyVh1fZQoaAZHwGB+aKLsKLNoB00WA2gIR0CxR7tP557gdX2UKGgGR8BgqFmvnr6daAdN/QJoCEdAsUgCSxJNCnV9lChoBkfASqohUzbeuWgHTegDaAhHQLFKFZOSGJx1fZQoaAZHwD9XC0ngHeJoB03oA2gIR0CxSi1HrhR7dX2UKGgGR0BEMqbSZ0CBaAdN1wNoCEdAsUo5tP557nV9lChoBkdAVQm5SWJJoWgHTVMDaAhHQLFKcNKh+OR1fZQoaAZHwFDzFCb+cYtoB03oA2gIR0CxSvZ3PiT/dX2UKGgGR8Bt3hI1+AmRaAdNQANoCEdAsU5aYjSofnV9lChoBkfAOM+jmCAc1mgHTegDaAhHQLFQJ5nDiwV1fZQoaAZHwFt09U0elsRoB03oA2gIR0CxUFDHsC1adX2UKGgGR8BmjHlfZ26kaAdNhwNoCEdAsVD6pEQXh3V9lChoBkfASEhMDfWMCWgHTegDaAhHQLFSKSmZVn51fZQoaAZHwGRRUzj3mFJoB00sA2gIR0CxU3mknCwbdX2UKGgGR8BChpI+W4ViaAdN6ANoCEdAsVZz2Cdz4nV9lChoBkfAZHYnTiKiwmgHTRsDaAhHQLFW662OQyR1fZQoaAZHwG1QRoqTbFloB03VA2gIR0CxWYFN5+pgdX2UKGgGR8BlXcnw5NoKaAdNCANoCEdAsVnJAdGRWHV9lChoBkfAWZD0UXYUWWgHTegBaAhHQLFaRYNy5qd1fZQoaAZHwGbwV+AmReVoB00HA2gIR0CxWlTYqXnhdX2UKGgGR8Bcy76DXe3yaAdNWAJoCEdAsVqbnhbW3HV9lChoBkfAbGTZSNwR5GgHTaUDaAhHQLFas2Kl54Z1fZQoaAZHwFPFua4MF2VoB03oA2gIR0CxW5btJFspdX2UKGgGR8Buu+Tkhib2aAdN3wNoCEdAsV0lCkXUIHV9lChoBkfAVyaHwgDA8GgHTegDaAhHQLFdW23azu51fZQoaAZHwEQOIJqqOtJoB03oA2gIR0CxXWR/ZuhsdX2UKGgGR8BWvG74BV+7aAdN8AFoCEdAsV9HPLPldXV9lChoBkfAXWEGKQ7tA2gHTRgCaAhHQLFgRmoR7JJ1fZQoaAZHwGU2/fXPJJZoB00RA2gIR0CxYHwA+6iCdX2UKGgGR8BWMSbDuSfUaAdNuAFoCEdAsWGP3IuGsXV9lChoBkfAQq77yhBZ6mgHTegDaAhHQLFiQ5Lytmt1fZQoaAZHwFI5io86mwdoB03oA2gIR0CxYwpWzWwvdX2UKGgGR8BevVhLGrCFaAdNggJoCEdAsWQmNzbN8nV9lChoBkfAS8B7ojfNzWgHTegDaAhHQLFlVbrC3w11fZQoaAZHwFyP6bvw3HdoB007AmgIR0CxZocry1/ldX2UKGgGR8BjalYSxqwhaAdNGgNoCEdAsWeEo4MnZ3V9lChoBkfAZC0E1VHWjGgHTdkCaAhHQLFnvqQiiZh1fZQoaAZHwGsFavicXnBoB01eA2gIR0CxaA8yFfzCdX2UKGgGR8BlzfpKSPluaAdNVwJoCEdAsWnEBnzxw3V9lChoBkfATiMit7rs0GgHTegDaAhHQLFrXAFgUlB1fZQoaAZHwDVrhVENOM5oB03oA2gIR0Cxa6KzRhMKdX2UKGgGR8BftrVz6rNoaAdNEQJoCEdAsWy+59Vmz3V9lChoBkfAXcIcQyylemgHTUECaAhHQLFsx14gRsd1fZQoaAZHwGzvxRVIZqFoB02hA2gIR0CxbXKoVEeAdX2UKGgGR8BooIg/1QIlaAdNBANoCEdAsW50dlum8HV9lChoBkfATilmapgkT2gHTegDaAhHQLFuxqlxffJ1fZQoaAZHwFEgKji4rjJoB03oA2gIR0CxcsAGnn+ydX2UKGgGR8BY1DPBzmwJaAdN6ANoCEdAsXSCtCAtnXVlLg=="}, "ep_success_buffer": {":type:": "<class 'collections.deque'>", ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="}, "_n_updates": 14844, "observation_space": {":type:": "<class 'gymnasium.spaces.box.Box'>", ":serialized:": "gAWVdgIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoCIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoESiWCAAAAAAAAAABAQEBAQEBAZRoFUsIhZRoGXSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBEoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaAtLCIWUaBl0lFKUjARoaWdolGgRKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgLSwiFlGgZdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=", "dtype": "float32", "bounded_below": "[ True True True True True True True True]", "bounded_above": "[ True True True True True True True True]", "_shape": [8], "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]", "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]", "_np_random": null}, "action_space": {":type:": "<class 'gymnasium.spaces.discrete.Discrete'>", ":serialized:": "gAWVpAEAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCmMBWR0eXBllGgOjApfbnBfcmFuZG9tlIwUbnVtcHkucmFuZG9tLl9waWNrbGWUjBBfX2dlbmVyYXRvcl9jdG9ylJOUjAVQQ0c2NJRoG4wUX19iaXRfZ2VuZXJhdG9yX2N0b3KUk5SGlFKUfZQojA1iaXRfZ2VuZXJhdG9ylIwFUENHNjSUjAVzdGF0ZZR9lChoJooRI3gx9nV86k+Av4E0d+Wa3ACMA2luY5SKEAOj7fwhxAH26id6KbEBMzp1jApoYXNfdWludDMylEsAjAh1aW50ZWdlcpSKBYUFMuEAdWJ1Yi4=", "n": "4", "start": "0", "_shape": [], "dtype": "int64", "_np_random": "Generator(PCG64)"}, "n_envs": 16, "buffer_size": 1000000, "batch_size": 64, "learning_starts": 50000, "tau": 1.0, "gamma": 0.999, "gradient_steps": 1, "optimize_memory_usage": false, "replay_buffer_class": {":type:": "<class 'abc.ABCMeta'>", ":serialized:": "gAWVNQAAAAAAAACMIHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5idWZmZXJzlIwMUmVwbGF5QnVmZmVylJOULg==", "__module__": "stable_baselines3.common.buffers", "__doc__": "\n Replay buffer used in off-policy algorithms like SAC/TD3.\n\n :param buffer_size: Max number of element in the buffer\n :param observation_space: Observation space\n :param action_space: Action space\n :param device: PyTorch device\n :param n_envs: Number of parallel environments\n :param optimize_memory_usage: Enable a memory efficient variant\n of the replay buffer which reduces by almost a factor two the memory used,\n at a cost of more complexity.\n See https://github.com/DLR-RM/stable-baselines3/issues/37#issuecomment-637501195\n and https://github.com/DLR-RM/stable-baselines3/pull/28#issuecomment-637559274\n Cannot be used in combination with handle_timeout_termination.\n :param handle_timeout_termination: Handle timeout termination (due to timelimit)\n separately and treat the task as infinite horizon task.\n https://github.com/DLR-RM/stable-baselines3/issues/284\n ", "__init__": "<function ReplayBuffer.__init__ at 0x7fd5331ca2a0>", "add": "<function ReplayBuffer.add at 0x7fd5331ca3e0>", "sample": "<function ReplayBuffer.sample at 0x7fd5331ca480>", "_get_samples": "<function ReplayBuffer._get_samples at 0x7fd5331ca520>", "__abstractmethods__": "frozenset()", "_abc_impl": "<_abc._abc_data object at 0x7fd5331c7140>"}, "replay_buffer_kwargs": {}, "train_freq": {":type:": "<class 'stable_baselines3.common.type_aliases.TrainFreq'>", ":serialized:": "gAWVeAAAAAAAAACMJXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi50eXBlX2FsaWFzZXOUjAlUcmFpbkZyZXGUk5RLBIwIYnVpbHRpbnOUjAdnZXRhdHRylJOUaACMElRyYWluRnJlcXVlbmN5VW5pdJSTlIwEU1RFUJSGlFKUhpSBlC4="}, "use_sde_at_warmup": false, "exploration_initial_eps": 1.0, "exploration_final_eps": 0.05, "exploration_fraction": 0.1, "target_update_interval": 625, "_n_calls": 62500, "max_grad_norm": 10, "exploration_rate": 0.05, "lr_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWV4QIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwiVAZcAiQFTAJROhZQpjAFflIWUjF4vaG9tZS9hYmJ5L2FuYWNvbmRhMy9lbnZzL2NvbGFiL2xpYi9weXRob24zLjExL3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUS4RDCPiAANgPEogKlEMAlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMXi9ob21lL2FiYnkvYW5hY29uZGEzL2VudnMvY29sYWIvbGliL3B5dGhvbjMuMTEvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCF9lH2UKGgYaA2MDF9fcXVhbG5hbWVfX5RoDowPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoGYwHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/Gjbi6xxDLYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="}, "batch_norm_stats": [], "batch_norm_stats_target": [], "exploration_schedule": {":type:": "<class 'function'>", ":serialized:": "gAWVwAMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLBEsTQzyVA5cAZAF8AHoKAACJAmsEAAAAAHICiQFTAIkDZAF8AHoKAACJAYkDegoAAHoFAACJAnoLAAB6AAAAUwCUTksBhpQpjBJwcm9ncmVzc19yZW1haW5pbmeUhZSMXi9ob21lL2FiYnkvYW5hY29uZGEzL2VudnMvY29sYWIvbGliL3B5dGhvbjMuMTEvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlIwbZ2V0X2xpbmVhcl9mbi48bG9jYWxzPi5mdW5jlEtyQzv4gADYDA3QECLRDCKgbNILMvAAAwlTAdgTFohK4BMYmEHQIDLRHDKwc7hVsXvRG0PAbNEbUtETUtAMUpRDAJSMA2VuZJSMDGVuZF9mcmFjdGlvbpSMBXN0YXJ0lIeUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMXi9ob21lL2FiYnkvYW5hY29uZGEzL2VudnMvY29sYWIvbGliL3B5dGhvbjMuMTEvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpRoHylSlGgfKVKUh5R0lFKUaACMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGglfZR9lChoGmgNjAxfX3F1YWxuYW1lX1+UaA6MD19fYW5ub3RhdGlvbnNfX5R9lChoCowIYnVpbHRpbnOUjAVmbG9hdJSTlIwGcmV0dXJulGgvdYwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBuMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHP6mZmZmZmZqFlFKUaDdHP7mZmZmZmZqFlFKUaDdHP/AAAAAAAACFlFKUh5SMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="}, "system_info": {"OS": "Linux-5.15.133.1-microsoft-standard-WSL2-x86_64-with-glibc2.35 # 1 SMP Thu Oct 5 21:02:42 UTC 2023", "Python": "3.11.0", "Stable-Baselines3": "2.0.0a5", "PyTorch": "2.1.2+cu121", "GPU Enabled": "True", "Numpy": "1.26.3", "Cloudpickle": "3.0.0", "Gymnasium": "0.28.1"}}
dqn-LunarLander-v1.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d742a2f04bf3b44e5739dc99c1ade2b471dce8416e2a766d088cb6b9f6197d0
3
+ size 108209
dqn-LunarLander-v1/_stable_baselines3_version ADDED
@@ -0,0 +1 @@
 
 
1
+ 2.0.0a5
dqn-LunarLander-v1/data ADDED
@@ -0,0 +1,121 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "policy_class": {
3
+ ":type:": "<class 'abc.ABCMeta'>",
4
+ ":serialized:": "gAWVMAAAAAAAAACMHnN0YWJsZV9iYXNlbGluZXMzLmRxbi5wb2xpY2llc5SMCURRTlBvbGljeZSTlC4=",
5
+ "__module__": "stable_baselines3.dqn.policies",
6
+ "__annotations__": "{'q_net': <class 'stable_baselines3.dqn.policies.QNetwork'>, 'q_net_target': <class 'stable_baselines3.dqn.policies.QNetwork'>}",
7
+ "__doc__": "\n Policy class with Q-Value Net and target net for DQN\n\n :param observation_space: Observation space\n :param action_space: Action space\n :param lr_schedule: Learning rate schedule (could be constant)\n :param net_arch: The specification of the policy and value networks.\n :param activation_fn: Activation function\n :param features_extractor_class: Features extractor to use.\n :param features_extractor_kwargs: Keyword arguments\n to pass to the features extractor.\n :param normalize_images: Whether to normalize images or not,\n dividing by 255.0 (True by default)\n :param optimizer_class: The optimizer to use,\n ``th.optim.Adam`` by default\n :param optimizer_kwargs: Additional keyword arguments,\n excluding the learning rate, to pass to the optimizer\n ",
8
+ "__init__": "<function DQNPolicy.__init__ at 0x7fd5331deb60>",
9
+ "_build": "<function DQNPolicy._build at 0x7fd5331dec00>",
10
+ "make_q_net": "<function DQNPolicy.make_q_net at 0x7fd5331deca0>",
11
+ "forward": "<function DQNPolicy.forward at 0x7fd5331ded40>",
12
+ "_predict": "<function DQNPolicy._predict at 0x7fd5331dede0>",
13
+ "_get_constructor_parameters": "<function DQNPolicy._get_constructor_parameters at 0x7fd5331dee80>",
14
+ "set_training_mode": "<function DQNPolicy.set_training_mode at 0x7fd5331def20>",
15
+ "__abstractmethods__": "frozenset()",
16
+ "_abc_impl": "<_abc._abc_data object at 0x7fd5331e9940>"
17
+ },
18
+ "verbose": 1,
19
+ "policy_kwargs": {},
20
+ "num_timesteps": 1000000,
21
+ "_total_timesteps": 1000000,
22
+ "_num_timesteps_at_start": 0,
23
+ "seed": null,
24
+ "action_noise": null,
25
+ "start_time": 1706575822237294089,
26
+ "learning_rate": 0.0001,
27
+ "tensorboard_log": null,
28
+ "_last_obs": {
29
+ ":type:": "<class 'numpy.ndarray'>",
30
+ ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAANhU7b6sHBY+QI/KvUQn37ssifO74MD0uwAAAAAAAAAASSgbv0wEQz7Shq29PN6Ovef2Brww3Yi8AAAAAAAAAAAznXm9NhQhP3BZ/73AAFO9OmBYPACNA70AAAAAAAAAAM2QpDsZjCo/WhC2vSVWqrzP0bU6S7eQvAAAAAAAAAAAS7JHv2xKKz6PkpG9QyKqPHoy4L0Bt6g9AACAPwAAgD9WTpS+Cx6jPhsokb3d5iC9XJ8hPTrPc7wAAAAAAAAAAEinJb8pwu4+UqMavY0H2r2mIAQ96v8AvAAAAAAAAAAAvHwVv0xypj8dWmG+gF7YvZ/EHb7AgKM8AAAAAAAAAAClDvq+pWqXPvtR47wjAQm9EdnWPKDI1jwAAAAAAAAAANPYyL4Qbag+f4W/vTr9N70Bfna9EnKlPAAAAAAAAAAAmv16PtTHkD+t7yu+bEJbvZUm07sh0ha8AAAAAAAAAACzrLQ9a/dEP3WhYL37+hi9hwXQPKqkTrwAAAAAAAAAAErLrD50PVg/LoXUuxswh72RwQU9Rhg9OwAAAAAAAAAAoDZIvnSg9j7Fvca92VVhvYowqrwazOE8AAAAAAAAAACy1VG/fHFDP1qKvb0etMK9StILvap8bbwAAAAAAAAAAIU+J7/U1l0+IgA1vR3427yEJVE83fGaPAAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
31
+ },
32
+ "_last_episode_starts": {
33
+ ":type:": "<class 'numpy.ndarray'>",
34
+ ":serialized:": "gAWVgwAAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYQAAAAAAAAAAEBAQEBAQEBAQEBAQEBAQGUjAVudW1weZSMBWR0eXBllJOUjAJiMZSJiIeUUpQoSwOMAXyUTk5OSv////9K/////0sAdJRiSxCFlIwBQ5R0lFKULg=="
35
+ },
36
+ "_last_original_obs": {
37
+ ":type:": "<class 'numpy.ndarray'>",
38
+ ":serialized:": "gAWVdQIAAAAAAACMEm51bXB5LmNvcmUubnVtZXJpY5SMC19mcm9tYnVmZmVylJOUKJYAAgAAAAAAALbS7L7VRBY+54LLvbKtH71UTOe7W4fvuwAAAAAAAAAANPAav7qfRD5wy8S9O2cyvV+O8ruTr+s8AAAAAAAAAADNcHS9MmAhP2DX/L13b069lq9yPEL0AL0AAAAAAAAAAJr9wTvBqio/lhaavRaLgr29yxQ7Ht2XuwAAAAAAAAAAbYZHv8TRKj71foq9Q7yiPACi6L0yL6E9AACAPwAAgD9z8JO+8pGjPqsceL1TpTq9jKskPep437sAAAAAAAAAAEeOJb8m/O8+z+pDvWpLpL1zvQU9zG4FPQAAAAAAAAAAKu0Uv0TApj+Sl2++Kf3zvTrKHr7kOIA8AAAAAAAAAAAD7Pm+Oc2XPlUembwNcNS72RvMPHCSJbwAAAAAAAAAAJZfyL6n8ag+wPPSvSYlj7zcoHq9k45vPQAAAAAAAAAA+rZ8PkzvkD+IwDu+n//CvYMRxLuZNMG8AAAAAAAAAACaz7U9gi5FP6vRW73Tdpm9AzDVPC3EY7wAAAAAAAAAAJrTrD7Jnlg//qRqvCEDI71JKgU9gsMMPQAAAAAAAAAA4DtHvsRC9z5KCeC9S5+mvb96tbx/iY08AAAAAAAAAACQmFG/pP1DPx3N4r3lTs69VdoIvXpd+rwAAAAAAAAAADAiJ78ndV4+8Mv2vCkHVr3wpkE856cBPQAAAAAAAAAAlIwFbnVtcHmUjAVkdHlwZZSTlIwCZjSUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYksQSwiGlIwBQ5R0lFKULg=="
39
+ },
40
+ "_episode_num": 2180,
41
+ "use_sde": false,
42
+ "sde_sample_freq": -1,
43
+ "_current_progress_remaining": 0.0,
44
+ "_stats_window_size": 100,
45
+ "ep_info_buffer": {
46
+ ":type:": "<class 'collections.deque'>",
47
+ ":serialized:": "gAWVRAwAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKUKH2UKIwBcpRHwD6dyOq//NuMAWyUTegDjAF0lEdAsQ1Vvfj0c3V9lChoBkfAZSg/BWPtD2gHTV0DaAhHQLEN7+j/Mnt1fZQoaAZHwFRg5Xlr/KhoB03oA2gIR0CxELe1OTJRdX2UKGgGR8BSrXsolUqAaAdN6ANoCEdAsRHyY6XBxnV9lChoBkfAJFuRDCxeLWgHTegDaAhHQLETYn8baRJ1fZQoaAZHP/w/IbOu7pVoB03oA2gIR0CxFLwEEC/5dX2UKGgGR8BowfPVurIYaAdNpQNoCEdAsRUcWrOqvXV9lChoBkfAJKVkUbkwOGgHTegDaAhHQLEW/WrwOON1fZQoaAZHwB7haHKwIMVoB03oA2gIR0CxFxIeT3ZgdX2UKGgGR8BGWN/FzdULaAdN6ANoCEdAsRceqJdjXnV9lChoBkfAVBBIatLcsWgHTegDaAhHQLEXuZUT+Nt1fZQoaAZHwEcWL3sXzlNoB03oA2gIR0CxGGP7WNFSdX2UKGgGR8BYoUit7rs0aAdN6ANoCEdAsRif4EfT1HV9lChoBkfALlQjD8+A3GgHTegDaAhHQLEav6QeV9p1fZQoaAZHwGjWUhFEy+JoB03CA2gIR0CxHHqqn3tbdX2UKGgGR8BA+IwEhaC+aAdN6ANoCEdAsRyYbrC3w3V9lChoBkfATli2c8TzumgHTegDaAhHQLEfeXu3MIN1fZQoaAZHwFrMe5nUUfxoB03oA2gIR0CxIBUV32VWdX2UKGgGR8AXGlJpWV/uaAdN6ANoCEdAsSLl1QqI8HV9lChoBkdAUU5og3cYZWgHTcUDaAhHQLEjUWAf+0h1fZQoaAZHwGMe3PiT+vRoB01xA2gIR0CxJI8hTwUhdX2UKGgGR8BmvTF+/gzhaAdN9gJoCEdAsSUP987ZF3V9lChoBkfAZCklt0mtyWgHTTMDaAhHQLElUdkauOl1fZQoaAZHwE3y8mKIi1RoB03oA2gIR0CxJW/vjOs1dX2UKGgGR8AqVd30PH1faAdN6ANoCEdAsSZ04tHx0HV9lChoBkfAYSbTNt65XmgHTSEDaAhHQLEnFw++ueV1fZQoaAZHQEQu4EwFkhBoB03IA2gIR0CxJ8ujynUEdX2UKGgGR8BYlrUXpGF0aAdN6ANoCEdAsShjlfZ26nV9lChoBkfATfuzSkTHsGgHTegDaAhHQLEp5DG96C11fZQoaAZHwCSwZVGTcItoB03oA2gIR0CxLPMD8tPIdX2UKGgGR8BRo6Mm4RVZaAdN6ANoCEdAsS8lv2oNu3V9lChoBkfARCIsPJ7swGgHTegDaAhHQLEvS9/z8P51fZQoaAZHwD0v9m6GxlhoB03oA2gIR0CxMo3AymALdX2UKGgGR8BVy5rxiG34aAdN6ANoCEdAsTM4cBEKE3V9lChoBkfAY6gmelKsdWgHTV8DaAhHQLEzds8PnSx1fZQoaAZHP/NdmQKa5PNoB03bA2gIR0CxNagLeANHdX2UKGgGR8Bk7PbZezD5aAdNywNoCEdAsTdetzS1E3V9lChoBkfAVB11QqI8AGgHTegDaAhHQLE3c6w+t8x1fZQoaAZHwGUPm/WUbDNoB03WA2gIR0CxN88rNGExdX2UKGgGR8BWbcenyd4FaAdN6ANoCEdAsTg71nM+vHV9lChoBkfAZ+p3bEgnt2gHTZADaAhHQLE4ZqgRK6F1fZQoaAZHwEa5QHiWE9NoB03oA2gIR0CxOTVOTJQtdX2UKGgGR8BrH9dszl90aAdNvQNoCEdAsTnJHI6sAHV9lChoBkdAT7V4gRsdk2gHTa0DaAhHQLE6Iaef7Jp1fZQoaAZHwEG+jv/io89oB03oA2gIR0CxPJi8e0XxdX2UKGgGR8BlctcdHUc5aAdNPANoCEdAsTy7csUZenV9lChoBkfAZUd1g6U7jmgHTRQDaAhHQLE9+4nWrfd1fZQoaAZHQFEfomois4loB001A2gIR0CxPnI3aSLZdX2UKGgGR8BjKfa+N96UaAdNuAJoCEdAsT8BcNYr8XV9lChoBkfAYZ7yLhrFfmgHTdgCaAhHQLFCTWnTAnF1fZQoaAZHwGAo2+wkgOloB01uA2gIR0CxQzUjPfKqdX2UKGgGR8BGS1WbPQfIaAdN6ANoCEdAsUWTbUPQOXV9lChoBkfAYtg7xusLfGgHTTADaAhHQLFHLu7HyVh1fZQoaAZHwGB+aKLsKLNoB00WA2gIR0CxR7tP557gdX2UKGgGR8BgqFmvnr6daAdN/QJoCEdAsUgCSxJNCnV9lChoBkfASqohUzbeuWgHTegDaAhHQLFKFZOSGJx1fZQoaAZHwD9XC0ngHeJoB03oA2gIR0CxSi1HrhR7dX2UKGgGR0BEMqbSZ0CBaAdN1wNoCEdAsUo5tP557nV9lChoBkdAVQm5SWJJoWgHTVMDaAhHQLFKcNKh+OR1fZQoaAZHwFDzFCb+cYtoB03oA2gIR0CxSvZ3PiT/dX2UKGgGR8Bt3hI1+AmRaAdNQANoCEdAsU5aYjSofnV9lChoBkfAOM+jmCAc1mgHTegDaAhHQLFQJ5nDiwV1fZQoaAZHwFt09U0elsRoB03oA2gIR0CxUFDHsC1adX2UKGgGR8BmjHlfZ26kaAdNhwNoCEdAsVD6pEQXh3V9lChoBkfASEhMDfWMCWgHTegDaAhHQLFSKSmZVn51fZQoaAZHwGRRUzj3mFJoB00sA2gIR0CxU3mknCwbdX2UKGgGR8BChpI+W4ViaAdN6ANoCEdAsVZz2Cdz4nV9lChoBkfAZHYnTiKiwmgHTRsDaAhHQLFW662OQyR1fZQoaAZHwG1QRoqTbFloB03VA2gIR0CxWYFN5+pgdX2UKGgGR8BlXcnw5NoKaAdNCANoCEdAsVnJAdGRWHV9lChoBkfAWZD0UXYUWWgHTegBaAhHQLFaRYNy5qd1fZQoaAZHwGbwV+AmReVoB00HA2gIR0CxWlTYqXnhdX2UKGgGR8Bcy76DXe3yaAdNWAJoCEdAsVqbnhbW3HV9lChoBkfAbGTZSNwR5GgHTaUDaAhHQLFas2Kl54Z1fZQoaAZHwFPFua4MF2VoB03oA2gIR0CxW5btJFspdX2UKGgGR8Buu+Tkhib2aAdN3wNoCEdAsV0lCkXUIHV9lChoBkfAVyaHwgDA8GgHTegDaAhHQLFdW23azu51fZQoaAZHwEQOIJqqOtJoB03oA2gIR0CxXWR/ZuhsdX2UKGgGR8BWvG74BV+7aAdN8AFoCEdAsV9HPLPldXV9lChoBkfAXWEGKQ7tA2gHTRgCaAhHQLFgRmoR7JJ1fZQoaAZHwGU2/fXPJJZoB00RA2gIR0CxYHwA+6iCdX2UKGgGR8BWMSbDuSfUaAdNuAFoCEdAsWGP3IuGsXV9lChoBkfAQq77yhBZ6mgHTegDaAhHQLFiQ5Lytmt1fZQoaAZHwFI5io86mwdoB03oA2gIR0CxYwpWzWwvdX2UKGgGR8BevVhLGrCFaAdNggJoCEdAsWQmNzbN8nV9lChoBkfAS8B7ojfNzWgHTegDaAhHQLFlVbrC3w11fZQoaAZHwFyP6bvw3HdoB007AmgIR0CxZocry1/ldX2UKGgGR8BjalYSxqwhaAdNGgNoCEdAsWeEo4MnZ3V9lChoBkfAZC0E1VHWjGgHTdkCaAhHQLFnvqQiiZh1fZQoaAZHwGsFavicXnBoB01eA2gIR0CxaA8yFfzCdX2UKGgGR8BlzfpKSPluaAdNVwJoCEdAsWnEBnzxw3V9lChoBkfATiMit7rs0GgHTegDaAhHQLFrXAFgUlB1fZQoaAZHwDVrhVENOM5oB03oA2gIR0Cxa6KzRhMKdX2UKGgGR8BftrVz6rNoaAdNEQJoCEdAsWy+59Vmz3V9lChoBkfAXcIcQyylemgHTUECaAhHQLFsx14gRsd1fZQoaAZHwGzvxRVIZqFoB02hA2gIR0CxbXKoVEeAdX2UKGgGR8BooIg/1QIlaAdNBANoCEdAsW50dlum8HV9lChoBkfATilmapgkT2gHTegDaAhHQLFuxqlxffJ1fZQoaAZHwFEgKji4rjJoB03oA2gIR0CxcsAGnn+ydX2UKGgGR8BY1DPBzmwJaAdN6ANoCEdAsXSCtCAtnXVlLg=="
48
+ },
49
+ "ep_success_buffer": {
50
+ ":type:": "<class 'collections.deque'>",
51
+ ":serialized:": "gAWVIAAAAAAAAACMC2NvbGxlY3Rpb25zlIwFZGVxdWWUk5QpS2SGlFKULg=="
52
+ },
53
+ "_n_updates": 14844,
54
+ "observation_space": {
55
+ ":type:": "<class 'gymnasium.spaces.box.Box'>",
56
+ ":serialized:": "gAWVdgIAAAAAAACMFGd5bW5hc2l1bS5zcGFjZXMuYm94lIwDQm94lJOUKYGUfZQojAVkdHlwZZSMBW51bXB5lIwFZHR5cGWUk5SMAmY0lImIh5RSlChLA4wBPJROTk5K/////0r/////SwB0lGKMDWJvdW5kZWRfYmVsb3eUjBJudW1weS5jb3JlLm51bWVyaWOUjAtfZnJvbWJ1ZmZlcpSTlCiWCAAAAAAAAAABAQEBAQEBAZRoCIwCYjGUiYiHlFKUKEsDjAF8lE5OTkr/////Sv////9LAHSUYksIhZSMAUOUdJRSlIwNYm91bmRlZF9hYm92ZZRoESiWCAAAAAAAAAABAQEBAQEBAZRoFUsIhZRoGXSUUpSMBl9zaGFwZZRLCIWUjANsb3eUaBEoliAAAAAAAAAAAAC0wgAAtMIAAKDAAACgwNsPScAAAKDAAAAAgAAAAICUaAtLCIWUaBl0lFKUjARoaWdolGgRKJYgAAAAAAAAAAAAtEIAALRCAACgQAAAoEDbD0lAAACgQAAAgD8AAIA/lGgLSwiFlGgZdJRSlIwIbG93X3JlcHKUjFtbLTkwLiAgICAgICAgLTkwLiAgICAgICAgIC01LiAgICAgICAgIC01LiAgICAgICAgIC0zLjE0MTU5MjcgIC01LgogIC0wLiAgICAgICAgIC0wLiAgICAgICBdlIwJaGlnaF9yZXBylIxTWzkwLiAgICAgICAgOTAuICAgICAgICAgNS4gICAgICAgICA1LiAgICAgICAgIDMuMTQxNTkyNyAgNS4KICAxLiAgICAgICAgIDEuICAgICAgIF2UjApfbnBfcmFuZG9tlE51Yi4=",
57
+ "dtype": "float32",
58
+ "bounded_below": "[ True True True True True True True True]",
59
+ "bounded_above": "[ True True True True True True True True]",
60
+ "_shape": [
61
+ 8
62
+ ],
63
+ "low": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]",
64
+ "high": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]",
65
+ "low_repr": "[-90. -90. -5. -5. -3.1415927 -5.\n -0. -0. ]",
66
+ "high_repr": "[90. 90. 5. 5. 3.1415927 5.\n 1. 1. ]",
67
+ "_np_random": null
68
+ },
69
+ "action_space": {
70
+ ":type:": "<class 'gymnasium.spaces.discrete.Discrete'>",
71
+ ":serialized:": "gAWVpAEAAAAAAACMGWd5bW5hc2l1bS5zcGFjZXMuZGlzY3JldGWUjAhEaXNjcmV0ZZSTlCmBlH2UKIwBbpSMFW51bXB5LmNvcmUubXVsdGlhcnJheZSMBnNjYWxhcpSTlIwFbnVtcHmUjAVkdHlwZZSTlIwCaTiUiYiHlFKUKEsDjAE8lE5OTkr/////Sv////9LAHSUYkMIBAAAAAAAAACUhpRSlIwFc3RhcnSUaAhoDkMIAAAAAAAAAACUhpRSlIwGX3NoYXBllCmMBWR0eXBllGgOjApfbnBfcmFuZG9tlIwUbnVtcHkucmFuZG9tLl9waWNrbGWUjBBfX2dlbmVyYXRvcl9jdG9ylJOUjAVQQ0c2NJRoG4wUX19iaXRfZ2VuZXJhdG9yX2N0b3KUk5SGlFKUfZQojA1iaXRfZ2VuZXJhdG9ylIwFUENHNjSUjAVzdGF0ZZR9lChoJooRI3gx9nV86k+Av4E0d+Wa3ACMA2luY5SKEAOj7fwhxAH26id6KbEBMzp1jApoYXNfdWludDMylEsAjAh1aW50ZWdlcpSKBYUFMuEAdWJ1Yi4=",
72
+ "n": "4",
73
+ "start": "0",
74
+ "_shape": [],
75
+ "dtype": "int64",
76
+ "_np_random": "Generator(PCG64)"
77
+ },
78
+ "n_envs": 16,
79
+ "buffer_size": 1000000,
80
+ "batch_size": 64,
81
+ "learning_starts": 50000,
82
+ "tau": 1.0,
83
+ "gamma": 0.999,
84
+ "gradient_steps": 1,
85
+ "optimize_memory_usage": false,
86
+ "replay_buffer_class": {
87
+ ":type:": "<class 'abc.ABCMeta'>",
88
+ ":serialized:": "gAWVNQAAAAAAAACMIHN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi5idWZmZXJzlIwMUmVwbGF5QnVmZmVylJOULg==",
89
+ "__module__": "stable_baselines3.common.buffers",
90
+ "__doc__": "\n Replay buffer used in off-policy algorithms like SAC/TD3.\n\n :param buffer_size: Max number of element in the buffer\n :param observation_space: Observation space\n :param action_space: Action space\n :param device: PyTorch device\n :param n_envs: Number of parallel environments\n :param optimize_memory_usage: Enable a memory efficient variant\n of the replay buffer which reduces by almost a factor two the memory used,\n at a cost of more complexity.\n See https://github.com/DLR-RM/stable-baselines3/issues/37#issuecomment-637501195\n and https://github.com/DLR-RM/stable-baselines3/pull/28#issuecomment-637559274\n Cannot be used in combination with handle_timeout_termination.\n :param handle_timeout_termination: Handle timeout termination (due to timelimit)\n separately and treat the task as infinite horizon task.\n https://github.com/DLR-RM/stable-baselines3/issues/284\n ",
91
+ "__init__": "<function ReplayBuffer.__init__ at 0x7fd5331ca2a0>",
92
+ "add": "<function ReplayBuffer.add at 0x7fd5331ca3e0>",
93
+ "sample": "<function ReplayBuffer.sample at 0x7fd5331ca480>",
94
+ "_get_samples": "<function ReplayBuffer._get_samples at 0x7fd5331ca520>",
95
+ "__abstractmethods__": "frozenset()",
96
+ "_abc_impl": "<_abc._abc_data object at 0x7fd5331c7140>"
97
+ },
98
+ "replay_buffer_kwargs": {},
99
+ "train_freq": {
100
+ ":type:": "<class 'stable_baselines3.common.type_aliases.TrainFreq'>",
101
+ ":serialized:": "gAWVeAAAAAAAAACMJXN0YWJsZV9iYXNlbGluZXMzLmNvbW1vbi50eXBlX2FsaWFzZXOUjAlUcmFpbkZyZXGUk5RLBIwIYnVpbHRpbnOUjAdnZXRhdHRylJOUaACMElRyYWluRnJlcXVlbmN5VW5pdJSTlIwEU1RFUJSGlFKUhpSBlC4="
102
+ },
103
+ "use_sde_at_warmup": false,
104
+ "exploration_initial_eps": 1.0,
105
+ "exploration_final_eps": 0.05,
106
+ "exploration_fraction": 0.1,
107
+ "target_update_interval": 625,
108
+ "_n_calls": 62500,
109
+ "max_grad_norm": 10,
110
+ "exploration_rate": 0.05,
111
+ "lr_schedule": {
112
+ ":type:": "<class 'function'>",
113
+ ":serialized:": "gAWV4QIAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLAUsTQwiVAZcAiQFTAJROhZQpjAFflIWUjF4vaG9tZS9hYmJ5L2FuYWNvbmRhMy9lbnZzL2NvbGFiL2xpYi9weXRob24zLjExL3NpdGUtcGFja2FnZXMvc3RhYmxlX2Jhc2VsaW5lczMvY29tbW9uL3V0aWxzLnB5lIwEZnVuY5SMGWNvbnN0YW50X2ZuLjxsb2NhbHM+LmZ1bmOUS4RDCPiAANgPEogKlEMAlIwDdmFslIWUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMXi9ob21lL2FiYnkvYW5hY29uZGEzL2VudnMvY29sYWIvbGliL3B5dGhvbjMuMTEvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpSFlHSUUpRoAIwSX2Z1bmN0aW9uX3NldHN0YXRllJOUaCF9lH2UKGgYaA2MDF9fcXVhbG5hbWVfX5RoDowPX19hbm5vdGF0aW9uc19flH2UjA5fX2t3ZGVmYXVsdHNfX5ROjAxfX2RlZmF1bHRzX1+UTowKX19tb2R1bGVfX5RoGYwHX19kb2NfX5ROjAtfX2Nsb3N1cmVfX5RoAIwKX21ha2VfY2VsbJSTlEc/Gjbi6xxDLYWUUpSFlIwXX2Nsb3VkcGlja2xlX3N1Ym1vZHVsZXOUXZSMC19fZ2xvYmFsc19flH2UdYaUhlIwLg=="
114
+ },
115
+ "batch_norm_stats": [],
116
+ "batch_norm_stats_target": [],
117
+ "exploration_schedule": {
118
+ ":type:": "<class 'function'>",
119
+ ":serialized:": "gAWVwAMAAAAAAACMF2Nsb3VkcGlja2xlLmNsb3VkcGlja2xllIwOX21ha2VfZnVuY3Rpb26Uk5QoaACMDV9idWlsdGluX3R5cGWUk5SMCENvZGVUeXBllIWUUpQoSwFLAEsASwFLBEsTQzyVA5cAZAF8AHoKAACJAmsEAAAAAHICiQFTAIkDZAF8AHoKAACJAYkDegoAAHoFAACJAnoLAAB6AAAAUwCUTksBhpQpjBJwcm9ncmVzc19yZW1haW5pbmeUhZSMXi9ob21lL2FiYnkvYW5hY29uZGEzL2VudnMvY29sYWIvbGliL3B5dGhvbjMuMTEvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUjARmdW5jlIwbZ2V0X2xpbmVhcl9mbi48bG9jYWxzPi5mdW5jlEtyQzv4gADYDA3QECLRDCKgbNILMvAAAwlTAdgTFohK4BMYmEHQIDLRHDKwc7hVsXvRG0PAbNEbUtETUtAMUpRDAJSMA2VuZJSMDGVuZF9mcmFjdGlvbpSMBXN0YXJ0lIeUKXSUUpR9lCiMC19fcGFja2FnZV9flIwYc3RhYmxlX2Jhc2VsaW5lczMuY29tbW9ulIwIX19uYW1lX1+UjB5zdGFibGVfYmFzZWxpbmVzMy5jb21tb24udXRpbHOUjAhfX2ZpbGVfX5SMXi9ob21lL2FiYnkvYW5hY29uZGEzL2VudnMvY29sYWIvbGliL3B5dGhvbjMuMTEvc2l0ZS1wYWNrYWdlcy9zdGFibGVfYmFzZWxpbmVzMy9jb21tb24vdXRpbHMucHmUdU5OaACMEF9tYWtlX2VtcHR5X2NlbGyUk5QpUpRoHylSlGgfKVKUh5R0lFKUaACMEl9mdW5jdGlvbl9zZXRzdGF0ZZSTlGglfZR9lChoGmgNjAxfX3F1YWxuYW1lX1+UaA6MD19fYW5ub3RhdGlvbnNfX5R9lChoCowIYnVpbHRpbnOUjAVmbG9hdJSTlIwGcmV0dXJulGgvdYwOX19rd2RlZmF1bHRzX1+UTowMX19kZWZhdWx0c19flE6MCl9fbW9kdWxlX1+UaBuMB19fZG9jX1+UTowLX19jbG9zdXJlX1+UaACMCl9tYWtlX2NlbGyUk5RHP6mZmZmZmZqFlFKUaDdHP7mZmZmZmZqFlFKUaDdHP/AAAAAAAACFlFKUh5SMF19jbG91ZHBpY2tsZV9zdWJtb2R1bGVzlF2UjAtfX2dsb2JhbHNfX5R9lHWGlIZSMC4="
120
+ }
121
+ }
dqn-LunarLander-v1/policy.optimizer.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e01224413da9a8766d030e877361131c644bc5bd76e7e398e57ea9fabfea00e1
3
+ size 45344
dqn-LunarLander-v1/policy.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:46e921fd33a9cd98a37cdc80814c7eb9d9807878d2f53e850bd6179eb44e6d87
3
+ size 44466
dqn-LunarLander-v1/pytorch_variables.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c35cea3b2e60fb5e7e162d3592df775cd400e575a31c72f359fb9e654ab00c5
3
+ size 864
dqn-LunarLander-v1/system_info.txt ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ - OS: Linux-5.15.133.1-microsoft-standard-WSL2-x86_64-with-glibc2.35 # 1 SMP Thu Oct 5 21:02:42 UTC 2023
2
+ - Python: 3.11.0
3
+ - Stable-Baselines3: 2.0.0a5
4
+ - PyTorch: 2.1.2+cu121
5
+ - GPU Enabled: True
6
+ - Numpy: 1.26.3
7
+ - Cloudpickle: 3.0.0
8
+ - Gymnasium: 0.28.1
results.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"mean_reward": -116.97339803432669, "std_reward": 89.44823287178626, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2024-01-29T17:11:17.538647"}