colinrgodsey commited on
Commit
a717324
1 Parent(s): 32da6cf

Push agent to the Hub

Browse files
Files changed (39) hide show
  1. README.md +11 -15
  2. logs/events.out.tfevents.1719353183.tf-notebook-0.332.0 +3 -0
  3. logs/events.out.tfevents.1719353271.tf-notebook-0.332.1 +3 -0
  4. logs/events.out.tfevents.1719353349.tf-notebook-0.332.2 +3 -0
  5. logs/events.out.tfevents.1719353384.tf-notebook-0.332.3 +3 -0
  6. logs/events.out.tfevents.1719353471.tf-notebook-0.332.4 +3 -0
  7. logs/events.out.tfevents.1719353496.tf-notebook-0.332.5 +3 -0
  8. logs/events.out.tfevents.1719353590.tf-notebook-0.332.6 +3 -0
  9. logs/events.out.tfevents.1719353644.tf-notebook-0.332.7 +3 -0
  10. logs/events.out.tfevents.1719353844.tf-notebook-0.332.8 +3 -0
  11. logs/events.out.tfevents.1719353870.tf-notebook-0.332.9 +3 -0
  12. logs/events.out.tfevents.1719353882.tf-notebook-0.332.10 +3 -0
  13. logs/events.out.tfevents.1719354284.tf-notebook-0.332.11 +3 -0
  14. logs/events.out.tfevents.1719354389.tf-notebook-0.332.12 +3 -0
  15. logs/events.out.tfevents.1719354425.tf-notebook-0.332.13 +3 -0
  16. logs/events.out.tfevents.1719354454.tf-notebook-0.332.14 +3 -0
  17. logs/events.out.tfevents.1719354640.tf-notebook-0.332.15 +3 -0
  18. logs/events.out.tfevents.1719354757.tf-notebook-0.332.16 +3 -0
  19. logs/events.out.tfevents.1719354768.tf-notebook-0.332.17 +3 -0
  20. logs/events.out.tfevents.1719354800.tf-notebook-0.332.18 +3 -0
  21. logs/events.out.tfevents.1719356369.tf-notebook-0.332.19 +3 -0
  22. logs/events.out.tfevents.1719356432.tf-notebook-0.332.20 +3 -0
  23. logs/events.out.tfevents.1719356487.tf-notebook-0.332.21 +3 -0
  24. logs/events.out.tfevents.1719356673.tf-notebook-0.332.22 +3 -0
  25. logs/events.out.tfevents.1719356688.tf-notebook-0.332.23 +3 -0
  26. logs/events.out.tfevents.1719356760.tf-notebook-0.332.24 +3 -0
  27. logs/events.out.tfevents.1719356787.tf-notebook-0.332.25 +3 -0
  28. logs/events.out.tfevents.1719356872.tf-notebook-0.332.26 +3 -0
  29. logs/events.out.tfevents.1719356874.tf-notebook-0.332.27 +3 -0
  30. logs/events.out.tfevents.1719356910.tf-notebook-0.332.28 +3 -0
  31. logs/events.out.tfevents.1719356975.tf-notebook-0.332.29 +3 -0
  32. logs/events.out.tfevents.1719357059.tf-notebook-0.332.30 +3 -0
  33. logs/events.out.tfevents.1719357230.tf-notebook-0.652.0 +3 -0
  34. logs/events.out.tfevents.1719357453.tf-notebook-0.652.1 +3 -0
  35. logs/events.out.tfevents.1719357465.tf-notebook-0.652.2 +3 -0
  36. logs/events.out.tfevents.1719357588.tf-notebook-0.652.3 +3 -0
  37. model.pt +3 -0
  38. replay.mp4 +0 -0
  39. results.json +1 -1
README.md CHANGED
@@ -1,10 +1,11 @@
1
  ---
2
- library_name: stable-baselines3
3
  tags:
4
  - LunarLander-v2
 
5
  - deep-reinforcement-learning
6
  - reinforcement-learning
7
- - stable-baselines3
 
8
  model-index:
9
  - name: PPO
10
  results:
@@ -16,22 +17,17 @@ model-index:
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
- value: 222.32 +/- 18.92
20
  name: mean_reward
21
  verified: false
22
  ---
23
 
24
- # **PPO** Agent playing **LunarLander-v2**
25
- This is a trained model of a **PPO** agent playing **LunarLander-v2**
26
- using the [stable-baselines3 library](https://github.com/DLR-RM/stable-baselines3).
27
 
28
- ## Usage (with Stable-baselines3)
29
- TODO: Add your code
30
 
31
-
32
- ```python
33
- from stable_baselines3 import ...
34
- from huggingface_sb3 import load_from_hub
35
-
36
- ...
37
- ```
 
1
  ---
 
2
  tags:
3
  - LunarLander-v2
4
+ - ppo
5
  - deep-reinforcement-learning
6
  - reinforcement-learning
7
+ - custom-implementation
8
+ - deep-rl-course
9
  model-index:
10
  - name: PPO
11
  results:
 
17
  type: LunarLander-v2
18
  metrics:
19
  - type: mean_reward
20
+ value: -170.08 +/- 80.20
21
  name: mean_reward
22
  verified: false
23
  ---
24
 
25
+ # PPO Agent Playing LunarLander-v2
 
 
26
 
27
+ This is a trained model of a PPO agent playing LunarLander-v2.
 
28
 
29
+ # Hyperparameters
30
+ ```python
31
+ {'env_id': 'LunarLander-v2'}
32
+ ```
33
+
 
 
logs/events.out.tfevents.1719353183.tf-notebook-0.332.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f2f390b2e73d8a0ca654762cab960d923e14b978a7d85261abe41f34467e3ace
3
+ size 88
logs/events.out.tfevents.1719353271.tf-notebook-0.332.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bed1e0be175a7b2a739343b2cad5ff1d966f156314d65d0a289f611105a06a5d
3
+ size 88
logs/events.out.tfevents.1719353349.tf-notebook-0.332.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d3dde747d208b609eda700497c79bc5346060da9d26a962aa3c842a4777552da
3
+ size 1100
logs/events.out.tfevents.1719353384.tf-notebook-0.332.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a2af277db06767d4da304235d95376814b473fad4e359f44baa1090c6b85ecb
3
+ size 1100
logs/events.out.tfevents.1719353471.tf-notebook-0.332.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3d6638b99bb824179b03b472381808c1a90cdcd0f859547a15feea6c76e2032e
3
+ size 1100
logs/events.out.tfevents.1719353496.tf-notebook-0.332.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc583af126ce03e6abecb30364cc97457ff8f5f5ac8b5598d609bc00295e8e16
3
+ size 1100
logs/events.out.tfevents.1719353590.tf-notebook-0.332.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f7061b1b4427c51df4497e73060d37349f0fc8d12301e2c94e1fd00836cb34e
3
+ size 1100
logs/events.out.tfevents.1719353644.tf-notebook-0.332.7 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96c15dc25a09cced1851a9f181430927a63e390c98b168367dbf2405cade3c9b
3
+ size 1100
logs/events.out.tfevents.1719353844.tf-notebook-0.332.8 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b641ed94d069fa5866dcc11662bb9620c8d5aa04783efeb4cde35bd7507d261a
3
+ size 1100
logs/events.out.tfevents.1719353870.tf-notebook-0.332.9 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a928aea0a2ee5b6a0655d98b984a922e1d7d927e3ac9f230c783d12ed15b27bc
3
+ size 1100
logs/events.out.tfevents.1719353882.tf-notebook-0.332.10 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba82ba81ff260ec5f1606ff14907582afba864ea681169cbcdcdaa2fba5fe6d9
3
+ size 1100
logs/events.out.tfevents.1719354284.tf-notebook-0.332.11 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a8b931ce823992afbe81a974e2a6402503d8f438808eb1096cbe4440128be0c
3
+ size 1100
logs/events.out.tfevents.1719354389.tf-notebook-0.332.12 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c73995f785b18c0088b065b4977785108226ccdc0d82ae4f8c07c85e2ffe1f2a
3
+ size 1100
logs/events.out.tfevents.1719354425.tf-notebook-0.332.13 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4112932f744acb2d6f54695eba35019626f0a37920686d97f31f1697a3a56cce
3
+ size 1100
logs/events.out.tfevents.1719354454.tf-notebook-0.332.14 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:525c951103ca8698b5257d98d379c54e9e2e4eace01c7d6ad57adb90b2acb3f7
3
+ size 12385
logs/events.out.tfevents.1719354640.tf-notebook-0.332.15 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:977e346aaec56acee618a3f5b9801bf33298383847fb64bd99b2f1ff10bf45b6
3
+ size 31494
logs/events.out.tfevents.1719354757.tf-notebook-0.332.16 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f9b5bf788405c28609f19db2f7368d9206c8c48a195d2bf3694ebe34cde108c
3
+ size 6259
logs/events.out.tfevents.1719354768.tf-notebook-0.332.17 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6accdedb51a4d2ba98f27c2e5e575a57ec0411d98d09ecf6611d13e6f153b67a
3
+ size 31494
logs/events.out.tfevents.1719354800.tf-notebook-0.332.18 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea8b7d39c743d4a49a503219e1feaab5dbadd624543f06353fdfdcf008a39911
3
+ size 317424
logs/events.out.tfevents.1719356369.tf-notebook-0.332.19 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:221b493b3fffdfd7c4210b1227f94c06dccd3e23182692de103fd8cd50548dea
3
+ size 88
logs/events.out.tfevents.1719356432.tf-notebook-0.332.20 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:643aca1373738746e3f3d7e682c49f510ffbc195e9b0a82a5c621924f3acecc8
3
+ size 88
logs/events.out.tfevents.1719356487.tf-notebook-0.332.21 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:877c0fd664a761c323a250831d986944f8c6e0f7489fc869d869f70fa5e826cc
3
+ size 88
logs/events.out.tfevents.1719356673.tf-notebook-0.332.22 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cae99f838b2cce01876799a17670a941241b1d514353bb9bcafea12cc030e677
3
+ size 88
logs/events.out.tfevents.1719356688.tf-notebook-0.332.23 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:074aebbe049397370267e883db49c67695649a4d4fa44e48da858be46c79f65d
3
+ size 88
logs/events.out.tfevents.1719356760.tf-notebook-0.332.24 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:582c38c22f7900fc020401d75066659ce492bf37500dc0c3b99a4e54336c1168
3
+ size 88
logs/events.out.tfevents.1719356787.tf-notebook-0.332.25 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:30a2f1687390320bdbc925d63341aebc9ec8d7db6370b4ba9a148987a2bfa7df
3
+ size 88
logs/events.out.tfevents.1719356872.tf-notebook-0.332.26 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b3ca66090a1b67a4088df872098980ce168f0163da847a8886140c9cf88e7e25
3
+ size 88
logs/events.out.tfevents.1719356874.tf-notebook-0.332.27 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b4d51464b9c74134650f2d21001cdead0852f5ea440c57cb20d40f0a789a63e
3
+ size 88
logs/events.out.tfevents.1719356910.tf-notebook-0.332.28 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a268ab338a72ca49cb24b07352a67f669462021bdaedf4fae4cf0ae0102366a
3
+ size 88
logs/events.out.tfevents.1719356975.tf-notebook-0.332.29 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:243736f4bc752163d2d81f373a12bd02104aac96fc9fc87183d16ee9d668b37f
3
+ size 88
logs/events.out.tfevents.1719357059.tf-notebook-0.332.30 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e0d40e8f2449a210d189575251ac449e5971488b31859a0a12ef7f9b52e09d73
3
+ size 88
logs/events.out.tfevents.1719357230.tf-notebook-0.652.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ea080b6d5ededdfd41be46569352a2ffe4dd7af01e233e670d4d893cb3a3d32
3
+ size 88
logs/events.out.tfevents.1719357453.tf-notebook-0.652.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:40d5553cd458d76b2e23a1b258e2e778b8efdd75e6d4f20c9ebcc165e5a0bcc4
3
+ size 88
logs/events.out.tfevents.1719357465.tf-notebook-0.652.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc15f523957beb89e85eb16cfb51f8e83a1fd67fbe1d85ac07af88253fe4acf9
3
+ size 31494
logs/events.out.tfevents.1719357588.tf-notebook-0.652.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba9703f8b01a74827f18fededf2b52ff0b743ed26f67e0e0dea2f63297d82661
3
+ size 31494
model.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:653ae816697afc17a6a84170a17cdac4a0ef843a569ddd15091ce1bdfa812508
3
+ size 84812
replay.mp4 CHANGED
Binary files a/replay.mp4 and b/replay.mp4 differ
 
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 222.31539170000002, "std_reward": 18.9212491095876, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2024-06-12T16:47:09.504217"}
 
1
+ {"env_id": "LunarLander-v2", "mean_reward": -170.0832651597297, "std_reward": 80.19670027783228, "n_evaluation_episodes": 10, "eval_datetime": "2024-06-25T23:20:36.087787"}