breathing-vasu444 commited on
Commit
8d66194
1 Parent(s): a5c3aca

Upload PPO Lunarlander-v2 trained agent

Browse files
Files changed (4) hide show
  1. README.md +1 -1
  2. ppo_lunarlander.zip +1 -1
  3. replay.mp4 +0 -0
  4. results.json +1 -1
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
- value: 109.04 +/- 56.86
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: LunarLander-v2
17
  metrics:
18
  - type: mean_reward
19
+ value: 99.25 +/- 77.41
20
  name: mean_reward
21
  verified: false
22
  ---
ppo_lunarlander.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:08694ecc846f1bf4408a0701dfce82d48c711733ac28452cdb0c826d4506ea99
3
  size 147426
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:742cf2fa0f552a7b829fbae99f70c5bb9625bea169471fb01c668f3c8c370c07
3
  size 147426
replay.mp4 CHANGED
Binary files a/replay.mp4 and b/replay.mp4 differ
 
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 109.0440527, "std_reward": 56.86480596253884, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2024-07-16T11:30:18.836830"}
 
1
+ {"mean_reward": 99.24949939999999, "std_reward": 77.41262730307886, "is_deterministic": true, "n_eval_episodes": 10, "eval_datetime": "2024-07-16T11:36:48.663223"}