jfelgate commited on
Commit
8248e10
1 Parent(s): 722a645

Push agent to the Hub

Browse files
README.md CHANGED
@@ -17,7 +17,7 @@ model-index:
17
  type: LunarLander-v2
18
  metrics:
19
  - type: mean_reward
20
- value: -176.62 +/- 95.81
21
  name: mean_reward
22
  verified: false
23
  ---
@@ -40,7 +40,7 @@ model-index:
40
  'total_timesteps': 50000
41
  'learning_rate': 0.00025
42
  'num_envs': 4
43
- 'num_steps': 1024
44
  'anneal_lr': True
45
  'gae': True
46
  'gamma': 0.9
@@ -55,7 +55,7 @@ model-index:
55
  'max_grad_norm': 0.5
56
  'target_kl': None
57
  'repo_id': 'jfelgate/ppo-LunarLander-v2'
58
- 'batch_size': 4096
59
- 'minibatch_size': 1024}
60
  ```
61
 
 
17
  type: LunarLander-v2
18
  metrics:
19
  - type: mean_reward
20
+ value: -128.94 +/- 87.14
21
  name: mean_reward
22
  verified: false
23
  ---
 
40
  'total_timesteps': 50000
41
  'learning_rate': 0.00025
42
  'num_envs': 4
43
+ 'num_steps': 128
44
  'anneal_lr': True
45
  'gae': True
46
  'gamma': 0.9
 
55
  'max_grad_norm': 0.5
56
  'target_kl': None
57
  'repo_id': 'jfelgate/ppo-LunarLander-v2'
58
+ 'batch_size': 512
59
+ 'minibatch_size': 128}
60
  ```
61
 
logs/events.out.tfevents.1698072626.527fe3665085.25230.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:162f37fec7429b6672114a7f0edee04e50615bcff19eed6006c79f7fb1a6950a
3
+ size 85465
model.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e877e327c37e38355e589831a8bf9a9137c34b031f902e346ce8080cf2c11701
3
  size 43026
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8fa2f6fac6eb7b6411a0149a887c9f7ab56ee6f49340bc59ff494f622b2003c1
3
  size 43026
replay.mp4 CHANGED
Binary files a/replay.mp4 and b/replay.mp4 differ
 
results.json CHANGED
@@ -1 +1 @@
1
- {"env_id": "LunarLander-v2", "mean_reward": -176.61866016938296, "std_reward": 95.81393100407745, "n_evaluation_episodes": 10, "eval_datetime": "2023-10-23T14:47:51.086564"}
 
1
+ {"env_id": "LunarLander-v2", "mean_reward": -128.9358893690048, "std_reward": 87.13581962908091, "n_evaluation_episodes": 10, "eval_datetime": "2023-10-23T14:51:32.531005"}