pm390 commited on
Commit
a49b144
1 Parent(s): 9e51070

Push Reinforce agent to the Hub

Browse files
README.md CHANGED
@@ -17,7 +17,7 @@ model-index:
17
  type: LunarLander-v2
18
  metrics:
19
  - type: mean_reward
20
- value: -140.79 +/- 78.99
21
  name: mean_reward
22
  verified: false
23
  ---
@@ -38,25 +38,25 @@ model-index:
38
  'wandb_entity': None
39
  'capture_video': False
40
  'env_id': 'LunarLander-v2'
41
- 'total_timesteps': 50000
42
- 'learning_rate': 0.00025
43
- 'num_envs': 4
44
- 'num_steps': 128
45
  'anneal_lr': True
46
  'gae': True
47
  'gamma': 0.99
48
  'gae_lambda': 0.95
49
- 'num_minibatches': 4
50
- 'update_epochs': 4
51
  'norm_adv': True
52
- 'clip_coef': 0.2
53
  'clip_vloss': True
54
- 'ent_coef': 0.01
55
- 'vf_coef': 0.5
56
- 'max_grad_norm': 0.5
57
  'target_kl': None
58
  'repo_id': 'pm390/LunarLander-v2'
59
- 'batch_size': 512
60
- 'minibatch_size': 128}
61
  ```
62
 
 
17
  type: LunarLander-v2
18
  metrics:
19
  - type: mean_reward
20
+ value: -162.88 +/- 78.93
21
  name: mean_reward
22
  verified: false
23
  ---
 
38
  'wandb_entity': None
39
  'capture_video': False
40
  'env_id': 'LunarLander-v2'
41
+ 'total_timesteps': 1000000
42
+ 'learning_rate': 0.000125
43
+ 'num_envs': 16
44
+ 'num_steps': 256
45
  'anneal_lr': True
46
  'gae': True
47
  'gamma': 0.99
48
  'gae_lambda': 0.95
49
+ 'num_minibatches': 8
50
+ 'update_epochs': 8
51
  'norm_adv': True
52
+ 'clip_coef': 0.4
53
  'clip_vloss': True
54
+ 'ent_coef': 0.03
55
+ 'vf_coef': 0.6
56
+ 'max_grad_norm': 0.4
57
  'target_kl': None
58
  'repo_id': 'pm390/LunarLander-v2'
59
+ 'batch_size': 4096
60
+ 'minibatch_size': 512}
61
  ```
62
 
logs/events.out.tfevents.1662324684.624f3f3c0672.728.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0937251530d8068e200b4a93dab94b59dd750577916f2fc6fced8147c29f6af6
3
+ size 125018
model.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f40e04bf2b6121fa3344974ae4fe959f9f08a5d324c3f75a801c9ad9df763af4
3
  size 42689
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:06deccbb7adc999536f3496e49815e9b1fad596f4988072376b1b7a751894178
3
  size 42689
replay.mp4 CHANGED
Binary files a/replay.mp4 and b/replay.mp4 differ
 
results.json CHANGED
@@ -1 +1 @@
1
- {"env_id": "LunarLander-v2", "mean_reward": -140.78854956623383, "std_reward": 78.9862128665021, "n_evaluation_episodes": 10, "eval_datetime": "2022-09-04T20:48:23.275011"}
 
1
+ {"env_id": "LunarLander-v2", "mean_reward": -162.88328449226753, "std_reward": 78.92687312975224, "n_evaluation_episodes": 10, "eval_datetime": "2022-09-04T20:52:40.675612"}