jianzhnie commited on
Commit
1765737
1 Parent(s): f25cd1d

Push Reinforce agent to the Hub

Browse files
Files changed (5) hide show
  1. README.md +1 -1
  2. hyperparameters.json +1 -1
  3. model.pt +2 -2
  4. replay.mp4 +2 -2
  5. results.json +1 -1
README.md CHANGED
@@ -10,7 +10,7 @@ model-index:
10
  results:
11
  - metrics:
12
  - type: mean_reward
13
- value: 69.30 +/- 13.76
14
  name: mean_reward
15
  task:
16
  type: reinforcement-learning
 
10
  results:
11
  - metrics:
12
  - type: mean_reward
13
+ value: 81.61 +/- 7.99
14
  name: mean_reward
15
  task:
16
  type: reinforcement-learning
hyperparameters.json CHANGED
@@ -1 +1 @@
1
- {"h_size": 16, "n_training_episodes": 1000, "n_evaluation_episodes": 10, "max_t": 1000, "gamma": 0.995, "lr": 0.01, "env_id": "CartPole-v1", "state_space": 4, "action_space": 2}
 
1
+ {"h_size": 32, "n_training_episodes": 10000, "n_evaluation_episodes": 100, "max_t": 1000, "gamma": 0.995, "lr": 0.01, "env_id": "CartPole-v1", "state_space": 4, "action_space": 2}
model.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:87939259e6c8e408422c33f87263588e6bf4bf32d2867b88fb130f4a28175b6d
3
- size 2655
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:58477eebf4316d8995d4bb9e612dc12baf16708833315614d35a10c7b9b2a944
3
+ size 3103
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aeb29e06a9bdf2f323bebb1644ab1b937e4b07b257d3a8a3bfe04b8d8888c8de
3
- size 10202
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:973df1a5d7e82ba4abf794e7392bc3a051f2a801db8e3c0c7d47aabfa8044f00
3
+ size 10151
results.json CHANGED
@@ -1 +1 @@
1
- {"env_id": "CartPole-v1", "mean_reward": 69.3, "std_reward": 13.755362590640786, "n_evaluation_episodes": 10, "eval_datetime": "2022-07-28T21:42:26.866139", "hyperparameters": {"h_size": 16, "n_training_episodes": 1000, "n_evaluation_episodes": 10, "max_t": 1000, "gamma": 0.995, "lr": 0.01, "env_id": "CartPole-v1", "state_space": 4, "action_space": 2}}
 
1
+ {"env_id": "CartPole-v1", "mean_reward": 81.61, "std_reward": 7.991113814731961, "n_evaluation_episodes": 100, "eval_datetime": "2022-07-28T21:59:38.194617", "hyperparameters": {"h_size": 32, "n_training_episodes": 10000, "n_evaluation_episodes": 100, "max_t": 1000, "gamma": 0.995, "lr": 0.01, "env_id": "CartPole-v1", "state_space": 4, "action_space": 2}}