bitcloud2 commited on
Commit
aa0bec0
1 Parent(s): cc077aa

Upload . with huggingface_hub

Browse files
Files changed (5) hide show
  1. README.md +5 -6
  2. hyperparameters.json +1 -1
  3. model.pt +1 -1
  4. replay.mp4 +0 -0
  5. results.json +1 -1
README.md CHANGED
@@ -8,17 +8,16 @@ tags:
8
  model-index:
9
  - name: Reinforce-pixelcopter
10
  results:
11
- - task:
 
 
 
 
12
  type: reinforcement-learning
13
  name: reinforcement-learning
14
  dataset:
15
  name: Pixelcopter-PLE-v0
16
  type: Pixelcopter-PLE-v0
17
- metrics:
18
- - type: mean_reward
19
- value: 12.30 +/- 12.51
20
- name: mean_reward
21
- verified: false
22
  ---
23
 
24
  # **Reinforce** Agent playing **Pixelcopter-PLE-v0**
 
8
  model-index:
9
  - name: Reinforce-pixelcopter
10
  results:
11
+ - metrics:
12
+ - type: mean_reward
13
+ value: 5.80 +/- 4.31
14
+ name: mean_reward
15
+ task:
16
  type: reinforcement-learning
17
  name: reinforcement-learning
18
  dataset:
19
  name: Pixelcopter-PLE-v0
20
  type: Pixelcopter-PLE-v0
 
 
 
 
 
21
  ---
22
 
23
  # **Reinforce** Agent playing **Pixelcopter-PLE-v0**
hyperparameters.json CHANGED
@@ -1 +1 @@
1
- {"h_size": 64, "n_training_episodes": 5000, "n_evaluation_episodes": 10, "max_t": 10000, "gamma": 0.99, "lr": 0.0001, "env_id": "Pixelcopter-PLE-v0", "state_space": 7, "action_space": 2}
 
1
+ {"h_size": 64, "n_training_episodes": 1000, "n_evaluation_episodes": 10, "max_t": 10000, "gamma": 0.99, "lr": 0.0001, "env_id": "Pixelcopter-PLE-v0", "state_space": 7, "action_space": 2}
model.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fa8c8491f4584c81373272824bdfbd9c9a073e4e0e8aab8c79530f3303b5c689
3
  size 38983
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:46454ffc528cfb8a89a29d7a7c7682e2c15489266f5f6ed8864c0ff0a1764889
3
  size 38983
replay.mp4 CHANGED
Binary files a/replay.mp4 and b/replay.mp4 differ
 
results.json CHANGED
@@ -1 +1 @@
1
- {"env_id": "Pixelcopter-PLE-v0", "mean_reward": 12.3, "n_evaluation_episodes": 10, "eval_datetime": "2023-01-06T09:15:26.812060"}
 
1
+ {"env_id": "Pixelcopter-PLE-v0", "mean_reward": 5.8, "n_evaluation_episodes": 10, "eval_datetime": "2023-01-06T19:34:59.610045"}