alfredo-wh commited on
Commit
e66e7a0
1 Parent(s): be81626

batchsize 64

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: ALE/MsPacman-v5
17
  metrics:
18
  - type: mean_reward
19
- value: 1048.00 +/- 238.91
20
  name: mean_reward
21
  verified: false
22
  ---
@@ -62,7 +62,7 @@ python -m rl_zoo3.push_to_hub --algo dqn --env ALE/MsPacman-v5 -f logs/ -orga al
62
 
63
  ## Hyperparameters
64
  ```python
65
- OrderedDict([('batch_size', 32),
66
  ('buffer_size', 100000),
67
  ('env_wrapper',
68
  ['stable_baselines3.common.atari_wrappers.AtariWrapper']),
 
16
  type: ALE/MsPacman-v5
17
  metrics:
18
  - type: mean_reward
19
+ value: 1353.00 +/- 433.57
20
  name: mean_reward
21
  verified: false
22
  ---
 
62
 
63
  ## Hyperparameters
64
  ```python
65
+ OrderedDict([('batch_size', 64),
66
  ('buffer_size', 100000),
67
  ('env_wrapper',
68
  ['stable_baselines3.common.atari_wrappers.AtariWrapper']),
args.yml CHANGED
@@ -54,7 +54,7 @@
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
- - 3060910362
58
  - - storage
59
  - null
60
  - - study_name
 
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
+ - 1567762788
58
  - - storage
59
  - null
60
  - - study_name
config.yml CHANGED
@@ -1,6 +1,6 @@
1
  !!python/object/apply:collections.OrderedDict
2
  - - - batch_size
3
- - 32
4
  - - buffer_size
5
  - 100000
6
  - - env_wrapper
 
1
  !!python/object/apply:collections.OrderedDict
2
  - - - batch_size
3
+ - 64
4
  - - buffer_size
5
  - 100000
6
  - - env_wrapper
dqn-ALE-MsPacman-v5.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:85065e769c818d95e4620d6c98cb7483ca5e4f301d7683b453a3bfaeffbbb487
3
  size 27244716
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff0a5ecc6b528ad07236e2e879e54d44d295a70ad3d432da56adf99ee1005137
3
  size 27244716
dqn-ALE-MsPacman-v5/data CHANGED
The diff for this file is too large to render. See raw diff
 
dqn-ALE-MsPacman-v5/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fac7617570166f4564e66fae9c33df5394015693296db9221cffa5bea16ec692
3
  size 13518524
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b50f9f096f41b822ed8ff5670f2ee108616cce531ce0173a5074a2e782a4dff
3
  size 13518524
dqn-ALE-MsPacman-v5/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ae253f22325203bbe20d30e4a3dc034b84d2924593035f7c98fe0461e2bb2a2f
3
  size 13517658
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d767e1379865beef1cbc366382ee591453ca7407e21ef599db7dc7c2a1f481a
3
  size 13517658
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d2edae8b0873b6851eafad54ffd5678422a3269aedbaf8167372baf5b916f0dd
3
- size 310585
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f9f6bef9c006012286411ffa6d5439e359c70e52289ed4b749274ffa2c473e9f
3
+ size 311075
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 1048.0, "std_reward": 238.90583919192935, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2023-12-02T17:31:36.379761"}
 
1
+ {"mean_reward": 1353.0, "std_reward": 433.56775710377724, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2023-12-03T10:47:59.093910"}
train_eval_metrics.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b4d8688db48b9e09d794fd636ddbb44e58bc24c3681407633bc7b3a4dd118fbe
3
- size 78219
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:863197350b47d43ebbe0389b2c28ab2fcc26fda2a4f4af5ac84ad5345e19c480
3
+ size 76647