skyfox commited on
Commit
50a421b
1 Parent(s): 9f1badb

Initial commit

Browse files
README.md CHANGED
@@ -10,7 +10,7 @@ model-index:
10
  results:
11
  - metrics:
12
  - type: mean_reward
13
- value: 203.50 +/- 113.65
14
  name: mean_reward
15
  task:
16
  type: reinforcement-learning
@@ -60,7 +60,7 @@ OrderedDict([('batch_size', 32),
60
  ('gradient_steps', 1),
61
  ('learning_rate', 0.0001),
62
  ('learning_starts', 100000),
63
- ('n_timesteps', 500000),
64
  ('optimize_memory_usage', True),
65
  ('policy', 'CnnPolicy'),
66
  ('target_update_interval', 1000),
 
10
  results:
11
  - metrics:
12
  - type: mean_reward
13
+ value: 767.00 +/- 378.16
14
  name: mean_reward
15
  task:
16
  type: reinforcement-learning
 
60
  ('gradient_steps', 1),
61
  ('learning_rate', 0.0001),
62
  ('learning_starts', 100000),
63
+ ('n_timesteps', 1000000),
64
  ('optimize_memory_usage', True),
65
  ('policy', 'CnnPolicy'),
66
  ('target_update_interval', 1000),
args.yml CHANGED
@@ -50,7 +50,7 @@
50
  - - save_replay_buffer
51
  - false
52
  - - seed
53
- - 3604725529
54
  - - storage
55
  - null
56
  - - study_name
 
50
  - - save_replay_buffer
51
  - false
52
  - - seed
53
+ - 4178693783
54
  - - storage
55
  - null
56
  - - study_name
config.yml CHANGED
@@ -18,7 +18,7 @@
18
  - - learning_starts
19
  - 100000
20
  - - n_timesteps
21
- - 500000
22
  - - optimize_memory_usage
23
  - true
24
  - - policy
 
18
  - - learning_starts
19
  - 100000
20
  - - n_timesteps
21
+ - 1000000
22
  - - optimize_memory_usage
23
  - true
24
  - - policy
dqn-SpaceInvadersNoFrameskip-v4.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5b2397690310d207fb30dda13cfc2809ce479bbd1ffe270196ffb7f13082a7f9
3
- size 27222200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92bfe95a656fa17231fbe746298384f8a109d503c34bafdd92c81993c484610a
3
+ size 27222203
dqn-SpaceInvadersNoFrameskip-v4/data CHANGED
The diff for this file is too large to render. See raw diff
 
dqn-SpaceInvadersNoFrameskip-v4/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:70a7ca177fd0c711d433cec9ac55b477a69f498e67b4b157c0de9313eec968e2
3
  size 13503145
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dea24d48a2e93b9193103f4bb643551ebe420316acb85d8d66ce2bf18d8748d4
3
  size 13503145
dqn-SpaceInvadersNoFrameskip-v4/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5f4d22dc40f89d10ea117dca01b578d9afbdf33b6f28781d9ce8abe24a3b2961
3
  size 13504937
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e0e76ca8d33241d6b18fa9633c805bb0f6f65363c8457a69810267b6c6fd5848
3
  size 13504937
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0f42dd010c7dca9c0defa50ee069de377da0009ef1823bef73ba0cc7619240b5
3
- size 254482
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a614ce5516aae56dfaf35f1ca2f0979a0ff4d0f97a76dc45972f4230fd902c4
3
+ size 203554
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 203.5, "std_reward": 113.64528146825982, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2022-06-08T17:15:42.183247"}
 
1
+ {"mean_reward": 767.0, "std_reward": 378.16134122884637, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2022-06-08T18:47:09.904974"}
train_eval_metrics.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3c30430c79f6bc237c06e892b39f87b3774c5f9d0c6ae2300285fd23858207e6
3
- size 22261
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:010afc39c7835257ef07ca3e1d95afd15a98faaee8b29d8d55218cbc394770d4
3
+ size 37864