coledie commited on
Commit
ed2fca8
1 Parent(s): 691e492

Initial commit

Browse files
README.md CHANGED
@@ -10,7 +10,7 @@ model-index:
10
  results:
11
  - metrics:
12
  - type: mean_reward
13
- value: 15.50 +/- 12.54
14
  name: mean_reward
15
  task:
16
  type: reinforcement-learning
 
10
  results:
11
  - metrics:
12
  - type: mean_reward
13
+ value: 354.50 +/- 137.76
14
  name: mean_reward
15
  task:
16
  type: reinforcement-learning
args.yml CHANGED
@@ -30,7 +30,7 @@
30
  - - n_startup_trials
31
  - 10
32
  - - n_timesteps
33
- - 100000
34
  - - n_trials
35
  - 500
36
  - - no_optim_plots
@@ -50,7 +50,7 @@
50
  - - save_replay_buffer
51
  - false
52
  - - seed
53
- - 3981732003
54
  - - storage
55
  - null
56
  - - study_name
 
30
  - - n_startup_trials
31
  - 10
32
  - - n_timesteps
33
+ - 500000
34
  - - n_trials
35
  - 500
36
  - - no_optim_plots
 
50
  - - save_replay_buffer
51
  - false
52
  - - seed
53
+ - 1448633258
54
  - - storage
55
  - null
56
  - - study_name
dqn-SpaceInvadersNoFrameskip-v4.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b3077ead92a0ad7126ca9816049c3eef3521aa3e3922c71d82f324d3064f2cde
3
- size 13719479
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2b41b27146ec12a07b35788c850c6832cc421b9bbb09fa6d787f91365daacbd
3
+ size 27221817
dqn-SpaceInvadersNoFrameskip-v4/data CHANGED
The diff for this file is too large to render. See raw diff
 
dqn-SpaceInvadersNoFrameskip-v4/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d2cbea93aa998a3114d7b0e19fbd3e65edc311a58b95199b7b2a09052fe1b3ed
3
- size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:440c5fe0de6c39edece98778b434b01616b08aaaaf60bc90753c0e5affcc5feb
3
+ size 13502953
dqn-SpaceInvadersNoFrameskip-v4/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d0a8dfc23372da75867b6e2c4642bbaff878106fa0ceaebeccb1057fddc20603
3
  size 13504745
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:68a92a279ee96a0444c31c16c4fe3194a2e31aa722bc51733cefd7f9e5f921dd
3
  size 13504745
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7d4afaddf633990f3d270cf9e169f40ac375b39e821b996f71f99ba9161b17f7
3
- size 273553
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e96f4f4c7ecaed8d52a7b6fa8e9b2320d25c1dfc87ea79e5a5e5096c87c84c28
3
+ size 258171
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 15.5, "std_reward": 12.539936203984453, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2022-07-04T00:46:36.314974"}
 
1
+ {"mean_reward": 354.5, "std_reward": 137.75793988006643, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2022-07-04T04:44:54.644401"}
train_eval_metrics.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:765aafd973659b94beeeffe7f0d772e615e0a885604a0dbe8a8a03b68b40d645
3
- size 5695
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8daf1e0a336fc11bbc0f99b60fc1354d61f73f1b40b2d35f568541ec0e79a0a8
3
+ size 22066