custom Q-learning for 4x4 slippery
Browse files- README.md +1 -1
- q-learning.pkl +1 -1
- replay.mp4 +2 -2
- results.json +1 -1
README.md
CHANGED
@@ -9,7 +9,7 @@ model-index:
|
|
9 |
results:
|
10 |
- metrics:
|
11 |
- type: mean_reward
|
12 |
-
value: 0.
|
13 |
name: mean_reward
|
14 |
task:
|
15 |
type: reinforcement-learning
|
|
|
9 |
results:
|
10 |
- metrics:
|
11 |
- type: mean_reward
|
12 |
+
value: 0.80 +/- 0.40
|
13 |
name: mean_reward
|
14 |
task:
|
15 |
type: reinforcement-learning
|
q-learning.pkl
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 921
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c7fe564cb148e8914a739db0b806e1795d932a449ea1f7ee0c842badd0758777
|
3 |
size 921
|
replay.mp4
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d7ddba8e8e3d86fd271aaeeb804ed314d2dee03d5c8d3c5e562b729cc76e3b1f
|
3 |
+
size 34555
|
results.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"env_id": "FrozenLake-v1", "mean_reward": 0.
|
|
|
1 |
+
{"env_id": "FrozenLake-v1", "mean_reward": 0.8041237113402062, "n_eval_episodes": 100, "eval_datetime": "2022-05-21T15:06:44.507392"}
|