tweak epsilon, lr
Browse files- q-learning.pkl +2 -2
- replay.mp4 +2 -2
- results.json +1 -1
q-learning.pkl
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:995c2c39a3920869e9e1d9cc9d0a0e4e1393a8b4ad14be686f5fccca96bcee6c
|
3 |
+
size 24589
|
replay.mp4
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0c608ec1904186d780500aee40e286845a5916d0e53573a7a7063b98a3f6e78f
|
3 |
+
size 100879
|
results.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"env_id": "Taxi-v3", "mean_reward": 7.56, "n_eval_episodes": 100, "eval_datetime": "2022-05-22T09:
|
|
|
1 |
+
{"env_id": "Taxi-v3", "mean_reward": 7.56, "n_eval_episodes": 100, "eval_datetime": "2022-05-22T09:40:41.639162"}
|