Push Q-Learning agent to Hub
Browse files- README.md +1 -1
- q-learning.pkl +1 -1
- replay.mp4 +2 -2
- results.json +1 -1
README.md
CHANGED
@@ -9,7 +9,7 @@ model-index:
|
|
9 |
results:
|
10 |
- metrics:
|
11 |
- type: mean_reward
|
12 |
-
value: 7.
|
13 |
name: mean_reward
|
14 |
task:
|
15 |
type: reinforcement-learning
|
|
|
9 |
results:
|
10 |
- metrics:
|
11 |
- type: mean_reward
|
12 |
+
value: 7.56 +/- 2.71
|
13 |
name: mean_reward
|
14 |
task:
|
15 |
type: reinforcement-learning
|
q-learning.pkl
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 24589
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:49bd3f98c281d734e5336288eff4589c35609056e49a3a14950e056d0f0eda59
|
3 |
size 24589
|
replay.mp4
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7a6ecdfe734abd6afa20082608d989125016e80bf1765928aaa990423cab4b66
|
3 |
+
size 106886
|
results.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"env_id": "Taxi-v3", "mean_reward": 7.
|
|
|
1 |
+
{"env_id": "Taxi-v3", "mean_reward": 7.56, "n_eval_episodes": 100, "eval_datetime": "2022-06-24T17:32:39.488627"}
|