sofiaoliveira
commited on
Commit
•
cdf6092
1
Parent(s):
f549db8
Push Q-Learning agent to Hub
Browse files- README.md +1 -1
- q-learning.pkl +2 -2
- replay.mp4 +2 -2
- results.json +1 -1
README.md
CHANGED
@@ -9,7 +9,7 @@ model-index:
|
|
9 |
results:
|
10 |
- metrics:
|
11 |
- type: mean_reward
|
12 |
-
value: 7.
|
13 |
name: mean_reward
|
14 |
task:
|
15 |
type: reinforcement-learning
|
|
|
9 |
results:
|
10 |
- metrics:
|
11 |
- type: mean_reward
|
12 |
+
value: 7.56 +/- 2.71
|
13 |
name: mean_reward
|
14 |
task:
|
15 |
type: reinforcement-learning
|
q-learning.pkl
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:65b80f0cf2d3194385177bd9f2dcbb3f9d3072065392c541262ba76c044ed8df
|
3 |
+
size 24591
|
replay.mp4
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:644d40e0911b5aaca1da5a67154701793e211cb8ef83c6ae0cee2c8643db8b8b
|
3 |
+
size 125538
|
results.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"env_id": "Taxi-v3", "mean_reward": 7.
|
|
|
1 |
+
{"env_id": "Taxi-v3", "mean_reward": 7.56, "n_eval_episodes": 100, "eval_datetime": "2022-08-08T15:01:59.502797"}
|