vwxyzjn commited on
Commit
b37cacc
1 Parent(s): 60e0047

pushing model

Browse files
README.md CHANGED
@@ -30,7 +30,7 @@ found [here](https://github.com/vwxyzjn/cleanrl/blob/master/cleanrl/dqn.py).
30
 
31
  ```bash
32
  curl -OL https://huggingface.co/vwxyzjn/CartPole-v1-dqn-seed1/raw/main/dqn.py
33
- python cleanrl/dqn.py --cuda False --save-model --upload-model --total-timesteps 500
34
  ```
35
 
36
  # Hyperparameters
 
30
 
31
  ```bash
32
  curl -OL https://huggingface.co/vwxyzjn/CartPole-v1-dqn-seed1/raw/main/dqn.py
33
+ python dqn.py --cuda False --save-model --upload-model --total-timesteps 500
34
  ```
35
 
36
  # Hyperparameters
events.out.tfevents.1668621727.pop-os.1063627.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:830b02670954a8f05f7e96b7966dd827f8bd7206f70e7ef00bb70a9b1e1c447a
3
+ size 1805
events.out.tfevents.1668621728.pop-os.1063627.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4c417780d8220d5655af10b0d08bf71d9ea42beb2b1087f355555cd052abbe6
3
+ size 618
pyproject.toml ADDED
@@ -0,0 +1,96 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [tool.poetry]
2
+ name = "cleanrl"
3
+ version = "1.0.0b2"
4
+ description = "High-quality single file implementation of Deep Reinforcement Learning algorithms with research-friendly features"
5
+ authors = ["Costa Huang <costa.huang@outlook.com>"]
6
+ include = ["cleanrl_utils"]
7
+ keywords = ["reinforcement", "machine", "learning", "research"]
8
+ license="MIT"
9
+ readme = "README.md"
10
+
11
+ [tool.poetry.dependencies]
12
+ python = ">=3.7.1,<3.10"
13
+ tensorboard = "^2.10.0"
14
+ wandb = "^0.13.3"
15
+ gym = {version = "0.23.1", extras = ["classic_control"]}
16
+ torch = "^1.12.1"
17
+ stable-baselines3 = "1.2.0"
18
+
19
+ [tool.poetry.group.dev.dependencies]
20
+ pre-commit = "^2.20.0"
21
+
22
+ [tool.poetry.group.atari]
23
+ optional = true
24
+ [tool.poetry.group.atari.dependencies]
25
+ ale-py = "0.7.4"
26
+ AutoROM = {extras = ["accept-rom-license"], version = "^0.4.2"}
27
+ opencv-python = "^4.6.0.66"
28
+
29
+ [tool.poetry.group.pybullet]
30
+ optional = true
31
+ [tool.poetry.group.pybullet.dependencies]
32
+ pybullet = "3.1.8"
33
+
34
+ [tool.poetry.group.procgen]
35
+ optional = true
36
+ [tool.poetry.group.procgen.dependencies]
37
+ procgen = "^0.10.7"
38
+
39
+ [tool.poetry.group.pytest]
40
+ optional = true
41
+ [tool.poetry.group.pytest.dependencies]
42
+ pytest = "^7.1.3"
43
+
44
+ [tool.poetry.group.mujoco]
45
+ optional = true
46
+ [tool.poetry.group.mujoco.dependencies]
47
+ free-mujoco-py = "^2.1.6"
48
+
49
+ [tool.poetry.group.docs]
50
+ optional = true
51
+ [tool.poetry.group.docs.dependencies]
52
+ mkdocs-material = "^8.4.3"
53
+ markdown-include = "^0.7.0"
54
+
55
+ [tool.poetry.group.jax]
56
+ optional = true
57
+ [tool.poetry.group.jax.dependencies]
58
+ jax = "^0.3.17"
59
+ jaxlib = "^0.3.15"
60
+ flax = "^0.6.0"
61
+
62
+ [tool.poetry.group.optuna]
63
+ optional = true
64
+ [tool.poetry.group.optuna.dependencies]
65
+ optuna = "^3.0.1"
66
+ optuna-dashboard = "^0.7.2"
67
+ rich = "<12.0"
68
+
69
+ [tool.poetry.group.envpool]
70
+ optional = true
71
+ [tool.poetry.group.envpool.dependencies]
72
+ envpool = "^0.6.4"
73
+
74
+ [tool.poetry.group.pettingzoo]
75
+ optional = true
76
+ [tool.poetry.group.pettingzoo.dependencies]
77
+ PettingZoo = "1.18.1"
78
+ SuperSuit = "3.4.0"
79
+ multi-agent-ale-py = "0.1.11"
80
+
81
+
82
+ [tool.poetry.group.cloud]
83
+ optional = true
84
+ [tool.poetry.group.cloud.dependencies]
85
+ boto3 = "^1.24.70"
86
+ awscli = "^1.25.71"
87
+
88
+ [tool.poetry.group.isaacgym]
89
+ optional = true
90
+ [tool.poetry.group.isaacgym.dependencies]
91
+ isaacgymenvs = {git = "https://github.com/vwxyzjn/IsaacGymEnvs.git", rev = "poetry"}
92
+ isaacgym = {path = "cleanrl/ppo_continuous_action_isaacgym/isaacgym", develop = true}
93
+
94
+ [build-system]
95
+ requires = ["poetry-core"]
96
+ build-backend = "poetry.core.masonry.api"
replay.mp4 ADDED
Binary file (10.8 kB). View file
 
videos/CartPole-v1__dqn__1__1668621727-eval/rl-video-episode-0.mp4 ADDED
Binary file (12.6 kB). View file
 
videos/CartPole-v1__dqn__1__1668621727-eval/rl-video-episode-1.mp4 ADDED
Binary file (8.84 kB). View file
 
videos/CartPole-v1__dqn__1__1668621727-eval/rl-video-episode-8.mp4 ADDED
Binary file (10.8 kB). View file