mmorales34
commited on
Commit
β’
aa4480b
1
Parent(s):
b085d98
pushing model
Browse files- dqpn_freq.py +3 -4
- events.out.tfevents.1679277760.rhea.183515.0 β events.out.tfevents.1679289431.redi.466821.0 +1 -1
- videos/{CartPole-v1__CP_DQPN_x1__3__1679277756-eval β CartPole-v1__CP_DQPN_x1__3__1679289427-eval}/rl-video-episode-0.mp4 +0 -0
- videos/{CartPole-v1__CP_DQPN_x1__3__1679277756-eval β CartPole-v1__CP_DQPN_x1__3__1679289427-eval}/rl-video-episode-1.mp4 +0 -0
- videos/{CartPole-v1__CP_DQPN_x1__3__1679277756-eval β CartPole-v1__CP_DQPN_x1__3__1679289427-eval}/rl-video-episode-8.mp4 +0 -0
dqpn_freq.py
CHANGED
@@ -141,17 +141,16 @@ if __name__ == "__main__":
|
|
141 |
wandb.log({name: x, "global_step": y})
|
142 |
|
143 |
# TRY NOT TO MODIFY: seeding
|
144 |
-
random.seed(args.seed)
|
145 |
-
np.random.seed(args.seed)
|
146 |
torch.manual_seed(args.seed)
|
147 |
-
torch.backends.cudnn.deterministic = args.torch_deterministic
|
|
|
|
|
148 |
|
149 |
device = torch.device("cuda" if torch.cuda.is_available() and args.cuda else "cpu")
|
150 |
|
151 |
# env setup
|
152 |
envs = gym.vector.SyncVectorEnv([make_env(args.env_id, args.seed, 0, args.capture_video, run_name)])
|
153 |
assert isinstance(envs.single_action_space, gym.spaces.Discrete), "only discrete action space is supported"
|
154 |
-
envs.seed(args.seed)
|
155 |
|
156 |
q_network = QNetwork(envs).to(device)
|
157 |
optimizer = optim.RMSprop(q_network.parameters(), lr=args.learning_rate)
|
|
|
141 |
wandb.log({name: x, "global_step": y})
|
142 |
|
143 |
# TRY NOT TO MODIFY: seeding
|
|
|
|
|
144 |
torch.manual_seed(args.seed)
|
145 |
+
# torch.backends.cudnn.deterministic = args.torch_deterministic
|
146 |
+
np.random.seed(args.seed)
|
147 |
+
random.seed(args.seed)
|
148 |
|
149 |
device = torch.device("cuda" if torch.cuda.is_available() and args.cuda else "cpu")
|
150 |
|
151 |
# env setup
|
152 |
envs = gym.vector.SyncVectorEnv([make_env(args.env_id, args.seed, 0, args.capture_video, run_name)])
|
153 |
assert isinstance(envs.single_action_space, gym.spaces.Discrete), "only discrete action space is supported"
|
|
|
154 |
|
155 |
q_network = QNetwork(envs).to(device)
|
156 |
optimizer = optim.RMSprop(q_network.parameters(), lr=args.learning_rate)
|
events.out.tfevents.1679277760.rhea.183515.0 β events.out.tfevents.1679289431.redi.466821.0
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 684
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d7f9f851c34b5a4bd724939e309f3f0326129819727edfe81190ec4d3630443b
|
3 |
size 684
|
videos/{CartPole-v1__CP_DQPN_x1__3__1679277756-eval β CartPole-v1__CP_DQPN_x1__3__1679289427-eval}/rl-video-episode-0.mp4
RENAMED
File without changes
|
videos/{CartPole-v1__CP_DQPN_x1__3__1679277756-eval β CartPole-v1__CP_DQPN_x1__3__1679289427-eval}/rl-video-episode-1.mp4
RENAMED
File without changes
|
videos/{CartPole-v1__CP_DQPN_x1__3__1679277756-eval β CartPole-v1__CP_DQPN_x1__3__1679289427-eval}/rl-video-episode-8.mp4
RENAMED
File without changes
|