sdpkjc commited on
Commit
48650fa
β€’
1 Parent(s): 1009314

pushing model

Browse files
.gitattributes CHANGED
@@ -40,3 +40,6 @@ replay.mp4 filter=lfs diff=lfs merge=lfs -text
40
  videos/HalfCheetah-v4__ppo_fix_continuous_action__5__1704463477-eval/rl-video-episode-8.mp4 filter=lfs diff=lfs merge=lfs -text
41
  videos/HalfCheetah-v4__ppo_fix_continuous_action__5__1704463477-eval/rl-video-episode-1.mp4 filter=lfs diff=lfs merge=lfs -text
42
  videos/HalfCheetah-v4__ppo_fix_continuous_action__5__1704463477-eval/rl-video-episode-0.mp4 filter=lfs diff=lfs merge=lfs -text
 
 
 
 
40
  videos/HalfCheetah-v4__ppo_fix_continuous_action__5__1704463477-eval/rl-video-episode-8.mp4 filter=lfs diff=lfs merge=lfs -text
41
  videos/HalfCheetah-v4__ppo_fix_continuous_action__5__1704463477-eval/rl-video-episode-1.mp4 filter=lfs diff=lfs merge=lfs -text
42
  videos/HalfCheetah-v4__ppo_fix_continuous_action__5__1704463477-eval/rl-video-episode-0.mp4 filter=lfs diff=lfs merge=lfs -text
43
+ videos/HalfCheetah-v4__ppo_fix_continuous_action__5__1705702894-eval/rl-video-episode-0.mp4 filter=lfs diff=lfs merge=lfs -text
44
+ videos/HalfCheetah-v4__ppo_fix_continuous_action__5__1705702894-eval/rl-video-episode-8.mp4 filter=lfs diff=lfs merge=lfs -text
45
+ videos/HalfCheetah-v4__ppo_fix_continuous_action__5__1705702894-eval/rl-video-episode-1.mp4 filter=lfs diff=lfs merge=lfs -text
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: HalfCheetah-v4
17
  metrics:
18
  - type: mean_reward
19
- value: 1640.51 +/- 33.40
20
  name: mean_reward
21
  verified: false
22
  ---
 
16
  type: HalfCheetah-v4
17
  metrics:
18
  - type: mean_reward
19
+ value: 1608.34 +/- 18.25
20
  name: mean_reward
21
  verified: false
22
  ---
events.out.tfevents.1704463487.4090-171.161713.0 β†’ events.out.tfevents.1705702908.3090-172.2625643.0 RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6b45cde0003c0d7c51c38416698b047ed434759ec86f9c9d8b2b37c2bc2b1468
3
  size 376394
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac8154f9904f7faab5bf6d0286864ce2711a01cc3eeb5c68efecb612fcd78e66
3
  size 376394
ppo_fix_continuous_action.cleanrl_model CHANGED
Binary files a/ppo_fix_continuous_action.cleanrl_model and b/ppo_fix_continuous_action.cleanrl_model differ
 
ppo_fix_continuous_action.py CHANGED
@@ -198,7 +198,7 @@ class NormalizeReward(gym.core.Wrapper, gym.utils.RecordConstructorArgs):
198
  return obs, rews, terminateds, truncateds, infos
199
 
200
  def reset(self, **kwargs):
201
- self.returns = np.zeros(self.num_envs)
202
  return self.env.reset(**kwargs)
203
 
204
  def normalize(self, rews):
 
198
  return obs, rews, terminateds, truncateds, infos
199
 
200
  def reset(self, **kwargs):
201
+ # self.returns = np.zeros(self.num_envs)
202
  return self.env.reset(**kwargs)
203
 
204
  def normalize(self, rews):
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5ef772844b50ee96d27a6886884667389061d311e1c6a35ee22f9ae086fa65ad
3
- size 2058420
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4072ae9c1b8ffff37108e3ad3f2b447111d55e2358efaa4670eb5458d782892d
3
+ size 2047150
videos/{HalfCheetah-v4__ppo_fix_continuous_action__5__1704463477-eval β†’ HalfCheetah-v4__ppo_fix_continuous_action__5__1705702894-eval}/rl-video-episode-0.mp4 RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:67ebe612727bac1af4c3ab8817b0e2ebc24f6771945a415b2900728448719ef1
3
- size 2015752
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3aa3e3aaaf1477ad2c0ec447abc0f5ea43e26089e8ebdcfa2f1df307aa040ec2
3
+ size 2003448
videos/{HalfCheetah-v4__ppo_fix_continuous_action__5__1704463477-eval β†’ HalfCheetah-v4__ppo_fix_continuous_action__5__1705702894-eval}/rl-video-episode-1.mp4 RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:45f277c2ec1a3d4956f68d18cb76b8904e5544dce29897d1c5660033f27a0e59
3
- size 2022201
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10ce836ea72981ac1232d987301a4108c440ace76b184cbca79bf19ae79321cc
3
+ size 2029003
videos/{HalfCheetah-v4__ppo_fix_continuous_action__5__1704463477-eval β†’ HalfCheetah-v4__ppo_fix_continuous_action__5__1705702894-eval}/rl-video-episode-8.mp4 RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5ef772844b50ee96d27a6886884667389061d311e1c6a35ee22f9ae086fa65ad
3
- size 2058420
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4072ae9c1b8ffff37108e3ad3f2b447111d55e2358efaa4670eb5458d782892d
3
+ size 2047150