zjowowen commited on
Commit
19994eb
1 Parent(s): dcf808a

Upload README.md with huggingface_hub

Browse files
Files changed (1) hide show
  1. README.md +6 -4
README.md CHANGED
@@ -21,7 +21,7 @@ model-index:
21
  type: BreakoutNoFrameskip-v4
22
  metrics:
23
  - type: mean_reward
24
- value: 6.6 +/- 3.58
25
  name: mean_reward
26
  ---
27
 
@@ -175,7 +175,9 @@ exp_config = {
175
  'n_evaluator_episode': 3,
176
  'manager': {
177
  'shared_memory': False
178
- }
 
 
179
  },
180
  'policy': {
181
  'on_policy': False,
@@ -241,7 +243,7 @@ exp_config = {
241
  'root_noise_weight': 0.25,
242
  'random_collect_episode_num': 0,
243
  'eps': {
244
- 'eps_greedy_exploration_in_collect': False,
245
  'type': 'linear',
246
  'start': 1.0,
247
  'end': 0.05,
@@ -290,7 +292,7 @@ exp_config = {
290
  - **Demo:** [video](https://huggingface.co/OpenDILabCommunity/BreakoutNoFrameskip-v4-MuZero/blob/main/replay.mp4)
291
  <!-- Provide the size information for the model. -->
292
  - **Parameters total size:** 24008.38 KB
293
- - **Last Update Date:** 2023-12-20
294
 
295
  ## Environments
296
  <!-- Address questions around what environment the model is intended to be trained and deployed at, including the necessary information needed to be provided for future users. -->
 
21
  type: BreakoutNoFrameskip-v4
22
  metrics:
23
  - type: mean_reward
24
+ value: 416.7 +/- 149.94
25
  name: mean_reward
26
  ---
27
 
 
175
  'n_evaluator_episode': 3,
176
  'manager': {
177
  'shared_memory': False
178
+ },
179
+ 'collect_max_episode_steps': 5000,
180
+ 'eval_max_episode_steps': 20000
181
  },
182
  'policy': {
183
  'on_policy': False,
 
243
  'root_noise_weight': 0.25,
244
  'random_collect_episode_num': 0,
245
  'eps': {
246
+ 'eps_greedy_exploration_in_collect': True,
247
  'type': 'linear',
248
  'start': 1.0,
249
  'end': 0.05,
 
292
  - **Demo:** [video](https://huggingface.co/OpenDILabCommunity/BreakoutNoFrameskip-v4-MuZero/blob/main/replay.mp4)
293
  <!-- Provide the size information for the model. -->
294
  - **Parameters total size:** 24008.38 KB
295
+ - **Last Update Date:** 2023-12-26
296
 
297
  ## Environments
298
  <!-- Address questions around what environment the model is intended to be trained and deployed at, including the necessary information needed to be provided for future users. -->