hishamcse commited on
Commit
4de1db5
1 Parent(s): e34632c

Upload folder using huggingface_hub

Browse files
Files changed (6) hide show
  1. .gitattributes +1 -0
  2. README.md +29 -0
  3. agent.pt +3 -0
  4. hyperparameters.json +1 -0
  5. replay.mp4 +3 -0
  6. results.json +1 -0
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ replay.mp4 filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,29 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ tags:
3
+ - MontezumaRevengeNoFrameskip-v4
4
+ - RND
5
+ - CNN
6
+ - reinforcement-learning
7
+ - custom-implementation
8
+ - atari
9
+ - MontezumaRevengeNoFrameskip-v4
10
+ model-index:
11
+ - name: RND-MontezumaRevengeNoframeSkip-v4
12
+ results:
13
+ - task:
14
+ type: reinforcement-learning
15
+ name: reinforcement-learning
16
+ dataset:
17
+ name: MontezumaRevengeNoFrameskip-v4
18
+ type: MontezumaRevengeNoFrameskip-v4
19
+ metrics:
20
+ - type: mean_reward
21
+ value: 60.00 +/- 149.67
22
+ name: mean_reward
23
+ verified: false
24
+ ---
25
+
26
+ # **RND with CNN** Agent playing **MontezumaRevengeNoFrameskip-v4**
27
+ This is a trained model of a **RND-CNN** agent playing **MontezumaRevengeNoFrameskip-v4** .
28
+ To learn to use this model and train yours check this notebook on kaggle: https://www.kaggle.com/code/syedjarullahhisham/drl-extra-personal-unit-5-rnd-montezuma-mario-bros
29
+
agent.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21d17eef042235eba953472a459d080041e1df0951d2df6c09805d2061e8ce1b
3
+ size 21177478
hyperparameters.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"trainmethod": "RND", "envid": "MontezumaRevengeNoFrameskip-v4", "maxstepperepisode": 4500, "learningrate": 0.0001, "numenv": 1, "numstep": 128, "gamma": 0.999, "intgamma": 0.99, "lambda": 0.95, "usegae": true, "clipgradnorm": 0.5, "entropy": 0.001, "epoch": 4, "minibatch": 4, "ppoeps": 0.1, "extcoef": 2.0, "intcoef": 1.0, "stickyaction": false, "actionprob": 0.25, "lifedone": false, "obsnormstep": 50}
replay.mp4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9bc9698b46aa0f98741d013623f2ac3bcdb85e63ca851a4e6fde4ba90c419d7f
3
+ size 5655334
results.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"env_id": "MontezumaRevengeNoFrameskip-v4", "mean_reward": 60.0, "n_evaluation_episodes": 10, "eval_datetime": "2024-06-23T06:53:37.640281"}