Amu commited on
Commit
fbdbdf4
1 Parent(s): 49e21e2
Files changed (6) hide show
  1. .gitattributes +1 -0
  2. README.md +25 -0
  3. hyperparameters.json +1 -0
  4. model.pt +3 -0
  5. replay.mp4 +3 -0
  6. results.json +1 -0
.gitattributes CHANGED
@@ -32,3 +32,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
32
  *.zip filter=lfs diff=lfs merge=lfs -text
33
  *.zst filter=lfs diff=lfs merge=lfs -text
34
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
32
  *.zip filter=lfs diff=lfs merge=lfs -text
33
  *.zst filter=lfs diff=lfs merge=lfs -text
34
  *tfevents* filter=lfs diff=lfs merge=lfs -text
35
+ *.mp4 filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,25 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ tags:
3
+ - CartPole-v1
4
+ - reinforce
5
+ - reinforcement-learning
6
+ - custom-implementation
7
+ - deep-rl-class
8
+ model-index:
9
+ - name: tao-ppo-CartPole-v1
10
+ results:
11
+ - task:
12
+ type: reinforcement-learning
13
+ name: reinforcement-learning
14
+ dataset:
15
+ name: CartPole-v1
16
+ type: CartPole-v1
17
+ metrics:
18
+ - type: mean_reward
19
+ value: 254.10 +/- 29.91
20
+ name: mean_reward
21
+ verified: false
22
+ ---
23
+
24
+ # Agent playing **CartPole-v1**
25
+
hyperparameters.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"training": false, "model_name": "PPO", "track": false, "wandb_project_name": "tao", "wandb_entity": null, "env_id": "CartPole-v1", "capture_video": false, "total_timesteps": 500000, "learning_rate": 0.00025, "num_envs": 4, "num_steps": 128, "anneal_lr": true, "gamma": 0.99, "gae_lambda": 0.95, "num_minibatches": 4, "update_epochs": 4, "norm_adv": true, "clip_range": 0.2, "entropy_coef": 0.01, "vf_coef": 0.5, "max_grad_norm": 0.5, "target_kl": null, "seed": 1, "run_name": "CartPole-v1__PPO__1__500000", "device": "cpu", "torch_deterministic": true, "batch_size": 512, "minibatch_size": 128}
model.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bfff2411866bdf14cd72f3fc93c85c3769ff70a7735f8d2ad2daa2749bfecf10
3
+ size 39909
replay.mp4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:767b346e9a995d9d733706e2256b54d12686cf3dddd2c35c960b123adf080e58
3
+ size 57900
results.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"env_id": "CartPole-v1", "mean_reward": 254.10000610351562, "n_evaluation_episodes": 10, "eval_datetime": "2022-12-27T17:51:03.873785"}