Update README.md
Browse files
README.md
CHANGED
@@ -30,39 +30,7 @@ TODO: Add your code
|
|
30 |
|
31 |
```python
|
32 |
|
33 |
-
|
34 |
-
model_architecture = "PPO"
|
35 |
-
model_name = "ppo-LunarLander-v2"
|
36 |
-
|
37 |
-
env = make_vec_env(env_id , n_envs=16)
|
38 |
-
|
39 |
-
model = PPO(
|
40 |
-
policy = "MlpPolicy",
|
41 |
-
env = env,
|
42 |
-
n_steps = 1024,
|
43 |
-
batch_size = 64,
|
44 |
-
n_epochs = 4,
|
45 |
-
gamma = 0.999,
|
46 |
-
gae_lambda = 0.98,
|
47 |
-
ent_coef = 0.01,
|
48 |
-
verbose = 0
|
49 |
-
)
|
50 |
-
|
51 |
-
model.learn(total_timesteps=1_000_000)
|
52 |
-
model.save(model_name)
|
53 |
-
|
54 |
-
eval_env = DummyVecEnv([lambda: gym.make(env_id)])
|
55 |
-
mean_reward, std_reward = evaluate_policy(model, eval_env, n_eval_episodes=10, deterministic=True)
|
56 |
-
print(f"mean_reward={mean_reward:.2f} +/- {std_reward}")
|
57 |
-
|
58 |
-
package_to_hub(model=model,
|
59 |
-
model_name=model_name,
|
60 |
-
model_architecture=model_architecture,
|
61 |
-
env_id=env_id,
|
62 |
-
eval_env=eval_env,
|
63 |
-
repo_id="29thDay/ppo-LunarLander-v2",
|
64 |
-
commit_message="Upload PPO LunarLander-v2 trained agent"
|
65 |
-
)
|
66 |
|
67 |
...
|
68 |
```
|
|
|
30 |
|
31 |
```python
|
32 |
|
33 |
+
# TODO
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
34 |
|
35 |
...
|
36 |
```
|