pkalkman
/

LunarLander-v2-ppo

Reinforcement Learning

stable-baselines3

deep-reinforcement-learning

Eval Results (legacy)

Model card Files Files and versions

LunarLander-v2-ppo / src /upload.py

pkalkman's picture

model with score above 200

7b8c673 over 1 year ago

history blame contribute delete

1.36 kB

	import gymnasium as gym
	from stable_baselines3 import PPO
	from stable_baselines3.common.vec_env import DummyVecEnv
	from stable_baselines3.common.monitor import Monitor # Import Monitor
	from huggingface_sb3 import package_to_hub
	from stable_baselines3.common.vec_env import VecNormalize

	# Define the name of the environment
	env_id = "LunarLander-v2"

	# Define the model architecture we used
	model_architecture = "PPO"

	repo_id = "pkalkman/LunarLander-v2-ppo"

	# Define the commit message
	commit_message = "Upload PPO LunarLander-v2 trained agent"

	# Load the best trained model
	model_name = "ppo-LunarLander-v2"
	model = PPO.load("./logs/best_model/best_model.zip")

	# Create the evaluation environment and wrap it with Monitor
	eval_env = DummyVecEnv([lambda: Monitor(gym.make(env_id, render_mode="rgb_array"))])

	# Load VecNormalize statistics from training
	eval_env = VecNormalize.load("vecnormalize.pkl", eval_env)

	# Push the model to Hugging Face
	package_to_hub(
	model=model, # Our trained model
	model_name=model_name, # The name of our trained model
	model_architecture=model_architecture, # The model architecture we used
	env_id=env_id, # Name of the environment
	eval_env=eval_env, # Evaluation environment
	repo_id=repo_id, # Your Hugging Face repo ID
	commit_message=commit_message # Commit message for the upload
	)