Spaces:

TaherFattahi
/

TD3-robot-nav-irsim

Running

App Files Files Community

TD3-robot-nav-irsim / app.py

TaherFattahi

init: td3 robot nav

a54010a 9 months ago

raw

history blame contribute delete

7.48 kB

	from models.TD3.TD3 import TD3

	import torch
	import numpy as np
	from sim import SIM_ENV
	import yaml
	import gradio as gr
	import os
	from pathlib import Path
	import matplotlib
	import random

	matplotlib.use('Agg')

	def generate_random_points(num_scenarios=2):
	"""Generate random robot poses and goals"""
	robot_poses = []
	robot_goals = []

	for _ in range(num_scenarios):
	# Random pose: x, y, orientation, velocity
	pose = [
	[random.uniform(1, 9)], # x position
	[random.uniform(1, 9)], # y position
	[random.uniform(0, 3.14)], # orientation
	[0] # initial velocity
	]

	# Random goal: x, y, orientation
	goal = [
	[random.uniform(1, 9)], # x position
	[random.uniform(1, 9)], # y position
	[0] # orientation
	]

	robot_poses.append(pose)
	robot_goals.append(goal)

	return robot_poses, robot_goals

	def get_predefined_scenarios():
	"""Return predefined robot poses and goals"""
	robot_poses = [
	[[3], [4], [0], [0]],
	[[8], [1], [1], [0]],
	[[2], [6], [1], [0]],
	[[7], [1], [0], [0]],
	[[7], [6.5], [2], [0]],
	[[9], [9], [3], [0]],
	[[2], [9], [1], [0]],
	[[3], [6], [3], [0]],
	[[1], [7], [0], [0]],
	[[5], [7], [3], [0]]
	]

	robot_goals = [
	[[8], [8], [0]],
	[[2], [9], [0]],
	[[7], [1], [0]],
	[[7.2], [9], [0]],
	[[1], [1], [0]],
	[[5], [1], [0]],
	[[7], [4], [0]],
	[[9], [4], [0]],
	[[1], [9], [0]],
	[[5], [1], [0]]
	]

	return robot_poses, robot_goals

	def run_simulation():
	"""Run the simulation and return the path to the generated GIF"""
	action_dim = 2 # number of actions produced by the model
	max_action = 1 # maximum absolute value of output actions
	state_dim = 25 # number of input values in the neural network (vector length of state input)
	device = torch.device(
	"cuda" if torch.cuda.is_available() else "cpu"
	) # using cuda if it is available, cpu otherwise
	epoch = 0 # epoch number
	max_steps = 300 # maximum number of steps in single episode

	model = TD3(
	state_dim=state_dim,
	action_dim=action_dim,
	max_action=max_action,
	device=device,
	load_model=True,
	) # instantiate a model

	sim = SIM_ENV(world_file="eval_world.yaml", save_ani=True) # instantiate environment

	# Generate random evaluation points instead of loading from YAML
	# num_scenarios = random.randint(2, 5) # Random number of scenarios between 2 and 5

	# Get predefined scenarios and randomly select one
	all_poses, all_goals = get_predefined_scenarios()
	scenario_index = random.randint(0, len(all_poses) - 1)

	robot_poses = [all_poses[scenario_index]]
	robot_goals = [all_goals[scenario_index]]

	print(f"Selected scenario {scenario_index+1} of {len(all_poses)}")
	total_reward = 0.0
	total_steps = 0
	col = 0
	goals = 0
	for idx in range(len(robot_poses)):
	count = 0
	latest_scan, distance, cos, sin, collision, goal, a, reward = sim.reset(
	robot_state=robot_poses[idx],
	robot_goal=robot_goals[idx],
	random_obstacles=False,
	)
	done = False
	while not done and count < max_steps:
	state, terminal = model.prepare_state(
	latest_scan, distance, cos, sin, collision, goal, a
	)
	action = model.get_action(np.array(state), False)
	a_in = [(action[0] + 1) / 4, action[1]]
	latest_scan, distance, cos, sin, collision, goal, a, reward = sim.step(
	lin_velocity=a_in[0], ang_velocity=a_in[1]
	)
	total_reward += reward
	total_steps += 1
	count += 1
	if collision:
	col += 1
	if goal:
	goals += 1
	done = collision or goal
	avg_step_reward = total_reward / total_steps
	avg_reward = total_reward / len(robot_poses)
	avg_col = col / len(robot_poses)
	avg_goal = goals / len(robot_poses)
	print(f"Total Reward: {total_reward}")
	print(f"Average Reward: {avg_reward}")
	print(f"Average Step Reward: {avg_step_reward}")
	print(f"Average Collision rate: {avg_col}")
	print(f"Average Goal rate: {avg_goal}")
	print("..............................................")
	model.writer.add_scalar("test/total_reward", total_reward, epoch)
	model.writer.add_scalar("test/avg_reward", avg_reward, epoch)
	model.writer.add_scalar("test/avg_step_reward", avg_step_reward, epoch)
	model.writer.add_scalar("test/avg_col", avg_col, epoch)
	model.writer.add_scalar("test/avg_goal", avg_goal, epoch)

	sim.env.end(ending_time=3)

	# Find the latest generated GIF file in the animation folder
	animation_dir = Path("animation")
	if animation_dir.exists():
	gif_files = list(animation_dir.glob("*.gif"))
	if gif_files:
	# Sort by creation time (newest first)
	latest_gif = max(gif_files, key=lambda x: x.stat().st_ctime)
	return str(latest_gif), {
	"Total Reward": f"{total_reward:.2f}",
	"Average Reward": f"{avg_reward:.2f}",
	"Average Step Reward": f"{avg_step_reward:.2f}",
	"Collision Rate": f"{avg_col:.2f}",
	"Goal Rate": f"{avg_goal:.2f}"
	}

	return None, {"Error": "No GIF file was generated"}

	def get_default_data():
	"""Return default animation and statistics data"""
	# Find any existing GIF in the animation folder
	animation_dir = Path("animation")
	default_gif = None

	if animation_dir.exists():
	gif_files = list(animation_dir.glob("*.gif"))
	if gif_files:
	# Get the most recent GIF
	default_gif = str(max(gif_files, key=lambda x: x.stat().st_ctime))

	# Default statistics
	default_stats = {
	"Total Reward": "99.12",
	"Average Reward": "99.12",
	"Average Step Reward": "1.40",
	"Collision Rate": "0.00",
	"Goal Rate": "1.00"
	}

	return default_gif, default_stats

	def main(args=None):
	"""Main function with Gradio interface"""
	# Get default data for initial display
	default_gif, default_stats = get_default_data()

	with gr.Blocks(title="Robot Navigation Simulation") as demo:
	with gr.Row():
	with gr.Column():
	run_button = gr.Button("Run Simulation", variant="primary")

	with gr.Row():
	with gr.Column():
	output_image = gr.Image(
	type="filepath",
	label="Simulation Animation",
	value=default_gif # Set default value
	)

	with gr.Column():
	output_stats = gr.JSON(
	label="Simulation Statistics",
	value=default_stats # Set default value
	)

	run_button.click(
	fn=run_simulation,
	outputs=[output_image, output_stats]
	)

	demo.launch(share=False)


	if __name__ == "__main__":
	main()