Text-Gym-Agents / envs /mujoco /pusher_translator.py
CharlesZhang's picture
add: Pusher env
6299d2b
'''Pusher
Action Space Box(-2.0, 2.0, (7,), float32)
Observation Space Box(-inf, inf, (23,), float64)
'''
import math
class BasicLevelTranslator:
def __init__(self):
pass
def translate(self, state):
joint_angles = state[:7]
joint_velocities = state[7:14]
fingertip_coords = state[14:17]
object_coords = state[17:20]
goal_coords = state[20:]
joint_angle_degrees = [math.degrees(angle) for angle in joint_angles]
joint_velocity_degrees = [math.degrees(velocity) for velocity in joint_velocities]
res = (f"Rotation of the panning shoulder: {joint_angle_degrees[0]:.2f} degrees, "
f"Rotation of the shoulder lifting joint: {joint_angle_degrees[1]:.2f} degrees, "
f"Rotation of the shoulder rolling joint: {joint_angle_degrees[2]:.2f} degrees, "
f"Rotation of the elbow joint: {joint_angle_degrees[3]:.2f} degrees, "
f"Rotation of the forearm rolling joint: {joint_angle_degrees[4]:.2f} degrees, "
f"Rotation of the wrist flexing joint: {joint_angle_degrees[5]:.2f} degrees, "
f"Rotation of the wrist rolling joint: {joint_angle_degrees[6]:.2f} degrees, "
f"Rotational velocity of the panning shoulder: {joint_velocity_degrees[0]:.2f} degrees/s, "
f"Rotational velocity of the shoulder lifting joint: {joint_velocity_degrees[1]:.2f} degrees/s, "
f"Rotational velocity of the shoulder rolling joint: {joint_velocity_degrees[2]:.2f} degrees/s, "
f"Rotational velocity of the elbow joint: {joint_velocity_degrees[3]:.2f} degrees/s, "
f"Rotational velocity of the forearm rolling joint: {joint_velocity_degrees[4]:.2f} degrees/s, "
f"Rotational velocity of the wrist flexing joint: {joint_velocity_degrees[5]:.2f} degrees/s, "
f"Rotational velocity of the wrist rolling joint: {joint_velocity_degrees[6]:.2f} degrees/s, "
f"Fingertip coordinates (x, y, z): ({fingertip_coords[0]:.2f}, {fingertip_coords[1]:.2f}, {fingertip_coords[2]:.2f}), "
f"Object coordinates (x, y, z): ({object_coords[0]:.2f}, {object_coords[1]:.2f}, {object_coords[2]:.2f}), "
f"Goal coordinates (x, y, z): ({goal_coords[0]:.2f}, {goal_coords[1]:.2f}, {goal_coords[2]:.2f}).")
return res
class GameDescriber:
def __init__(self, args):
self.is_only_local_obs = args.is_only_local_obs == 1
self.max_episode_len = args.max_episode_len
self.action_desc_dict = {
}
self.reward_desc_dict = {
}
def translate_terminate_state(self, state, episode_len, max_episode_len):
return ""
def translate_potential_next_state(self, state, action):
return ""
def describe_goal(self):
return "The goal is to move the target cylinder (object) to the goal position using the robot's end effector (fingertip)."
def describe_game(self):
return ("In the Pusher game, you control a multi-jointed robot arm to manipulate a target cylinder (object) "
"and place it in a goal position using the robot's fingertip (end effector). The robot has shoulder, elbow, "
"forearm, and wrist joints that you can control with torque values. The observation space includes joint angles, "
"angular velocities of joints, fingertip coordinates, object coordinates, and goal coordinates. The reward is "
"based on the distance between the fingertip and the object, the distance between the object and the goal, "
"and control penalties for large actions.")
def describe_action(self):
return ("Your next move: \n Please provide a list of 7 numerical values within the range [-2, 2], "
"representing the torques applied to the robot's joints (shoulder, elbow, forearm, and wrist).")
class BasicStateSequenceTranslator(BasicLevelTranslator):
def translate(self, infos, is_current=False):
descriptions = []
if is_current:
state_desc = BasicLevelTranslator().translate(infos[-1]['state'])
return state_desc
for info in infos:
assert 'state' in info, "info should contain state information"
state_desc = BasicLevelTranslator().translate(info['state'])
action_desc = ("Take Action: Apply Torques - "
"Shoulder Pan: {:.2f}, Shoulder Lift: {:.2f}, Shoulder Roll: {:.2f}, "
"Elbow Flex: {:.2f}, Forearm Roll: {:.2f}, Wrist Flex: {:.2f}, Wrist Roll: {:.2f}"
).format(info['action'][0], info['action'][1], info['action'][2], info['action'][3],
info['action'][4], info['action'][5], info['action'][6])
reward_desc = f"Result: Reward of {info['reward']:.2f}"
next_state_desc = BasicLevelTranslator().translate(info['next_state'])
descriptions.append(f"{state_desc}\n{action_desc}\n{reward_desc}\nTransit to {next_state_desc}")
return descriptions