Text-Gym-Agents / envs /mujoco /halfcheetah_translator.py
CharlesZhang's picture
add 5 more envs: halfcheetah, hopper, walker2d, invertedPendulum, invertedDoublePendulum.
2ec5014
class BasicLevelTranslator:
def __init__(self):
pass
def translate(self, state):
(front_tip_z, front_tip_angle, back_thigh_angle_1, back_shin_angle_1,
tip_velocity_x, tip_velocity_y, front_tip_angular_velocity,
back_thigh_angular_velocity_1, front_tip_x, front_tip_y, front_tip_angle_2,
back_thigh_angle_2, back_shin_angle_2, tip_velocity_angular_x,
tip_velocity_angular_y, front_tip_angular_velocity_2,
back_thigh_angular_velocity_2) = state[:17]
res = (
f"The front tip is at a z-coordinate of {front_tip_z:.2f} meters. "
f"The angle of the front tip is {front_tip_angle:.2f} radians. "
f"The angles of the back thigh are {back_thigh_angle_1:.2f} and {back_thigh_angle_2:.2f} radians. "
f"The angles of the back shin are {back_shin_angle_1:.2f} and {back_shin_angle_2:.2f} radians. "
f"The tip has velocity along the x-axis of {tip_velocity_x:.2f} m/s. "
f"The tip has velocity along the y-axis of {tip_velocity_y:.2f} m/s. "
f"The angular velocity of the front tip is {front_tip_angular_velocity:.2f} radians/s. "
f"The angular velocities of the back thigh are {back_thigh_angular_velocity_1:.2f} and {back_thigh_angular_velocity_2:.2f} radians/s. "
f"The x-coordinate of the front tip is {front_tip_x:.2f} meters. "
f"The y-coordinate of the front tip is {front_tip_y:.2f} meters. "
f"The angle of the front tip is {front_tip_angle_2:.2f} radians. "
f"The angular velocity of the tip along the x-axis is {tip_velocity_angular_x:.2f} radians/s. "
f"The angular velocity of the tip along the y-axis is {tip_velocity_angular_y:.2f} radians/s. "
f"The angular velocity of the back shin is {front_tip_angular_velocity_2:.2f} radians/s."
)
return res
class GameDescriber:
def __init__(self, args):
self.is_only_local_obs = args.is_only_local_obs == 1
self.max_episode_len = args.max_episode_len
self.action_desc_dict = {
}
self.reward_desc_dict = {
}
def translate_terminate_state(self, state, episode_len, max_episode_len):
return ""
def translate_potential_next_state(self, state, action):
return ""
def describe_goal(self):
return "The goal is to make the Half-Cheetah run forward (right) as fast as possible."
def describe_game(self):
return (
"In the Half-Cheetah game, you control a 2-dimensional robot with 9 links and 8 joints. "
"The goal is to apply torque to the joints to make the cheetah run forward (right) as fast as possible. "
"You can control the back thigh, back shin, and back foot rotors for the back legs, and the front thigh, "
"front shin, and front foot rotors for the front legs. The episode ends after 1000 timesteps. "
"Your reward is based on how much forward progress you make and how much control effort you apply."
)
def describe_action(self):
return (
"Your next move: \n"
"Please select six numerical values, each one within the range of [-1,1], "
"which represents the torque being applied to the back thigh rotor, "
"back shin rotor, back foot rotor, front thigh rotor, front shin rotor, "
"and front foot rotor respectively."
)
class BasicStateSequenceTranslator(BasicLevelTranslator):
def translate(self, infos, is_current=False):
descriptions = []
if is_current:
state_desc = BasicLevelTranslator().translate(infos[-1]['state'])
return state_desc
for i, info in enumerate(infos):
assert 'state' in info, "info should contain state information"
state_desc = BasicLevelTranslator().translate(info['state'])
action_desc = (
"Take Action: "
"Apply Back Thigh Torque: {:.2f}, "
"Apply Back Shin Torque: {:.2f}, "
"Apply Back Foot Torque: {:.2f}, "
"Apply Front Thigh Torque: {:.2f}, "
"Apply Front Shin Torque: {:.2f}, "
"Apply Front Foot Torque: {:.2f}"
).format(
info['action'][0], info['action'][1], info['action'][2],
info['action'][3], info['action'][4], info['action'][5]
)
reward_desc = f"Result: Forward Reward of {info['forward_reward']:.2f}, "
ctrl_cost_desc = f"Control Cost of {info['ctrl_cost']:.2f}, "
total_reward_desc = f"Total Reward of {info['reward']:.2f}, "
next_state_desc = BasicLevelTranslator().translate(info['next_state'])
descriptions.append(f"{state_desc}.\\n {action_desc} \\n {reward_desc} {ctrl_cost_desc} {total_reward_desc} \\n Transit to {next_state_desc}")
return descriptions