Spaces:

MAIL-CS-ECNU
/

Text-Gym-Agents

Runtime error

Text-Gym-Agents / envs /toy_text /frozenlake_translator.py

Jarvis-K

init

2a33798 over 1 year ago

4.4 kB

	class BasicLevelTranslator:
	def __init__(self):
	pass

	def translate(self, state, nrow=4, ncol=4):
	row, col = state // nrow, state % ncol
	res = f"The current position of the player is at row {row}, column {col}."
	return res

	class GameDescriber:
	def __init__(self, args):
	self.is_only_local_obs = args.is_only_local_obs == 1
	self.max_episode_len = args.max_episode_len
	self.action_desc_dict = {
	1: "Move left",
	2: "Move down",
	3: "Move right",
	4: "Move up",
	}
	self.reward_desc_dict = {
	1: "which lets him reach the goal and receive 1 reward",
	0: "which lets him receive 0 reward"
	}

	def describe_goal(self):
	return f"The goal is to navigate across the frozen lake and reach the goal position {'located at (3,3)' if not self.is_only_local_obs else ''} without falling into any holes{', which are located at (1,1), (1,3), (2,3) and (3,0)' if not self.is_only_local_obs else ''}."

	def translate_terminate_state(self, state, episode_len, max_episode_len):
	state = int(state)
	nrows = 4
	current_row = state // nrows
	current_col = state % nrows
	if current_row == 3 and current_col == 3:
	return f"The player reaches the goal location ({current_row}, {current_col}) in the grid world."
	else:
	if (current_row, current_col) in [(1,1), (1, 3), (2,3), (3, 0)]:
	return f"The game ends due to step into a hole locating at {(current_row, current_col)}."
	else:
	return f"The game ends due to reach the max episode length {episode_len} and the player does not reach the goal."

	def translate_potential_next_state(self, state, action):
	state = int(state)
	nrows = 4
	current_row = state // nrows
	current_col = state % nrows
	action = str(action)
	if action == '1':
	current_col -= 1
	elif action == '2':
	current_row += 1
	elif action == '3':
	current_col += 1
	elif action == '4':
	current_row -= 1
	return f"He tries to step into location ({current_row}, {current_col}),"

	def describe_game(self):
	return "In the FrozenLake game, the player starts at the start position of the grid and tries to reach the" \
	f" goal position {'located at (3,3)' if not self.is_only_local_obs else ''}. There are holes which the player must avoid{'. These holes are located at (1,1), (1,3), (2,3) and (3,0)' if not self.is_only_local_obs else ''}. The frozen lake is " \
	"slippery, meaning that the player might not always move in the intended direction. The game ends" \
	" when the player reaches the goal or falls into a hole."

	def describe_action(self):
	return ("Your Next Move: \n Please choose an action. For current position ('x', 'y'), the action means the player try to step into the next position. The possible actions are:" \
	"\n '1': Move left, which means ('x', 'y-1'), " \
	"\n '2': Move down, which means ('x+1', 'y')," \
	"\n '3': Move right, which means ('x', 'y+1')," \
	"\n '4': Move up, which means trying to step into ('x-1', 'y')." \
	" Ensure you only provide the action number from the valid action list, i.e., [1, 2, 3, 4].")

	class BasicStateSequenceTranslator(BasicLevelTranslator):
	def translate(self, infos, is_current=False):
	descriptions = []
	if is_current:
	state_desc = BasicLevelTranslator().translate(infos[-1]['state'])
	return state_desc
	for i, info in enumerate(infos):
	assert 'state' in info, "info should contain state information"

	state_desc = BasicLevelTranslator().translate(info['state'])
	action_directions = ['left', 'down', 'right', 'up']
	action_desc = f"Take Action: Move {action_directions[info['action']-1]} ({info['action']})."
	reward_desc = f"Result: Reward of {info['reward']}, "
	next_state_desc = BasicLevelTranslator().translate(info['next_state'])
	descriptions.append(f"{state_desc}.\n {action_desc} \n {reward_desc} \n Transit to {next_state_desc}")
	return descriptions