Spaces:
Runtime error
Runtime error
File size: 8,237 Bytes
4bdab37 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 |
from typing import List, Union
import re
from tenacity import RetryError
import logging
import uuid
from abc import abstractmethod
import asyncio
from .backends import IntelligenceBackend, load_backend
from .message import Message, SYSTEM_NAME
from .config import AgentConfig, Configurable, BackendConfig
# A special signal sent by the player to indicate that it is not possible to continue the conversation, and it requests to end the conversation.
# It contains a random UUID string to avoid being exploited by any of the players.
SIGNAL_END_OF_CONVERSATION = f"<<<<<<END_OF_CONVERSATION>>>>>>{uuid.uuid4()}"
class Agent(Configurable):
"""
An abstract base class for all the agents in the chatArena environment.
"""
@abstractmethod
def __init__(self, name: str, role_desc: str, global_prompt: str = None, *args, **kwargs):
"""
Initialize the agent.
Parameters:
name (str): The name of the agent.
role_desc (str): Description of the agent's role.
global_prompt (str): A universal prompt that applies to all agents. Defaults to None.
"""
super().__init__(name=name, role_desc=role_desc, global_prompt=global_prompt, **kwargs)
self.name = name
self.role_desc = role_desc
self.global_prompt = global_prompt
class Player(Agent):
"""
The Player class represents a player in the chatArena environment. A player can observe the environment
and perform an action (generate a response) based on the observation.
"""
def __init__(self, name: str, role_desc: str, backend: Union[BackendConfig, IntelligenceBackend],
global_prompt: str = None, **kwargs):
"""
Initialize the player with a name, role description, backend, and a global prompt.
Parameters:
name (str): The name of the player.
role_desc (str): Description of the player's role.
backend (Union[BackendConfig, IntelligenceBackend]): The backend that will be used for decision making. It can be either a LLM backend or a Human backend.
global_prompt (str): A universal prompt that applies to all players. Defaults to None.
"""
if isinstance(backend, BackendConfig):
backend_config = backend
backend = load_backend(backend_config)
elif isinstance(backend, IntelligenceBackend):
backend_config = backend.to_config()
else:
raise ValueError(f"backend must be a BackendConfig or an IntelligenceBackend, but got {type(backend)}")
assert name != SYSTEM_NAME, f"Player name cannot be {SYSTEM_NAME}, which is reserved for the system."
# Register the fields in the _config
super().__init__(name=name, role_desc=role_desc, backend=backend_config,
global_prompt=global_prompt, **kwargs)
self.backend = backend
def to_config(self) -> AgentConfig:
return AgentConfig(
name=self.name,
role_desc=self.role_desc,
backend=self.backend.to_config(),
global_prompt=self.global_prompt,
)
def act(self, observation: List[Message]) -> str:
"""
Take an action based on the observation (Generate a response), which can later be parsed to actual actions that affect the game dyanmics.
Parameters:
observation (List[Message]): The messages that the player has observed from the environment.
Returns:
str: The action (response) of the player.
"""
try:
response = self.backend.query(agent_name=self.name, role_desc=self.role_desc,
history_messages=observation, global_prompt=self.global_prompt,
request_msg=None)
except RetryError as e:
err_msg = f"Agent {self.name} failed to generate a response. Error: {e.last_attempt.exception()}. Sending signal to end the conversation."
logging.warning(err_msg)
response = SIGNAL_END_OF_CONVERSATION + err_msg
return response
def __call__(self, observation: List[Message]) -> str:
return self.act(observation)
async def async_act(self, observation: List[Message]) -> str:
"""
Async version of act(). This is used when you want to generate a response asynchronously.
Parameters:
observation (List[Message]): The messages that the player has observed from the environment.
Returns:
str: The action (response) of the player.
"""
try:
response = self.backend.async_query(agent_name=self.name, role_desc=self.role_desc,
history_messages=observation, global_prompt=self.global_prompt,
request_msg=None)
except RetryError as e:
err_msg = f"Agent {self.name} failed to generate a response. Error: {e.last_attempt.exception()}. Sending signal to end the conversation."
logging.warning(err_msg)
response = SIGNAL_END_OF_CONVERSATION + err_msg
return response
def reset(self):
"""
Reset the player's backend in case they are not stateless.
This is usually called at the end of each episode.
"""
self.backend.reset()
class Moderator(Player):
"""
The Moderator class represents a special type of player that moderates the conversation.
It is usually used as a component of the environment when the transition dynamics is conditioned on natural language that are not easy to parse programatically.
"""
def __init__(self, role_desc: str, backend: Union[BackendConfig, IntelligenceBackend],
terminal_condition: str, global_prompt: str = None, **kwargs):
"""
Initialize the moderator with a role description, backend, terminal condition, and a global prompt.
Parameters:
role_desc (str): Description of the moderator's role.
backend (Union[BackendConfig, IntelligenceBackend]): The backend that will be used for decision making.
terminal_condition (str): The condition that signifies the end of the conversation.
global_prompt (str): A universal prompt that applies to the moderator. Defaults to None.
"""
name = "Moderator"
super().__init__(name=name, role_desc=role_desc, backend=backend, global_prompt=global_prompt, **kwargs)
self.terminal_condition = terminal_condition
def to_config(self) -> AgentConfig:
return AgentConfig(
name=self.name,
role_desc=self.role_desc,
backend=self.backend.to_config(),
terminal_condition=self.terminal_condition,
global_prompt=self.global_prompt,
)
def is_terminal(self, history: List[Message], *args, **kwargs) -> bool:
"""
Check whether an episode is terminated based on the terminal condition.
Parameters:
history (List[Message]): The conversation history.
Returns:
bool: True if the conversation is over, otherwise False.
"""
# If the last message is the signal, then the conversation is over
if history[-1].content == SIGNAL_END_OF_CONVERSATION:
return True
try:
request_msg = Message(agent_name=self.name, content=self.terminal_condition, turn=-1)
response = self.backend.query(agent_name=self.name, role_desc=self.role_desc, history_messages=history,
global_prompt=self.global_prompt, request_msg=request_msg, *args, **kwargs)
except RetryError as e:
logging.warning(f"Agent {self.name} failed to generate a response. "
f"Error: {e.last_attempt.exception()}.")
return True
if re.match(r"yes|y|yea|yeah|yep|yup|sure|ok|okay|alright", response, re.IGNORECASE):
# print(f"Decision: {response}. Conversation is ended by moderator.")
return True
else:
return False
|