Spaces:
Build error
Build error
import copy | |
import logging | |
import os | |
import re | |
import sys | |
import traceback | |
from datetime import datetime | |
from types import TracebackType | |
from typing import Any, Literal, Mapping, MutableMapping, TextIO | |
import litellm | |
from pythonjsonlogger.json import JsonFormatter | |
from termcolor import colored | |
LOG_LEVEL = os.getenv('LOG_LEVEL', 'INFO').upper() | |
DEBUG = os.getenv('DEBUG', 'False').lower() in ['true', '1', 'yes'] | |
DEBUG_LLM = os.getenv('DEBUG_LLM', 'False').lower() in ['true', '1', 'yes'] | |
# Structured logs with JSON, disabled by default | |
LOG_JSON = os.getenv('LOG_JSON', 'False').lower() in ['true', '1', 'yes'] | |
LOG_JSON_LEVEL_KEY = os.getenv('LOG_JSON_LEVEL_KEY', 'level') | |
# Configure litellm logging based on DEBUG_LLM | |
if DEBUG_LLM: | |
confirmation = input( | |
'\n⚠️ WARNING: You are enabling DEBUG_LLM which may expose sensitive information like API keys.\n' | |
'This should NEVER be enabled in production.\n' | |
"Type 'y' to confirm you understand the risks: " | |
) | |
if confirmation.lower() == 'y': | |
litellm.suppress_debug_info = False | |
litellm.set_verbose = True | |
else: | |
print('DEBUG_LLM disabled due to lack of confirmation') | |
litellm.suppress_debug_info = True | |
litellm.set_verbose = False | |
else: | |
litellm.suppress_debug_info = True | |
litellm.set_verbose = False | |
if DEBUG: | |
LOG_LEVEL = 'DEBUG' | |
LOG_TO_FILE = os.getenv('LOG_TO_FILE', 'False').lower() in ['true', '1', 'yes'] | |
DISABLE_COLOR_PRINTING = False | |
LOG_ALL_EVENTS = os.getenv('LOG_ALL_EVENTS', 'False').lower() in ['true', '1', 'yes'] | |
# Controls whether to stream Docker container logs | |
DEBUG_RUNTIME = os.getenv('DEBUG_RUNTIME', 'False').lower() in ['true', '1', 'yes'] | |
ColorType = Literal[ | |
'red', | |
'green', | |
'yellow', | |
'blue', | |
'magenta', | |
'cyan', | |
'light_grey', | |
'dark_grey', | |
'light_red', | |
'light_green', | |
'light_yellow', | |
'light_blue', | |
'light_magenta', | |
'light_cyan', | |
'white', | |
] | |
LOG_COLORS: Mapping[str, ColorType] = { | |
'ACTION': 'green', | |
'USER_ACTION': 'light_red', | |
'OBSERVATION': 'yellow', | |
'USER_OBSERVATION': 'light_green', | |
'DETAIL': 'cyan', | |
'ERROR': 'red', | |
'PLAN': 'light_magenta', | |
} | |
class StackInfoFilter(logging.Filter): | |
def filter(self, record: logging.LogRecord) -> bool: | |
if record.levelno >= logging.ERROR: | |
# Only add stack trace info if there's an actual exception | |
exc_info = sys.exc_info() | |
if exc_info and exc_info[0] is not None: | |
# Capture the current stack trace as a string | |
stack = traceback.format_stack() | |
# Remove the last entries which are related to the logging machinery | |
stack = stack[:-3] # Adjust this number if needed | |
# Join the stack frames into a single string | |
stack_str = ''.join(stack) | |
setattr(record, 'stack_info', stack_str) | |
setattr(record, 'exc_info', exc_info) | |
return True | |
class NoColorFormatter(logging.Formatter): | |
"""Formatter for non-colored logging in files.""" | |
def format(self, record: logging.LogRecord) -> str: | |
# Create a deep copy of the record to avoid modifying the original | |
new_record = _fix_record(record) | |
# Strip ANSI color codes from the message | |
new_record.msg = strip_ansi(new_record.msg) | |
return super().format(new_record) | |
def strip_ansi(s: str) -> str: | |
"""Remove ANSI escape sequences (terminal color/formatting codes) from string. | |
Removes ANSI escape sequences from str, as defined by ECMA-048 in | |
http://www.ecma-international.org/publications/files/ECMA-ST/Ecma-048.pdf | |
# https://github.com/ewen-lbh/python-strip-ansi/blob/master/strip_ansi/__init__.py | |
""" | |
pattern = re.compile(r'\x1B\[\d+(;\d+){0,2}m') | |
stripped = pattern.sub('', s) | |
return stripped | |
class ColoredFormatter(logging.Formatter): | |
def format(self, record: logging.LogRecord) -> str: | |
msg_type = record.__dict__.get('msg_type', '') | |
event_source = record.__dict__.get('event_source', '') | |
if event_source: | |
new_msg_type = f'{event_source.upper()}_{msg_type}' | |
if new_msg_type in LOG_COLORS: | |
msg_type = new_msg_type | |
if msg_type in LOG_COLORS and not DISABLE_COLOR_PRINTING: | |
msg_type_color = colored(msg_type, LOG_COLORS[msg_type]) | |
msg = colored(record.msg, LOG_COLORS[msg_type]) | |
time_str = colored( | |
self.formatTime(record, self.datefmt), LOG_COLORS[msg_type] | |
) | |
name_str = colored(record.name, LOG_COLORS[msg_type]) | |
level_str = colored(record.levelname, LOG_COLORS[msg_type]) | |
if msg_type in ['ERROR'] or DEBUG: | |
return f'{time_str} - {name_str}:{level_str}: {record.filename}:{record.lineno}\n{msg_type_color}\n{msg}' | |
return f'{time_str} - {msg_type_color}\n{msg}' | |
elif msg_type == 'STEP': | |
if LOG_ALL_EVENTS: | |
msg = '\n\n==============\n' + record.msg + '\n' | |
return f'{msg}' | |
else: | |
return record.msg | |
new_record = _fix_record(record) | |
return super().format(new_record) | |
def _fix_record(record: logging.LogRecord) -> logging.LogRecord: | |
new_record = copy.copy(record) | |
# The formatter expects non boolean values, and will raise an exception if there is a boolean - so we fix these | |
# LogRecord attributes are dynamically typed | |
if getattr(new_record, 'exc_info', None) is True: | |
setattr(new_record, 'exc_info', sys.exc_info()) | |
setattr(new_record, 'stack_info', None) | |
return new_record | |
file_formatter = NoColorFormatter( | |
'%(asctime)s - %(name)s:%(levelname)s: %(filename)s:%(lineno)s - %(message)s', | |
datefmt='%H:%M:%S', | |
) | |
llm_formatter = logging.Formatter('%(message)s') | |
class RollingLogger: | |
max_lines: int | |
char_limit: int | |
log_lines: list[str] | |
all_lines: str | |
def __init__(self, max_lines: int = 10, char_limit: int = 80) -> None: | |
self.max_lines = max_lines | |
self.char_limit = char_limit | |
self.log_lines = [''] * self.max_lines | |
self.all_lines = '' | |
def is_enabled(self) -> bool: | |
return DEBUG and sys.stdout.isatty() | |
def start(self, message: str = '') -> None: | |
if message: | |
print(message) | |
self._write('\n' * self.max_lines) | |
self._flush() | |
def add_line(self, line: str) -> None: | |
self.log_lines.pop(0) | |
self.log_lines.append(line[: self.char_limit]) | |
self.print_lines() | |
self.all_lines += line + '\n' | |
def write_immediately(self, line: str) -> None: | |
self._write(line) | |
self._flush() | |
def print_lines(self) -> None: | |
"""Display the last n log_lines in the console (not for file logging). | |
This will create the effect of a rolling display in the console. | |
""" | |
self.move_back() | |
for line in self.log_lines: | |
self.replace_current_line(line) | |
def move_back(self, amount: int = -1) -> None: | |
r"""'\033[F' moves the cursor up one line.""" | |
if amount == -1: | |
amount = self.max_lines | |
self._write('\033[F' * (self.max_lines)) | |
self._flush() | |
def replace_current_line(self, line: str = '') -> None: | |
r"""'\033[2K\r' clears the line and moves the cursor to the beginning of the line.""" | |
self._write('\033[2K' + line + '\n') | |
self._flush() | |
def _write(self, line: str) -> None: | |
if not self.is_enabled(): | |
return | |
sys.stdout.write(line) | |
def _flush(self) -> None: | |
if not self.is_enabled(): | |
return | |
sys.stdout.flush() | |
class SensitiveDataFilter(logging.Filter): | |
def filter(self, record: logging.LogRecord) -> bool: | |
# Gather sensitive values which should not ever appear in the logs. | |
sensitive_values = [] | |
for key, value in os.environ.items(): | |
key_upper = key.upper() | |
if ( | |
len(value) > 2 | |
and value != 'default' | |
and any(s in key_upper for s in ('SECRET', '_KEY', '_CODE', '_TOKEN')) | |
): | |
sensitive_values.append(value) | |
# Replace sensitive values from env! | |
msg = record.getMessage() | |
for sensitive_value in sensitive_values: | |
msg = msg.replace(sensitive_value, '******') | |
# Replace obvious sensitive values from log itself... | |
sensitive_patterns = [ | |
'api_key', | |
'aws_access_key_id', | |
'aws_secret_access_key', | |
'e2b_api_key', | |
'github_token', | |
'jwt_secret', | |
'modal_api_token_id', | |
'modal_api_token_secret', | |
'llm_api_key', | |
'sandbox_env_github_token', | |
'daytona_api_key', | |
] | |
# add env var names | |
env_vars = [attr.upper() for attr in sensitive_patterns] | |
sensitive_patterns.extend(env_vars) | |
for attr in sensitive_patterns: | |
pattern = rf"{attr}='?([\w-]+)'?" | |
msg = re.sub(pattern, f"{attr}='******'", msg) | |
# Update the record | |
record.msg = msg | |
record.args = () | |
return True | |
def get_console_handler(log_level: int = logging.INFO) -> logging.StreamHandler: | |
"""Returns a console handler for logging.""" | |
console_handler = logging.StreamHandler() | |
console_handler.setLevel(log_level) | |
formatter_str = '\033[92m%(asctime)s - %(name)s:%(levelname)s\033[0m: %(filename)s:%(lineno)s - %(message)s' | |
console_handler.setFormatter(ColoredFormatter(formatter_str, datefmt='%H:%M:%S')) | |
return console_handler | |
def get_file_handler( | |
log_dir: str, log_level: int = logging.INFO | |
) -> logging.FileHandler: | |
"""Returns a file handler for logging.""" | |
os.makedirs(log_dir, exist_ok=True) | |
timestamp = datetime.now().strftime('%Y-%m-%d') | |
file_name = f'openhands_{timestamp}.log' | |
file_handler = logging.FileHandler(os.path.join(log_dir, file_name)) | |
file_handler.setLevel(log_level) | |
if LOG_JSON: | |
file_handler.setFormatter(json_formatter()) | |
else: | |
file_handler.setFormatter(file_formatter) | |
return file_handler | |
def json_formatter() -> JsonFormatter: | |
return JsonFormatter( | |
'{message}{levelname}', | |
style='{', | |
rename_fields={'levelname': LOG_JSON_LEVEL_KEY}, | |
timestamp=True, | |
) | |
def json_log_handler( | |
level: int = logging.INFO, | |
_out: TextIO = sys.stdout, | |
) -> logging.Handler: | |
""" | |
Configure logger instance for structured logging as json lines. | |
""" | |
handler = logging.StreamHandler(_out) | |
handler.setLevel(level) | |
handler.setFormatter(json_formatter()) | |
return handler | |
# Set up logging | |
logging.basicConfig(level=logging.ERROR) | |
def log_uncaught_exceptions( | |
ex_cls: type[BaseException], ex: BaseException, tb: TracebackType | None | |
) -> Any: | |
"""Logs uncaught exceptions along with the traceback. | |
Args: | |
ex_cls: The type of the exception. | |
ex: The exception instance. | |
tb: The traceback object. | |
Returns: | |
None | |
""" | |
if tb: # Add check since tb can be None | |
logging.error(''.join(traceback.format_tb(tb))) | |
logging.error('{0}: {1}'.format(ex_cls, ex)) | |
sys.excepthook = log_uncaught_exceptions | |
openhands_logger = logging.getLogger('openhands') | |
current_log_level = logging.INFO | |
if LOG_LEVEL in logging.getLevelNamesMapping(): | |
current_log_level = logging.getLevelNamesMapping()[LOG_LEVEL] | |
openhands_logger.setLevel(current_log_level) | |
if DEBUG: | |
openhands_logger.addFilter(StackInfoFilter()) | |
if current_log_level == logging.DEBUG: | |
LOG_TO_FILE = True | |
openhands_logger.debug('DEBUG mode enabled.') | |
if LOG_JSON: | |
openhands_logger.addHandler(json_log_handler(current_log_level)) | |
else: | |
openhands_logger.addHandler(get_console_handler(current_log_level)) | |
openhands_logger.addFilter(SensitiveDataFilter(openhands_logger.name)) | |
openhands_logger.propagate = False | |
openhands_logger.debug('Logging initialized') | |
LOG_DIR = os.path.join( | |
# parent dir of openhands/core (i.e., root of the repo) | |
os.path.dirname(os.path.dirname(os.path.dirname(os.path.abspath(__file__)))), | |
'logs', | |
) | |
if LOG_TO_FILE: | |
openhands_logger.addHandler( | |
get_file_handler(LOG_DIR, current_log_level) | |
) # default log to project root | |
openhands_logger.debug(f'Logging to file in: {LOG_DIR}') | |
# Exclude LiteLLM from logging output as it can leak keys | |
logging.getLogger('LiteLLM').disabled = True | |
logging.getLogger('LiteLLM Router').disabled = True | |
logging.getLogger('LiteLLM Proxy').disabled = True | |
# Exclude loquacious loggers | |
LOQUACIOUS_LOGGERS = [ | |
'engineio', | |
'engineio.server', | |
'socketio', | |
'socketio.client', | |
'socketio.server', | |
] | |
for logger_name in LOQUACIOUS_LOGGERS: | |
logging.getLogger(logger_name).setLevel('WARNING') | |
class LlmFileHandler(logging.FileHandler): | |
"""LLM prompt and response logging.""" | |
def __init__( | |
self, | |
filename: str, | |
mode: str = 'a', | |
encoding: str = 'utf-8', | |
delay: bool = False, | |
) -> None: | |
"""Initializes an instance of LlmFileHandler. | |
Args: | |
filename (str): The name of the log file. | |
mode (str, optional): The file mode. Defaults to 'a'. | |
encoding (str, optional): The file encoding. Defaults to None. | |
delay (bool, optional): Whether to delay file opening. Defaults to False. | |
""" | |
self.filename = filename | |
self.message_counter = 1 | |
if DEBUG: | |
self.session = datetime.now().strftime('%y-%m-%d_%H-%M') | |
else: | |
self.session = 'default' | |
self.log_directory = os.path.join(LOG_DIR, 'llm', self.session) | |
os.makedirs(self.log_directory, exist_ok=True) | |
if not DEBUG: | |
# Clear the log directory if not in debug mode | |
for file in os.listdir(self.log_directory): | |
file_path = os.path.join(self.log_directory, file) | |
try: | |
os.unlink(file_path) | |
except Exception as e: | |
openhands_logger.error( | |
'Failed to delete %s. Reason: %s', file_path, e | |
) | |
filename = f'{self.filename}_{self.message_counter:03}.log' | |
self.baseFilename = os.path.join(self.log_directory, filename) | |
super().__init__(self.baseFilename, mode, encoding, delay) | |
def emit(self, record: logging.LogRecord) -> None: | |
"""Emits a log record. | |
Args: | |
record (logging.LogRecord): The log record to emit. | |
""" | |
filename = f'{self.filename}_{self.message_counter:03}.log' | |
self.baseFilename = os.path.join(self.log_directory, filename) | |
self.stream = self._open() | |
super().emit(record) | |
self.stream.close() | |
openhands_logger.debug('Logging to %s', self.baseFilename) | |
self.message_counter += 1 | |
def _get_llm_file_handler(name: str, log_level: int) -> LlmFileHandler: | |
# The 'delay' parameter, when set to True, postpones the opening of the log file | |
# until the first log message is emitted. | |
llm_file_handler = LlmFileHandler(name, delay=True) | |
llm_file_handler.setFormatter(llm_formatter) | |
llm_file_handler.setLevel(log_level) | |
return llm_file_handler | |
def _setup_llm_logger(name: str, log_level: int) -> logging.Logger: | |
logger = logging.getLogger(name) | |
logger.propagate = False | |
logger.setLevel(log_level) | |
if LOG_TO_FILE: | |
logger.addHandler(_get_llm_file_handler(name, log_level)) | |
return logger | |
llm_prompt_logger = _setup_llm_logger('prompt', current_log_level) | |
llm_response_logger = _setup_llm_logger('response', current_log_level) | |
class OpenHandsLoggerAdapter(logging.LoggerAdapter): | |
extra: dict | |
def __init__( | |
self, logger: logging.Logger = openhands_logger, extra: dict | None = None | |
) -> None: | |
self.logger = logger | |
self.extra = extra or {} | |
def process( | |
self, msg: str, kwargs: MutableMapping[str, Any] | |
) -> tuple[str, MutableMapping[str, Any]]: | |
""" | |
If 'extra' is supplied in kwargs, merge it with the adapters 'extra' dict | |
Starting in Python 3.13, LoggerAdapter's merge_extra option will do this. | |
""" | |
if 'extra' in kwargs and isinstance(kwargs['extra'], dict): | |
kwargs['extra'] = {**self.extra, **kwargs['extra']} | |
else: | |
kwargs['extra'] = self.extra | |
return msg, kwargs | |