logger.py 7.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246
  1. import logging
  2. import os
  3. import re
  4. import sys
  5. import traceback
  6. from datetime import datetime
  7. from typing import Literal, Mapping
  8. from termcolor import colored
  9. DISABLE_COLOR_PRINTING = False
  10. DEBUG = False
  11. ColorType = Literal[
  12. 'red',
  13. 'green',
  14. 'yellow',
  15. 'blue',
  16. 'magenta',
  17. 'cyan',
  18. 'light_grey',
  19. 'dark_grey',
  20. 'light_red',
  21. 'light_green',
  22. 'light_yellow',
  23. 'light_blue',
  24. 'light_magenta',
  25. 'light_cyan',
  26. 'white',
  27. ]
  28. LOG_COLORS: Mapping[str, ColorType] = {
  29. 'ACTION': 'green',
  30. 'USER_ACTION': 'light_red',
  31. 'OBSERVATION': 'yellow',
  32. 'USER_OBSERVATION': 'light_green',
  33. 'DETAIL': 'cyan',
  34. 'ERROR': 'red',
  35. 'PLAN': 'light_magenta',
  36. }
  37. class ColoredFormatter(logging.Formatter):
  38. def format(self, record):
  39. msg_type = record.__dict__.get('msg_type')
  40. event_source = record.__dict__.get('event_source')
  41. if event_source:
  42. new_msg_type = f'{event_source.upper()}_{msg_type}'
  43. if new_msg_type in LOG_COLORS:
  44. msg_type = new_msg_type
  45. if msg_type in LOG_COLORS and not DISABLE_COLOR_PRINTING:
  46. msg_type_color = colored(msg_type, LOG_COLORS[msg_type])
  47. msg = colored(record.msg, LOG_COLORS[msg_type])
  48. time_str = colored(
  49. self.formatTime(record, self.datefmt), LOG_COLORS[msg_type]
  50. )
  51. name_str = colored(record.name, LOG_COLORS[msg_type])
  52. level_str = colored(record.levelname, LOG_COLORS[msg_type])
  53. if msg_type in ['ERROR'] or DEBUG:
  54. return f'{time_str} - {name_str}:{level_str}: {record.filename}:{record.lineno}\n{msg_type_color}\n{msg}'
  55. return f'{time_str} - {msg_type_color}\n{msg}'
  56. elif msg_type == 'STEP':
  57. msg = '\n\n==============\n' + record.msg + '\n'
  58. return f'{msg}'
  59. return super().format(record)
  60. console_formatter = ColoredFormatter(
  61. '\033[92m%(asctime)s - %(name)s:%(levelname)s\033[0m: %(filename)s:%(lineno)s - %(message)s',
  62. datefmt='%H:%M:%S',
  63. )
  64. file_formatter = logging.Formatter(
  65. '%(asctime)s - %(name)s:%(levelname)s: %(filename)s:%(lineno)s - %(message)s',
  66. datefmt='%H:%M:%S',
  67. )
  68. llm_formatter = logging.Formatter('%(message)s')
  69. class SensitiveDataFilter(logging.Filter):
  70. def filter(self, record):
  71. # start with attributes
  72. sensitive_patterns = [
  73. 'api_key',
  74. 'aws_access_key_id',
  75. 'aws_secret_access_key',
  76. 'e2b_api_key',
  77. 'github_token',
  78. 'jwt_secret',
  79. 'ssh_password',
  80. ]
  81. # add env var names
  82. env_vars = [attr.upper() for attr in sensitive_patterns]
  83. sensitive_patterns.extend(env_vars)
  84. # and some special cases
  85. sensitive_patterns.append('JWT_SECRET')
  86. sensitive_patterns.append('LLM_API_KEY')
  87. sensitive_patterns.append('GITHUB_TOKEN')
  88. sensitive_patterns.append('SANDBOX_ENV_GITHUB_TOKEN')
  89. # this also formats the message with % args
  90. msg = record.getMessage()
  91. record.args = ()
  92. for attr in sensitive_patterns:
  93. pattern = rf"{attr}='?([\w-]+)'?"
  94. msg = re.sub(pattern, f"{attr}='******'", msg)
  95. # passed with msg
  96. record.msg = msg
  97. return True
  98. def get_console_handler():
  99. """Returns a console handler for logging."""
  100. console_handler = logging.StreamHandler()
  101. console_handler.setLevel(logging.INFO)
  102. if DEBUG:
  103. console_handler.setLevel(logging.DEBUG)
  104. console_handler.setFormatter(console_formatter)
  105. return console_handler
  106. def get_file_handler(log_dir=None):
  107. """Returns a file handler for logging."""
  108. log_dir = os.path.join(os.getcwd(), 'logs') if log_dir is None else log_dir
  109. os.makedirs(log_dir, exist_ok=True)
  110. timestamp = datetime.now().strftime('%Y-%m-%d')
  111. file_name = f'opendevin_{timestamp}.log'
  112. file_handler = logging.FileHandler(os.path.join(log_dir, file_name))
  113. if DEBUG:
  114. file_handler.setLevel(logging.DEBUG)
  115. file_handler.setFormatter(file_formatter)
  116. return file_handler
  117. # Set up logging
  118. logging.basicConfig(level=logging.ERROR)
  119. def log_uncaught_exceptions(ex_cls, ex, tb):
  120. """Logs uncaught exceptions along with the traceback.
  121. Args:
  122. ex_cls (type): The type of the exception.
  123. ex (Exception): The exception instance.
  124. tb (traceback): The traceback object.
  125. Returns:
  126. None
  127. """
  128. logging.error(''.join(traceback.format_tb(tb)))
  129. logging.error('{0}: {1}'.format(ex_cls, ex))
  130. sys.excepthook = log_uncaught_exceptions
  131. opendevin_logger = logging.getLogger('opendevin')
  132. opendevin_logger.setLevel(logging.INFO)
  133. if DEBUG:
  134. opendevin_logger.setLevel(logging.DEBUG)
  135. opendevin_logger.addHandler(get_file_handler())
  136. opendevin_logger.addHandler(get_console_handler())
  137. opendevin_logger.addFilter(SensitiveDataFilter(opendevin_logger.name))
  138. opendevin_logger.propagate = False
  139. opendevin_logger.debug('Logging initialized')
  140. opendevin_logger.debug(
  141. 'Logging to %s', os.path.join(os.getcwd(), 'logs', 'opendevin.log')
  142. )
  143. # Exclude LiteLLM from logging output
  144. logging.getLogger('LiteLLM').disabled = True
  145. logging.getLogger('LiteLLM Router').disabled = True
  146. logging.getLogger('LiteLLM Proxy').disabled = True
  147. class LlmFileHandler(logging.FileHandler):
  148. """# LLM prompt and response logging"""
  149. def __init__(self, filename, mode='a', encoding='utf-8', delay=False):
  150. """Initializes an instance of LlmFileHandler.
  151. Args:
  152. filename (str): The name of the log file.
  153. mode (str, optional): The file mode. Defaults to 'a'.
  154. encoding (str, optional): The file encoding. Defaults to None.
  155. delay (bool, optional): Whether to delay file opening. Defaults to False.
  156. """
  157. self.filename = filename
  158. self.message_counter = 1
  159. if DEBUG:
  160. self.session = datetime.now().strftime('%y-%m-%d_%H-%M')
  161. else:
  162. self.session = 'default'
  163. self.log_directory = os.path.join(os.getcwd(), 'logs', 'llm', self.session)
  164. os.makedirs(self.log_directory, exist_ok=True)
  165. if not DEBUG:
  166. # Clear the log directory if not in debug mode
  167. for file in os.listdir(self.log_directory):
  168. file_path = os.path.join(self.log_directory, file)
  169. try:
  170. os.unlink(file_path)
  171. except Exception as e:
  172. opendevin_logger.error(
  173. 'Failed to delete %s. Reason: %s', file_path, e
  174. )
  175. filename = f'{self.filename}_{self.message_counter:03}.log'
  176. self.baseFilename = os.path.join(self.log_directory, filename)
  177. super().__init__(self.baseFilename, mode, encoding, delay)
  178. def emit(self, record):
  179. """Emits a log record.
  180. Args:
  181. record (logging.LogRecord): The log record to emit.
  182. """
  183. filename = f'{self.filename}_{self.message_counter:03}.log'
  184. self.baseFilename = os.path.join(self.log_directory, filename)
  185. self.stream = self._open()
  186. super().emit(record)
  187. self.stream.close()
  188. opendevin_logger.debug('Logging to %s', self.baseFilename)
  189. self.message_counter += 1
  190. def _get_llm_file_handler(name, debug_level=logging.DEBUG):
  191. # The 'delay' parameter, when set to True, postpones the opening of the log file
  192. # until the first log message is emitted.
  193. llm_file_handler = LlmFileHandler(name, delay=True)
  194. llm_file_handler.setFormatter(llm_formatter)
  195. llm_file_handler.setLevel(debug_level)
  196. return llm_file_handler
  197. def _setup_llm_logger(name, debug_level=logging.DEBUG):
  198. logger = logging.getLogger(name)
  199. logger.propagate = False
  200. logger.setLevel(debug_level)
  201. logger.addHandler(_get_llm_file_handler(name, debug_level))
  202. return logger
  203. llm_prompt_logger = _setup_llm_logger('prompt', logging.DEBUG)
  204. llm_response_logger = _setup_llm_logger('response', logging.DEBUG)