vor 1 Jahr · 98adbf54ec
--- a/agenthub/micro/agent.py
+++ b/agenthub/micro/agent.py
@@ -1,10 +1,11 @@
 
															-import json
														
 
															+from json import JSONDecodeError
														
 
															 from jinja2 import BaseLoader, Environment
														
 
															 from opendevin.controller.agent import Agent
														
 
															 from opendevin.controller.state.state import State
														
 
															 from opendevin.core.exceptions import LLMOutputError
														
 
															+from opendevin.core.utils import json
														
 
															 from opendevin.events.action import Action, action_from_dict
														
 
															 from opendevin.llm.llm import LLM
														
@@ -28,32 +29,18 @@ def parse_response(orig_response: str) -> Action:
 
															                     action_dict = json.loads(response)
														
 
															                     action = action_from_dict(action_dict)
														
 
															                     return action
														
 
															-                except json.JSONDecodeError as e:
														
 
															+                except JSONDecodeError as e:
														
 
															                     raise LLMOutputError(
														
 
															                         'Invalid JSON in response. Please make sure the response is a valid JSON object.'
														
 
															                     ) from e
														
 
															     raise LLMOutputError('No valid JSON object found in response.')
														
 
															-def my_encoder(obj):
														
 
															-    """
														
 
															-    Encodes objects as dictionaries
														
 
															-
														
 
															-    Parameters:
														
 
															-    - obj (Object): An object that will be converted
														
 
															-
														
 
															-    Returns:
														
 
															-    - dict: If the object can be converted it is returned in dict format
														
 
															-    """
														
 
															-    if hasattr(obj, 'to_dict'):
														
 
															-        return obj.to_dict()
														
 
															-
														
 
															-
														
 
															 def to_json(obj, **kwargs):
														
 
															     """
														
 
															     Serialize an object to str format
														
 
															     """
														
 
															-    return json.dumps(obj, default=my_encoder, **kwargs)
														
 
															+    return json.dumps(obj, **kwargs)
														
 
															 class MicroAgent(Agent):
														
--- a/agenthub/monologue_agent/agent.py
+++ b/agenthub/monologue_agent/agent.py
@@ -1,5 +1,4 @@
 
															 import agenthub.monologue_agent.utils.prompts as prompts
														
 
															-from agenthub.monologue_agent.utils.monologue import Monologue
														
 
															 from opendevin.controller.agent import Agent
														
 
															 from opendevin.controller.state.state import State
														
 
															 from opendevin.core.config import config
														
@@ -24,9 +23,11 @@ from opendevin.events.observation import (
 
															     Observation,
														
 
															 )
														
 
															 from opendevin.llm.llm import LLM
														
 
															+from opendevin.memory.condenser import MemoryCondenser
														
 
															+from opendevin.memory.history import ShortTermHistory
														
 
															 if config.agent.memory_enabled:
														
 
															-    from agenthub.monologue_agent.utils.memory import LongTermMemory
														
 
															+    from opendevin.memory.memory import LongTermMemory
														
 
															 MAX_TOKEN_COUNT_PADDING = 512
														
 
															 MAX_OUTPUT_LENGTH = 5000
														
@@ -85,8 +86,9 @@ class MonologueAgent(Agent):
 
															     """
														
 
															     _initialized = False
														
 
															-    monologue: Monologue
														
 
															+    monologue: ShortTermHistory
														
 
															     memory: 'LongTermMemory | None'
														
 
															+    memory_condenser: MemoryCondenser
														
 
															     def __init__(self, llm: LLM):
														
 
															         """
														
@@ -97,7 +99,7 @@ class MonologueAgent(Agent):
 
															         """
														
 
															         super().__init__(llm)
														
 
															-    def _add_event(self, event: dict):
														
 
															+    def _add_event(self, event_dict: dict):
														
 
															         """
														
 
															         Adds a new event to the agent's monologue and memory.
														
 
															         Monologue automatically condenses when it gets too large.
														
@@ -107,29 +109,33 @@ class MonologueAgent(Agent):
 
															         """
														
 
															         if (
														
 
															-            'args' in event
														
 
															-            and 'output' in event['args']
														
 
															-            and len(event['args']['output']) > MAX_OUTPUT_LENGTH
														
 
															+            'args' in event_dict
														
 
															+            and 'output' in event_dict['args']
														
 
															+            and len(event_dict['args']['output']) > MAX_OUTPUT_LENGTH
														
 
															         ):
														
 
															-            event['args']['output'] = (
														
 
															-                event['args']['output'][:MAX_OUTPUT_LENGTH] + '...'
														
 
															+            event_dict['args']['output'] = (
														
 
															+                event_dict['args']['output'][:MAX_OUTPUT_LENGTH] + '...'
														
 
															             )
														
 
															-        self.monologue.add_event(event)
														
 
															+        self.monologue.add_event(event_dict)
														
 
															         if self.memory is not None:
														
 
															-            self.memory.add_event(event)
														
 
															+            self.memory.add_event(event_dict)
														
 
															         # Test monologue token length
														
 
															         prompt = prompts.get_request_action_prompt(
														
 
															             '',
														
 
															-            self.monologue.get_thoughts(),
														
 
															+            self.monologue.get_events(),
														
 
															             [],
														
 
															         )
														
 
															         messages = [{'content': prompt, 'role': 'user'}]
														
 
															         token_count = self.llm.get_token_count(messages)
														
 
															         if token_count + MAX_TOKEN_COUNT_PADDING > self.llm.max_input_tokens:
														
 
															-            self.monologue.condense(self.llm)
														
 
															+            prompt = prompts.get_summarize_monologue_prompt(self.monologue.events)
														
 
															+            summary_response = self.memory_condenser.condense(
														
 
															+                summarize_prompt=prompt, llm=self.llm
														
 
															+            )
														
 
															+            self.monologue.events = prompts.parse_summary_response(summary_response)
														
 
															     def _initialize(self, task: str):
														
 
															         """
														
@@ -151,12 +157,14 @@ class MonologueAgent(Agent):
 
															         if task is None or task == '':
														
 
															             raise AgentNoInstructionError()
														
 
															-        self.monologue = Monologue()
														
 
															+        self.monologue = ShortTermHistory()
														
 
															         if config.agent.memory_enabled:
														
 
															             self.memory = LongTermMemory()
														
 
															         else:
														
 
															             self.memory = None
														
 
															+        self.memory_condenser = MemoryCondenser()
														
 
															+
														
 
															         self._add_initial_thoughts(task)
														
 
															         self._initialized = True
														
@@ -226,7 +234,7 @@ class MonologueAgent(Agent):
 
															         prompt = prompts.get_request_action_prompt(
														
 
															             state.plan.main_goal,
														
 
															-            self.monologue.get_thoughts(),
														
 
															+            self.monologue.get_events(),
														
 
															             state.background_commands_obs,
														
 
															         )
														
 
															         messages = [{'content': prompt, 'role': 'user'}]
														
--- a/agenthub/monologue_agent/utils/monologue.py
+++ b/agenthub/monologue_agent/utils/monologue.py
@@ -1,79 +0,0 @@
 
															-import agenthub.monologue_agent.utils.json as json
														
 
															-import agenthub.monologue_agent.utils.prompts as prompts
														
 
															-from opendevin.core.exceptions import AgentEventTypeError
														
 
															-from opendevin.core.logger import opendevin_logger as logger
														
 
															-from opendevin.llm.llm import LLM
														
 
															-
														
 
															-
														
 
															-class Monologue:
														
 
															-    """
														
 
															-    The monologue is a representation for the agent's internal monologue where it can think.
														
 
															-    The agent has the capability of using this monologue for whatever it wants.
														
 
															-    """
														
 
															-
														
 
															-    def __init__(self):
														
 
															-        """
														
 
															-        Initialize the empty list of thoughts
														
 
															-        """
														
 
															-        self.thoughts = []
														
 
															-
														
 
															-    def add_event(self, t: dict):
														
 
															-        """
														
 
															-        Adds an event to memory if it is a valid event.
														
 
															-
														
 
															-        Parameters:
														
 
															-        - t (dict): The thought that we want to add to memory
														
 
															-
														
 
															-        Raises:
														
 
															-        - AgentEventTypeError: If t is not a dict
														
 
															-        """
														
 
															-        if not isinstance(t, dict):
														
 
															-            raise AgentEventTypeError()
														
 
															-        self.thoughts.append(t)
														
 
															-
														
 
															-    def get_thoughts(self):
														
 
															-        """
														
 
															-        Get the current thoughts of the agent.
														
 
															-
														
 
															-        Returns:
														
 
															-        - list: The list of thoughts that the agent has.
														
 
															-        """
														
 
															-        return self.thoughts
														
 
															-
														
 
															-    def get_total_length(self):
														
 
															-        """
														
 
															-        Gives the total number of characters in all thoughts
														
 
															-
														
 
															-        Returns:
														
 
															-        - Int: Total number of chars in thoughts.
														
 
															-        """
														
 
															-        total_length = 0
														
 
															-        for t in self.thoughts:
														
 
															-            try:
														
 
															-                total_length += len(json.dumps(t))
														
 
															-            except TypeError as e:
														
 
															-                logger.error('Error serializing thought: %s', str(e), exc_info=False)
														
 
															-        return total_length
														
 
															-
														
 
															-    def condense(self, llm: LLM):
														
 
															-        """
														
 
															-        Attempts to condense the monologue by using the llm
														
 
															-
														
 
															-        Parameters:
														
 
															-        - llm (LLM): llm to be used for summarization
														
 
															-
														
 
															-        Raises:
														
 
															-        - Exception: the same exception as it got from the llm or processing the response
														
 
															-        """
														
 
															-
														
 
															-        try:
														
 
															-            prompt = prompts.get_summarize_monologue_prompt(self.thoughts)
														
 
															-            messages = [{'content': prompt, 'role': 'user'}]
														
 
															-            resp = llm.completion(messages=messages)
														
 
															-            summary_resp = resp['choices'][0]['message']['content']
														
 
															-            self.thoughts = prompts.parse_summary_response(summary_resp)
														
 
															-        except Exception as e:
														
 
															-            logger.error('Error condensing thoughts: %s', str(e), exc_info=False)
														
 
															-
														
 
															-            # TODO If the llm fails with ContextWindowExceededError, we can try to condense the monologue chunk by chunk
														
 
															-            raise
														
--- a/agenthub/monologue_agent/utils/prompts.py
+++ b/agenthub/monologue_agent/utils/prompts.py
@@ -3,6 +3,7 @@ from json import JSONDecodeError
 
															 from opendevin.core.config import config
														
 
															 from opendevin.core.exceptions import LLMOutputError
														
 
															+from opendevin.core.utils import json
														
 
															 from opendevin.events.action import (
														
 
															     Action,
														
 
															     action_from_dict,
														
@@ -11,8 +12,6 @@ from opendevin.events.observation import (
 
															     CmdOutputObservation,
														
 
															 )
														
 
															-from . import json
														
 
															-
														
 
															 ACTION_PROMPT = """
														
 
															 You're a thoughtful robot. Your main task is this:
														
 
															 %(task)s
														
--- a/agenthub/planner_agent/prompt.py
+++ b/agenthub/planner_agent/prompt.py
@@ -1,8 +1,7 @@
 
															-import json
														
 
															-
														
 
															 from opendevin.controller.state.plan import Plan
														
 
															 from opendevin.core.logger import opendevin_logger as logger
														
 
															 from opendevin.core.schema import ActionType
														
 
															+from opendevin.core.utils import json
														
 
															 from opendevin.events.action import (
														
 
															     Action,
														
 
															     NullAction,
														
@@ -176,9 +175,6 @@ def parse_response(response: str) -> Action:
 
															     Returns:
														
 
															     - Action: A valid next action to perform from model output
														
 
															     """
														
 
															-    json_start = response.find('{')
														
 
															-    json_end = response.rfind('}') + 1
														
 
															-    response = response[json_start:json_end]
														
 
															     action_dict = json.loads(response)
														
 
															     if 'contents' in action_dict:
														
 
															         # The LLM gets confused here. Might as well be robust
														
--- a/agenthub/monologue_agent/utils/json.py
+++ b/agenthub/monologue_agent/utils/json.py
--- a/opendevin/memory/__init__.py
+++ b/opendevin/memory/__init__.py
@@ -0,0 +1,5 @@
 
															+from .condenser import MemoryCondenser
														
 
															+from .history import ShortTermHistory
														
 
															+from .memory import LongTermMemory
														
 
															+
														
 
															+__all__ = ['LongTermMemory', 'ShortTermHistory', 'MemoryCondenser']
														
--- a/opendevin/memory/condenser.py
+++ b/opendevin/memory/condenser.py
@@ -0,0 +1,26 @@
 
															+from opendevin.core.logger import opendevin_logger as logger
														
 
															+from opendevin.llm.llm import LLM
														
 
															+
														
 
															+
														
 
															+class MemoryCondenser:
														
 
															+    def condense(self, summarize_prompt: str, llm: LLM):
														
 
															+        """
														
 
															+        Attempts to condense the monologue by using the llm
														
 
															+
														
 
															+        Parameters:
														
 
															+        - llm (LLM): llm to be used for summarization
														
 
															+
														
 
															+        Raises:
														
 
															+        - Exception: the same exception as it got from the llm or processing the response
														
 
															+        """
														
 
															+
														
 
															+        try:
														
 
															+            messages = [{'content': summarize_prompt, 'role': 'user'}]
														
 
															+            resp = llm.completion(messages=messages)
														
 
															+            summary_response = resp['choices'][0]['message']['content']
														
 
															+            return summary_response
														
 
															+        except Exception as e:
														
 
															+            logger.error('Error condensing thoughts: %s', str(e), exc_info=False)
														
 
															+
														
 
															+            # TODO If the llm fails with ContextWindowExceededError, we can try to condense the monologue chunk by chunk
														
 
															+            raise
														
--- a/opendevin/memory/history.py
+++ b/opendevin/memory/history.py
@@ -0,0 +1,54 @@
 
															+import opendevin.core.utils.json as json
														
 
															+from opendevin.core.exceptions import AgentEventTypeError
														
 
															+from opendevin.core.logger import opendevin_logger as logger
														
 
															+
														
 
															+
														
 
															+class ShortTermHistory:
														
 
															+    """
														
 
															+    The short term history is the most recent series of events.
														
 
															+    An agent can send this in the prompt or use it for other purpose.
														
 
															+    """
														
 
															+
														
 
															+    def __init__(self):
														
 
															+        """
														
 
															+        Initialize the empty list of events
														
 
															+        """
														
 
															+        self.events = []
														
 
															+
														
 
															+    def add_event(self, event_dict: dict):
														
 
															+        """
														
 
															+        Adds an event to memory if it is a valid event.
														
 
															+
														
 
															+        Parameters:
														
 
															+        - event_dict (dict): The event that we want to add to memory
														
 
															+
														
 
															+        Raises:
														
 
															+        - AgentEventTypeError: If event_dict is not a dict
														
 
															+        """
														
 
															+        if not isinstance(event_dict, dict):
														
 
															+            raise AgentEventTypeError()
														
 
															+        self.events.append(event_dict)
														
 
															+
														
 
															+    def get_events(self):
														
 
															+        """
														
 
															+        Get the events in the agent's recent history.
														
 
															+
														
 
															+        Returns:
														
 
															+        - List: The list of events that the agent remembers easily.
														
 
															+        """
														
 
															+        return self.events
														
 
															+
														
 
															+    def get_total_length(self):
														
 
															+        """
														
 
															+        Gives the total number of characters in all history
														
 
															+
														
 
															+        Returns:
														
 
															+        - Int: Total number of characters of the recent history.
														
 
															+        """
														
 
															+        total_length = 0
														
 
															+        for t in self.events:
														
 
															+            try:
														
 
															+                total_length += len(json.dumps(t))
														
 
															+            except TypeError as e:
														
 
															+                logger.error('Error serializing event: %s', str(e), exc_info=False)
														
 
															+        return total_length
														
--- a/agenthub/monologue_agent/utils/memory.py
+++ b/agenthub/monologue_agent/utils/memory.py
@@ -15,8 +15,7 @@ from tenacity import (
 
															 from opendevin.core.config import config
														
 
															 from opendevin.core.logger import opendevin_logger as logger
														
 
															-
														
 
															-from . import json
														
 
															+from opendevin.core.utils import json
														
 
															 num_retries = config.llm.num_retries
														
 
															 retry_min_wait = config.llm.retry_min_wait