| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177 |
- import os
- import asyncio
- from typing import Optional, Dict, Type
- from fastapi import WebSocketDisconnect
- from opendevin.action import (
- Action,
- NullAction,
- CmdRunAction,
- CmdKillAction,
- BrowseURLAction,
- FileReadAction,
- FileWriteAction,
- AgentRecallAction,
- AgentThinkAction,
- AgentFinishAction,
- )
- from opendevin.agent import Agent
- from opendevin.controller import AgentController
- from opendevin.llm.llm import LLM
- from opendevin.observation import (
- Observation,
- UserMessageObservation
- )
- # NOTE: this is a temporary solution - but hopefully we can use Action/Observation throughout the codebase
- ACTION_TYPE_TO_CLASS: Dict[str, Type[Action]] = {
- "run": CmdRunAction,
- "kill": CmdKillAction,
- "browse": BrowseURLAction,
- "read": FileReadAction,
- "write": FileWriteAction,
- "recall": AgentRecallAction,
- "think": AgentThinkAction,
- "finish": AgentFinishAction,
- }
- DEFAULT_WORKSPACE_DIR = os.getenv("WORKSPACE_DIR", os.path.join(os.getcwd(), "workspace"))
- LLM_MODEL = os.getenv("LLM_MODEL", "gpt-4-0125-preview")
- def parse_event(data):
- if "action" not in data:
- return None
- action = data["action"]
- args = {}
- if "args" in data:
- args = data["args"]
- message = None
- if "message" in data:
- message = data["message"]
- return {
- "action": action,
- "args": args,
- "message": message,
- }
- class Session:
- def __init__(self, websocket):
- self.websocket = websocket
- self.controller: Optional[AgentController] = None
- self.agent: Optional[Agent] = None
- self.agent_task = None
- asyncio.create_task(self.create_controller(), name="create controller") # FIXME: starting the docker container synchronously causes a websocket error...
- async def send_error(self, message):
- await self.send({"error": True, "message": message})
- async def send_message(self, message):
- await self.send({"message": message})
- async def send(self, data):
- if self.websocket is None:
- return
- try:
- await self.websocket.send_json(data)
- except Exception as e:
- print("Error sending data to client", e)
- async def start_listening(self):
- try:
- while True:
- try:
- data = await self.websocket.receive_json()
- except ValueError:
- await self.send_error("Invalid JSON")
- continue
- event = parse_event(data)
- if event is None:
- await self.send_error("Invalid event")
- continue
- if event["action"] == "initialize":
- await self.create_controller(event)
- elif event["action"] == "start":
- await self.start_task(event)
- else:
- if self.controller is None:
- await self.send_error("No agent started. Please wait a second...")
- elif event["action"] == "chat":
- self.controller.add_history(NullAction(), UserMessageObservation(event["message"]))
- else:
- # TODO: we only need to implement user message for now
- # since even Devin does not support having the user taking other
- # actions (e.g., edit files) while the agent is running
- raise NotImplementedError
- except WebSocketDisconnect as e:
- self.websocket = None
- if self.agent_task:
- self.agent_task.cancel()
- print("Client websocket disconnected", e)
- async def create_controller(self, start_event=None):
- directory = DEFAULT_WORKSPACE_DIR
- if start_event and "directory" in start_event.args:
- directory = start_event.args["directory"]
- agent_cls = "LangchainsAgent"
- if start_event and "agent_cls" in start_event.args:
- agent_cls = start_event.args["agent_cls"]
- model = LLM_MODEL
- if start_event and "model" in start_event.args:
- model = start_event.args["model"]
- if not os.path.exists(directory):
- print(f"Workspace directory {directory} does not exist. Creating it...")
- os.makedirs(directory)
- directory = os.path.relpath(directory, os.getcwd())
- llm = LLM(model)
- AgentCls = Agent.get_cls(agent_cls)
- self.agent = AgentCls(llm)
- self.controller = AgentController(self.agent, workdir=directory, callbacks=[self.on_agent_event])
- await self.send({"action": "initialize", "message": "Control loop started."})
- async def start_task(self, start_event):
- if "task" not in start_event["args"]:
- await self.send_error("No task specified")
- return
- await self.send_message("Starting new task...")
- task = start_event["args"]["task"]
- if self.controller is None:
- await self.send_error("No agent started. Please wait a second...")
- return
- self.agent_task = asyncio.create_task(self.controller.start_loop(task), name="agent loop")
- def on_agent_event(self, event: Observation | Action):
- # FIXME: we need better serialization
- event_dict = event.to_dict()
- if "action" in event_dict:
- if event_dict["action"] == "CmdRunAction":
- event_dict["action"] = "run"
- elif event_dict["action"] == "CmdKillAction":
- event_dict["action"] = "kill"
- elif event_dict["action"] == "BrowseURLAction":
- event_dict["action"] = "browse"
- elif event_dict["action"] == "FileReadAction":
- event_dict["action"] = "read"
- elif event_dict["action"] == "FileWriteAction":
- event_dict["action"] = "write"
- elif event_dict["action"] == "AgentFinishAction":
- event_dict["action"] = "finish"
- elif event_dict["action"] == "AgentRecallAction":
- event_dict["action"] = "recall"
- elif event_dict["action"] == "AgentThinkAction":
- event_dict["action"] = "think"
- if "observation" in event_dict:
- if event_dict["observation"] == "UserMessageObservation":
- event_dict["observation"] = "chat"
- elif event_dict["observation"] == "AgentMessageObservation":
- event_dict["observation"] = "chat"
- elif event_dict["observation"] == "CmdOutputObservation":
- event_dict["observation"] = "run"
- elif event_dict["observation"] == "FileReadObservation":
- event_dict["observation"] = "read"
- asyncio.create_task(self.send(event_dict), name="send event in callback")
|