1 год назад · 62ce183c2d
--- a/opendevin/events/action/commands.py
+++ b/opendevin/events/action/commands.py
@@ -10,6 +10,14 @@ from .action import Action, ActionConfirmationStatus
 
															 class CmdRunAction(Action):
														
 
															     command: str
														
 
															     thought: str = ''
														
 
															+    keep_prompt: bool = True
														
 
															+    # if True, the command prompt will be kept in the command output observation
														
 
															+    # Example of command output:
														
 
															+    # root@sandbox:~# ls
														
 
															+    # file1.txt
														
 
															+    # file2.txt
														
 
															+    # root@sandbox:~# <-- this is the command prompt
														
 
															+
														
 
															     action: str = ActionType.RUN
														
 
															     runnable: ClassVar[bool] = True
														
 
															     is_confirmed: ActionConfirmationStatus = ActionConfirmationStatus.CONFIRMED
														
--- a/opendevin/runtime/client/client.py
+++ b/opendevin/runtime/client/client.py
@@ -170,8 +170,7 @@ class RuntimeClient:
 
															             matched is not None
														
 
															         ), f'Failed to parse bash prompt: {ps1}. This should not happen.'
														
 
															         username, hostname, working_dir = matched.groups()
														
 
															-        self._prev_pwd = self.pwd
														
 
															-        self.pwd = working_dir
														
 
															+        self.pwd = os.path.expanduser(working_dir)
														
 
															         # re-assemble the prompt
														
 
															         prompt = f'{username}@{hostname}:{working_dir} '
														
@@ -192,8 +191,10 @@ class RuntimeClient:
 
															         self.shell.expect(self.__bash_expect_regex, timeout=timeout)
														
 
															         output = self.shell.before
														
 
															+
														
 
															+        bash_prompt = self._get_bash_prompt_and_update_pwd()
														
 
															         if keep_prompt:
														
 
															-            output += '\r\n' + self._get_bash_prompt_and_update_pwd()
														
 
															+            output += '\r\n' + bash_prompt
														
 
															         logger.debug(f'Command output: {output}')
														
 
															         # Get exit code
														
@@ -218,7 +219,11 @@ class RuntimeClient:
 
															             commands = split_bash_commands(action.command)
														
 
															             all_output = ''
														
 
															             for command in commands:
														
 
															-                output, exit_code = self._execute_bash(command, timeout=action.timeout)
														
 
															+                output, exit_code = self._execute_bash(
														
 
															+                    command,
														
 
															+                    timeout=action.timeout,
														
 
															+                    keep_prompt=action.keep_prompt,
														
 
															+                )
														
 
															                 if all_output:
														
 
															                     # previous output already exists with prompt "user@hostname:working_dir #""
														
 
															                     # we need to add the command to the previous output,
														
@@ -240,15 +245,19 @@ class RuntimeClient:
 
															     async def run_ipython(self, action: IPythonRunCellAction) -> Observation:
														
 
															         if 'jupyter' in self.plugins:
														
 
															             _jupyter_plugin: JupyterPlugin = self.plugins['jupyter']  # type: ignore
														
 
															-
														
 
															             # This is used to make AgentSkills in Jupyter aware of the
														
 
															             # current working directory in Bash
														
 
															-            if not hasattr(self, '_prev_pwd') or self.pwd != self._prev_pwd:
														
 
															-                reset_jupyter_pwd_code = (
														
 
															-                    f'import os; os.environ["JUPYTER_PWD"] = "{self.pwd}"\n\n'
														
 
															+            if self.pwd != getattr(self, '_jupyter_pwd', None):
														
 
															+                logger.debug(
														
 
															+                    f"{self.pwd} != {getattr(self, '_jupyter_pwd', None)} -> reset Jupyter PWD"
														
 
															                 )
														
 
															+                reset_jupyter_pwd_code = f'import os; os.environ["JUPYTER_PWD"] = os.path.abspath("{self.pwd}")'
														
 
															                 _aux_action = IPythonRunCellAction(code=reset_jupyter_pwd_code)
														
 
															-                _ = await _jupyter_plugin.run(_aux_action)
														
 
															+                _reset_obs = await _jupyter_plugin.run(_aux_action)
														
 
															+                logger.debug(
														
 
															+                    f'Changed working directory in IPython to: {self.pwd}. Output: {_reset_obs}'
														
 
															+                )
														
 
															+                self._jupyter_pwd = self.pwd
														
 
															             obs: IPythonRunCellObservation = await _jupyter_plugin.run(action)
														
 
															             return obs
														
--- a/tests/integration/mock/eventstream_runtime/DelegatorAgent/test_edits/prompt_002.log
+++ b/tests/integration/mock/eventstream_runtime/DelegatorAgent/test_edits/prompt_002.log
@@ -41,7 +41,7 @@ as well as observations you've made. This only includes the MOST RECENT
 
															 actions and observations--more may have happened before that.
														
 
															 They are time-ordered, with your most recent action at the bottom.
														
 
															-[{"source": "agent", "action": "run", "args": {"command": "ls", "thought": "", "is_confirmed": "confirmed"}}, {"source": "agent", "observation": "run", "content": "bad.txt\r\n\r\nopendevin@docker-desktop:/workspace $ ", "extras": {"command_id": -1, "command": "ls", "exit_code": 0}}]
														
 
															+[{"source": "agent", "action": "run", "args": {"command": "ls", "thought": "", "keep_prompt": true, "is_confirmed": "confirmed"}}, {"source": "agent", "observation": "run", "content": "bad.txt\r\n\r\nopendevin@docker-desktop:/workspace $ ", "extras": {"command_id": -1, "command": "ls", "exit_code": 0}}]
														
 
															 ## Format
														
 
															 Your response MUST be in JSON format. It must be an object, and it must contain two fields:
														
--- a/tests/integration/mock/eventstream_runtime/DelegatorAgent/test_edits/prompt_003.log
+++ b/tests/integration/mock/eventstream_runtime/DelegatorAgent/test_edits/prompt_003.log
@@ -41,7 +41,7 @@ as well as observations you've made. This only includes the MOST RECENT
 
															 actions and observations--more may have happened before that.
														
 
															 They are time-ordered, with your most recent action at the bottom.
														
 
															-[{"source": "agent", "action": "run", "args": {"command": "ls", "thought": "", "is_confirmed": "confirmed"}}, {"source": "agent", "observation": "run", "content": "bad.txt\r\n\r\nopendevin@docker-desktop:/workspace $ ", "extras": {"command_id": -1, "command": "ls", "exit_code": 0}}, {"source": "agent", "action": "read", "args": {"path": "bad.txt", "start": 0, "end": -1, "thought": ""}}, {"source": "agent", "observation": "read", "content": "This is a stupid typoo.\nReally?\nNo mor typos!\nEnjoy!\n", "extras": {"path": "/workspace/bad.txt"}}]
														
 
															+[{"source": "agent", "action": "run", "args": {"command": "ls", "thought": "", "keep_prompt": true, "is_confirmed": "confirmed"}}, {"source": "agent", "observation": "run", "content": "bad.txt\r\n\r\nopendevin@docker-desktop:/workspace $ ", "extras": {"command_id": -1, "command": "ls", "exit_code": 0}}, {"source": "agent", "action": "read", "args": {"path": "bad.txt", "start": 0, "end": -1, "thought": ""}}, {"source": "agent", "observation": "read", "content": "This is a stupid typoo.\nReally?\nNo mor typos!\nEnjoy!\n", "extras": {"path": "/workspace/bad.txt"}}]
														
 
															 ## Format
														
 
															 Your response MUST be in JSON format. It must be an object, and it must contain two fields:
														
--- a/tests/integration/mock/eventstream_runtime/DelegatorAgent/test_write_simple_script/prompt_002.log
+++ b/tests/integration/mock/eventstream_runtime/DelegatorAgent/test_write_simple_script/prompt_002.log
@@ -41,7 +41,7 @@ as well as observations you've made. This only includes the MOST RECENT
 
															 actions and observations--more may have happened before that.
														
 
															 They are time-ordered, with your most recent action at the bottom.
														
 
															-[{"source": "agent", "action": "run", "args": {"command": "ls", "thought": "", "is_confirmed": "confirmed"}}, {"source": "agent", "observation": "run", "content": "\r\nopendevin@docker-desktop:/workspace $ ", "extras": {"command_id": -1, "command": "ls", "exit_code": 0}}]
														
 
															+[{"source": "agent", "action": "run", "args": {"command": "ls", "thought": "", "keep_prompt": true, "is_confirmed": "confirmed"}}, {"source": "agent", "observation": "run", "content": "\r\nopendevin@docker-desktop:/workspace $ ", "extras": {"command_id": -1, "command": "ls", "exit_code": 0}}]
														
 
															 ## Format
														
 
															 Your response MUST be in JSON format. It must be an object, and it must contain two fields:
														
--- a/tests/integration/mock/eventstream_runtime/DelegatorAgent/test_write_simple_script/prompt_005.log
+++ b/tests/integration/mock/eventstream_runtime/DelegatorAgent/test_write_simple_script/prompt_005.log
@@ -41,7 +41,7 @@ as well as observations you've made. This only includes the MOST RECENT
 
															 actions and observations--more may have happened before that.
														
 
															 They are time-ordered, with your most recent action at the bottom.
														
 
															-[{"source": "agent", "action": "write", "args": {"path": "hello.sh", "content": "#!/bin/bash\n\necho 'hello'", "start": 0, "end": -1, "thought": ""}}, {"source": "agent", "observation": "write", "content": "", "extras": {"path": "/workspace/hello.sh"}}, {"source": "agent", "action": "run", "args": {"command": "chmod +x hello.sh", "thought": "", "is_confirmed": "confirmed"}}, {"source": "agent", "observation": "run", "content": "\r\nopendevin@docker-desktop:/workspace $ ", "extras": {"command_id": -1, "command": "chmod +x hello.sh", "exit_code": 0}}]
														
 
															+[{"source": "agent", "action": "write", "args": {"path": "hello.sh", "content": "#!/bin/bash\n\necho 'hello'", "start": 0, "end": -1, "thought": ""}}, {"source": "agent", "observation": "write", "content": "", "extras": {"path": "/workspace/hello.sh"}}, {"source": "agent", "action": "run", "args": {"command": "chmod +x hello.sh", "thought": "", "keep_prompt": true, "is_confirmed": "confirmed"}}, {"source": "agent", "observation": "run", "content": "\r\nopendevin@docker-desktop:/workspace $ ", "extras": {"command_id": -1, "command": "chmod +x hello.sh", "exit_code": 0}}]
														
 
															 ## Format
														
 
															 Your response MUST be in JSON format. It must be an object, and it must contain two fields:
														
--- a/tests/integration/mock/eventstream_runtime/DelegatorAgent/test_write_simple_script/prompt_006.log
+++ b/tests/integration/mock/eventstream_runtime/DelegatorAgent/test_write_simple_script/prompt_006.log
@@ -41,7 +41,7 @@ as well as observations you've made. This only includes the MOST RECENT
 
															 actions and observations--more may have happened before that.
														
 
															 They are time-ordered, with your most recent action at the bottom.
														
 
															-[{"source": "agent", "action": "write", "args": {"path": "hello.sh", "content": "#!/bin/bash\n\necho 'hello'", "start": 0, "end": -1, "thought": ""}}, {"source": "agent", "observation": "write", "content": "", "extras": {"path": "/workspace/hello.sh"}}, {"source": "agent", "action": "run", "args": {"command": "chmod +x hello.sh", "thought": "", "is_confirmed": "confirmed"}}, {"source": "agent", "observation": "run", "content": "\r\nopendevin@docker-desktop:/workspace $ ", "extras": {"command_id": -1, "command": "chmod +x hello.sh", "exit_code": 0}}, {"source": "agent", "action": "run", "args": {"command": "./hello.sh", "thought": "", "is_confirmed": "confirmed"}}, {"source": "agent", "observation": "run", "content": "hello\r\n\r\nopendevin@docker-desktop:/workspace $ ", "extras": {"command_id": -1, "command": "./hello.sh", "exit_code": 0}}]
														
 
															+[{"source": "agent", "action": "write", "args": {"path": "hello.sh", "content": "#!/bin/bash\n\necho 'hello'", "start": 0, "end": -1, "thought": ""}}, {"source": "agent", "observation": "write", "content": "", "extras": {"path": "/workspace/hello.sh"}}, {"source": "agent", "action": "run", "args": {"command": "chmod +x hello.sh", "thought": "", "keep_prompt": true, "is_confirmed": "confirmed"}}, {"source": "agent", "observation": "run", "content": "\r\nopendevin@docker-desktop:/workspace $ ", "extras": {"command_id": -1, "command": "chmod +x hello.sh", "exit_code": 0}}, {"source": "agent", "action": "run", "args": {"command": "./hello.sh", "thought": "", "keep_prompt": true, "is_confirmed": "confirmed"}}, {"source": "agent", "observation": "run", "content": "hello\r\n\r\nopendevin@docker-desktop:/workspace $ ", "extras": {"command_id": -1, "command": "./hello.sh", "exit_code": 0}}]
														
 
															 ## Format
														
 
															 Your response MUST be in JSON format. It must be an object, and it must contain two fields:
														
--- a/tests/integration/mock/eventstream_runtime/DelegatorAgent/test_write_simple_script/prompt_009.log
+++ b/tests/integration/mock/eventstream_runtime/DelegatorAgent/test_write_simple_script/prompt_009.log
@@ -39,7 +39,7 @@ as well as observations you've made. This only includes the MOST RECENT
 
															 actions and observations--more may have happened before that.
														
 
															 They are time-ordered, with your most recent action at the bottom.
														
 
															-[{"source": "agent", "action": "read", "args": {"path": "hello.sh", "start": 0, "end": -1, "thought": ""}}, {"source": "agent", "observation": "read", "content": "#!/bin/bash\n\necho 'hello'\n", "extras": {"path": "/workspace/hello.sh"}}, {"source": "agent", "action": "run", "args": {"command": "bash hello.sh", "thought": "", "is_confirmed": "confirmed"}}, {"source": "agent", "observation": "run", "content": "hello\r\n\r\nopendevin@docker-desktop:/workspace $ ", "extras": {"command_id": -1, "command": "bash hello.sh", "exit_code": 0}}]
														
 
															+[{"source": "agent", "action": "read", "args": {"path": "hello.sh", "start": 0, "end": -1, "thought": ""}}, {"source": "agent", "observation": "read", "content": "#!/bin/bash\n\necho 'hello'\n", "extras": {"path": "/workspace/hello.sh"}}, {"source": "agent", "action": "run", "args": {"command": "bash hello.sh", "thought": "", "keep_prompt": true, "is_confirmed": "confirmed"}}, {"source": "agent", "observation": "run", "content": "hello\r\n\r\nopendevin@docker-desktop:/workspace $ ", "extras": {"command_id": -1, "command": "bash hello.sh", "exit_code": 0}}]
														
 
															 ## Format
														
 
															 Your response MUST be in JSON format. It must be an object, and it must contain two fields:
														
--- a/tests/integration/mock/eventstream_runtime/ManagerAgent/test_simple_task_rejection/prompt_003.log
+++ b/tests/integration/mock/eventstream_runtime/ManagerAgent/test_simple_task_rejection/prompt_003.log
@@ -28,7 +28,7 @@ as well as observations you've made. This only includes the MOST RECENT
 
															 actions and observations--more may have happened before that.
														
 
															 They are time-ordered, with your most recent action at the bottom.
														
 
															-[{"source": "agent", "action": "run", "args": {"command": "git status", "thought": "", "is_confirmed": "confirmed"}}, {"source": "agent", "observation": "run", "content": "fatal: not a git repository (or any parent up to mount point /)\r\nStopping at filesystem boundary (GIT_DISCOVERY_ACROSS_FILESYSTEM not set).\r\n\r\nopendevin@docker-desktop:/workspace $ ", "extras": {"command_id": -1, "command": "git status", "exit_code": 128}}]
														
 
															+[{"source": "agent", "action": "run", "args": {"command": "git status", "thought": "", "keep_prompt": true, "is_confirmed": "confirmed"}}, {"source": "agent", "observation": "run", "content": "fatal: not a git repository (or any parent up to mount point /)\r\nStopping at filesystem boundary (GIT_DISCOVERY_ACROSS_FILESYSTEM not set).\r\n\r\nopendevin@docker-desktop:/workspace $ ", "extras": {"command_id": -1, "command": "git status", "exit_code": 128}}]
														
 
															 If the last item in the history is an error, you should try to fix it.
														
--- a/tests/integration/mock/eventstream_runtime/ManagerAgent/test_simple_task_rejection/prompt_004.log
+++ b/tests/integration/mock/eventstream_runtime/ManagerAgent/test_simple_task_rejection/prompt_004.log
@@ -28,7 +28,7 @@ as well as observations you've made. This only includes the MOST RECENT
 
															 actions and observations--more may have happened before that.
														
 
															 They are time-ordered, with your most recent action at the bottom.
														
 
															-[{"source": "agent", "action": "run", "args": {"command": "git status", "thought": "", "is_confirmed": "confirmed"}}, {"source": "agent", "observation": "run", "content": "fatal: not a git repository (or any parent up to mount point /)\r\nStopping at filesystem boundary (GIT_DISCOVERY_ACROSS_FILESYSTEM not set).\r\n\r\nopendevin@docker-desktop:/workspace $ ", "extras": {"command_id": -1, "command": "git status", "exit_code": 128}}, {"source": "agent", "observation": "error", "content": "action={'action': 'reject', 'args': {'reason': 'Not a valid git repository.'}} has the wrong arguments", "extras": {}}]
														
 
															+[{"source": "agent", "action": "run", "args": {"command": "git status", "thought": "", "keep_prompt": true, "is_confirmed": "confirmed"}}, {"source": "agent", "observation": "run", "content": "fatal: not a git repository (or any parent up to mount point /)\r\nStopping at filesystem boundary (GIT_DISCOVERY_ACROSS_FILESYSTEM not set).\r\n\r\nopendevin@docker-desktop:/workspace $ ", "extras": {"command_id": -1, "command": "git status", "exit_code": 128}}, {"source": "agent", "observation": "error", "content": "action={'action': 'reject', 'args': {'reason': 'Not a valid git repository.'}} has the wrong arguments", "extras": {}}]
														
 
															 If the last item in the history is an error, you should try to fix it.
														
--- a/tests/integration/mock/eventstream_runtime/ManagerAgent/test_simple_task_rejection/prompt_005.log
+++ b/tests/integration/mock/eventstream_runtime/ManagerAgent/test_simple_task_rejection/prompt_005.log
@@ -28,7 +28,7 @@ as well as observations you've made. This only includes the MOST RECENT
 
															 actions and observations--more may have happened before that.
														
 
															 They are time-ordered, with your most recent action at the bottom.
														
 
															-[{"source": "agent", "action": "run", "args": {"command": "git status", "thought": "", "is_confirmed": "confirmed"}}, {"source": "agent", "observation": "run", "content": "fatal: not a git repository (or any parent up to mount point /)\r\nStopping at filesystem boundary (GIT_DISCOVERY_ACROSS_FILESYSTEM not set).\r\n\r\nopendevin@docker-desktop:/workspace $ ", "extras": {"command_id": -1, "command": "git status", "exit_code": 128}}, {"source": "agent", "observation": "error", "content": "action={'action': 'reject', 'args': {'reason': 'Not a valid git repository.'}} has the wrong arguments", "extras": {}}, {"source": "agent", "observation": "error", "content": "action={'action': 'reject', 'args': {'reason': 'Not a valid git repository.'}} has the wrong arguments", "extras": {}}]
														
 
															+[{"source": "agent", "action": "run", "args": {"command": "git status", "thought": "", "keep_prompt": true, "is_confirmed": "confirmed"}}, {"source": "agent", "observation": "run", "content": "fatal: not a git repository (or any parent up to mount point /)\r\nStopping at filesystem boundary (GIT_DISCOVERY_ACROSS_FILESYSTEM not set).\r\n\r\nopendevin@docker-desktop:/workspace $ ", "extras": {"command_id": -1, "command": "git status", "exit_code": 128}}, {"source": "agent", "observation": "error", "content": "action={'action': 'reject', 'args': {'reason': 'Not a valid git repository.'}} has the wrong arguments", "extras": {}}, {"source": "agent", "observation": "error", "content": "action={'action': 'reject', 'args': {'reason': 'Not a valid git repository.'}} has the wrong arguments", "extras": {}}]
														
 
															 If the last item in the history is an error, you should try to fix it.
														
--- a/tests/integration/mock/eventstream_runtime/ManagerAgent/test_simple_task_rejection/prompt_006.log
+++ b/tests/integration/mock/eventstream_runtime/ManagerAgent/test_simple_task_rejection/prompt_006.log
@@ -28,7 +28,7 @@ as well as observations you've made. This only includes the MOST RECENT
 
															 actions and observations--more may have happened before that.
														
 
															 They are time-ordered, with your most recent action at the bottom.
														
 
															-[{"source": "agent", "action": "run", "args": {"command": "git status", "thought": "", "is_confirmed": "confirmed"}}, {"source": "agent", "observation": "run", "content": "fatal: not a git repository (or any parent up to mount point /)\r\nStopping at filesystem boundary (GIT_DISCOVERY_ACROSS_FILESYSTEM not set).\r\n\r\nopendevin@docker-desktop:/workspace $ ", "extras": {"command_id": -1, "command": "git status", "exit_code": 128}}, {"source": "agent", "observation": "error", "content": "action={'action': 'reject', 'args': {'reason': 'Not a valid git repository.'}} has the wrong arguments", "extras": {}}, {"source": "agent", "observation": "error", "content": "action={'action': 'reject', 'args': {'reason': 'Not a valid git repository.'}} has the wrong arguments", "extras": {}}, {"source": "agent", "observation": "error", "content": "action={'action': 'reject', 'args': {'reason': 'Not a valid git repository.'}} has the wrong arguments", "extras": {}}]
														
 
															+[{"source": "agent", "action": "run", "args": {"command": "git status", "thought": "", "keep_prompt": true, "is_confirmed": "confirmed"}}, {"source": "agent", "observation": "run", "content": "fatal: not a git repository (or any parent up to mount point /)\r\nStopping at filesystem boundary (GIT_DISCOVERY_ACROSS_FILESYSTEM not set).\r\n\r\nopendevin@docker-desktop:/workspace $ ", "extras": {"command_id": -1, "command": "git status", "exit_code": 128}}, {"source": "agent", "observation": "error", "content": "action={'action': 'reject', 'args': {'reason': 'Not a valid git repository.'}} has the wrong arguments", "extras": {}}, {"source": "agent", "observation": "error", "content": "action={'action': 'reject', 'args': {'reason': 'Not a valid git repository.'}} has the wrong arguments", "extras": {}}, {"source": "agent", "observation": "error", "content": "action={'action': 'reject', 'args': {'reason': 'Not a valid git repository.'}} has the wrong arguments", "extras": {}}]
														
 
															 If the last item in the history is an error, you should try to fix it.
														
--- a/tests/integration/mock/eventstream_runtime/ManagerAgent/test_simple_task_rejection/prompt_007.log
+++ b/tests/integration/mock/eventstream_runtime/ManagerAgent/test_simple_task_rejection/prompt_007.log
@@ -28,7 +28,7 @@ as well as observations you've made. This only includes the MOST RECENT
 
															 actions and observations--more may have happened before that.
														
 
															 They are time-ordered, with your most recent action at the bottom.
														
 
															-[{"source": "agent", "action": "run", "args": {"command": "git status", "thought": "", "is_confirmed": "confirmed"}}, {"source": "agent", "observation": "run", "content": "fatal: not a git repository (or any parent up to mount point /)\r\nStopping at filesystem boundary (GIT_DISCOVERY_ACROSS_FILESYSTEM not set).\r\n\r\nopendevin@docker-desktop:/workspace $ ", "extras": {"command_id": -1, "command": "git status", "exit_code": 128}}, {"source": "agent", "observation": "error", "content": "action={'action': 'reject', 'args': {'reason': 'Not a valid git repository.'}} has the wrong arguments", "extras": {}}, {"source": "agent", "observation": "error", "content": "action={'action': 'reject', 'args': {'reason': 'Not a valid git repository.'}} has the wrong arguments", "extras": {}}, {"source": "agent", "observation": "error", "content": "action={'action': 'reject', 'args': {'reason': 'Not a valid git repository.'}} has the wrong arguments", "extras": {}}, {"source": "agent", "observation": "error", "content": "action={'action': 'reject', 'args': {'reason': 'Not a valid git repository.'}} has the wrong arguments", "extras": {}}]
														
 
															+[{"source": "agent", "action": "run", "args": {"command": "git status", "thought": "", "keep_prompt": true, "is_confirmed": "confirmed"}}, {"source": "agent", "observation": "run", "content": "fatal: not a git repository (or any parent up to mount point /)\r\nStopping at filesystem boundary (GIT_DISCOVERY_ACROSS_FILESYSTEM not set).\r\n\r\nopendevin@docker-desktop:/workspace $ ", "extras": {"command_id": -1, "command": "git status", "exit_code": 128}}, {"source": "agent", "observation": "error", "content": "action={'action': 'reject', 'args': {'reason': 'Not a valid git repository.'}} has the wrong arguments", "extras": {}}, {"source": "agent", "observation": "error", "content": "action={'action': 'reject', 'args': {'reason': 'Not a valid git repository.'}} has the wrong arguments", "extras": {}}, {"source": "agent", "observation": "error", "content": "action={'action': 'reject', 'args': {'reason': 'Not a valid git repository.'}} has the wrong arguments", "extras": {}}, {"source": "agent", "observation": "error", "content": "action={'action': 'reject', 'args': {'reason': 'Not a valid git repository.'}} has the wrong arguments", "extras": {}}]
														
 
															 If the last item in the history is an error, you should try to fix it.
														
--- a/tests/integration/mock/eventstream_runtime/PlannerAgent/test_write_simple_script/prompt_010.log
+++ b/tests/integration/mock/eventstream_runtime/PlannerAgent/test_write_simple_script/prompt_010.log
@@ -198,6 +198,7 @@ ten actions--more happened before that.
 
															     "args": {
														
 
															       "command": "bash hello.sh",
														
 
															       "thought": "",
														
 
															+      "keep_prompt": true,
														
 
															       "is_confirmed": "confirmed"
														
 
															     }
														
 
															   },
														
--- a/tests/integration/mock/eventstream_runtime/PlannerAgent/test_write_simple_script/prompt_011.log
+++ b/tests/integration/mock/eventstream_runtime/PlannerAgent/test_write_simple_script/prompt_011.log
@@ -197,6 +197,7 @@ ten actions--more happened before that.
 
															     "args": {
														
 
															       "command": "bash hello.sh",
														
 
															       "thought": "",
														
 
															+      "keep_prompt": true,
														
 
															       "is_confirmed": "confirmed"
														
 
															     }
														
 
															   },
														
--- a/tests/integration/mock/server_runtime/DelegatorAgent/test_edits/prompt_002.log
+++ b/tests/integration/mock/server_runtime/DelegatorAgent/test_edits/prompt_002.log
@@ -41,7 +41,7 @@ as well as observations you've made. This only includes the MOST RECENT
 
															 actions and observations--more may have happened before that.
														
 
															 They are time-ordered, with your most recent action at the bottom.
														
 
															-[{"source": "agent", "action": "run", "args": {"command": "ls", "thought": "", "is_confirmed": "confirmed"}}, {"source": "agent", "observation": "run", "content": "bad.txt", "extras": {"command_id": -1, "command": "ls", "exit_code": 0}}]
														
 
															+[{"source": "agent", "action": "run", "args": {"command": "ls", "thought": "", "keep_prompt": true, "is_confirmed": "confirmed"}}, {"source": "agent", "observation": "run", "content": "bad.txt", "extras": {"command_id": -1, "command": "ls", "exit_code": 0}}]
														
 
															 ## Format
														
 
															 Your response MUST be in JSON format. It must be an object, and it must contain two fields:
														
--- a/tests/integration/mock/server_runtime/DelegatorAgent/test_edits/prompt_003.log
+++ b/tests/integration/mock/server_runtime/DelegatorAgent/test_edits/prompt_003.log
@@ -41,7 +41,7 @@ as well as observations you've made. This only includes the MOST RECENT
 
															 actions and observations--more may have happened before that.
														
 
															 They are time-ordered, with your most recent action at the bottom.
														
 
															-[{"source": "agent", "action": "run", "args": {"command": "ls", "thought": "", "is_confirmed": "confirmed"}}, {"source": "agent", "observation": "run", "content": "bad.txt", "extras": {"command_id": -1, "command": "ls", "exit_code": 0}}, {"source": "agent", "action": "read", "args": {"path": "bad.txt", "start": 0, "end": -1, "thought": ""}}, {"source": "agent", "observation": "read", "content": "This is a stupid typoo.\nReally?\nNo mor typos!\nEnjoy!\n", "extras": {"path": "bad.txt"}}]
														
 
															+[{"source": "agent", "action": "run", "args": {"command": "ls", "thought": "", "keep_prompt": true, "is_confirmed": "confirmed"}}, {"source": "agent", "observation": "run", "content": "bad.txt", "extras": {"command_id": -1, "command": "ls", "exit_code": 0}}, {"source": "agent", "action": "read", "args": {"path": "bad.txt", "start": 0, "end": -1, "thought": ""}}, {"source": "agent", "observation": "read", "content": "This is a stupid typoo.\nReally?\nNo mor typos!\nEnjoy!\n", "extras": {"path": "bad.txt"}}]
														
 
															 ## Format
														
 
															 Your response MUST be in JSON format. It must be an object, and it must contain two fields:
														
--- a/tests/integration/mock/server_runtime/DelegatorAgent/test_write_simple_script/prompt_002.log
+++ b/tests/integration/mock/server_runtime/DelegatorAgent/test_write_simple_script/prompt_002.log
@@ -41,7 +41,7 @@ as well as observations you've made. This only includes the MOST RECENT
 
															 actions and observations--more may have happened before that.
														
 
															 They are time-ordered, with your most recent action at the bottom.
														
 
															-[{"source": "agent", "action": "run", "args": {"command": "ls", "thought": "", "is_confirmed": "confirmed"}}, {"source": "agent", "observation": "run", "content": "", "extras": {"command_id": -1, "command": "ls", "exit_code": 0}}]
														
 
															+[{"source": "agent", "action": "run", "args": {"command": "ls", "thought": "", "keep_prompt": true, "is_confirmed": "confirmed"}}, {"source": "agent", "observation": "run", "content": "", "extras": {"command_id": -1, "command": "ls", "exit_code": 0}}]
														
 
															 ## Format
														
 
															 Your response MUST be in JSON format. It must be an object, and it must contain two fields:
														
--- a/tests/integration/mock/server_runtime/DelegatorAgent/test_write_simple_script/prompt_005.log
+++ b/tests/integration/mock/server_runtime/DelegatorAgent/test_write_simple_script/prompt_005.log
@@ -41,7 +41,7 @@ as well as observations you've made. This only includes the MOST RECENT
 
															 actions and observations--more may have happened before that.
														
 
															 They are time-ordered, with your most recent action at the bottom.
														
 
															-[{"source": "agent", "action": "write", "args": {"path": "hello.sh", "content": "#!/bin/bash\n\n# Print hello\necho 'hello'", "start": 0, "end": -1, "thought": ""}}, {"source": "agent", "observation": "write", "content": "", "extras": {"path": "hello.sh"}}, {"source": "agent", "action": "run", "args": {"command": "chmod +x hello.sh", "thought": "", "is_confirmed": "confirmed"}}, {"source": "agent", "observation": "run", "content": "", "extras": {"command_id": -1, "command": "chmod +x hello.sh", "exit_code": 0}}]
														
 
															+[{"source": "agent", "action": "write", "args": {"path": "hello.sh", "content": "#!/bin/bash\n\n# Print hello\necho 'hello'", "start": 0, "end": -1, "thought": ""}}, {"source": "agent", "observation": "write", "content": "", "extras": {"path": "hello.sh"}}, {"source": "agent", "action": "run", "args": {"command": "chmod +x hello.sh", "thought": "", "keep_prompt": true, "is_confirmed": "confirmed"}}, {"source": "agent", "observation": "run", "content": "", "extras": {"command_id": -1, "command": "chmod +x hello.sh", "exit_code": 0}}]
														
 
															 ## Format
														
 
															 Your response MUST be in JSON format. It must be an object, and it must contain two fields:
														
--- a/tests/integration/mock/server_runtime/DelegatorAgent/test_write_simple_script/prompt_006.log
+++ b/tests/integration/mock/server_runtime/DelegatorAgent/test_write_simple_script/prompt_006.log
@@ -41,7 +41,7 @@ as well as observations you've made. This only includes the MOST RECENT
 
															 actions and observations--more may have happened before that.
														
 
															 They are time-ordered, with your most recent action at the bottom.
														
 
															-[{"source": "agent", "action": "write", "args": {"path": "hello.sh", "content": "#!/bin/bash\n\n# Print hello\necho 'hello'", "start": 0, "end": -1, "thought": ""}}, {"source": "agent", "observation": "write", "content": "", "extras": {"path": "hello.sh"}}, {"source": "agent", "action": "run", "args": {"command": "chmod +x hello.sh", "thought": "", "is_confirmed": "confirmed"}}, {"source": "agent", "observation": "run", "content": "", "extras": {"command_id": -1, "command": "chmod +x hello.sh", "exit_code": 0}}, {"source": "agent", "action": "run", "args": {"command": "./hello.sh", "thought": "", "is_confirmed": "confirmed"}}, {"source": "agent", "observation": "run", "content": "hello", "extras": {"command_id": -1, "command": "./hello.sh", "exit_code": 0}}]
														
 
															+[{"source": "agent", "action": "write", "args": {"path": "hello.sh", "content": "#!/bin/bash\n\n# Print hello\necho 'hello'", "start": 0, "end": -1, "thought": ""}}, {"source": "agent", "observation": "write", "content": "", "extras": {"path": "hello.sh"}}, {"source": "agent", "action": "run", "args": {"command": "chmod +x hello.sh", "thought": "", "keep_prompt": true, "is_confirmed": "confirmed"}}, {"source": "agent", "observation": "run", "content": "", "extras": {"command_id": -1, "command": "chmod +x hello.sh", "exit_code": 0}}, {"source": "agent", "action": "run", "args": {"command": "./hello.sh", "thought": "", "keep_prompt": true, "is_confirmed": "confirmed"}}, {"source": "agent", "observation": "run", "content": "hello", "extras": {"command_id": -1, "command": "./hello.sh", "exit_code": 0}}]
														
 
															 ## Format
														
 
															 Your response MUST be in JSON format. It must be an object, and it must contain two fields:
														
--- a/tests/integration/mock/server_runtime/DelegatorAgent/test_write_simple_script/prompt_009.log
+++ b/tests/integration/mock/server_runtime/DelegatorAgent/test_write_simple_script/prompt_009.log
@@ -39,7 +39,7 @@ as well as observations you've made. This only includes the MOST RECENT
 
															 actions and observations--more may have happened before that.
														
 
															 They are time-ordered, with your most recent action at the bottom.
														
 
															-[{"source": "agent", "action": "read", "args": {"path": "hello.sh", "start": 0, "end": -1, "thought": ""}}, {"source": "agent", "observation": "read", "content": "#!/bin/bash\n\n# Print hello\necho 'hello'\n", "extras": {"path": "hello.sh"}}, {"source": "agent", "action": "run", "args": {"command": "bash hello.sh", "thought": "", "is_confirmed": "confirmed"}}, {"source": "agent", "observation": "run", "content": "hello", "extras": {"command_id": -1, "command": "bash hello.sh", "exit_code": 0}}]
														
 
															+[{"source": "agent", "action": "read", "args": {"path": "hello.sh", "start": 0, "end": -1, "thought": ""}}, {"source": "agent", "observation": "read", "content": "#!/bin/bash\n\n# Print hello\necho 'hello'\n", "extras": {"path": "hello.sh"}}, {"source": "agent", "action": "run", "args": {"command": "bash hello.sh", "thought": "", "keep_prompt": true, "is_confirmed": "confirmed"}}, {"source": "agent", "observation": "run", "content": "hello", "extras": {"command_id": -1, "command": "bash hello.sh", "exit_code": 0}}]
														
 
															 ## Format
														
 
															 Your response MUST be in JSON format. It must be an object, and it must contain two fields:
														
--- a/tests/integration/mock/server_runtime/ManagerAgent/test_simple_task_rejection/prompt_003.log
+++ b/tests/integration/mock/server_runtime/ManagerAgent/test_simple_task_rejection/prompt_003.log
@@ -28,7 +28,7 @@ as well as observations you've made. This only includes the MOST RECENT
 
															 actions and observations--more may have happened before that.
														
 
															 They are time-ordered, with your most recent action at the bottom.
														
 
															-[{"source": "agent", "action": "run", "args": {"command": "git status", "thought": "", "is_confirmed": "confirmed"}}, {"source": "agent", "observation": "run", "content": "fatal: not a git repository (or any parent up to mount point /)\r\nStopping at filesystem boundary (GIT_DISCOVERY_ACROSS_FILESYSTEM not set).", "extras": {"command_id": -1, "command": "git status", "exit_code": 128}}]
														
 
															+[{"source": "agent", "action": "run", "args": {"command": "git status", "thought": "", "keep_prompt": true, "is_confirmed": "confirmed"}}, {"source": "agent", "observation": "run", "content": "fatal: not a git repository (or any parent up to mount point /)\r\nStopping at filesystem boundary (GIT_DISCOVERY_ACROSS_FILESYSTEM not set).", "extras": {"command_id": -1, "command": "git status", "exit_code": 128}}]
														
 
															 If the last item in the history is an error, you should try to fix it.
														
--- a/tests/integration/mock/server_runtime/ManagerAgent/test_simple_task_rejection/prompt_004.log
+++ b/tests/integration/mock/server_runtime/ManagerAgent/test_simple_task_rejection/prompt_004.log
@@ -28,7 +28,7 @@ as well as observations you've made. This only includes the MOST RECENT
 
															 actions and observations--more may have happened before that.
														
 
															 They are time-ordered, with your most recent action at the bottom.
														
 
															-[{"source": "agent", "action": "run", "args": {"command": "git status", "thought": "", "is_confirmed": "confirmed"}}, {"source": "agent", "observation": "run", "content": "fatal: not a git repository (or any parent up to mount point /)\r\nStopping at filesystem boundary (GIT_DISCOVERY_ACROSS_FILESYSTEM not set).", "extras": {"command_id": -1, "command": "git status", "exit_code": 128}}, {"source": "agent", "observation": "error", "content": "action={'action': 'reject', 'args': {'reason': 'Not a valid git repository.'}} has the wrong arguments", "extras": {}}]
														
 
															+[{"source": "agent", "action": "run", "args": {"command": "git status", "thought": "", "keep_prompt": true, "is_confirmed": "confirmed"}}, {"source": "agent", "observation": "run", "content": "fatal: not a git repository (or any parent up to mount point /)\r\nStopping at filesystem boundary (GIT_DISCOVERY_ACROSS_FILESYSTEM not set).", "extras": {"command_id": -1, "command": "git status", "exit_code": 128}}, {"source": "agent", "observation": "error", "content": "action={'action': 'reject', 'args': {'reason': 'Not a valid git repository.'}} has the wrong arguments", "extras": {}}]
														
 
															 If the last item in the history is an error, you should try to fix it.
														
--- a/tests/integration/mock/server_runtime/ManagerAgent/test_simple_task_rejection/prompt_005.log
+++ b/tests/integration/mock/server_runtime/ManagerAgent/test_simple_task_rejection/prompt_005.log
@@ -28,7 +28,7 @@ as well as observations you've made. This only includes the MOST RECENT
 
															 actions and observations--more may have happened before that.
														
 
															 They are time-ordered, with your most recent action at the bottom.
														
 
															-[{"source": "agent", "action": "run", "args": {"command": "git status", "thought": "", "is_confirmed": "confirmed"}}, {"source": "agent", "observation": "run", "content": "fatal: not a git repository (or any parent up to mount point /)\r\nStopping at filesystem boundary (GIT_DISCOVERY_ACROSS_FILESYSTEM not set).", "extras": {"command_id": -1, "command": "git status", "exit_code": 128}}, {"source": "agent", "observation": "error", "content": "action={'action': 'reject', 'args': {'reason': 'Not a valid git repository.'}} has the wrong arguments", "extras": {}}, {"source": "agent", "observation": "error", "content": "action={'action': 'reject', 'args': {'reason': 'Not a valid git repository.'}} has the wrong arguments", "extras": {}}]
														
 
															+[{"source": "agent", "action": "run", "args": {"command": "git status", "thought": "", "keep_prompt": true, "is_confirmed": "confirmed"}}, {"source": "agent", "observation": "run", "content": "fatal: not a git repository (or any parent up to mount point /)\r\nStopping at filesystem boundary (GIT_DISCOVERY_ACROSS_FILESYSTEM not set).", "extras": {"command_id": -1, "command": "git status", "exit_code": 128}}, {"source": "agent", "observation": "error", "content": "action={'action': 'reject', 'args': {'reason': 'Not a valid git repository.'}} has the wrong arguments", "extras": {}}, {"source": "agent", "observation": "error", "content": "action={'action': 'reject', 'args': {'reason': 'Not a valid git repository.'}} has the wrong arguments", "extras": {}}]
														
 
															 If the last item in the history is an error, you should try to fix it.
														
--- a/tests/integration/mock/server_runtime/PlannerAgent/test_write_simple_script/prompt_010.log
+++ b/tests/integration/mock/server_runtime/PlannerAgent/test_write_simple_script/prompt_010.log
@@ -198,6 +198,7 @@ ten actions--more happened before that.
 
															     "args": {
														
 
															       "command": "bash hello.sh",
														
 
															       "thought": "",
														
 
															+      "keep_prompt": true,
														
 
															       "is_confirmed": "confirmed"
														
 
															     }
														
 
															   },
														
--- a/tests/integration/mock/server_runtime/PlannerAgent/test_write_simple_script/prompt_011.log
+++ b/tests/integration/mock/server_runtime/PlannerAgent/test_write_simple_script/prompt_011.log
@@ -197,6 +197,7 @@ ten actions--more happened before that.
 
															     "args": {
														
 
															       "command": "bash hello.sh",
														
 
															       "thought": "",
														
 
															+      "keep_prompt": true,
														
 
															       "is_confirmed": "confirmed"
														
 
															     }
														
 
															   },
														
--- a/tests/unit/test_action_serialization.py
+++ b/tests/unit/test_action_serialization.py
@@ -86,6 +86,7 @@ def test_cmd_run_action_serialization_deserialization():
 
															         'args': {
														
 
															             'command': 'echo "Hello world"',
														
 
															             'thought': '',
														
 
															+            'keep_prompt': True,
														
 
															             'is_confirmed': ActionConfirmationStatus.CONFIRMED,
														
 
															         },
														
 
															     }
														
--- a/tests/unit/test_runtime.py
+++ b/tests/unit/test_runtime.py
@@ -844,6 +844,9 @@ async def test_ipython_simple(temp_dir, box_class):
 
															     logger.info(obs, extra={'msg_type': 'OBSERVATION'})
														
 
															     assert obs.content.strip() == '1'
														
 
															+    await runtime.close()
														
 
															+    await asyncio.sleep(1)
														
 
															+
														
 
															 async def _test_ipython_agentskills_fileop_pwd_impl(
														
 
															     runtime: ServerRuntime | EventStreamRuntime, enable_auto_lint: bool
														
@@ -954,6 +957,9 @@ DO NOT re-run the same failed edit command. Running it again will lead to the sa
 
															     logger.info(obs, extra={'msg_type': 'OBSERVATION'})
														
 
															     assert obs.exit_code == 0
														
 
															+    await runtime.close()
														
 
															+    await asyncio.sleep(1)
														
 
															+
														
 
															 @pytest.mark.asyncio
														
 
															 async def test_ipython_agentskills_fileop_pwd(temp_dir, box_class, enable_auto_lint):
														
@@ -967,6 +973,72 @@ async def test_ipython_agentskills_fileop_pwd(temp_dir, box_class, enable_auto_l
 
															     await asyncio.sleep(1)
														
 
															+@pytest.mark.asyncio
														
 
															+async def test_ipython_agentskills_fileop_pwd_with_userdir(temp_dir, box_class):
														
 
															+    """Make sure that cd in bash also update the current working directory in ipython.
														
 
															+
														
 
															+    Handle special case where the pwd is provided as "~", which should be expanded using os.path.expanduser
														
 
															+    on the client side.
														
 
															+    """
														
 
															+
														
 
															+    runtime = await _load_runtime(
														
 
															+        temp_dir,
														
 
															+        box_class,
														
 
															+        run_as_devin=False,
														
 
															+    )
														
 
															+
														
 
															+    action = CmdRunAction(command='cd ~')
														
 
															+    logger.info(action, extra={'msg_type': 'ACTION'})
														
 
															+    obs = await runtime.run_action(action)
														
 
															+    logger.info(obs, extra={'msg_type': 'OBSERVATION'})
														
 
															+    assert obs.exit_code == 0
														
 
															+
														
 
															+    action = CmdRunAction(command='mkdir test && ls -la')
														
 
															+    logger.info(action, extra={'msg_type': 'ACTION'})
														
 
															+    obs = await runtime.run_action(action)
														
 
															+    logger.info(obs, extra={'msg_type': 'OBSERVATION'})
														
 
															+    assert isinstance(obs, CmdOutputObservation)
														
 
															+    assert obs.exit_code == 0
														
 
															+
														
 
															+    action = IPythonRunCellAction(code="create_file('hello.py')")
														
 
															+    logger.info(action, extra={'msg_type': 'ACTION'})
														
 
															+    obs = await runtime.run_action(action)
														
 
															+    logger.info(obs, extra={'msg_type': 'OBSERVATION'})
														
 
															+    assert isinstance(obs, IPythonRunCellObservation)
														
 
															+    assert obs.content.replace('\r\n', '\n').strip().split('\n') == (
														
 
															+        '[File: /root/hello.py (1 lines total)]\n'
														
 
															+        '(this is the beginning of the file)\n'
														
 
															+        '1|\n'
														
 
															+        '(this is the end of the file)\n'
														
 
															+        '[File hello.py created.]\n'
														
 
															+    ).strip().split('\n')
														
 
															+
														
 
															+    action = CmdRunAction(command='cd test')
														
 
															+    logger.info(action, extra={'msg_type': 'ACTION'})
														
 
															+    obs = await runtime.run_action(action)
														
 
															+    logger.info(obs, extra={'msg_type': 'OBSERVATION'})
														
 
															+    assert isinstance(obs, CmdOutputObservation)
														
 
															+    assert obs.exit_code == 0
														
 
															+
														
 
															+    # This should create a file in the current working directory
														
 
															+    # i.e., /workspace/test/hello.py instead of /workspace/hello.py
														
 
															+    action = IPythonRunCellAction(code="create_file('hello.py')")
														
 
															+    logger.info(action, extra={'msg_type': 'ACTION'})
														
 
															+    obs = await runtime.run_action(action)
														
 
															+    logger.info(obs, extra={'msg_type': 'OBSERVATION'})
														
 
															+    assert isinstance(obs, IPythonRunCellObservation)
														
 
															+    assert obs.content.replace('\r\n', '\n').strip().split('\n') == (
														
 
															+        '[File: /root/test/hello.py (1 lines total)]\n'
														
 
															+        '(this is the beginning of the file)\n'
														
 
															+        '1|\n'
														
 
															+        '(this is the end of the file)\n'
														
 
															+        '[File hello.py created.]\n'
														
 
															+    ).strip().split('\n')
														
 
															+
														
 
															+    await runtime.close()
														
 
															+    await asyncio.sleep(1)
														
 
															+
														
 
															+
														
 
															 @pytest.mark.skipif(
														
 
															     TEST_RUNTIME.lower() == 'eventstream',
														
 
															     reason='Skip this if we want to test EventStreamRuntime',
														
@@ -1082,6 +1154,9 @@ async def test_copy_single_file(temp_dir, box_class):
 
															     assert obs.exit_code == 0
														
 
															     assert 'Hello, World!' in obs.content
														
 
															+    await runtime.close()
														
 
															+    await asyncio.sleep(1)
														
 
															+
														
 
															 def _create_test_dir_with_files(host_temp_dir):
														
 
															     os.mkdir(os.path.join(host_temp_dir, 'test_dir'))
														
@@ -1129,6 +1204,9 @@ async def test_copy_directory_recursively(temp_dir, box_class):
 
															     assert obs.exit_code == 0
														
 
															     assert 'File 1 content' in obs.content
														
 
															+    await runtime.close()
														
 
															+    await asyncio.sleep(1)
														
 
															+
														
 
															 @pytest.mark.asyncio
														
 
															 async def test_copy_to_non_existent_directory(temp_dir, box_class):
														
@@ -1148,6 +1226,9 @@ async def test_copy_to_non_existent_directory(temp_dir, box_class):
 
															     assert obs.exit_code == 0
														
 
															     assert 'Hello, World!' in obs.content
														
 
															+    await runtime.close()
														
 
															+    await asyncio.sleep(1)
														
 
															+
														
 
															 @pytest.mark.asyncio
														
 
															 async def test_overwrite_existing_file(temp_dir, box_class):
														
@@ -1183,6 +1264,9 @@ async def test_overwrite_existing_file(temp_dir, box_class):
 
															     assert obs.exit_code == 0
														
 
															     assert 'Hello, World!' in obs.content
														
 
															+    await runtime.close()
														
 
															+    await asyncio.sleep(1)
														
 
															+
														
 
															 @pytest.mark.asyncio
														
 
															 async def test_copy_non_existent_file(temp_dir, box_class):
														
@@ -1200,3 +1284,33 @@ async def test_copy_non_existent_file(temp_dir, box_class):
 
															     logger.info(obs, extra={'msg_type': 'OBSERVATION'})
														
 
															     assert isinstance(obs, CmdOutputObservation)
														
 
															     assert obs.exit_code != 0  # File should not exist
														
 
															+
														
 
															+    await runtime.close()
														
 
															+    await asyncio.sleep(1)
														
 
															+
														
 
															+
														
 
															+@pytest.mark.asyncio
														
 
															+async def test_keep_prompt(temp_dir):
														
 
															+    # only EventStreamRuntime supports keep_prompt
														
 
															+    runtime = await _load_runtime(
														
 
															+        temp_dir, box_class=EventStreamRuntime, run_as_devin=False
														
 
															+    )
														
 
															+
														
 
															+    action = CmdRunAction(command='touch /workspace/test_file.txt')
														
 
															+    logger.info(action, extra={'msg_type': 'ACTION'})
														
 
															+    obs = await runtime.run_action(action)
														
 
															+    logger.info(obs, extra={'msg_type': 'OBSERVATION'})
														
 
															+    assert isinstance(obs, CmdOutputObservation)
														
 
															+    assert obs.exit_code == 0
														
 
															+    assert 'root@' in obs.content
														
 
															+
														
 
															+    action = CmdRunAction(command='cat /workspace/test_file.txt', keep_prompt=False)
														
 
															+    logger.info(action, extra={'msg_type': 'ACTION'})
														
 
															+    obs = await runtime.run_action(action)
														
 
															+    logger.info(obs, extra={'msg_type': 'OBSERVATION'})
														
 
															+    assert isinstance(obs, CmdOutputObservation)
														
 
															+    assert obs.exit_code == 0
														
 
															+    assert 'root@' not in obs.content
														
 
															+
														
 
															+    await runtime.close()
														
 
															+    await asyncio.sleep(1)