2026-01-15 14:37:00 +08:00
|
|
|
import re
|
|
|
|
|
|
2026-01-14 12:32:34 +08:00
|
|
|
from langchain.tools import ToolRuntime, tool
|
|
|
|
|
from langgraph.typing import ContextT
|
2026-01-14 07:19:34 +08:00
|
|
|
|
2026-01-15 14:37:00 +08:00
|
|
|
from src.agents.thread_state import ThreadDataState, ThreadState
|
2026-01-17 23:23:12 +08:00
|
|
|
from src.sandbox.exceptions import (
|
|
|
|
|
SandboxError,
|
|
|
|
|
SandboxFileError,
|
|
|
|
|
SandboxFileNotFoundError,
|
|
|
|
|
SandboxNotFoundError,
|
|
|
|
|
SandboxRuntimeError,
|
|
|
|
|
)
|
2026-01-14 12:32:34 +08:00
|
|
|
from src.sandbox.sandbox import Sandbox
|
2026-01-14 07:19:34 +08:00
|
|
|
from src.sandbox.sandbox_provider import get_sandbox_provider
|
|
|
|
|
|
2026-01-15 14:37:00 +08:00
|
|
|
# Virtual path prefix used in sandbox environments
|
|
|
|
|
VIRTUAL_PATH_PREFIX = "/mnt/user-data"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
def replace_virtual_path(path: str, thread_data: ThreadDataState | None) -> str:
|
|
|
|
|
"""Replace virtual /mnt/user-data paths with actual thread data paths.
|
|
|
|
|
|
|
|
|
|
Mapping:
|
|
|
|
|
/mnt/user-data/workspace/* -> thread_data['workspace_path']/*
|
|
|
|
|
/mnt/user-data/uploads/* -> thread_data['uploads_path']/*
|
|
|
|
|
/mnt/user-data/outputs/* -> thread_data['outputs_path']/*
|
|
|
|
|
|
|
|
|
|
Args:
|
|
|
|
|
path: The path that may contain virtual path prefix.
|
|
|
|
|
thread_data: The thread data containing actual paths.
|
|
|
|
|
|
|
|
|
|
Returns:
|
|
|
|
|
The path with virtual prefix replaced by actual path.
|
|
|
|
|
"""
|
|
|
|
|
if not path.startswith(VIRTUAL_PATH_PREFIX):
|
|
|
|
|
return path
|
|
|
|
|
|
|
|
|
|
if thread_data is None:
|
|
|
|
|
return path
|
|
|
|
|
|
|
|
|
|
# Map virtual subdirectories to thread_data keys
|
|
|
|
|
path_mapping = {
|
|
|
|
|
"workspace": thread_data.get("workspace_path"),
|
|
|
|
|
"uploads": thread_data.get("uploads_path"),
|
|
|
|
|
"outputs": thread_data.get("outputs_path"),
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
# Extract the subdirectory after /mnt/user-data/
|
|
|
|
|
relative_path = path[len(VIRTUAL_PATH_PREFIX) :].lstrip("/")
|
|
|
|
|
if not relative_path:
|
|
|
|
|
return path
|
|
|
|
|
|
|
|
|
|
# Find which subdirectory this path belongs to
|
|
|
|
|
parts = relative_path.split("/", 1)
|
|
|
|
|
subdir = parts[0]
|
|
|
|
|
rest = parts[1] if len(parts) > 1 else ""
|
|
|
|
|
|
|
|
|
|
actual_base = path_mapping.get(subdir)
|
|
|
|
|
if actual_base is None:
|
|
|
|
|
return path
|
|
|
|
|
|
|
|
|
|
if rest:
|
|
|
|
|
return f"{actual_base}/{rest}"
|
|
|
|
|
return actual_base
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
def replace_virtual_paths_in_command(command: str, thread_data: ThreadDataState | None) -> str:
|
|
|
|
|
"""Replace all virtual /mnt/user-data paths in a command string.
|
|
|
|
|
|
|
|
|
|
Args:
|
|
|
|
|
command: The command string that may contain virtual paths.
|
|
|
|
|
thread_data: The thread data containing actual paths.
|
|
|
|
|
|
|
|
|
|
Returns:
|
|
|
|
|
The command with all virtual paths replaced.
|
|
|
|
|
"""
|
|
|
|
|
if VIRTUAL_PATH_PREFIX not in command:
|
|
|
|
|
return command
|
|
|
|
|
|
|
|
|
|
if thread_data is None:
|
|
|
|
|
return command
|
|
|
|
|
|
|
|
|
|
# Pattern to match /mnt/user-data followed by path characters
|
|
|
|
|
pattern = re.compile(rf"{re.escape(VIRTUAL_PATH_PREFIX)}(/[^\s\"';&|<>()]*)?")
|
|
|
|
|
|
|
|
|
|
def replace_match(match: re.Match) -> str:
|
|
|
|
|
full_path = match.group(0)
|
|
|
|
|
return replace_virtual_path(full_path, thread_data)
|
|
|
|
|
|
|
|
|
|
return pattern.sub(replace_match, command)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
def get_thread_data(runtime: ToolRuntime[ContextT, ThreadState] | None) -> ThreadDataState | None:
|
|
|
|
|
"""Extract thread_data from runtime state."""
|
|
|
|
|
if runtime is None:
|
|
|
|
|
return None
|
|
|
|
|
return runtime.state.get("thread_data")
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
def is_local_sandbox(runtime: ToolRuntime[ContextT, ThreadState] | None) -> bool:
|
|
|
|
|
"""Check if the current sandbox is a local sandbox.
|
|
|
|
|
|
|
|
|
|
Path replacement is only needed for local sandbox since aio sandbox
|
|
|
|
|
already has /mnt/user-data mounted in the container.
|
|
|
|
|
"""
|
|
|
|
|
if runtime is None:
|
|
|
|
|
return False
|
|
|
|
|
sandbox_state = runtime.state.get("sandbox")
|
|
|
|
|
if sandbox_state is None:
|
|
|
|
|
return False
|
|
|
|
|
return sandbox_state.get("sandbox_id") == "local"
|
|
|
|
|
|
2026-01-14 07:19:34 +08:00
|
|
|
|
2026-01-14 12:32:34 +08:00
|
|
|
def sandbox_from_runtime(runtime: ToolRuntime[ContextT, ThreadState] | None = None) -> Sandbox:
|
2026-01-17 23:23:12 +08:00
|
|
|
"""Extract sandbox instance from tool runtime.
|
|
|
|
|
|
|
|
|
|
Raises:
|
|
|
|
|
SandboxRuntimeError: If runtime is not available or sandbox state is missing.
|
|
|
|
|
SandboxNotFoundError: If sandbox with the given ID cannot be found.
|
|
|
|
|
"""
|
2026-01-14 12:32:34 +08:00
|
|
|
if runtime is None:
|
2026-01-17 23:23:12 +08:00
|
|
|
raise SandboxRuntimeError("Tool runtime not available")
|
2026-01-14 12:32:34 +08:00
|
|
|
sandbox_state = runtime.state.get("sandbox")
|
|
|
|
|
if sandbox_state is None:
|
2026-01-17 23:23:12 +08:00
|
|
|
raise SandboxRuntimeError("Sandbox state not initialized in runtime")
|
2026-01-14 12:32:34 +08:00
|
|
|
sandbox_id = sandbox_state.get("sandbox_id")
|
|
|
|
|
if sandbox_id is None:
|
2026-01-17 23:23:12 +08:00
|
|
|
raise SandboxRuntimeError("Sandbox ID not found in state")
|
2026-01-14 12:32:34 +08:00
|
|
|
sandbox = get_sandbox_provider().get(sandbox_id)
|
|
|
|
|
if sandbox is None:
|
2026-01-17 23:23:12 +08:00
|
|
|
raise SandboxNotFoundError(f"Sandbox with ID '{sandbox_id}' not found", sandbox_id=sandbox_id)
|
2026-01-14 12:32:34 +08:00
|
|
|
return sandbox
|
|
|
|
|
|
|
|
|
|
|
2026-01-14 07:19:34 +08:00
|
|
|
@tool("bash", parse_docstring=True)
|
2026-01-14 12:32:34 +08:00
|
|
|
def bash_tool(runtime: ToolRuntime[ContextT, ThreadState], description: str, command: str) -> str:
|
2026-01-14 09:12:03 +08:00
|
|
|
"""Execute a bash command in a Linux environment.
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
- Use `python` to run Python code.
|
|
|
|
|
- Use `pip install` to install Python packages.
|
2026-01-14 07:19:34 +08:00
|
|
|
|
|
|
|
|
Args:
|
2026-01-14 12:32:34 +08:00
|
|
|
description: Explain why you are running this command in short words. ALWAYS PROVIDE THIS PARAMETER FIRST.
|
2026-01-14 07:19:34 +08:00
|
|
|
command: The bash command to execute. Always use absolute paths for files and directories.
|
|
|
|
|
"""
|
|
|
|
|
try:
|
2026-01-14 12:32:34 +08:00
|
|
|
sandbox = sandbox_from_runtime(runtime)
|
2026-01-15 14:37:00 +08:00
|
|
|
if is_local_sandbox(runtime):
|
|
|
|
|
thread_data = get_thread_data(runtime)
|
|
|
|
|
command = replace_virtual_paths_in_command(command, thread_data)
|
2026-01-14 07:19:34 +08:00
|
|
|
return sandbox.execute_command(command)
|
2026-01-17 23:23:12 +08:00
|
|
|
except SandboxError as e:
|
2026-01-14 07:19:34 +08:00
|
|
|
return f"Error: {e}"
|
2026-01-17 23:23:12 +08:00
|
|
|
except Exception as e:
|
|
|
|
|
return f"Error: Unexpected error executing command: {type(e).__name__}: {e}"
|
2026-01-14 07:19:34 +08:00
|
|
|
|
|
|
|
|
|
|
|
|
|
@tool("ls", parse_docstring=True)
|
2026-01-14 12:32:34 +08:00
|
|
|
def ls_tool(runtime: ToolRuntime[ContextT, ThreadState], description: str, path: str) -> str:
|
2026-01-14 07:19:34 +08:00
|
|
|
"""List the contents of a directory up to 2 levels deep in tree format.
|
|
|
|
|
|
|
|
|
|
Args:
|
2026-01-14 12:32:34 +08:00
|
|
|
description: Explain why you are listing this directory in short words. ALWAYS PROVIDE THIS PARAMETER FIRST.
|
2026-01-14 07:19:34 +08:00
|
|
|
path: The **absolute** path to the directory to list.
|
|
|
|
|
"""
|
|
|
|
|
try:
|
2026-01-14 12:32:34 +08:00
|
|
|
sandbox = sandbox_from_runtime(runtime)
|
2026-01-15 14:37:00 +08:00
|
|
|
if is_local_sandbox(runtime):
|
|
|
|
|
thread_data = get_thread_data(runtime)
|
|
|
|
|
path = replace_virtual_path(path, thread_data)
|
2026-01-14 07:19:34 +08:00
|
|
|
children = sandbox.list_dir(path)
|
|
|
|
|
if not children:
|
|
|
|
|
return "(empty)"
|
|
|
|
|
return "\n".join(children)
|
2026-01-17 23:23:12 +08:00
|
|
|
except SandboxError as e:
|
2026-01-14 07:19:34 +08:00
|
|
|
return f"Error: {e}"
|
2026-01-17 23:23:12 +08:00
|
|
|
except FileNotFoundError:
|
|
|
|
|
return f"Error: Directory not found: {path}"
|
|
|
|
|
except PermissionError:
|
|
|
|
|
return f"Error: Permission denied: {path}"
|
|
|
|
|
except Exception as e:
|
|
|
|
|
return f"Error: Unexpected error listing directory: {type(e).__name__}: {e}"
|
2026-01-14 07:19:34 +08:00
|
|
|
|
|
|
|
|
|
|
|
|
|
@tool("read_file", parse_docstring=True)
|
|
|
|
|
def read_file_tool(
|
2026-01-14 12:32:34 +08:00
|
|
|
runtime: ToolRuntime[ContextT, ThreadState],
|
2026-01-14 07:19:34 +08:00
|
|
|
description: str,
|
|
|
|
|
path: str,
|
2026-01-15 22:05:54 +08:00
|
|
|
start_line: int | None = None,
|
|
|
|
|
end_line: int | None = None,
|
2026-01-14 07:19:34 +08:00
|
|
|
) -> str:
|
2026-01-15 22:05:54 +08:00
|
|
|
"""Read the contents of a text file. Use this to examine source code, configuration files, logs, or any text-based file.
|
2026-01-14 07:19:34 +08:00
|
|
|
|
|
|
|
|
Args:
|
2026-01-15 22:05:54 +08:00
|
|
|
description: Explain why you are reading this file in short words. ALWAYS PROVIDE THIS PARAMETER FIRST.
|
2026-01-14 07:19:34 +08:00
|
|
|
path: The **absolute** path to the file to read.
|
2026-01-15 22:05:54 +08:00
|
|
|
start_line: Optional starting line number (1-indexed, inclusive). Use with end_line to read a specific range.
|
|
|
|
|
end_line: Optional ending line number (1-indexed, inclusive). Use with start_line to read a specific range.
|
2026-01-14 07:19:34 +08:00
|
|
|
"""
|
|
|
|
|
try:
|
2026-01-14 12:32:34 +08:00
|
|
|
sandbox = sandbox_from_runtime(runtime)
|
2026-01-15 14:37:00 +08:00
|
|
|
if is_local_sandbox(runtime):
|
|
|
|
|
thread_data = get_thread_data(runtime)
|
|
|
|
|
path = replace_virtual_path(path, thread_data)
|
2026-01-14 07:19:34 +08:00
|
|
|
content = sandbox.read_file(path)
|
|
|
|
|
if not content:
|
|
|
|
|
return "(empty)"
|
2026-01-15 22:05:54 +08:00
|
|
|
if start_line is not None and end_line is not None:
|
|
|
|
|
content = "\n".join(content.splitlines()[start_line - 1 : end_line])
|
2026-01-14 07:19:34 +08:00
|
|
|
return content
|
2026-01-17 23:23:12 +08:00
|
|
|
except SandboxError as e:
|
2026-01-14 07:19:34 +08:00
|
|
|
return f"Error: {e}"
|
2026-01-17 23:23:12 +08:00
|
|
|
except FileNotFoundError:
|
|
|
|
|
return f"Error: File not found: {path}"
|
|
|
|
|
except PermissionError:
|
|
|
|
|
return f"Error: Permission denied reading file: {path}"
|
|
|
|
|
except IsADirectoryError:
|
|
|
|
|
return f"Error: Path is a directory, not a file: {path}"
|
|
|
|
|
except Exception as e:
|
|
|
|
|
return f"Error: Unexpected error reading file: {type(e).__name__}: {e}"
|
2026-01-14 07:19:34 +08:00
|
|
|
|
|
|
|
|
|
|
|
|
|
@tool("write_file", parse_docstring=True)
|
|
|
|
|
def write_file_tool(
|
2026-01-14 12:32:34 +08:00
|
|
|
runtime: ToolRuntime[ContextT, ThreadState],
|
2026-01-14 07:19:34 +08:00
|
|
|
description: str,
|
|
|
|
|
path: str,
|
|
|
|
|
content: str,
|
|
|
|
|
append: bool = False,
|
|
|
|
|
) -> str:
|
|
|
|
|
"""Write text content to a file.
|
|
|
|
|
|
|
|
|
|
Args:
|
2026-01-14 12:32:34 +08:00
|
|
|
description: Explain why you are writing to this file in short words. ALWAYS PROVIDE THIS PARAMETER FIRST.
|
|
|
|
|
path: The **absolute** path to the file to write to. ALWAYS PROVIDE THIS PARAMETER SECOND.
|
|
|
|
|
content: The content to write to the file. ALWAYS PROVIDE THIS PARAMETER THIRD.
|
2026-01-14 07:19:34 +08:00
|
|
|
"""
|
|
|
|
|
try:
|
2026-01-14 12:32:34 +08:00
|
|
|
sandbox = sandbox_from_runtime(runtime)
|
2026-01-15 14:37:00 +08:00
|
|
|
if is_local_sandbox(runtime):
|
|
|
|
|
thread_data = get_thread_data(runtime)
|
|
|
|
|
path = replace_virtual_path(path, thread_data)
|
2026-01-14 07:19:34 +08:00
|
|
|
sandbox.write_file(path, content, append)
|
|
|
|
|
return "OK"
|
2026-01-17 23:23:12 +08:00
|
|
|
except SandboxError as e:
|
2026-01-14 07:19:34 +08:00
|
|
|
return f"Error: {e}"
|
2026-01-17 23:23:12 +08:00
|
|
|
except PermissionError:
|
|
|
|
|
return f"Error: Permission denied writing to file: {path}"
|
|
|
|
|
except IsADirectoryError:
|
|
|
|
|
return f"Error: Path is a directory, not a file: {path}"
|
|
|
|
|
except OSError as e:
|
|
|
|
|
return f"Error: Failed to write file '{path}': {e}"
|
|
|
|
|
except Exception as e:
|
|
|
|
|
return f"Error: Unexpected error writing file: {type(e).__name__}: {e}"
|
2026-01-14 07:19:34 +08:00
|
|
|
|
|
|
|
|
|
|
|
|
|
@tool("str_replace", parse_docstring=True)
|
|
|
|
|
def str_replace_tool(
|
2026-01-14 12:32:34 +08:00
|
|
|
runtime: ToolRuntime[ContextT, ThreadState],
|
2026-01-14 07:19:34 +08:00
|
|
|
description: str,
|
|
|
|
|
path: str,
|
|
|
|
|
old_str: str,
|
|
|
|
|
new_str: str,
|
|
|
|
|
replace_all: bool = False,
|
|
|
|
|
) -> str:
|
|
|
|
|
"""Replace a substring in a file with another substring.
|
|
|
|
|
If `replace_all` is False (default), the substring to replace must appear **exactly once** in the file.
|
|
|
|
|
|
|
|
|
|
Args:
|
2026-01-14 12:32:34 +08:00
|
|
|
description: Explain why you are replacing the substring in short words. ALWAYS PROVIDE THIS PARAMETER FIRST.
|
|
|
|
|
path: The **absolute** path to the file to replace the substring in. ALWAYS PROVIDE THIS PARAMETER SECOND.
|
|
|
|
|
old_str: The substring to replace. ALWAYS PROVIDE THIS PARAMETER THIRD.
|
|
|
|
|
new_str: The new substring. ALWAYS PROVIDE THIS PARAMETER FOURTH.
|
2026-01-14 07:19:34 +08:00
|
|
|
replace_all: Whether to replace all occurrences of the substring. If False, only the first occurrence will be replaced. Default is False.
|
|
|
|
|
"""
|
|
|
|
|
try:
|
2026-01-14 12:32:34 +08:00
|
|
|
sandbox = sandbox_from_runtime(runtime)
|
2026-01-15 14:37:00 +08:00
|
|
|
if is_local_sandbox(runtime):
|
|
|
|
|
thread_data = get_thread_data(runtime)
|
|
|
|
|
path = replace_virtual_path(path, thread_data)
|
2026-01-14 07:19:34 +08:00
|
|
|
content = sandbox.read_file(path)
|
|
|
|
|
if not content:
|
|
|
|
|
return "OK"
|
2026-01-17 23:23:12 +08:00
|
|
|
if old_str not in content:
|
|
|
|
|
return f"Error: String to replace not found in file: {path}"
|
2026-01-14 07:19:34 +08:00
|
|
|
if replace_all:
|
|
|
|
|
content = content.replace(old_str, new_str)
|
|
|
|
|
else:
|
|
|
|
|
content = content.replace(old_str, new_str, 1)
|
|
|
|
|
sandbox.write_file(path, content)
|
|
|
|
|
return "OK"
|
2026-01-17 23:23:12 +08:00
|
|
|
except SandboxError as e:
|
2026-01-14 07:19:34 +08:00
|
|
|
return f"Error: {e}"
|
2026-01-17 23:23:12 +08:00
|
|
|
except FileNotFoundError:
|
|
|
|
|
return f"Error: File not found: {path}"
|
|
|
|
|
except PermissionError:
|
|
|
|
|
return f"Error: Permission denied accessing file: {path}"
|
|
|
|
|
except Exception as e:
|
|
|
|
|
return f"Error: Unexpected error replacing string: {type(e).__name__}: {e}"
|