backend/src/tools/builtins/task_tool.py

"""Task tool for delegating work to subagents."""

import logging
import time
import uuid
from typing import Annotated, Literal

from langchain.tools import InjectedToolCallId, ToolRuntime, tool
from langgraph.typing import ContextT
from langgraph.config import get_stream_writer

from src.agents.thread_state import ThreadState
from src.subagents import SubagentExecutor, get_subagent_config
from src.subagents.executor import SubagentStatus, get_background_task_result

logger = logging.getLogger(__name__)


@tool("task", parse_docstring=True)
def task_tool(
    runtime: ToolRuntime[ContextT, ThreadState],
    description: str,
    prompt: str,
    subagent_type: Literal["general-purpose", "bash"],
    tool_call_id: Annotated[str, InjectedToolCallId],
    max_turns: int | None = None,
) -> str:
    """Delegate a task to a specialized subagent that runs in its own context.

    Subagents help you:
    - Preserve context by keeping exploration and implementation separate
    - Handle complex multi-step tasks autonomously
    - Execute commands or operations in isolated contexts

    Available subagent types:
    - **general-purpose**: A capable agent for complex, multi-step tasks that require
      both exploration and action. Use when the task requires complex reasoning,
      multiple dependent steps, or would benefit from isolated context.
    - **bash**: Command execution specialist for running bash commands. Use for
      git operations, build processes, or when command output would be verbose.

    When to use this tool:
    - Complex tasks requiring multiple steps or tools
    - Tasks that produce verbose output
    - When you want to isolate context from the main conversation
    - Parallel research or exploration tasks

    When NOT to use this tool:
    - Simple, single-step operations (use tools directly)
    - Tasks requiring user interaction or clarification

    Args:
        description: A short (3-5 word) description of the task for logging/display. ALWAYS PROVIDE THIS PARAMETER FIRST.
        prompt: The task description for the subagent. Be specific and clear about what needs to be done. ALWAYS PROVIDE THIS PARAMETER SECOND.
        subagent_type: The type of subagent to use. ALWAYS PROVIDE THIS PARAMETER THIRD.
        max_turns: Optional maximum number of agent turns. Defaults to subagent's configured max.
    """
    # Get subagent configuration
    config = get_subagent_config(subagent_type)
    if config is None:
        return f"Error: Unknown subagent type '{subagent_type}'. Available: general-purpose, bash"

    # Override max_turns if specified
    if max_turns is not None:
        # Create a copy with updated max_turns
        from dataclasses import replace

        config = replace(config, max_turns=max_turns)

    # Extract parent context from runtime
    sandbox_state = None
    thread_data = None
    thread_id = None
    parent_model = None
    trace_id = None

    if runtime is not None:
        sandbox_state = runtime.state.get("sandbox")
        thread_data = runtime.state.get("thread_data")
        thread_id = runtime.context.get("thread_id")

        # Try to get parent model from configurable
        metadata = runtime.config.get("metadata", {})
        parent_model = metadata.get("model_name")

        # Get or generate trace_id for distributed tracing
        trace_id = metadata.get("trace_id") or str(uuid.uuid4())[:8]

    # Get available tools (excluding task tool to prevent nesting)
    # Lazy import to avoid circular dependency
    from src.tools import get_available_tools

    # Subagents should not have subagent tools enabled (prevent recursive nesting)
    tools = get_available_tools(model_name=parent_model, subagent_enabled=False)

    # Create executor
    executor = SubagentExecutor(
        config=config,
        tools=tools,
        parent_model=parent_model,
        sandbox_state=sandbox_state,
        thread_data=thread_data,
        thread_id=thread_id,
        trace_id=trace_id,
    )

    # Start background execution (always async to prevent blocking)
    # Use tool_call_id as task_id for better traceability
    task_id = executor.execute_async(prompt, task_id=tool_call_id)
    logger.info(f"[trace={trace_id}] Started background task {task_id}, polling for completion...")

    # Poll for task completion in backend (removes need for LLM to poll)
    poll_count = 0
    last_status = None

    writer = get_stream_writer()
    # Send Task Started message'
    writer({"type": "task_started", "task_id": task_id, "description": description})


    while True:
        result = get_background_task_result(task_id)

        if result is None:
            logger.error(f"[trace={trace_id}] Task {task_id} not found in background tasks")
            writer({"type": "task_failed", "task_id": task_id, "error": "Task disappeared from background tasks"})
            return f"Error: Task {task_id} disappeared from background tasks"

        # Log status changes for debugging
        if result.status != last_status:
            logger.info(f"[trace={trace_id}] Task {task_id} status: {result.status.value}")
            last_status = result.status

        # Check if task completed or failed
        if result.status == SubagentStatus.COMPLETED:
            writer({"type": "task_completed", "task_id": task_id, "result": result.result})
            logger.info(f"[trace={trace_id}] Task {task_id} completed after {poll_count} polls")
            return f"Task Succeeded. Result: {result.result}"
        elif result.status == SubagentStatus.FAILED:
            writer({"type": "task_failed", "task_id": task_id, "error": result.error})
            logger.error(f"[trace={trace_id}] Task {task_id} failed: {result.error}")
            return f"Task failed. Error: {result.error}"

        # Still running, wait before next poll
        writer({"type": "task_running", "task_id": task_id, "poll_count": poll_count})
        time.sleep(5)  # Poll every 5 seconds
        poll_count += 1

        # Optional: Add timeout protection (e.g., max 5 minutes)
        if poll_count > 60:  # 60 * 5s = 5 minutes
            logger.warning(f"[trace={trace_id}] Task {task_id} timed out after {poll_count} polls")
            writer({"type": "task_timed_out", "task_id": task_id})
            return f"Task timed out after 5 minutes. Status: {result.status.value}"
feat: support sub agent mechanism 2026-02-05 19:59:25 +08:00			`"""Task tool for delegating work to subagents."""`

feat: fix task polling issue 2026-02-06 16:03:35 +08:00			`import logging`
			`import time`
feat: support sub agent mechanism 2026-02-05 19:59:25 +08:00			`import uuid`
refactor: optimize task tool parameter order and improve task tracking - Reorder task tool parameters to prioritize description first for better usability - Add tool_call_id injection for better task traceability - Use tool_call_id as task_id in executor for consistent tracking - Simplify event messages by removing redundant task_type field - Update task examples in prompt to reflect new parameter order Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com> 2026-02-07 16:04:36 +08:00			`from typing import Annotated, Literal`
feat: support sub agent mechanism 2026-02-05 19:59:25 +08:00
refactor: optimize task tool parameter order and improve task tracking - Reorder task tool parameters to prioritize description first for better usability - Add tool_call_id injection for better task traceability - Use tool_call_id as task_id in executor for consistent tracking - Simplify event messages by removing redundant task_type field - Update task examples in prompt to reflect new parameter order Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com> 2026-02-07 16:04:36 +08:00			`from langchain.tools import InjectedToolCallId, ToolRuntime, tool`
feat: support sub agent mechanism 2026-02-05 19:59:25 +08:00			`from langgraph.typing import ContextT`
feat: send custom event 2026-02-06 17:44:20 +08:00			`from langgraph.config import get_stream_writer`
feat: support sub agent mechanism 2026-02-05 19:59:25 +08:00
			`from src.agents.thread_state import ThreadState`
			`from src.subagents import SubagentExecutor, get_subagent_config`
			`from src.subagents.executor import SubagentStatus, get_background_task_result`

feat: fix task polling issue 2026-02-06 16:03:35 +08:00			`logger = logging.getLogger(__name__)`

feat: support sub agent mechanism 2026-02-05 19:59:25 +08:00
			`@tool("task", parse_docstring=True)`
			`def task_tool(`
			`runtime: ToolRuntime[ContextT, ThreadState],`
			`description: str,`
refactor: optimize task tool parameter order and improve task tracking - Reorder task tool parameters to prioritize description first for better usability - Add tool_call_id injection for better task traceability - Use tool_call_id as task_id in executor for consistent tracking - Simplify event messages by removing redundant task_type field - Update task examples in prompt to reflect new parameter order Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com> 2026-02-07 16:04:36 +08:00			`prompt: str,`
			`subagent_type: Literal["general-purpose", "bash"],`
			`tool_call_id: Annotated[str, InjectedToolCallId],`
feat: support sub agent mechanism 2026-02-05 19:59:25 +08:00			`max_turns: int \| None = None,`
			`) -> str:`
			`"""Delegate a task to a specialized subagent that runs in its own context.`

			`Subagents help you:`
			`- Preserve context by keeping exploration and implementation separate`
			`- Handle complex multi-step tasks autonomously`
			`- Execute commands or operations in isolated contexts`

			`Available subagent types:`
			`- general-purpose: A capable agent for complex, multi-step tasks that require`
			`both exploration and action. Use when the task requires complex reasoning,`
			`multiple dependent steps, or would benefit from isolated context.`
			`- bash: Command execution specialist for running bash commands. Use for`
			`git operations, build processes, or when command output would be verbose.`

			`When to use this tool:`
			`- Complex tasks requiring multiple steps or tools`
			`- Tasks that produce verbose output`
			`- When you want to isolate context from the main conversation`
			`- Parallel research or exploration tasks`

			`When NOT to use this tool:`
			`- Simple, single-step operations (use tools directly)`
			`- Tasks requiring user interaction or clarification`

			`Args:`
refactor: optimize task tool parameter order and improve task tracking - Reorder task tool parameters to prioritize description first for better usability - Add tool_call_id injection for better task traceability - Use tool_call_id as task_id in executor for consistent tracking - Simplify event messages by removing redundant task_type field - Update task examples in prompt to reflect new parameter order Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com> 2026-02-07 16:04:36 +08:00			`description: A short (3-5 word) description of the task for logging/display. ALWAYS PROVIDE THIS PARAMETER FIRST.`
			`prompt: The task description for the subagent. Be specific and clear about what needs to be done. ALWAYS PROVIDE THIS PARAMETER SECOND.`
			`subagent_type: The type of subagent to use. ALWAYS PROVIDE THIS PARAMETER THIRD.`
feat: support sub agent mechanism 2026-02-05 19:59:25 +08:00			`max_turns: Optional maximum number of agent turns. Defaults to subagent's configured max.`
			`"""`
			`# Get subagent configuration`
			`config = get_subagent_config(subagent_type)`
			`if config is None:`
			`return f"Error: Unknown subagent type '{subagent_type}'. Available: general-purpose, bash"`

			`# Override max_turns if specified`
			`if max_turns is not None:`
			`# Create a copy with updated max_turns`
			`from dataclasses import replace`

			`config = replace(config, max_turns=max_turns)`

			`# Extract parent context from runtime`
			`sandbox_state = None`
			`thread_data = None`
			`thread_id = None`
			`parent_model = None`
			`trace_id = None`

			`if runtime is not None:`
			`sandbox_state = runtime.state.get("sandbox")`
			`thread_data = runtime.state.get("thread_data")`
			`thread_id = runtime.context.get("thread_id")`

			`# Try to get parent model from configurable`
			`metadata = runtime.config.get("metadata", {})`
			`parent_model = metadata.get("model_name")`

			`# Get or generate trace_id for distributed tracing`
			`trace_id = metadata.get("trace_id") or str(uuid.uuid4())[:8]`

			`# Get available tools (excluding task tool to prevent nesting)`
			`# Lazy import to avoid circular dependency`
			`from src.tools import get_available_tools`

feat: add ultra mode 2026-02-06 15:42:53 +08:00			`# Subagents should not have subagent tools enabled (prevent recursive nesting)`
			`tools = get_available_tools(model_name=parent_model, subagent_enabled=False)`
feat: support sub agent mechanism 2026-02-05 19:59:25 +08:00
			`# Create executor`
			`executor = SubagentExecutor(`
			`config=config,`
			`tools=tools,`
			`parent_model=parent_model,`
			`sandbox_state=sandbox_state,`
			`thread_data=thread_data,`
			`thread_id=thread_id,`
			`trace_id=trace_id,`
			`)`

feat: fix task polling issue 2026-02-06 16:03:35 +08:00			`# Start background execution (always async to prevent blocking)`
refactor: optimize task tool parameter order and improve task tracking - Reorder task tool parameters to prioritize description first for better usability - Add tool_call_id injection for better task traceability - Use tool_call_id as task_id in executor for consistent tracking - Simplify event messages by removing redundant task_type field - Update task examples in prompt to reflect new parameter order Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com> 2026-02-07 16:04:36 +08:00			`# Use tool_call_id as task_id for better traceability`
			`task_id = executor.execute_async(prompt, task_id=tool_call_id)`
feat: fix task polling issue 2026-02-06 16:03:35 +08:00			`logger.info(f"[trace={trace_id}] Started background task {task_id}, polling for completion...")`

			`# Poll for task completion in backend (removes need for LLM to poll)`
			`poll_count = 0`
			`last_status = None`

feat: send custom event 2026-02-06 17:44:20 +08:00			`writer = get_stream_writer()`
			`# Send Task Started message'`
refactor: optimize task tool parameter order and improve task tracking - Reorder task tool parameters to prioritize description first for better usability - Add tool_call_id injection for better task traceability - Use tool_call_id as task_id in executor for consistent tracking - Simplify event messages by removing redundant task_type field - Update task examples in prompt to reflect new parameter order Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com> 2026-02-07 16:04:36 +08:00			`writer({"type": "task_started", "task_id": task_id, "description": description})`
feat: send custom event 2026-02-06 17:44:20 +08:00

feat: fix task polling issue 2026-02-06 16:03:35 +08:00			`while True:`
			`result = get_background_task_result(task_id)`

			`if result is None:`
			`logger.error(f"[trace={trace_id}] Task {task_id} not found in background tasks")`
refactor: optimize task tool parameter order and improve task tracking - Reorder task tool parameters to prioritize description first for better usability - Add tool_call_id injection for better task traceability - Use tool_call_id as task_id in executor for consistent tracking - Simplify event messages by removing redundant task_type field - Update task examples in prompt to reflect new parameter order Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com> 2026-02-07 16:04:36 +08:00			`writer({"type": "task_failed", "task_id": task_id, "error": "Task disappeared from background tasks"})`
feat: fix task polling issue 2026-02-06 16:03:35 +08:00			`return f"Error: Task {task_id} disappeared from background tasks"`

			`# Log status changes for debugging`
			`if result.status != last_status:`
			`logger.info(f"[trace={trace_id}] Task {task_id} status: {result.status.value}")`
			`last_status = result.status`

			`# Check if task completed or failed`
			`if result.status == SubagentStatus.COMPLETED:`
refactor: optimize task tool parameter order and improve task tracking - Reorder task tool parameters to prioritize description first for better usability - Add tool_call_id injection for better task traceability - Use tool_call_id as task_id in executor for consistent tracking - Simplify event messages by removing redundant task_type field - Update task examples in prompt to reflect new parameter order Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com> 2026-02-07 16:04:36 +08:00			`writer({"type": "task_completed", "task_id": task_id, "result": result.result})`
feat: fix task polling issue 2026-02-06 16:03:35 +08:00			`logger.info(f"[trace={trace_id}] Task {task_id} completed after {poll_count} polls")`
			`return f"Task Succeeded. Result: {result.result}"`
			`elif result.status == SubagentStatus.FAILED:`
refactor: optimize task tool parameter order and improve task tracking - Reorder task tool parameters to prioritize description first for better usability - Add tool_call_id injection for better task traceability - Use tool_call_id as task_id in executor for consistent tracking - Simplify event messages by removing redundant task_type field - Update task examples in prompt to reflect new parameter order Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com> 2026-02-07 16:04:36 +08:00			`writer({"type": "task_failed", "task_id": task_id, "error": result.error})`
feat: fix task polling issue 2026-02-06 16:03:35 +08:00			`logger.error(f"[trace={trace_id}] Task {task_id} failed: {result.error}")`
			`return f"Task failed. Error: {result.error}"`

			`# Still running, wait before next poll`
refactor: optimize task tool parameter order and improve task tracking - Reorder task tool parameters to prioritize description first for better usability - Add tool_call_id injection for better task traceability - Use tool_call_id as task_id in executor for consistent tracking - Simplify event messages by removing redundant task_type field - Update task examples in prompt to reflect new parameter order Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com> 2026-02-07 16:04:36 +08:00			`writer({"type": "task_running", "task_id": task_id, "poll_count": poll_count})`
feat: send custom event 2026-02-06 17:44:20 +08:00			`time.sleep(5) # Poll every 5 seconds`
feat: fix task polling issue 2026-02-06 16:03:35 +08:00			`poll_count += 1`

			`# Optional: Add timeout protection (e.g., max 5 minutes)`
feat: send custom event 2026-02-06 17:44:20 +08:00			`if poll_count > 60: # 60 * 5s = 5 minutes`
feat: fix task polling issue 2026-02-06 16:03:35 +08:00			`logger.warning(f"[trace={trace_id}] Task {task_id} timed out after {poll_count} polls")`
refactor: optimize task tool parameter order and improve task tracking - Reorder task tool parameters to prioritize description first for better usability - Add tool_call_id injection for better task traceability - Use tool_call_id as task_id in executor for consistent tracking - Simplify event messages by removing redundant task_type field - Update task examples in prompt to reflect new parameter order Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com> 2026-02-07 16:04:36 +08:00			`writer({"type": "task_timed_out", "task_id": task_id})`
feat: fix task polling issue 2026-02-06 16:03:35 +08:00			`return f"Task timed out after 5 minutes. Status: {result.status.value}"`