backend/packages/harness/deerflow/agents/middlewares/title_middleware.py

"""Middleware for automatic thread title generation."""

from typing import NotRequired, override

from langchain.agents import AgentState
from langchain.agents.middleware import AgentMiddleware
from langgraph.runtime import Runtime

from deerflow.config.title_config import get_title_config
from deerflow.models import create_chat_model


class TitleMiddlewareState(AgentState):
    """Compatible with the `ThreadState` schema."""

    title: NotRequired[str | None]


class TitleMiddleware(AgentMiddleware[TitleMiddlewareState]):
    """Automatically generate a title for the thread after the first user message."""

    state_schema = TitleMiddlewareState

    def _should_generate_title(self, state: TitleMiddlewareState) -> bool:
        """Check if we should generate a title for this thread."""
        config = get_title_config()
        if not config.enabled:
            return False

        # Check if thread already has a title in state
        if state.get("title"):
            return False

        # Check if this is the first turn (has at least one user message and one assistant response)
        messages = state.get("messages", [])
        if len(messages) < 2:
            return False

        # Count user and assistant messages
        user_messages = [m for m in messages if m.type == "human"]
        assistant_messages = [m for m in messages if m.type == "ai"]

        # Generate title after first complete exchange
        return len(user_messages) == 1 and len(assistant_messages) >= 1

    async def _generate_title(self, state: TitleMiddlewareState) -> str:
        """Generate a concise title based on the conversation."""
        config = get_title_config()
        messages = state.get("messages", [])

        # Get first user message and first assistant response
        user_msg_content = next((m.content for m in messages if m.type == "human"), "")
        assistant_msg_content = next((m.content for m in messages if m.type == "ai"), "")

        # Ensure content is string (LangChain messages can have list content)
        user_msg = str(user_msg_content) if user_msg_content else ""
        assistant_msg = str(assistant_msg_content) if assistant_msg_content else ""

        # Use a lightweight model to generate title
        model = create_chat_model(thinking_enabled=False)

        prompt = config.prompt_template.format(
            max_words=config.max_words,
            user_msg=user_msg[:500],
            assistant_msg=assistant_msg[:500],
        )

        try:
            response = await model.ainvoke(prompt)
            # Ensure response content is string
            title_content = str(response.content) if response.content else ""
            title = title_content.strip().strip('"').strip("'")
            # Limit to max characters
            return title[: config.max_chars] if len(title) > config.max_chars else title
        except Exception as e:
            print(f"Failed to generate title: {e}")
            # Fallback: use first part of user message (by character count)
            fallback_chars = min(config.max_chars, 50)  # Use max_chars or 50, whichever is smaller
            if len(user_msg) > fallback_chars:
                return user_msg[:fallback_chars].rstrip() + "..."
            return user_msg if user_msg else "New Conversation"

    @override
    async def aafter_model(self, state: TitleMiddlewareState, runtime: Runtime) -> dict | None:
        """Generate and set thread title after the first agent response."""
        if self._should_generate_title(state):
            title = await self._generate_title(state)
            print(f"Generated thread title: {title}")

            # Store title in state (will be persisted by checkpointer if configured)
            return {"title": title}

        return None
feat: add AIO sandbox provider and auto title generation (#1) - Add AioSandboxProvider for Docker-based sandbox execution with configurable container lifecycle, volume mounts, and port management - Add TitleMiddleware to auto-generate thread titles after first user-assistant exchange using LLM - Add Claude Code documentation (CLAUDE.md, AGENTS.md) - Extend SandboxConfig with Docker-specific options (image, port, mounts) - Fix hardcoded mount path to use expanduser - Add agent-sandbox and dotenv dependencies Co-authored-by: Claude Opus 4.5 <noreply@anthropic.com> 2026-01-14 23:29:18 +08:00			`"""Middleware for automatic thread title generation."""`

			`from typing import NotRequired, override`

			`from langchain.agents import AgentState`
			`from langchain.agents.middleware import AgentMiddleware`
			`from langgraph.runtime import Runtime`

refactor: split backend into harness (deerflow.) and app (app.) (#1131) * refactor: extract shared utils to break harness→app cross-layer imports Move _validate_skill_frontmatter to src/skills/validation.py and CONVERTIBLE_EXTENSIONS + convert_file_to_markdown to src/utils/file_conversion.py. This eliminates the two reverse dependencies from client.py (harness layer) into gateway/routers/ (app layer), preparing for the harness/app package split. Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com> * refactor: split backend/src into harness (deerflow.) and app (app.) Physically split the monolithic backend/src/ package into two layers: - Harness (`packages/harness/deerflow/`): publishable agent framework package with import prefix `deerflow.`. Contains agents, sandbox, tools, models, MCP, skills, config, and all core infrastructure. - App* (`app/`): unpublished application code with import prefix `app.`. Contains gateway (FastAPI REST API) and channels (IM integrations). Key changes: - Move 13 harness modules to packages/harness/deerflow/ via git mv - Move gateway + channels to app/ via git mv - Rename all imports: src. → deerflow.* (harness) / app.* (app layer) - Set up uv workspace with deerflow-harness as workspace member - Update langgraph.json, config.example.yaml, all scripts, Docker files - Add build-system (hatchling) to harness pyproject.toml - Add PYTHONPATH=. to gateway startup commands for app.* resolution - Update ruff.toml with known-first-party for import sorting - Update all documentation to reflect new directory structure Boundary rule enforced: harness code never imports from app. All 429 tests pass. Lint clean. Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com> * chore: add harness→app boundary check test and update docs Add test_harness_boundary.py that scans all Python files in packages/harness/deerflow/ and fails if any `from app.` or `import app.` statement is found. This enforces the architectural rule that the harness layer never depends on the app layer. Update CLAUDE.md to document the harness/app split architecture, import conventions, and the boundary enforcement test. Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com> * feat: add config versioning with auto-upgrade on startup When config.example.yaml schema changes, developers' local config.yaml files can silently become outdated. This adds a config_version field and auto-upgrade mechanism so breaking changes (like src.* → deerflow.* renames) are applied automatically before services start. - Add config_version: 1 to config.example.yaml - Add startup version check warning in AppConfig.from_file() - Add scripts/config-upgrade.sh with migration registry for value replacements - Add `make config-upgrade` target - Auto-run config-upgrade in serve.sh and start-daemon.sh before starting services - Add config error hints in service failure messages Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com> * fix comments * fix: update src.* import in test_sandbox_tools_security to deerflow.* Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com> * fix: handle empty config and search parent dirs for config.example.yaml Address Copilot review comments on PR #1131: - Guard against yaml.safe_load() returning None for empty config files - Search parent directories for config.example.yaml instead of only looking next to config.yaml, fixing detection in common setups Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com> * fix: correct skills root path depth and config_version type coercion - loader.py: fix get_skills_root_path() to use 5 parent levels (was 3) after harness split, file lives at packages/harness/deerflow/skills/ so parent×3 resolved to backend/packages/harness/ instead of backend/ - app_config.py: coerce config_version to int() before comparison in _check_config_version() to prevent TypeError when YAML stores value as string (e.g. config_version: "1") - tests: add regression tests for both fixes Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com> * fix: update test imports from src.* to deerflow./app. after harness refactor Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com> --------- Co-authored-by: Claude Opus 4.6 <noreply@anthropic.com> 2026-03-14 22:55:52 +08:00			`from deerflow.config.title_config import get_title_config`
			`from deerflow.models import create_chat_model`
feat: add AIO sandbox provider and auto title generation (#1) - Add AioSandboxProvider for Docker-based sandbox execution with configurable container lifecycle, volume mounts, and port management - Add TitleMiddleware to auto-generate thread titles after first user-assistant exchange using LLM - Add Claude Code documentation (CLAUDE.md, AGENTS.md) - Extend SandboxConfig with Docker-specific options (image, port, mounts) - Fix hardcoded mount path to use expanduser - Add agent-sandbox and dotenv dependencies Co-authored-by: Claude Opus 4.5 <noreply@anthropic.com> 2026-01-14 23:29:18 +08:00

			`class TitleMiddlewareState(AgentState):`
			"""Compatible with the `ThreadState` schema."""

			`title: NotRequired[str \| None]`


			`class TitleMiddleware(AgentMiddleware[TitleMiddlewareState]):`
			`"""Automatically generate a title for the thread after the first user message."""`

			`state_schema = TitleMiddlewareState`

			`def _should_generate_title(self, state: TitleMiddlewareState) -> bool:`
			`"""Check if we should generate a title for this thread."""`
			`config = get_title_config()`
			`if not config.enabled:`
			`return False`

			`# Check if thread already has a title in state`
			`if state.get("title"):`
			`return False`

			`# Check if this is the first turn (has at least one user message and one assistant response)`
			`messages = state.get("messages", [])`
			`if len(messages) < 2:`
			`return False`

			`# Count user and assistant messages`
			`user_messages = [m for m in messages if m.type == "human"]`
			`assistant_messages = [m for m in messages if m.type == "ai"]`

			`# Generate title after first complete exchange`
			`return len(user_messages) == 1 and len(assistant_messages) >= 1`

Enhance chat UI and compatible anthropic thinking messages (#1018) 2026-03-08 20:19:31 +08:00			`async def _generate_title(self, state: TitleMiddlewareState) -> str:`
feat: add AIO sandbox provider and auto title generation (#1) - Add AioSandboxProvider for Docker-based sandbox execution with configurable container lifecycle, volume mounts, and port management - Add TitleMiddleware to auto-generate thread titles after first user-assistant exchange using LLM - Add Claude Code documentation (CLAUDE.md, AGENTS.md) - Extend SandboxConfig with Docker-specific options (image, port, mounts) - Fix hardcoded mount path to use expanduser - Add agent-sandbox and dotenv dependencies Co-authored-by: Claude Opus 4.5 <noreply@anthropic.com> 2026-01-14 23:29:18 +08:00			`"""Generate a concise title based on the conversation."""`
			`config = get_title_config()`
			`messages = state.get("messages", [])`

			`# Get first user message and first assistant response`
			`user_msg_content = next((m.content for m in messages if m.type == "human"), "")`
			`assistant_msg_content = next((m.content for m in messages if m.type == "ai"), "")`

			`# Ensure content is string (LangChain messages can have list content)`
			`user_msg = str(user_msg_content) if user_msg_content else ""`
			`assistant_msg = str(assistant_msg_content) if assistant_msg_content else ""`

			`# Use a lightweight model to generate title`
			`model = create_chat_model(thinking_enabled=False)`

			`prompt = config.prompt_template.format(`
			`max_words=config.max_words,`
			`user_msg=user_msg[:500],`
			`assistant_msg=assistant_msg[:500],`
			`)`

			`try:`
Enhance chat UI and compatible anthropic thinking messages (#1018) 2026-03-08 20:19:31 +08:00			`response = await model.ainvoke(prompt)`
feat: add AIO sandbox provider and auto title generation (#1) - Add AioSandboxProvider for Docker-based sandbox execution with configurable container lifecycle, volume mounts, and port management - Add TitleMiddleware to auto-generate thread titles after first user-assistant exchange using LLM - Add Claude Code documentation (CLAUDE.md, AGENTS.md) - Extend SandboxConfig with Docker-specific options (image, port, mounts) - Fix hardcoded mount path to use expanduser - Add agent-sandbox and dotenv dependencies Co-authored-by: Claude Opus 4.5 <noreply@anthropic.com> 2026-01-14 23:29:18 +08:00			`# Ensure response content is string`
			`title_content = str(response.content) if response.content else ""`
			`title = title_content.strip().strip('"').strip("'")`
			`# Limit to max characters`
			`return title[: config.max_chars] if len(title) > config.max_chars else title`
			`except Exception as e:`
			`print(f"Failed to generate title: {e}")`
			`# Fallback: use first part of user message (by character count)`
			`fallback_chars = min(config.max_chars, 50) # Use max_chars or 50, whichever is smaller`
			`if len(user_msg) > fallback_chars:`
			`return user_msg[:fallback_chars].rstrip() + "..."`
			`return user_msg if user_msg else "New Conversation"`

			`@override`
Enhance chat UI and compatible anthropic thinking messages (#1018) 2026-03-08 20:19:31 +08:00			`async def aafter_model(self, state: TitleMiddlewareState, runtime: Runtime) -> dict \| None:`
feat: add AIO sandbox provider and auto title generation (#1) - Add AioSandboxProvider for Docker-based sandbox execution with configurable container lifecycle, volume mounts, and port management - Add TitleMiddleware to auto-generate thread titles after first user-assistant exchange using LLM - Add Claude Code documentation (CLAUDE.md, AGENTS.md) - Extend SandboxConfig with Docker-specific options (image, port, mounts) - Fix hardcoded mount path to use expanduser - Add agent-sandbox and dotenv dependencies Co-authored-by: Claude Opus 4.5 <noreply@anthropic.com> 2026-01-14 23:29:18 +08:00			`"""Generate and set thread title after the first agent response."""`
			`if self._should_generate_title(state):`
Enhance chat UI and compatible anthropic thinking messages (#1018) 2026-03-08 20:19:31 +08:00			`title = await self._generate_title(state)`
feat: add AIO sandbox provider and auto title generation (#1) - Add AioSandboxProvider for Docker-based sandbox execution with configurable container lifecycle, volume mounts, and port management - Add TitleMiddleware to auto-generate thread titles after first user-assistant exchange using LLM - Add Claude Code documentation (CLAUDE.md, AGENTS.md) - Extend SandboxConfig with Docker-specific options (image, port, mounts) - Fix hardcoded mount path to use expanduser - Add agent-sandbox and dotenv dependencies Co-authored-by: Claude Opus 4.5 <noreply@anthropic.com> 2026-01-14 23:29:18 +08:00			`print(f"Generated thread title: {title}")`

			`# Store title in state (will be persisted by checkpointer if configured)`
			`return {"title": title}`

			`return None`