feat: support dify in rag module (#550)

Co-authored-by: Willem Jiang <willem.jiang@gmail.com>
2026-04-04 06:32:13 +08:00 · 2025-09-16 20:30:45 +08:00
parent 5085bf8ee9
commit 7694bb5d72
19 changed files with 407 additions and 87 deletions
--- a/.env.example
+++ b/.env.example
@@ -41,13 +41,18 @@ TAVILY_API_KEY=tvly-xxx
 # RAGFLOW_RETRIEVAL_SIZE=10
 # RAGFLOW_CROSS_LANGUAGES=English,Chinese,Spanish,French,German,Japanese,Korean # Optional. To use RAGFlow's cross-language search, please separate each language with a single comma

+# RAG_PROVIDER=dify
+# DIFY_API_URL="https://api.dify.ai/v1"
+# DIFY_API_KEY="dataset-xxx"
+
 # MOI is a hybrid database that mainly serves enterprise users (https://www.matrixorigin.io/matrixone-intelligence)
 # RAG_PROVIDER=moi
-# MOI_API_URL="https://freetier-01.cn-hangzhou.cluster.matrixonecloud.cn"
+# MOI_API_URL="https://cluster.matrixonecloud.cn"
 # MOI_API_KEY="xxx-xxx-xxx-xxx"
 # MOI_RETRIEVAL_SIZE=10
 # MOI_LIST_LIMIT=10

+
 # RAG_PROVIDER: milvus  (using free milvus instance on zilliz cloud: https://docs.zilliz.com/docs/quick-start )
 # RAG_PROVIDER=milvus
 # MILVUS_URI=<endpoint_of_self_hosted_milvus_or_zilliz_cloud>
--- a/server.py
+++ b/server.py
@@ -4,10 +4,11 @@
 """
 Server script for running the DeerFlow API.
 """
-import os
-import asyncio
+
 import argparse
+import asyncio
 import logging
+import os
 import signal
 import sys

--- a/src/config/configuration.py
+++ b/src/config/configuration.py
@@ -8,9 +8,9 @@ from typing import Any, Optional

 from langchain_core.runnables import RunnableConfig

+from src.config.loader import get_bool_env, get_int_env, get_str_env
 from src.config.report_style import ReportStyle
 from src.rag.retriever import Resource
-from src.config.loader import get_str_env, get_int_env, get_bool_env

 logger = logging.getLogger(__name__)

--- a/src/config/tools.py
+++ b/src/config/tools.py
@@ -22,6 +22,7 @@ SELECTED_SEARCH_ENGINE = os.getenv("SEARCH_API", SearchEngine.TAVILY.value)


 class RAGProvider(enum.Enum):
+    DIFY = "dify"
    RAGFLOW = "ragflow"
    VIKINGDB_KNOWLEDGE_BASE = "vikingdb_knowledge_base"
    MOI = "moi"
--- a/src/graph/checkpoint.py
+++ b/src/graph/checkpoint.py
@@ -6,10 +6,12 @@ import logging
 import uuid
 from datetime import datetime
 from typing import List, Optional, Tuple
+
 import psycopg
+from langgraph.store.memory import InMemoryStore
 from psycopg.rows import dict_row
 from pymongo import MongoClient
-from langgraph.store.memory import InMemoryStore
+
 from src.config.loader import get_bool_env, get_str_env


--- a/src/llms/llm.py
+++ b/src/llms/llm.py
@@ -10,7 +10,6 @@ from langchain_core.language_models import BaseChatModel
 from langchain_deepseek import ChatDeepSeek
 from langchain_google_genai import ChatGoogleGenerativeAI
 from langchain_openai import AzureChatOpenAI, ChatOpenAI
-from typing import get_args

 from src.config import load_yaml_config
 from src.config.agents import LLMType
--- a/src/llms/providers/dashscope.py
+++ b/src/llms/providers/dashscope.py
@@ -211,7 +211,6 @@ class ChatDashscope(ChatOpenAI):
                and hasattr(response.choices[0], "message")
                and hasattr(response.choices[0].message, "reasoning_content")
            ):
-
                reasoning_content = response.choices[0].message.reasoning_content
                if reasoning_content and chat_result.generations:
                    chat_result.generations[0].message.additional_kwargs[
--- a/src/rag/init.py
+++ b/src/rag/init.py
@@ -2,6 +2,7 @@
 # SPDX-License-Identifier: MIT

 from .builder import build_retriever
+from .dify import DifyProvider
 from .ragflow import RAGFlowProvider
 from .moi import MOIProvider
 from .retriever import Chunk, Document, Resource, Retriever
@@ -11,6 +12,7 @@ __all__ = [
    Retriever,
    Document,
    Resource,
+    DifyProvider,
    RAGFlowProvider,
    MOIProvider,
    VikingDBKnowledgeBaseProvider,
--- a/src/rag/builder.py
+++ b/src/rag/builder.py
@@ -2,14 +2,17 @@
 # SPDX-License-Identifier: MIT

 from src.config.tools import SELECTED_RAG_PROVIDER, RAGProvider
+from src.rag.dify import DifyProvider
+from src.rag.milvus import MilvusProvider
 from src.rag.ragflow import RAGFlowProvider
 from src.rag.moi import MOIProvider
 from src.rag.retriever import Retriever
 from src.rag.vikingdb_knowledge_base import VikingDBKnowledgeBaseProvider
-from src.rag.milvus import MilvusProvider


 def build_retriever() -> Retriever | None:
+    if SELECTED_RAG_PROVIDER == RAGProvider.DIFY.value:
+        return DifyProvider()
    if SELECTED_RAG_PROVIDER == RAGProvider.RAGFLOW.value:
        return RAGFlowProvider()
    elif SELECTED_RAG_PROVIDER == RAGProvider.MOI.value:
--- a/src/rag/dify.py
+++ b/src/rag/dify.py
@@ -0,0 +1,132 @@
+# Copyright (c) 2025 Bytedance Ltd. and/or its affiliates
+# SPDX-License-Identifier: MIT
+
+import os
+from urllib.parse import urlparse
+
+import requests
+
+from src.rag.retriever import Chunk, Document, Resource, Retriever
+
+
+class DifyProvider(Retriever):
+    """
+    DifyProvider is a provider that uses dify to retrieve documents.
+    """
+
+    api_url: str
+    api_key: str
+
+    def __init__(self):
+        api_url = os.getenv("DIFY_API_URL")
+        if not api_url:
+            raise ValueError("DIFY_API_URL is not set")
+        self.api_url = api_url
+
+        api_key = os.getenv("DIFY_API_KEY")
+        if not api_key:
+            raise ValueError("DIFY_API_KEY is not set")
+        self.api_key = api_key
+
+    def query_relevant_documents(
+        self, query: str, resources: list[Resource] = []
+    ) -> list[Document]:
+        if not resources:
+            return []
+
+        headers = {
+            "Authorization": f"Bearer {self.api_key}",
+            "Content-Type": "application/json",
+        }
+
+        all_documents = {}
+        for resource in resources:
+            dataset_id, _ = parse_uri(resource.uri)
+            payload = {
+                "query": query,
+                "retrieval_model": {
+                    "search_method": "hybrid_search",
+                    "reranking_enable": False,
+                    "weights": {
+                        "weight_type": "customized",
+                        "keyword_setting": {"keyword_weight": 0.3},
+                        "vector_setting": {"vector_weight": 0.7},
+                    },
+                    "top_k": 3,
+                    "score_threshold_enabled": True,
+                    "score_threshold": 0.5,
+                },
+            }
+
+            response = requests.post(
+                f"{self.api_url}/datasets/{dataset_id}/retrieve",
+                headers=headers,
+                json=payload,
+            )
+
+            if response.status_code != 200:
+                raise Exception(f"Failed to query documents: {response.text}")
+
+            result = response.json()
+            records = result.get("records", {})
+            for record in records:
+                segment = record.get("segment")
+                if not segment:
+                    continue
+                document_info = segment.get("document")
+                if not document_info:
+                    continue
+                doc_id = document_info.get("id")
+                doc_name = document_info.get("name")
+                if not doc_id or not doc_name:
+                    continue
+
+                if doc_id not in all_documents:
+                    all_documents[doc_id] = Document(
+                        id=doc_id, title=doc_name, chunks=[]
+                    )
+
+                chunk = Chunk(
+                    content=segment.get("content", ""),
+                    similarity=record.get("score", 0.0),
+                )
+                all_documents[doc_id].chunks.append(chunk)
+
+        return list(all_documents.values())
+
+    def list_resources(self, query: str | None = None) -> list[Resource]:
+        headers = {
+            "Authorization": f"Bearer {self.api_key}",
+            "Content-Type": "application/json",
+        }
+
+        params = {}
+        if query:
+            params["keyword"] = query
+
+        response = requests.get(
+            f"{self.api_url}/datasets", headers=headers, params=params
+        )
+
+        if response.status_code != 200:
+            raise Exception(f"Failed to list resources: {response.text}")
+
+        result = response.json()
+        resources = []
+
+        for item in result.get("data", []):
+            item = Resource(
+                uri=f"rag://dataset/{item.get('id')}",
+                title=item.get("name", ""),
+                description=item.get("description", ""),
+            )
+            resources.append(item)
+
+        return resources
+
+
+def parse_uri(uri: str) -> tuple[str, str]:
+    parsed = urlparse(uri)
+    if parsed.scheme != "rag":
+        raise ValueError(f"Invalid URI: {uri}")
+    return parsed.path.split("/")[1], parsed.fragment
--- a/src/rag/milvus.py
+++ b/src/rag/milvus.py
@@ -7,11 +7,12 @@ from pathlib import Path
 from typing import Any, Dict, Iterable, List, Optional, Sequence, Set

 from langchain_milvus.vectorstores import Milvus as LangchainMilvus
-from pymilvus import MilvusClient, CollectionSchema, FieldSchema, DataType
 from langchain_openai import OpenAIEmbeddings
 from openai import OpenAI
+from pymilvus import CollectionSchema, DataType, FieldSchema, MilvusClient
+
+from src.config.loader import get_bool_env, get_int_env, get_str_env
 from src.rag.retriever import Chunk, Document, Resource, Retriever
-from src.config.loader import get_bool_env, get_str_env, get_int_env

 logger = logging.getLogger(__name__)

@@ -466,7 +467,7 @@ class MilvusRetriever(Retriever):
                    resources.append(
                        Resource(
                            uri=r.get(self.url_field, "")
-                            or f"milvus://{r.get(self.id_field,'')}",
+                            or f"milvus://{r.get(self.id_field, '')}",
                            title=r.get(self.title_field, "")
                            or r.get(self.id_field, "Unnamed"),
                            description="Stored Milvus document",
@@ -476,21 +477,23 @@ class MilvusRetriever(Retriever):
                # Use similarity_search_by_vector for lightweight listing.
                # If a query is provided embed it; else use a zero vector.
                docs: Iterable[Any] = self.client.similarity_search(
-                    query, k=100, expr="source == 'examples'"  # Limit to 100 results
+                    query,
+                    k=100,
+                    expr="source == 'examples'",  # Limit to 100 results
                )
                for d in docs:
                    meta = getattr(d, "metadata", {}) or {}
                    # check if the resource is in the list of resources
                    if resources and any(
                        r.uri == meta.get(self.url_field, "")
-                        or r.uri == f"milvus://{meta.get(self.id_field,'')}"
+                        or r.uri == f"milvus://{meta.get(self.id_field, '')}"
                        for r in resources
                    ):
                        continue
                    resources.append(
                        Resource(
                            uri=meta.get(self.url_field, "")
-                            or f"milvus://{meta.get(self.id_field,'')}",
+                            or f"milvus://{meta.get(self.id_field, '')}",
                            title=meta.get(self.title_field, "")
                            or meta.get(self.id_field, "Unnamed"),
                            description="Stored Milvus document",
--- a/src/server/app.py
+++ b/src/server/app.py
@@ -11,10 +11,10 @@ from fastapi import FastAPI, HTTPException, Query
 from fastapi.middleware.cors import CORSMiddleware
 from fastapi.responses import Response, StreamingResponse
 from langchain_core.messages import AIMessageChunk, BaseMessage, ToolMessage
-from langgraph.types import Command
-from langgraph.store.memory import InMemoryStore
 from langgraph.checkpoint.mongodb import AsyncMongoDBSaver
 from langgraph.checkpoint.postgres.aio import AsyncPostgresSaver
+from langgraph.store.memory import InMemoryStore
+from langgraph.types import Command
 from psycopg_pool import AsyncConnectionPool

 from src.config.configuration import get_recursion_limit
@@ -22,6 +22,7 @@ from src.config.loader import get_bool_env, get_str_env
 from src.config.report_style import ReportStyle
 from src.config.tools import SELECTED_RAG_PROVIDER
 from src.graph.builder import build_graph_with_memory
+from src.graph.checkpoint import chat_stream_message
 from src.llms.llm import get_configured_llm_models
 from src.podcast.graph.builder import build_graph as build_podcast_graph
 from src.ppt.graph.builder import build_graph as build_ppt_graph
@@ -47,7 +48,6 @@ from src.server.rag_request import (
    RAGResourcesResponse,
 )
 from src.tools import VolcengineTTS
-from src.graph.checkpoint import chat_stream_message
 from src.utils.json_utils import sanitize_args

 logger = logging.getLogger(__name__)
--- a/src/server/mcp_utils.py
+++ b/src/server/mcp_utils.py
@@ -97,7 +97,8 @@ async def load_mcp_tools(
                )

            return await _get_tools_from_client_session(
-                sse_client(url=url, headers=headers, timeout=timeout_seconds), timeout_seconds
+                sse_client(url=url, headers=headers, timeout=timeout_seconds),
+                timeout_seconds,
            )

        elif server_type == "streamable_http":
@@ -107,7 +108,10 @@ async def load_mcp_tools(
                )

            return await _get_tools_from_client_session(
-                streamablehttp_client(url=url, headers=headers, timeout=timeout_seconds), timeout_seconds,
+                streamablehttp_client(
+                    url=url, headers=headers, timeout=timeout_seconds
+                ),
+                timeout_seconds,
            )

        else:
--- a/src/utils/json_utils.py
+++ b/src/utils/json_utils.py
@@ -4,6 +4,7 @@
 import json
 import logging
 from typing import Any
+
 import json_repair

 logger = logging.getLogger(__name__)
--- a/tests/unit/checkpoint/postgres_mock_utils.py
+++ b/tests/unit/checkpoint/postgres_mock_utils.py
@@ -1,81 +1,85 @@
 # Copyright (c) 2025 Bytedance Ltd. and/or its affiliates
 # SPDX-License-Identifier: MIT

-import pytest
-import tempfile
 import shutil
+import tempfile
 from pathlib import Path
+from typing import Any, Dict, Optional
 from unittest.mock import MagicMock, patch
-from typing import Dict, Any, Optional
+
 import psycopg
+import pytest
+

 class PostgreSQLMockInstance:
    """Utility class for managing PostgreSQL mock instances."""
-    
+
    def __init__(self, database_name: str = "test_db"):
        self.database_name = database_name
        self.temp_dir: Optional[Path] = None
        self.mock_connection: Optional[MagicMock] = None
        self.mock_data: Dict[str, Any] = {}
        self._setup_mock_data()
-    
+
    def _setup_mock_data(self):
        """Initialize mock data storage."""
        self.mock_data = {
            "chat_streams": {},  # thread_id -> record
            "table_exists": False,
-            "connection_active": True
+            "connection_active": True,
        }
-    
+
    def connect(self) -> MagicMock:
        """Create a mock PostgreSQL connection."""
        self.mock_connection = MagicMock()
        self._setup_mock_methods()
        return self.mock_connection
-    
+
    def _setup_mock_methods(self):
        """Setup mock methods for PostgreSQL operations."""
        if not self.mock_connection:
            return
-            
+
        # Mock cursor context manager
        mock_cursor = MagicMock()
        mock_cursor.__enter__ = MagicMock(return_value=mock_cursor)
        mock_cursor.__exit__ = MagicMock(return_value=False)
-        
+
        # Setup cursor operations
        mock_cursor.execute = MagicMock(side_effect=self._mock_execute)
        mock_cursor.fetchone = MagicMock(side_effect=self._mock_fetchone)
        mock_cursor.rowcount = 0
-        
+
        # Setup connection operations
        self.mock_connection.cursor = MagicMock(return_value=mock_cursor)
        self.mock_connection.commit = MagicMock()
        self.mock_connection.rollback = MagicMock()
        self.mock_connection.close = MagicMock()
-        
+
        # Store cursor for external access
        self._mock_cursor = mock_cursor
-    
+
    def _mock_execute(self, sql: str, params=None):
        """Mock SQL execution."""
        sql_upper = sql.upper().strip()
-        
+
        if "CREATE TABLE" in sql_upper:
            self.mock_data["table_exists"] = True
            self._mock_cursor.rowcount = 0
-            
+
        elif "SELECT" in sql_upper and "chat_streams" in sql_upper:
            # Mock SELECT query
            if params and len(params) > 0:
                thread_id = params[0]
                if thread_id in self.mock_data["chat_streams"]:
-                    self._mock_cursor._fetch_result = self.mock_data["chat_streams"][thread_id]
+                    self._mock_cursor._fetch_result = self.mock_data["chat_streams"][
+                        thread_id
+                    ]
                else:
                    self._mock_cursor._fetch_result = None
            else:
                self._mock_cursor._fetch_result = None
-                
+
        elif "UPDATE" in sql_upper and "chat_streams" in sql_upper:
            # Mock UPDATE query
            if params and len(params) >= 2:
@@ -84,12 +88,12 @@ class PostgreSQLMockInstance:
                    self.mock_data["chat_streams"][thread_id] = {
                        "id": thread_id,
                        "thread_id": thread_id,
-                        "messages": messages
+                        "messages": messages,
                    }
                    self._mock_cursor.rowcount = 1
                else:
                    self._mock_cursor.rowcount = 0
-                    
+
        elif "INSERT" in sql_upper and "chat_streams" in sql_upper:
            # Mock INSERT query
            if params and len(params) >= 2:
@@ -97,30 +101,30 @@ class PostgreSQLMockInstance:
                self.mock_data["chat_streams"][thread_id] = {
                    "id": thread_id,
                    "thread_id": thread_id,
-                    "messages": messages
+                    "messages": messages,
                }
                self._mock_cursor.rowcount = 1
-    
+
    def _mock_fetchone(self):
        """Mock fetchone operation."""
-        return getattr(self._mock_cursor, '_fetch_result', None)
-    
+        return getattr(self._mock_cursor, "_fetch_result", None)
+
    def disconnect(self):
        """Cleanup mock connection."""
        if self.mock_connection:
            self.mock_connection.close()
        self._setup_mock_data()  # Reset data
-    
+
    def reset_data(self):
        """Reset all mock data."""
        self._setup_mock_data()
-    
+
    def get_table_count(self, table_name: str) -> int:
        """Get record count in a table."""
        if table_name == "chat_streams":
            return len(self.mock_data["chat_streams"])
        return 0
-    
+
    def create_test_data(self, table_name: str, records: list):
        """Insert test data into a table."""
        if table_name == "chat_streams":
@@ -129,6 +133,7 @@ class PostgreSQLMockInstance:
                if thread_id:
                    self.mock_data["chat_streams"][thread_id] = record

+
@pytest.fixture
 def mock_postgresql():
    """Create a PostgreSQL mock instance."""
@@ -137,6 +142,7 @@ def mock_postgresql():
    yield instance
    instance.disconnect()

+
@pytest.fixture
 def clean_mock_postgresql():
    """Create a clean PostgreSQL mock instance that resets between tests."""
@@ -144,4 +150,4 @@ def clean_mock_postgresql():
    instance.connect()
    instance.reset_data()
    yield instance
-    instance.disconnect()
+    instance.disconnect()
--- a/tests/unit/checkpoint/test_checkpoint.py
+++ b/tests/unit/checkpoint/test_checkpoint.py
@@ -2,15 +2,18 @@
 # SPDX-License-Identifier: MIT

 import os
-import pytest
+from unittest.mock import MagicMock, patch
+
 import mongomock
-from unittest.mock import patch, MagicMock
-import src.graph.checkpoint as checkpoint
+import pytest
 from postgres_mock_utils import PostgreSQLMockInstance

+import src.graph.checkpoint as checkpoint
+
 POSTGRES_URL = "postgresql://postgres:postgres@localhost:5432/checkpointing_db"
 MONGO_URL = "mongodb://admin:admin@localhost:27017/checkpointing_db?authSource=admin"

+
 def has_real_db_connection():
    # Check the environment if the MongoDB server is available
    enabled = os.getenv("DB_TESTS_ENABLED", "false")
@@ -18,27 +21,28 @@ def has_real_db_connection():
        return True
    return False

+
 def test_with_local_postgres_db():
    """Ensure the ChatStreamManager can be initialized with a local PostgreSQL DB."""
-    with patch('psycopg.connect') as mock_connect:
+    with patch("psycopg.connect") as mock_connect:
        # Setup mock PostgreSQL connection
        pg_mock = PostgreSQLMockInstance()
        mock_connect.return_value = pg_mock.connect()
        manager = checkpoint.ChatStreamManager(
            checkpoint_saver=True,
            db_uri=POSTGRES_URL,
-    )
+        )
    assert manager.postgres_conn is not None
    assert manager.mongo_client is None


 def test_with_local_mongo_db():
    """Ensure the ChatStreamManager can be initialized with a local MongoDB."""
-    with patch('src.graph.checkpoint.MongoClient') as mock_mongo_client:
+    with patch("src.graph.checkpoint.MongoClient") as mock_mongo_client:
        # Setup mongomock
        mock_client = mongomock.MongoClient()
        mock_mongo_client.return_value = mock_client
-        
+
        manager = checkpoint.ChatStreamManager(
            checkpoint_saver=True,
            db_uri=MONGO_URL,
@@ -80,7 +84,7 @@ def test_process_stream_partial_buffer_postgres(monkeypatch):

 def test_process_stream_partial_buffer_mongo():
    """Partial chunks should be buffered; Use mongomock instead of real MongoDB."""
-    with patch('src.graph.checkpoint.MongoClient') as mock_mongo_client:
+    with patch("src.graph.checkpoint.MongoClient") as mock_mongo_client:
        # Setup mongomock
        mock_client = mongomock.MongoClient()
        mock_mongo_client.return_value = mock_client
@@ -96,7 +100,10 @@ def test_process_stream_partial_buffer_mongo():
        values = [it.dict()["value"] for it in items]
        assert "hello" in values

-@pytest.mark.skipif(not has_real_db_connection(), reason="PostgreSQL Server is not available")
+
+@pytest.mark.skipif(
+    not has_real_db_connection(), reason="PostgreSQL Server is not available"
+)
 def test_persist_postgresql_local_db():
    """Ensure that the ChatStreamManager can persist to a local PostgreSQL DB."""
    manager = checkpoint.ChatStreamManager(
@@ -116,7 +123,9 @@ def test_persist_postgresql_local_db():
    assert result is True


-@pytest.mark.skipif(not has_real_db_connection(), reason="PostgreSQL Server is not available")
+@pytest.mark.skipif(
+    not has_real_db_connection(), reason="PostgreSQL Server is not available"
+)
 def test_persist_postgresql_called_with_aggregated_chunks():
    """On 'stop', aggregated chunks should be passed to PostgreSQL persist method."""
    manager = checkpoint.ChatStreamManager(
@@ -151,40 +160,42 @@ def test_persist_not_attempted_when_saver_disabled():

 def test_persist_mongodb_local_db():
    """Ensure that the ChatStreamManager can persist to a mocked MongoDB."""
-    with patch('src.graph.checkpoint.MongoClient') as mock_mongo_client:
+    with patch("src.graph.checkpoint.MongoClient") as mock_mongo_client:
        # Setup mongomock
        mock_client = mongomock.MongoClient()
        mock_mongo_client.return_value = mock_client
-        
+
        manager = checkpoint.ChatStreamManager(
            checkpoint_saver=True,
            db_uri=MONGO_URL,
        )
        assert manager.mongo_db is not None
        assert manager.postgres_conn is None
-        
+
        # Simulate a message to persist
        thread_id = "test_thread"
        messages = ["This is a test message."]
        result = manager._persist_to_mongodb(thread_id, messages)
        assert result is True
-        
+
        # Verify data was persisted in mock
        collection = manager.mongo_db.chat_streams
        doc = collection.find_one({"thread_id": thread_id})
        assert doc is not None
        assert doc["messages"] == messages
-        
+
        # Simulate a message with existing thread
        result = manager._persist_to_mongodb(thread_id, ["Another message."])
        assert result is True
-        
+
        # Verify update worked
        doc = collection.find_one({"thread_id": thread_id})
        assert doc["messages"] == ["Another message."]


-@pytest.mark.skipif(not has_real_db_connection(), reason="MongoDB server is not available")
+@pytest.mark.skipif(
+    not has_real_db_connection(), reason="MongoDB server is not available"
+)
 def test_persist_mongodb_called_with_aggregated_chunks():
    """On 'stop', aggregated chunks should be passed to MongoDB persist method."""

@@ -239,11 +250,11 @@ def test_unsupported_db_uri_scheme():

 def test_process_stream_with_interrupt_finish_reason():
    """Test that 'interrupt' finish_reason triggers persistence like 'stop'."""
-    with patch('src.graph.checkpoint.MongoClient') as mock_mongo_client:
+    with patch("src.graph.checkpoint.MongoClient") as mock_mongo_client:
        # Setup mongomock
        mock_client = mongomock.MongoClient()
        mock_mongo_client.return_value = mock_client
-        
+
        manager = checkpoint.ChatStreamManager(
            checkpoint_saver=True,
            db_uri=MONGO_URL,
@@ -263,7 +274,7 @@ def test_process_stream_with_interrupt_finish_reason():
            )
            is True
        )
-        
+
        # Verify persistence occurred
        collection = manager.mongo_db.chat_streams
        doc = collection.find_one({"thread_id": "int_test"})
@@ -395,7 +406,7 @@ def test_multiple_threads_isolation():

 def test_mongodb_insert_and_update_paths():
    """Exercise MongoDB insert, update, and exception branches using mongomock."""
-    with patch('src.graph.checkpoint.MongoClient') as mock_mongo_client:
+    with patch("src.graph.checkpoint.MongoClient") as mock_mongo_client:
        # Setup mongomock
        mock_client = mongomock.MongoClient()
        mock_mongo_client.return_value = mock_client
@@ -404,7 +415,7 @@ def test_mongodb_insert_and_update_paths():

        # Insert success (new thread)
        assert manager._persist_to_mongodb("th1", ["message1"]) is True
-        
+
        # Verify insert worked
        collection = manager.mongo_db.chat_streams
        doc = collection.find_one({"thread_id": "th1"})
@@ -413,7 +424,7 @@ def test_mongodb_insert_and_update_paths():

        # Update success (existing thread)
        assert manager._persist_to_mongodb("th1", ["message2"]) is True
-        
+
        # Verify update worked
        doc = collection.find_one({"thread_id": "th1"})
        assert doc["messages"] == ["message2"]
@@ -421,9 +432,9 @@ def test_mongodb_insert_and_update_paths():
        # Test error case by mocking collection methods
        original_find_one = collection.find_one
        collection.find_one = MagicMock(side_effect=RuntimeError("Database error"))
-        
+
        assert manager._persist_to_mongodb("th2", ["message"]) is False
-        
+
        # Restore original method
        collection.find_one = original_find_one

@@ -591,19 +602,19 @@ def test_context_manager_calls_close(monkeypatch):

 def test_init_mongodb_success_and_failure(monkeypatch):
    """MongoDB init should succeed with mongomock and fail gracefully with errors."""
-    
+
    # Success path with mongomock
-    with patch('src.graph.checkpoint.MongoClient') as mock_mongo_client:
+    with patch("src.graph.checkpoint.MongoClient") as mock_mongo_client:
        mock_client = mongomock.MongoClient()
        mock_mongo_client.return_value = mock_client
-        
+
        manager = checkpoint.ChatStreamManager(checkpoint_saver=True, db_uri=MONGO_URL)
        assert manager.mongo_db is not None

    # Failure path
-    with patch('src.graph.checkpoint.MongoClient') as mock_mongo_client:
+    with patch("src.graph.checkpoint.MongoClient") as mock_mongo_client:
        mock_mongo_client.side_effect = RuntimeError("Connection failed")
-        
+
        manager = checkpoint.ChatStreamManager(checkpoint_saver=True, db_uri=MONGO_URL)
        # Should have no mongo_db set on failure
        assert getattr(manager, "mongo_db", None) is None
--- a/tests/unit/llms/test_dashscope.py
+++ b/tests/unit/llms/test_dashscope.py
@@ -2,23 +2,21 @@
 # SPDX-License-Identifier: MIT

 import pytest
-
 from langchain_core.messages import (
    AIMessageChunk,
+    ChatMessageChunk,
+    FunctionMessageChunk,
    HumanMessageChunk,
    SystemMessageChunk,
-    FunctionMessageChunk,
    ToolMessageChunk,
 )

 from src.llms import llm as llm_module
-from langchain_core.messages import ChatMessageChunk
 from src.llms.providers import dashscope as dashscope_module
-
 from src.llms.providers.dashscope import (
    ChatDashscope,
-    _convert_delta_to_message_chunk,
    _convert_chunk_to_generation_chunk,
+    _convert_delta_to_message_chunk,
 )


--- a/tests/unit/rag/test_dify.py
+++ b/tests/unit/rag/test_dify.py
@@ -0,0 +1,154 @@
+# Copyright (c) 2025 Bytedance Ltd. and/or its affiliates
+# SPDX-License-Identifier: MIT
+
+from unittest.mock import MagicMock, patch
+
+import pytest
+
+from src.rag.dify import DifyProvider, parse_uri
+
+
+# Dummy classes to mock dependencies
+class DummyResource:
+    def __init__(self, uri, title="", description=""):
+        self.uri = uri
+        self.title = title
+        self.description = description
+
+
+class DummyChunk:
+    def __init__(self, content, similarity):
+        self.content = content
+        self.similarity = similarity
+
+
+class DummyDocument:
+    def __init__(self, id, title, chunks=None):
+        self.id = id
+        self.title = title
+        self.chunks = chunks or []
+
+
+# Patch imports in dify.py to use dummy classes
+@pytest.fixture(autouse=True)
+def patch_imports(monkeypatch):
+    import src.rag.dify as dify
+
+    dify.Resource = DummyResource
+    dify.Chunk = DummyChunk
+    dify.Document = DummyDocument
+    yield
+
+
+def test_parse_uri_valid():
+    uri = "rag://dataset/123#abc"
+    dataset_id, document_id = parse_uri(uri)
+    assert dataset_id == "123"
+    assert document_id == "abc"
+
+
+def test_parse_uri_invalid():
+    with pytest.raises(ValueError):
+        parse_uri("http://dataset/123#abc")
+
+
+def test_init_env_vars(monkeypatch):
+    monkeypatch.setenv("DIFY_API_URL", "http://api")
+    monkeypatch.setenv("DIFY_API_KEY", "key")
+    provider = DifyProvider()
+    assert provider.api_url == "http://api"
+    assert provider.api_key == "key"
+
+
+def test_init_missing_env(monkeypatch):
+    monkeypatch.delenv("DIFY_API_URL", raising=False)
+    monkeypatch.setenv("DIFY_API_KEY", "key")
+    with pytest.raises(ValueError):
+        DifyProvider()
+    monkeypatch.setenv("DIFY_API_URL", "http://api")
+    monkeypatch.delenv("DIFY_API_KEY", raising=False)
+    with pytest.raises(ValueError):
+        DifyProvider()
+
+
+@patch("src.rag.dify.requests.post")
+def test_query_relevant_documents_success(mock_post, monkeypatch):
+    monkeypatch.setenv("DIFY_API_URL", "http://api")
+    monkeypatch.setenv("DIFY_API_KEY", "key")
+    provider = DifyProvider()
+    resource = DummyResource("rag://dataset/123#doc456")
+    mock_response = MagicMock()
+    mock_response.status_code = 200
+    mock_response.json.return_value = {
+        "records": [
+            {
+                "segment": {
+                    "content": "chunk text",
+                    "document": {
+                        "id": "doc456",
+                        "name": "Doc Title",
+                    },
+                },
+                "score": 0.9,
+            }
+        ]
+    }
+    mock_post.return_value = mock_response
+    docs = provider.query_relevant_documents("query", [resource])
+    assert len(docs) == 1
+    assert docs[0].id == "doc456"
+    assert docs[0].title == "Doc Title"
+    assert len(docs[0].chunks) == 1
+    assert docs[0].chunks[0].content == "chunk text"
+    assert docs[0].chunks[0].similarity == 0.9
+
+
+@patch("src.rag.dify.requests.post")
+def test_query_relevant_documents_error(mock_post, monkeypatch):
+    monkeypatch.setenv("DIFY_API_URL", "http://api")
+    monkeypatch.setenv("DIFY_API_KEY", "key")
+    provider = DifyProvider()
+    resource = DummyResource("rag://dataset/123#doc456")
+    mock_response = MagicMock()
+    mock_response.status_code = 400
+    mock_response.text = "error"
+    mock_post.return_value = mock_response
+    with pytest.raises(Exception):
+        provider.query_relevant_documents("query", [resource])
+
+
+@patch("src.rag.dify.requests.get")
+def test_list_resources_success(mock_get, monkeypatch):
+    monkeypatch.setenv("DIFY_API_URL", "http://api")
+    monkeypatch.setenv("DIFY_API_KEY", "key")
+    provider = DifyProvider()
+    mock_response = MagicMock()
+    mock_response.status_code = 200
+    mock_response.json.return_value = {
+        "data": [
+            {"id": "123", "name": "Dataset1", "description": "desc1"},
+            {"id": "456", "name": "Dataset2", "description": "desc2"},
+        ]
+    }
+    mock_get.return_value = mock_response
+    resources = provider.list_resources()
+    assert len(resources) == 2
+    assert resources[0].uri == "rag://dataset/123"
+    assert resources[0].title == "Dataset1"
+    assert resources[0].description == "desc1"
+    assert resources[1].uri == "rag://dataset/456"
+    assert resources[1].title == "Dataset2"
+    assert resources[1].description == "desc2"
+
+
+@patch("src.rag.dify.requests.get")
+def test_list_resources_error(mock_get, monkeypatch):
+    monkeypatch.setenv("DIFY_API_URL", "http://api")
+    monkeypatch.setenv("DIFY_API_KEY", "key")
+    provider = DifyProvider()
+    mock_response = MagicMock()
+    mock_response.status_code = 500
+    mock_response.text = "fail"
+    mock_get.return_value = mock_response
+    with pytest.raises(Exception):
+        provider.list_resources()
--- a/tests/unit/rag/test_milvus.py
+++ b/tests/unit/rag/test_milvus.py
@@ -2,9 +2,11 @@
 # SPDX-License-Identifier: MIT

 from __future__ import annotations
-from uuid import uuid4
-from types import SimpleNamespace
+
 from pathlib import Path
+from types import SimpleNamespace
+from uuid import uuid4
+
 import pytest

 import src.rag.milvus as milvus_mod
@@ -13,7 +15,6 @@ from src.rag.retriever import Resource


 class DummyEmbedding:
-
    def __init__(self, **kwargs):
        self.kwargs = kwargs

@@ -369,9 +370,7 @@ def test_create_collection_lite(monkeypatch):
        def list_collections(self):  # noqa: D401
            return []  # empty triggers creation

-        def create_collection(
-            self, collection_name, schema, index_params
-        ):  # noqa: D401
+        def create_collection(self, collection_name, schema, index_params):  # noqa: D401
            created["name"] = collection_name
            created["schema"] = schema
            created["index"] = index_params