src/llms/llm.py

# Copyright (c) 2025 Bytedance Ltd. and/or its affiliates
# SPDX-License-Identifier: MIT

from pathlib import Path
from typing import Any, Dict
import os
import ssl
import httpx

from langchain_openai import ChatOpenAI
from langchain_deepseek import ChatDeepSeek
from typing import get_args

from src.config import load_yaml_config
from src.config.agents import LLMType

# Cache for LLM instances
_llm_cache: dict[LLMType, ChatOpenAI] = {}


def _get_config_file_path() -> str:
    """Get the path to the configuration file."""
    return str((Path(__file__).parent.parent.parent / "conf.yaml").resolve())


def _get_llm_type_config_keys() -> dict[str, str]:
    """Get mapping of LLM types to their configuration keys."""
    return {
        "reasoning": "REASONING_MODEL",
        "basic": "BASIC_MODEL",
        "vision": "VISION_MODEL",
    }


def _get_env_llm_conf(llm_type: str) -> Dict[str, Any]:
    """
    Get LLM configuration from environment variables.
    Environment variables should follow the format: {LLM_TYPE}__{KEY}
    e.g., BASIC_MODEL__api_key, BASIC_MODEL__base_url
    """
    prefix = f"{llm_type.upper()}_MODEL__"
    conf = {}
    for key, value in os.environ.items():
        if key.startswith(prefix):
            conf_key = key[len(prefix) :].lower()
            conf[conf_key] = value
    return conf


def _create_llm_use_conf(
    llm_type: LLMType, conf: Dict[str, Any]
) -> ChatOpenAI | ChatDeepSeek:
    """Create LLM instance using configuration."""
    llm_type_config_keys = _get_llm_type_config_keys()
    config_key = llm_type_config_keys.get(llm_type)

    if not config_key:
        raise ValueError(f"Unknown LLM type: {llm_type}")

    llm_conf = conf.get(config_key, {})
    if not isinstance(llm_conf, dict):
        raise ValueError(f"Invalid LLM configuration for {llm_type}: {llm_conf}")

    # Get configuration from environment variables
    env_conf = _get_env_llm_conf(llm_type)

    # Merge configurations, with environment variables taking precedence
    merged_conf = {**llm_conf, **env_conf}

    if not merged_conf:
        raise ValueError(f"No configuration found for LLM type: {llm_type}")

    if llm_type == "reasoning":
        merged_conf["api_base"] = merged_conf.pop("base_url", None)

    # Handle SSL verification settings
    verify_ssl = merged_conf.pop("verify_ssl", True)

    # Create custom HTTP client if SSL verification is disabled
    if not verify_ssl:
        http_client = httpx.Client(verify=False)
        http_async_client = httpx.AsyncClient(verify=False)
        merged_conf["http_client"] = http_client
        merged_conf["http_async_client"] = http_async_client

    return (
        ChatOpenAI(**merged_conf)
        if llm_type != "reasoning"
        else ChatDeepSeek(**merged_conf)
    )


def get_llm_by_type(
    llm_type: LLMType,
) -> ChatOpenAI:
    """
    Get LLM instance by type. Returns cached instance if available.
    """
    if llm_type in _llm_cache:
        return _llm_cache[llm_type]

    conf = load_yaml_config(_get_config_file_path())
    llm = _create_llm_use_conf(llm_type, conf)
    _llm_cache[llm_type] = llm
    return llm


def get_configured_llm_models() -> dict[str, list[str]]:
    """
    Get all configured LLM models grouped by type.

    Returns:
        Dictionary mapping LLM type to list of configured model names.
    """
    try:
        conf = load_yaml_config(_get_config_file_path())
        llm_type_config_keys = _get_llm_type_config_keys()

        configured_models: dict[str, list[str]] = {}

        for llm_type in get_args(LLMType):
            # Get configuration from YAML file
            config_key = llm_type_config_keys.get(llm_type, "")
            yaml_conf = conf.get(config_key, {}) if config_key else {}

            # Get configuration from environment variables
            env_conf = _get_env_llm_conf(llm_type)

            # Merge configurations, with environment variables taking precedence
            merged_conf = {**yaml_conf, **env_conf}

            # Check if model is configured
            model_name = merged_conf.get("model")
            if model_name:
                configured_models.setdefault(llm_type, []).append(model_name)

        return configured_models

    except Exception as e:
        # Log error and return empty dict to avoid breaking the application
        print(f"Warning: Failed to load LLM configuration: {e}")
        return {}


# In the future, we will use reasoning_llm and vl_llm for different purposes
# reasoning_llm = get_llm_by_type("reasoning")
# vl_llm = get_llm_by_type("vision")
chore: add license headers 2025-04-17 11:34:42 +08:00			`# Copyright (c) 2025 Bytedance Ltd. and/or its affiliates`
			`# SPDX-License-Identifier: MIT`

feat: remove `reasoning_llm` and `vl_llm` for now 2025-05-07 17:23:25 +08:00			`from pathlib import Path`
			`from typing import Any, Dict`
feat: support llm env in env file (#251) 2025-05-28 01:21:40 -07:00			`import os`
Add support for self-signed certs from model providers (#276) * Add support for self-signed certs from model providers * cleanup --------- Co-authored-by: tonydoesathing <tmastromarino@cpacket.com> Co-authored-by: Willem Jiang <willem.jiang@gmail.com> 2025-06-25 19:17:26 -07:00			`import ssl`
			`import httpx`
feat: remove `reasoning_llm` and `vl_llm` for now 2025-05-07 17:23:25 +08:00
feat: lite deep researcher implementation 2025-04-07 16:25:55 +08:00			`from langchain_openai import ChatOpenAI`
feat: add deep think feature (#311) * feat: implement backend logic * feat: implement api/config endpoint * rename the symbol * feat: re-implement configuration at client-side * feat: add client-side of deep thinking * fix backend bug * feat: add reasoning block * docs: update readme * fix: translate into English * fix: change icon to lightbulb * feat: ignore more bad cases * feat: adjust thinking layout, and implement auto scrolling * docs: add comments --------- Co-authored-by: Henry Li <henry1943@163.com> 2025-06-14 13:12:43 +08:00			`from langchain_deepseek import ChatDeepSeek`
			`from typing import get_args`
feat: remove `reasoning_llm` and `vl_llm` for now 2025-05-07 17:23:25 +08:00
feat: lite deep researcher implementation 2025-04-07 16:25:55 +08:00			`from src.config import load_yaml_config`
			`from src.config.agents import LLMType`

			`# Cache for LLM instances`
			`_llm_cache: dict[LLMType, ChatOpenAI] = {}`


feat: add deep think feature (#311) * feat: implement backend logic * feat: implement api/config endpoint * rename the symbol * feat: re-implement configuration at client-side * feat: add client-side of deep thinking * fix backend bug * feat: add reasoning block * docs: update readme * fix: translate into English * fix: change icon to lightbulb * feat: ignore more bad cases * feat: adjust thinking layout, and implement auto scrolling * docs: add comments --------- Co-authored-by: Henry Li <henry1943@163.com> 2025-06-14 13:12:43 +08:00			`def _get_config_file_path() -> str:`
			`"""Get the path to the configuration file."""`
			`return str((Path(__file__).parent.parent.parent / "conf.yaml").resolve())`


			`def _get_llm_type_config_keys() -> dict[str, str]:`
			`"""Get mapping of LLM types to their configuration keys."""`
			`return {`
			`"reasoning": "REASONING_MODEL",`
			`"basic": "BASIC_MODEL",`
			`"vision": "VISION_MODEL",`
			`}`


feat: support llm env in env file (#251) 2025-05-28 01:21:40 -07:00			`def _get_env_llm_conf(llm_type: str) -> Dict[str, Any]:`
			`"""`
			`Get LLM configuration from environment variables.`
			`Environment variables should follow the format: {LLM_TYPE}__{KEY}`
			`e.g., BASIC_MODEL__api_key, BASIC_MODEL__base_url`
			`"""`
			`prefix = f"{llm_type.upper()}_MODEL__"`
			`conf = {}`
			`for key, value in os.environ.items():`
			`if key.startswith(prefix):`
			`conf_key = key[len(prefix) :].lower()`
			`conf[conf_key] = value`
			`return conf`


feat: add deep think feature (#311) * feat: implement backend logic * feat: implement api/config endpoint * rename the symbol * feat: re-implement configuration at client-side * feat: add client-side of deep thinking * fix backend bug * feat: add reasoning block * docs: update readme * fix: translate into English * fix: change icon to lightbulb * feat: ignore more bad cases * feat: adjust thinking layout, and implement auto scrolling * docs: add comments --------- Co-authored-by: Henry Li <henry1943@163.com> 2025-06-14 13:12:43 +08:00			`def _create_llm_use_conf(`
			`llm_type: LLMType, conf: Dict[str, Any]`
			`) -> ChatOpenAI \| ChatDeepSeek:`
			`"""Create LLM instance using configuration."""`
			`llm_type_config_keys = _get_llm_type_config_keys()`
			`config_key = llm_type_config_keys.get(llm_type)`

			`if not config_key:`
			`raise ValueError(f"Unknown LLM type: {llm_type}")`

			`llm_conf = conf.get(config_key, {})`
feat: lite deep researcher implementation 2025-04-07 16:25:55 +08:00			`if not isinstance(llm_conf, dict):`
feat: add deep think feature (#311) * feat: implement backend logic * feat: implement api/config endpoint * rename the symbol * feat: re-implement configuration at client-side * feat: add client-side of deep thinking * fix backend bug * feat: add reasoning block * docs: update readme * fix: translate into English * fix: change icon to lightbulb * feat: ignore more bad cases * feat: adjust thinking layout, and implement auto scrolling * docs: add comments --------- Co-authored-by: Henry Li <henry1943@163.com> 2025-06-14 13:12:43 +08:00			`raise ValueError(f"Invalid LLM configuration for {llm_type}: {llm_conf}")`

feat: support llm env in env file (#251) 2025-05-28 01:21:40 -07:00			`# Get configuration from environment variables`
			`env_conf = _get_env_llm_conf(llm_type)`

			`# Merge configurations, with environment variables taking precedence`
			`merged_conf = {llm_conf, env_conf}`

			`if not merged_conf:`
feat: add deep think feature (#311) * feat: implement backend logic * feat: implement api/config endpoint * rename the symbol * feat: re-implement configuration at client-side * feat: add client-side of deep thinking * fix backend bug * feat: add reasoning block * docs: update readme * fix: translate into English * fix: change icon to lightbulb * feat: ignore more bad cases * feat: adjust thinking layout, and implement auto scrolling * docs: add comments --------- Co-authored-by: Henry Li <henry1943@163.com> 2025-06-14 13:12:43 +08:00			`raise ValueError(f"No configuration found for LLM type: {llm_type}")`
feat: support llm env in env file (#251) 2025-05-28 01:21:40 -07:00
feat: add deep think feature (#311) * feat: implement backend logic * feat: implement api/config endpoint * rename the symbol * feat: re-implement configuration at client-side * feat: add client-side of deep thinking * fix backend bug * feat: add reasoning block * docs: update readme * fix: translate into English * fix: change icon to lightbulb * feat: ignore more bad cases * feat: adjust thinking layout, and implement auto scrolling * docs: add comments --------- Co-authored-by: Henry Li <henry1943@163.com> 2025-06-14 13:12:43 +08:00			`if llm_type == "reasoning":`
			`merged_conf["api_base"] = merged_conf.pop("base_url", None)`

Add support for self-signed certs from model providers (#276) * Add support for self-signed certs from model providers * cleanup --------- Co-authored-by: tonydoesathing <tmastromarino@cpacket.com> Co-authored-by: Willem Jiang <willem.jiang@gmail.com> 2025-06-25 19:17:26 -07:00			`# Handle SSL verification settings`
			`verify_ssl = merged_conf.pop("verify_ssl", True)`
fix: the lint error of llm.py (#369) 2025-06-26 10:36:26 +08:00
Add support for self-signed certs from model providers (#276) * Add support for self-signed certs from model providers * cleanup --------- Co-authored-by: tonydoesathing <tmastromarino@cpacket.com> Co-authored-by: Willem Jiang <willem.jiang@gmail.com> 2025-06-25 19:17:26 -07:00			`# Create custom HTTP client if SSL verification is disabled`
			`if not verify_ssl:`
			`http_client = httpx.Client(verify=False)`
			`http_async_client = httpx.AsyncClient(verify=False)`
			`merged_conf["http_client"] = http_client`
			`merged_conf["http_async_client"] = http_async_client`

feat: add deep think feature (#311) * feat: implement backend logic * feat: implement api/config endpoint * rename the symbol * feat: re-implement configuration at client-side * feat: add client-side of deep thinking * fix backend bug * feat: add reasoning block * docs: update readme * fix: translate into English * fix: change icon to lightbulb * feat: ignore more bad cases * feat: adjust thinking layout, and implement auto scrolling * docs: add comments --------- Co-authored-by: Henry Li <henry1943@163.com> 2025-06-14 13:12:43 +08:00			`return (`
			`ChatOpenAI(**merged_conf)`
			`if llm_type != "reasoning"`
			`else ChatDeepSeek(**merged_conf)`
			`)`
feat: lite deep researcher implementation 2025-04-07 16:25:55 +08:00

			`def get_llm_by_type(`
			`llm_type: LLMType,`
			`) -> ChatOpenAI:`
			`"""`
			`Get LLM instance by type. Returns cached instance if available.`
			`"""`
			`if llm_type in _llm_cache:`
			`return _llm_cache[llm_type]`

feat: add deep think feature (#311) * feat: implement backend logic * feat: implement api/config endpoint * rename the symbol * feat: re-implement configuration at client-side * feat: add client-side of deep thinking * fix backend bug * feat: add reasoning block * docs: update readme * fix: translate into English * fix: change icon to lightbulb * feat: ignore more bad cases * feat: adjust thinking layout, and implement auto scrolling * docs: add comments --------- Co-authored-by: Henry Li <henry1943@163.com> 2025-06-14 13:12:43 +08:00			`conf = load_yaml_config(_get_config_file_path())`
feat: lite deep researcher implementation 2025-04-07 16:25:55 +08:00			`llm = _create_llm_use_conf(llm_type, conf)`
			`_llm_cache[llm_type] = llm`
			`return llm`


feat: add deep think feature (#311) * feat: implement backend logic * feat: implement api/config endpoint * rename the symbol * feat: re-implement configuration at client-side * feat: add client-side of deep thinking * fix backend bug * feat: add reasoning block * docs: update readme * fix: translate into English * fix: change icon to lightbulb * feat: ignore more bad cases * feat: adjust thinking layout, and implement auto scrolling * docs: add comments --------- Co-authored-by: Henry Li <henry1943@163.com> 2025-06-14 13:12:43 +08:00			`def get_configured_llm_models() -> dict[str, list[str]]:`
			`"""`
			`Get all configured LLM models grouped by type.`

			`Returns:`
			`Dictionary mapping LLM type to list of configured model names.`
			`"""`
			`try:`
			`conf = load_yaml_config(_get_config_file_path())`
			`llm_type_config_keys = _get_llm_type_config_keys()`

			`configured_models: dict[str, list[str]] = {}`

			`for llm_type in get_args(LLMType):`
			`# Get configuration from YAML file`
			`config_key = llm_type_config_keys.get(llm_type, "")`
			`yaml_conf = conf.get(config_key, {}) if config_key else {}`

			`# Get configuration from environment variables`
			`env_conf = _get_env_llm_conf(llm_type)`

			`# Merge configurations, with environment variables taking precedence`
			`merged_conf = {yaml_conf, env_conf}`

			`# Check if model is configured`
			`model_name = merged_conf.get("model")`
			`if model_name:`
			`configured_models.setdefault(llm_type, []).append(model_name)`

			`return configured_models`

			`except Exception as e:`
			`# Log error and return empty dict to avoid breaking the application`
			`print(f"Warning: Failed to load LLM configuration: {e}")`
			`return {}`


feat: remove `reasoning_llm` and `vl_llm` for now 2025-05-07 17:23:25 +08:00			`# In the future, we will use reasoning_llm and vl_llm for different purposes`
			`# reasoning_llm = get_llm_by_type("reasoning")`
			`# vl_llm = get_llm_by_type("vision")`