zhenxun_bot/zhenxun/services/llm/config/generation.py

"""
LLM 生成配置相关类和函数
"""

from typing import Any

from pydantic import BaseModel, Field

from zhenxun.services.log import logger
from zhenxun.utils.pydantic_compat import model_dump

from ..types.enums import ResponseFormat
from ..types.exceptions import LLMErrorCode, LLMException


class ModelConfigOverride(BaseModel):
    """模型配置覆盖参数"""

    temperature: float | None = Field(
        default=None, ge=0.0, le=2.0, description="生成温度"
    )
    max_tokens: int | None = Field(default=None, gt=0, description="最大输出token数")
    top_p: float | None = Field(default=None, ge=0.0, le=1.0, description="核采样参数")
    top_k: int | None = Field(default=None, gt=0, description="Top-K采样参数")
    frequency_penalty: float | None = Field(
        default=None, ge=-2.0, le=2.0, description="频率惩罚"
    )
    presence_penalty: float | None = Field(
        default=None, ge=-2.0, le=2.0, description="存在惩罚"
    )
    repetition_penalty: float | None = Field(
        default=None, ge=0.0, le=2.0, description="重复惩罚"
    )

    stop: list[str] | str | None = Field(default=None, description="停止序列")

    response_format: ResponseFormat | dict[str, Any] | None = Field(
        default=None, description="期望的响应格式"
    )
    response_mime_type: str | None = Field(
        default=None, description="响应MIME类型（Gemini专用）"
    )
    response_schema: dict[str, Any] | None = Field(
        default=None, description="JSON响应模式"
    )
    thinking_budget: float | None = Field(
        default=None, ge=0.0, le=1.0, description="思考预算"
    )
    include_thoughts: bool | None = Field(
        default=None, description="是否在响应中包含思维过程（Gemini专用）"
    )
    safety_settings: dict[str, str] | None = Field(default=None, description="安全设置")
    response_modalities: list[str] | None = Field(
        default=None, description="响应模态类型"
    )

    enable_code_execution: bool | None = Field(
        default=None, description="是否启用代码执行"
    )
    enable_grounding: bool | None = Field(
        default=None, description="是否启用信息来源关联"
    )
    enable_caching: bool | None = Field(default=None, description="是否启用响应缓存")

    custom_params: dict[str, Any] | None = Field(default=None, description="自定义参数")

    def to_dict(self) -> dict[str, Any]:
        """转换为字典，排除None值"""

        model_data = model_dump(self, exclude_none=True)

        result = {}
        for key, value in model_data.items():
            if key == "custom_params" and isinstance(value, dict):
                result.update(value)
            else:
                result[key] = value

        return result

    def merge_with_base_config(
        self,
        base_temperature: float | None = None,
        base_max_tokens: int | None = None,
    ) -> dict[str, Any]:
        """与基础配置合并，覆盖参数优先"""
        merged = {}

        if base_temperature is not None:
            merged["temperature"] = base_temperature
        if base_max_tokens is not None:
            merged["max_tokens"] = base_max_tokens

        override_dict = self.to_dict()
        merged.update(override_dict)

        return merged


class LLMGenerationConfig(ModelConfigOverride):
    """LLM 生成配置，继承模型配置覆盖参数"""

    def to_api_params(self, api_type: str, model_name: str) -> dict[str, Any]:
        """转换为API参数，支持不同API类型的参数名映射"""
        _ = model_name
        params = {}

        if self.temperature is not None:
            params["temperature"] = self.temperature

        if self.max_tokens is not None:
            if api_type == "gemini":
                params["maxOutputTokens"] = self.max_tokens
            else:
                params["max_tokens"] = self.max_tokens

        if api_type == "gemini":
            if self.top_k is not None:
                params["topK"] = self.top_k
            if self.top_p is not None:
                params["topP"] = self.top_p
        else:
            if self.top_k is not None:
                params["top_k"] = self.top_k
            if self.top_p is not None:
                params["top_p"] = self.top_p

        if api_type in ["openai", "deepseek", "zhipu", "general_openai_compat"]:
            if self.frequency_penalty is not None:
                params["frequency_penalty"] = self.frequency_penalty
            if self.presence_penalty is not None:
                params["presence_penalty"] = self.presence_penalty

            if self.repetition_penalty is not None:
                if api_type == "openai":
                    logger.warning("OpenAI官方API不支持repetition_penalty参数，已忽略")
                else:
                    params["repetition_penalty"] = self.repetition_penalty

        if self.response_format is not None:
            if isinstance(self.response_format, dict):
                if api_type in ["openai", "zhipu", "deepseek", "general_openai_compat"]:
                    params["response_format"] = self.response_format
                    logger.debug(
                        f"为 {api_type} 使用自定义 response_format: "
                        f"{self.response_format}"
                    )
            elif self.response_format == ResponseFormat.JSON:
                if api_type in ["openai", "zhipu", "deepseek", "general_openai_compat"]:
                    params["response_format"] = {"type": "json_object"}
                    logger.debug(f"为 {api_type} 启用 JSON 对象输出模式")
                elif api_type == "gemini":
                    params["responseMimeType"] = "application/json"
                    if self.response_schema:
                        params["responseSchema"] = self.response_schema
                    logger.debug(f"为 {api_type} 启用 JSON MIME 类型输出模式")

        if self.custom_params:
            custom_mapped = apply_api_specific_mappings(self.custom_params, api_type)
            params.update(custom_mapped)

        if api_type == "gemini":
            if (
                self.response_format != ResponseFormat.JSON
                and self.response_mime_type is not None
            ):
                params["responseMimeType"] = self.response_mime_type
                logger.debug(
                    f"使用显式设置的 responseMimeType: {self.response_mime_type}"
                )

            if self.response_schema is not None and "responseSchema" not in params:
                params["responseSchema"] = self.response_schema

            if self.thinking_budget is not None or self.include_thoughts is not None:
                thinking_config = params.setdefault("thinkingConfig", {})

                if self.thinking_budget is not None:
                    max_budget = 24576
                    budget_value = int(self.thinking_budget * max_budget)
                    thinking_config["thinkingBudget"] = budget_value
                    logger.debug(
                        f"已将 thinking_budget (float: {self.thinking_budget}) "
                        f"转换为 Gemini API 的整数格式: {budget_value}"
                    )

                if self.include_thoughts is not None:
                    thinking_config["includeThoughts"] = self.include_thoughts
                    logger.debug(f"已设置 includeThoughts: {self.include_thoughts}")

            if self.safety_settings is not None:
                params["safetySettings"] = self.safety_settings
            if self.response_modalities is not None:
                params["responseModalities"] = self.response_modalities

        logger.debug(f"为{api_type}转换配置参数: {len(params)}个参数")
        return params


def validate_override_params(
    override_config: dict[str, Any] | LLMGenerationConfig | None,
) -> LLMGenerationConfig:
    """验证和标准化覆盖参数"""
    if override_config is None:
        return LLMGenerationConfig()

    if isinstance(override_config, dict):
        try:
            filtered_config = {
                k: v for k, v in override_config.items() if v is not None
            }
            return LLMGenerationConfig(**filtered_config)
        except Exception as e:
            logger.warning(f"覆盖配置参数验证失败: {e}")
            raise LLMException(
                f"无效的覆盖配置参数: {e}",
                code=LLMErrorCode.CONFIGURATION_ERROR,
                cause=e,
            )

    return override_config


def apply_api_specific_mappings(
    params: dict[str, Any], api_type: str
) -> dict[str, Any]:
    """应用API特定的参数映射"""
    mapped_params = params.copy()

    if api_type == "gemini":
        if "max_tokens" in mapped_params:
            mapped_params["maxOutputTokens"] = mapped_params.pop("max_tokens")
        if "top_k" in mapped_params:
            mapped_params["topK"] = mapped_params.pop("top_k")
        if "top_p" in mapped_params:
            mapped_params["topP"] = mapped_params.pop("top_p")

        unsupported = ["frequency_penalty", "presence_penalty", "repetition_penalty"]
        for param in unsupported:
            if param in mapped_params:
                logger.warning(f"Gemini 原生API不支持参数 '{param}'，已忽略")
                mapped_params.pop(param)

    elif api_type in ["openai", "deepseek", "zhipu", "general_openai_compat"]:
        if "repetition_penalty" in mapped_params and api_type == "openai":
            logger.warning("OpenAI官方API不支持repetition_penalty参数，已忽略")
            mapped_params.pop("repetition_penalty")

        if "stop" in mapped_params:
            stop_value = mapped_params["stop"]
            if isinstance(stop_value, str):
                mapped_params["stop"] = [stop_value]

    return mapped_params


def create_generation_config_from_kwargs(**kwargs) -> LLMGenerationConfig:
    """从关键字参数创建生成配置"""
    model_fields = getattr(LLMGenerationConfig, "model_fields", {})
    known_fields = set(model_fields.keys())
    known_params = {}
    custom_params = {}

    for key, value in kwargs.items():
        if key in known_fields:
            known_params[key] = value
        else:
            custom_params[key] = value

    if custom_params:
        known_params["custom_params"] = custom_params

    return LLMGenerationConfig(**known_params)
-												✨ feat(llm): 实现LLM服务模块，支持多提供商统一接口和高级功能 (#1923)

* ✨ feat(llm): 实现LLM服务模块，支持多提供商统一接口和高级功能

* 🎨 Ruff

* :sparkles: Config配置类支持BaseModel存储

* :art: 代码格式化

* :art: 代码格式化

* :art: 格式化代码

* ✨ feat(llm): 添加 AI 对话历史管理

* ✨ feat(llmConfig): 引入 LLM 配置模型及管理功能

* 🎨 Ruff

---------

Co-authored-by: fccckaug <xxxmio123123@gmail.com>
Co-authored-by: HibiKier <45528451+HibiKier@users.noreply.github.com>
Co-authored-by: HibiKier <775757368@qq.com>
Co-authored-by: fccckaug <xxxmcsmiomio3@gmail.com>
Co-authored-by: webjoin111 <455457521@qq.com>
											
										
										
											2025-06-21 16:33:21 +08:00
+								"""
 								LLM 生成配置相关类和函数
 								"""
 								from typing import Any
 								from pydantic import BaseModel, Field
 								from zhenxun.services.log import logger
-												♻️ refactor!: 重构LLM服务架构并统一Pydantic兼容性处理 (#2002)

* ♻️ refactor(pydantic): 提取 Pydantic 兼容函数到独立模块

* ♻️ refactor!(llm): 重构LLM服务，引入现代化工具和执行器架构

🏗️ **架构变更**
- 引入ToolProvider/ToolExecutable协议，取代ToolRegistry
- 新增LLMToolExecutor，分离工具调用逻辑
- 新增BaseMemory抽象，解耦会话状态管理

🔄 **API重构**
- 移除：analyze, analyze_multimodal, pipeline_chat
- 新增：generate_structured, run_with_tools
- 重构：chat, search, code变为无状态调用

🛠️ **工具系统**
- 新增@function_tool装饰器
- 统一工具定义到ToolExecutable协议
- 移除MCP工具系统和mcp_tools.json

---------

Co-authored-by: webjoin111 <455457521@qq.com>
											
										
										
											2025-08-04 23:36:12 +08:00
+								from zhenxun.utils.pydantic_compat import model_dump
-												✨ feat(llm): 实现LLM服务模块，支持多提供商统一接口和高级功能 (#1923)

* ✨ feat(llm): 实现LLM服务模块，支持多提供商统一接口和高级功能

* 🎨 Ruff

* :sparkles: Config配置类支持BaseModel存储

* :art: 代码格式化

* :art: 代码格式化

* :art: 格式化代码

* ✨ feat(llm): 添加 AI 对话历史管理

* ✨ feat(llmConfig): 引入 LLM 配置模型及管理功能

* 🎨 Ruff

---------

Co-authored-by: fccckaug <xxxmio123123@gmail.com>
Co-authored-by: HibiKier <45528451+HibiKier@users.noreply.github.com>
Co-authored-by: HibiKier <775757368@qq.com>
Co-authored-by: fccckaug <xxxmcsmiomio3@gmail.com>
Co-authored-by: webjoin111 <455457521@qq.com>
											
										
										
											2025-06-21 16:33:21 +08:00
 								from ..types.enums import ResponseFormat
 								from ..types.exceptions import LLMErrorCode, LLMException
 								class ModelConfigOverride(BaseModel):
 								    """模型配置覆盖参数"""
 								    temperature: float | None = Field(
 								        default=None, ge=0.0, le=2.0, description="生成温度"
 								    )
 								    max_tokens: int | None = Field(default=None, gt=0, description="最大输出token数")
 								    top_p: float | None = Field(default=None, ge=0.0, le=1.0, description="核采样参数")
 								    top_k: int | None = Field(default=None, gt=0, description="Top-K采样参数")
 								    frequency_penalty: float | None = Field(
 								        default=None, ge=-2.0, le=2.0, description="频率惩罚"
 								    )
 								    presence_penalty: float | None = Field(
 								        default=None, ge=-2.0, le=2.0, description="存在惩罚"
 								    )
 								    repetition_penalty: float | None = Field(
 								        default=None, ge=0.0, le=2.0, description="重复惩罚"
 								    )
 								    stop: list[str] | str | None = Field(default=None, description="停止序列")
 								    response_format: ResponseFormat | dict[str, Any] | None = Field(
 								        default=None, description="期望的响应格式"
 								    )
 								    response_mime_type: str | None = Field(
 								        default=None, description="响应MIME类型（Gemini专用）"
 								    )
 								    response_schema: dict[str, Any] | None = Field(
 								        default=None, description="JSON响应模式"
 								    )
 								    thinking_budget: float | None = Field(
 								        default=None, ge=0.0, le=1.0, description="思考预算"
 								    )
-												♻️ refactor!: 重构LLM服务架构并统一Pydantic兼容性处理 (#2002)

* ♻️ refactor(pydantic): 提取 Pydantic 兼容函数到独立模块

* ♻️ refactor!(llm): 重构LLM服务，引入现代化工具和执行器架构

🏗️ **架构变更**
- 引入ToolProvider/ToolExecutable协议，取代ToolRegistry
- 新增LLMToolExecutor，分离工具调用逻辑
- 新增BaseMemory抽象，解耦会话状态管理

🔄 **API重构**
- 移除：analyze, analyze_multimodal, pipeline_chat
- 新增：generate_structured, run_with_tools
- 重构：chat, search, code变为无状态调用

🛠️ **工具系统**
- 新增@function_tool装饰器
- 统一工具定义到ToolExecutable协议
- 移除MCP工具系统和mcp_tools.json

---------

Co-authored-by: webjoin111 <455457521@qq.com>
											
										
										
											2025-08-04 23:36:12 +08:00
+								    include_thoughts: bool | None = Field(
 								        default=None, description="是否在响应中包含思维过程（Gemini专用）"
 								    )
-												✨ feat(llm): 实现LLM服务模块，支持多提供商统一接口和高级功能 (#1923)

* ✨ feat(llm): 实现LLM服务模块，支持多提供商统一接口和高级功能

* 🎨 Ruff

* :sparkles: Config配置类支持BaseModel存储

* :art: 代码格式化

* :art: 代码格式化

* :art: 格式化代码

* ✨ feat(llm): 添加 AI 对话历史管理

* ✨ feat(llmConfig): 引入 LLM 配置模型及管理功能

* 🎨 Ruff

---------

Co-authored-by: fccckaug <xxxmio123123@gmail.com>
Co-authored-by: HibiKier <45528451+HibiKier@users.noreply.github.com>
Co-authored-by: HibiKier <775757368@qq.com>
Co-authored-by: fccckaug <xxxmcsmiomio3@gmail.com>
Co-authored-by: webjoin111 <455457521@qq.com>
											
										
										
											2025-06-21 16:33:21 +08:00
+								    safety_settings: dict[str, str] | None = Field(default=None, description="安全设置")
 								    response_modalities: list[str] | None = Field(
 								        default=None, description="响应模态类型"
 								    )
 								    enable_code_execution: bool | None = Field(
 								        default=None, description="是否启用代码执行"
 								    )
 								    enable_grounding: bool | None = Field(
 								        default=None, description="是否启用信息来源关联"
 								    )
 								    enable_caching: bool | None = Field(default=None, description="是否启用响应缓存")
 								    custom_params: dict[str, Any] | None = Field(default=None, description="自定义参数")
 								    def to_dict(self) -> dict[str, Any]:
 								        """转换为字典，排除None值"""
-												♻️ refactor!: 重构LLM服务架构并统一Pydantic兼容性处理 (#2002)

* ♻️ refactor(pydantic): 提取 Pydantic 兼容函数到独立模块

* ♻️ refactor!(llm): 重构LLM服务，引入现代化工具和执行器架构

🏗️ **架构变更**
- 引入ToolProvider/ToolExecutable协议，取代ToolRegistry
- 新增LLMToolExecutor，分离工具调用逻辑
- 新增BaseMemory抽象，解耦会话状态管理

🔄 **API重构**
- 移除：analyze, analyze_multimodal, pipeline_chat
- 新增：generate_structured, run_with_tools
- 重构：chat, search, code变为无状态调用

🛠️ **工具系统**
- 新增@function_tool装饰器
- 统一工具定义到ToolExecutable协议
- 移除MCP工具系统和mcp_tools.json

---------

Co-authored-by: webjoin111 <455457521@qq.com>
											
										
										
											2025-08-04 23:36:12 +08:00
 								        model_data = model_dump(self, exclude_none=True)
-												✨ feat(llm): 实现LLM服务模块，支持多提供商统一接口和高级功能 (#1923)

* ✨ feat(llm): 实现LLM服务模块，支持多提供商统一接口和高级功能

* 🎨 Ruff

* :sparkles: Config配置类支持BaseModel存储

* :art: 代码格式化

* :art: 代码格式化

* :art: 格式化代码

* ✨ feat(llm): 添加 AI 对话历史管理

* ✨ feat(llmConfig): 引入 LLM 配置模型及管理功能

* 🎨 Ruff

---------

Co-authored-by: fccckaug <xxxmio123123@gmail.com>
Co-authored-by: HibiKier <45528451+HibiKier@users.noreply.github.com>
Co-authored-by: HibiKier <775757368@qq.com>
Co-authored-by: fccckaug <xxxmcsmiomio3@gmail.com>
Co-authored-by: webjoin111 <455457521@qq.com>
											
										
										
											2025-06-21 16:33:21 +08:00
+								        result = {}
 								        for key, value in model_data.items():
-												♻️ refactor!: 重构LLM服务架构并统一Pydantic兼容性处理 (#2002)

* ♻️ refactor(pydantic): 提取 Pydantic 兼容函数到独立模块

* ♻️ refactor!(llm): 重构LLM服务，引入现代化工具和执行器架构

🏗️ **架构变更**
- 引入ToolProvider/ToolExecutable协议，取代ToolRegistry
- 新增LLMToolExecutor，分离工具调用逻辑
- 新增BaseMemory抽象，解耦会话状态管理

🔄 **API重构**
- 移除：analyze, analyze_multimodal, pipeline_chat
- 新增：generate_structured, run_with_tools
- 重构：chat, search, code变为无状态调用

🛠️ **工具系统**
- 新增@function_tool装饰器
- 统一工具定义到ToolExecutable协议
- 移除MCP工具系统和mcp_tools.json

---------

Co-authored-by: webjoin111 <455457521@qq.com>
											
										
										
											2025-08-04 23:36:12 +08:00
+								            if key == "custom_params" and isinstance(value, dict):
 								                result.update(value)
 								            else:
 								                result[key] = value
-												✨ feat(llm): 实现LLM服务模块，支持多提供商统一接口和高级功能 (#1923)

* ✨ feat(llm): 实现LLM服务模块，支持多提供商统一接口和高级功能

* 🎨 Ruff

* :sparkles: Config配置类支持BaseModel存储

* :art: 代码格式化

* :art: 代码格式化

* :art: 格式化代码

* ✨ feat(llm): 添加 AI 对话历史管理

* ✨ feat(llmConfig): 引入 LLM 配置模型及管理功能

* 🎨 Ruff

---------

Co-authored-by: fccckaug <xxxmio123123@gmail.com>
Co-authored-by: HibiKier <45528451+HibiKier@users.noreply.github.com>
Co-authored-by: HibiKier <775757368@qq.com>
Co-authored-by: fccckaug <xxxmcsmiomio3@gmail.com>
Co-authored-by: webjoin111 <455457521@qq.com>
											
										
										
											2025-06-21 16:33:21 +08:00
+								        return result
 								    def merge_with_base_config(
 								        self,
 								        base_temperature: float | None = None,
 								        base_max_tokens: int | None = None,
 								    ) -> dict[str, Any]:
 								        """与基础配置合并，覆盖参数优先"""
 								        merged = {}
 								        if base_temperature is not None:
 								            merged["temperature"] = base_temperature
 								        if base_max_tokens is not None:
 								            merged["max_tokens"] = base_max_tokens
 								        override_dict = self.to_dict()
 								        merged.update(override_dict)
 								        return merged
 								class LLMGenerationConfig(ModelConfigOverride):
 								    """LLM 生成配置，继承模型配置覆盖参数"""
 								    def to_api_params(self, api_type: str, model_name: str) -> dict[str, Any]:
 								        """转换为API参数，支持不同API类型的参数名映射"""
 								        _ = model_name
 								        params = {}
 								        if self.temperature is not None:
 								            params["temperature"] = self.temperature
 								        if self.max_tokens is not None:
-												✨ feat(llm): 全面重构LLM服务模块，增强多模态与工具支持 (#1953)

* ✨ feat(llm): 全面重构LLM服务模块，增强多模态与工具支持

🚀 核心功能增强
- 多模型链式调用：新增 `pipeline_chat` 支持复杂任务流处理
- 扩展提供商支持：新增 ARK(火山方舟)、SiliconFlow(硅基流动) 适配器
- 多模态处理增强：支持URL媒体文件下载转换，提升输入灵活性
- 历史对话支持：AI.analyze 方法支持历史消息上下文和可选 UniMessage 参数
- 文本嵌入功能：新增 `embed`、`analyze_multimodal`、`search_multimodal` 等API
- 模型能力系统：新增 `ModelCapabilities` 统一管理模型特性（多模态、工具调用等）

🔧 架构重构与优化
- MCP工具系统重构：配置独立化至 `data/llm/mcp_tools.json`，预置常用工具
- API调用逻辑统一：提取通用 `_perform_api_call` 方法，消除代码重复
- 跨平台兼容：Windows平台MCP工具npx命令自动包装处理
- HTTP客户端增强：兼容不同版本httpx代理配置（0.28+版本适配）

🛠️ API与配置完善
- 统一返回类型：`AI.analyze` 统一返回 `LLMResponse` 类型
- 消息转换工具：新增 `message_to_unimessage` 转换函数
- Gemini适配器增强：URL图片下载编码、动态安全阈值配置
- 缓存管理：新增模型实例缓存和管理功能
- 配置预设：扩展 CommonOverrides 预设配置选项
- 历史管理优化：支持多模态内容占位符替换，提升效率

📚 文档与开发体验
- README全面重写：新增完整使用指南、API参考和架构概览
- 文档内容扩充：补充嵌入模型、缓存管理、工具注册等功能说明
- 日志记录增强：支持详细调试信息输出
- API简化：移除冗余函数，优化接口设计

* 🎨  feat(llm): 统一LLM服务函数文档格式

* ✨ feat(llm): 添加新模型并简化提供者配置加载

* :rotating_light: auto fix by pre-commit hooks

---------

Co-authored-by: webjoin111 <455457521@qq.com>
Co-authored-by: pre-commit-ci[bot] <66853113+pre-commit-ci[bot]@users.noreply.github.com>
											
										
										
											2025-07-08 11:15:15 +08:00
+								            if api_type == "gemini":
-												✨ feat(llm): 实现LLM服务模块，支持多提供商统一接口和高级功能 (#1923)

* ✨ feat(llm): 实现LLM服务模块，支持多提供商统一接口和高级功能

* 🎨 Ruff

* :sparkles: Config配置类支持BaseModel存储

* :art: 代码格式化

* :art: 代码格式化

* :art: 格式化代码

* ✨ feat(llm): 添加 AI 对话历史管理

* ✨ feat(llmConfig): 引入 LLM 配置模型及管理功能

* 🎨 Ruff

---------

Co-authored-by: fccckaug <xxxmio123123@gmail.com>
Co-authored-by: HibiKier <45528451+HibiKier@users.noreply.github.com>
Co-authored-by: HibiKier <775757368@qq.com>
Co-authored-by: fccckaug <xxxmcsmiomio3@gmail.com>
Co-authored-by: webjoin111 <455457521@qq.com>
											
										
										
											2025-06-21 16:33:21 +08:00
+								                params["maxOutputTokens"] = self.max_tokens
 								            else:
 								                params["max_tokens"] = self.max_tokens
-												✨ feat(llm): 全面重构LLM服务模块，增强多模态与工具支持 (#1953)

* ✨ feat(llm): 全面重构LLM服务模块，增强多模态与工具支持

🚀 核心功能增强
- 多模型链式调用：新增 `pipeline_chat` 支持复杂任务流处理
- 扩展提供商支持：新增 ARK(火山方舟)、SiliconFlow(硅基流动) 适配器
- 多模态处理增强：支持URL媒体文件下载转换，提升输入灵活性
- 历史对话支持：AI.analyze 方法支持历史消息上下文和可选 UniMessage 参数
- 文本嵌入功能：新增 `embed`、`analyze_multimodal`、`search_multimodal` 等API
- 模型能力系统：新增 `ModelCapabilities` 统一管理模型特性（多模态、工具调用等）

🔧 架构重构与优化
- MCP工具系统重构：配置独立化至 `data/llm/mcp_tools.json`，预置常用工具
- API调用逻辑统一：提取通用 `_perform_api_call` 方法，消除代码重复
- 跨平台兼容：Windows平台MCP工具npx命令自动包装处理
- HTTP客户端增强：兼容不同版本httpx代理配置（0.28+版本适配）

🛠️ API与配置完善
- 统一返回类型：`AI.analyze` 统一返回 `LLMResponse` 类型
- 消息转换工具：新增 `message_to_unimessage` 转换函数
- Gemini适配器增强：URL图片下载编码、动态安全阈值配置
- 缓存管理：新增模型实例缓存和管理功能
- 配置预设：扩展 CommonOverrides 预设配置选项
- 历史管理优化：支持多模态内容占位符替换，提升效率

📚 文档与开发体验
- README全面重写：新增完整使用指南、API参考和架构概览
- 文档内容扩充：补充嵌入模型、缓存管理、工具注册等功能说明
- 日志记录增强：支持详细调试信息输出
- API简化：移除冗余函数，优化接口设计

* 🎨  feat(llm): 统一LLM服务函数文档格式

* ✨ feat(llm): 添加新模型并简化提供者配置加载

* :rotating_light: auto fix by pre-commit hooks

---------

Co-authored-by: webjoin111 <455457521@qq.com>
Co-authored-by: pre-commit-ci[bot] <66853113+pre-commit-ci[bot]@users.noreply.github.com>
											
										
										
											2025-07-08 11:15:15 +08:00
+								        if api_type == "gemini":
-												✨ feat(llm): 实现LLM服务模块，支持多提供商统一接口和高级功能 (#1923)

* ✨ feat(llm): 实现LLM服务模块，支持多提供商统一接口和高级功能

* 🎨 Ruff

* :sparkles: Config配置类支持BaseModel存储

* :art: 代码格式化

* :art: 代码格式化

* :art: 格式化代码

* ✨ feat(llm): 添加 AI 对话历史管理

* ✨ feat(llmConfig): 引入 LLM 配置模型及管理功能

* 🎨 Ruff

---------

Co-authored-by: fccckaug <xxxmio123123@gmail.com>
Co-authored-by: HibiKier <45528451+HibiKier@users.noreply.github.com>
Co-authored-by: HibiKier <775757368@qq.com>
Co-authored-by: fccckaug <xxxmcsmiomio3@gmail.com>
Co-authored-by: webjoin111 <455457521@qq.com>
											
										
										
											2025-06-21 16:33:21 +08:00
+								            if self.top_k is not None:
 								                params["topK"] = self.top_k
 								            if self.top_p is not None:
 								                params["topP"] = self.top_p
 								        else:
 								            if self.top_k is not None:
 								                params["top_k"] = self.top_k
 								            if self.top_p is not None:
 								                params["top_p"] = self.top_p
 								        if api_type in ["openai", "deepseek", "zhipu", "general_openai_compat"]:
 								            if self.frequency_penalty is not None:
 								                params["frequency_penalty"] = self.frequency_penalty
 								            if self.presence_penalty is not None:
 								                params["presence_penalty"] = self.presence_penalty
 								            if self.repetition_penalty is not None:
 								                if api_type == "openai":
 								                    logger.warning("OpenAI官方API不支持repetition_penalty参数，已忽略")
 								                else:
 								                    params["repetition_penalty"] = self.repetition_penalty
 								        if self.response_format is not None:
 								            if isinstance(self.response_format, dict):
 								                if api_type in ["openai", "zhipu", "deepseek", "general_openai_compat"]:
 								                    params["response_format"] = self.response_format
 								                    logger.debug(
 								                        f"为 {api_type} 使用自定义 response_format: "
 								                        f"{self.response_format}"
 								                    )
 								            elif self.response_format == ResponseFormat.JSON:
 								                if api_type in ["openai", "zhipu", "deepseek", "general_openai_compat"]:
 								                    params["response_format"] = {"type": "json_object"}
 								                    logger.debug(f"为 {api_type} 启用 JSON 对象输出模式")
-												✨ feat(llm): 全面重构LLM服务模块，增强多模态与工具支持 (#1953)

* ✨ feat(llm): 全面重构LLM服务模块，增强多模态与工具支持

🚀 核心功能增强
- 多模型链式调用：新增 `pipeline_chat` 支持复杂任务流处理
- 扩展提供商支持：新增 ARK(火山方舟)、SiliconFlow(硅基流动) 适配器
- 多模态处理增强：支持URL媒体文件下载转换，提升输入灵活性
- 历史对话支持：AI.analyze 方法支持历史消息上下文和可选 UniMessage 参数
- 文本嵌入功能：新增 `embed`、`analyze_multimodal`、`search_multimodal` 等API
- 模型能力系统：新增 `ModelCapabilities` 统一管理模型特性（多模态、工具调用等）

🔧 架构重构与优化
- MCP工具系统重构：配置独立化至 `data/llm/mcp_tools.json`，预置常用工具
- API调用逻辑统一：提取通用 `_perform_api_call` 方法，消除代码重复
- 跨平台兼容：Windows平台MCP工具npx命令自动包装处理
- HTTP客户端增强：兼容不同版本httpx代理配置（0.28+版本适配）

🛠️ API与配置完善
- 统一返回类型：`AI.analyze` 统一返回 `LLMResponse` 类型
- 消息转换工具：新增 `message_to_unimessage` 转换函数
- Gemini适配器增强：URL图片下载编码、动态安全阈值配置
- 缓存管理：新增模型实例缓存和管理功能
- 配置预设：扩展 CommonOverrides 预设配置选项
- 历史管理优化：支持多模态内容占位符替换，提升效率

📚 文档与开发体验
- README全面重写：新增完整使用指南、API参考和架构概览
- 文档内容扩充：补充嵌入模型、缓存管理、工具注册等功能说明
- 日志记录增强：支持详细调试信息输出
- API简化：移除冗余函数，优化接口设计

* 🎨  feat(llm): 统一LLM服务函数文档格式

* ✨ feat(llm): 添加新模型并简化提供者配置加载

* :rotating_light: auto fix by pre-commit hooks

---------

Co-authored-by: webjoin111 <455457521@qq.com>
Co-authored-by: pre-commit-ci[bot] <66853113+pre-commit-ci[bot]@users.noreply.github.com>
											
										
										
											2025-07-08 11:15:15 +08:00
+								                elif api_type == "gemini":
-												✨ feat(llm): 实现LLM服务模块，支持多提供商统一接口和高级功能 (#1923)

* ✨ feat(llm): 实现LLM服务模块，支持多提供商统一接口和高级功能

* 🎨 Ruff

* :sparkles: Config配置类支持BaseModel存储

* :art: 代码格式化

* :art: 代码格式化

* :art: 格式化代码

* ✨ feat(llm): 添加 AI 对话历史管理

* ✨ feat(llmConfig): 引入 LLM 配置模型及管理功能

* 🎨 Ruff

---------

Co-authored-by: fccckaug <xxxmio123123@gmail.com>
Co-authored-by: HibiKier <45528451+HibiKier@users.noreply.github.com>
Co-authored-by: HibiKier <775757368@qq.com>
Co-authored-by: fccckaug <xxxmcsmiomio3@gmail.com>
Co-authored-by: webjoin111 <455457521@qq.com>
											
										
										
											2025-06-21 16:33:21 +08:00
+								                    params["responseMimeType"] = "application/json"
 								                    if self.response_schema:
 								                        params["responseSchema"] = self.response_schema
 								                    logger.debug(f"为 {api_type} 启用 JSON MIME 类型输出模式")
-												♻️ refactor!: 重构LLM服务架构并统一Pydantic兼容性处理 (#2002)

* ♻️ refactor(pydantic): 提取 Pydantic 兼容函数到独立模块

* ♻️ refactor!(llm): 重构LLM服务，引入现代化工具和执行器架构

🏗️ **架构变更**
- 引入ToolProvider/ToolExecutable协议，取代ToolRegistry
- 新增LLMToolExecutor，分离工具调用逻辑
- 新增BaseMemory抽象，解耦会话状态管理

🔄 **API重构**
- 移除：analyze, analyze_multimodal, pipeline_chat
- 新增：generate_structured, run_with_tools
- 重构：chat, search, code变为无状态调用

🛠️ **工具系统**
- 新增@function_tool装饰器
- 统一工具定义到ToolExecutable协议
- 移除MCP工具系统和mcp_tools.json

---------

Co-authored-by: webjoin111 <455457521@qq.com>
											
										
										
											2025-08-04 23:36:12 +08:00
+								        if self.custom_params:
 								            custom_mapped = apply_api_specific_mappings(self.custom_params, api_type)
 								            params.update(custom_mapped)
-												✨ feat(llm): 全面重构LLM服务模块，增强多模态与工具支持 (#1953)

* ✨ feat(llm): 全面重构LLM服务模块，增强多模态与工具支持

🚀 核心功能增强
- 多模型链式调用：新增 `pipeline_chat` 支持复杂任务流处理
- 扩展提供商支持：新增 ARK(火山方舟)、SiliconFlow(硅基流动) 适配器
- 多模态处理增强：支持URL媒体文件下载转换，提升输入灵活性
- 历史对话支持：AI.analyze 方法支持历史消息上下文和可选 UniMessage 参数
- 文本嵌入功能：新增 `embed`、`analyze_multimodal`、`search_multimodal` 等API
- 模型能力系统：新增 `ModelCapabilities` 统一管理模型特性（多模态、工具调用等）

🔧 架构重构与优化
- MCP工具系统重构：配置独立化至 `data/llm/mcp_tools.json`，预置常用工具
- API调用逻辑统一：提取通用 `_perform_api_call` 方法，消除代码重复
- 跨平台兼容：Windows平台MCP工具npx命令自动包装处理
- HTTP客户端增强：兼容不同版本httpx代理配置（0.28+版本适配）

🛠️ API与配置完善
- 统一返回类型：`AI.analyze` 统一返回 `LLMResponse` 类型
- 消息转换工具：新增 `message_to_unimessage` 转换函数
- Gemini适配器增强：URL图片下载编码、动态安全阈值配置
- 缓存管理：新增模型实例缓存和管理功能
- 配置预设：扩展 CommonOverrides 预设配置选项
- 历史管理优化：支持多模态内容占位符替换，提升效率

📚 文档与开发体验
- README全面重写：新增完整使用指南、API参考和架构概览
- 文档内容扩充：补充嵌入模型、缓存管理、工具注册等功能说明
- 日志记录增强：支持详细调试信息输出
- API简化：移除冗余函数，优化接口设计

* 🎨  feat(llm): 统一LLM服务函数文档格式

* ✨ feat(llm): 添加新模型并简化提供者配置加载

* :rotating_light: auto fix by pre-commit hooks

---------

Co-authored-by: webjoin111 <455457521@qq.com>
Co-authored-by: pre-commit-ci[bot] <66853113+pre-commit-ci[bot]@users.noreply.github.com>
											
										
										
											2025-07-08 11:15:15 +08:00
+								        if api_type == "gemini":
-												✨ feat(llm): 实现LLM服务模块，支持多提供商统一接口和高级功能 (#1923)

* ✨ feat(llm): 实现LLM服务模块，支持多提供商统一接口和高级功能

* 🎨 Ruff

* :sparkles: Config配置类支持BaseModel存储

* :art: 代码格式化

* :art: 代码格式化

* :art: 格式化代码

* ✨ feat(llm): 添加 AI 对话历史管理

* ✨ feat(llmConfig): 引入 LLM 配置模型及管理功能

* 🎨 Ruff

---------

Co-authored-by: fccckaug <xxxmio123123@gmail.com>
Co-authored-by: HibiKier <45528451+HibiKier@users.noreply.github.com>
Co-authored-by: HibiKier <775757368@qq.com>
Co-authored-by: fccckaug <xxxmcsmiomio3@gmail.com>
Co-authored-by: webjoin111 <455457521@qq.com>
											
										
										
											2025-06-21 16:33:21 +08:00
+								            if (
 								                self.response_format != ResponseFormat.JSON
 								                and self.response_mime_type is not None
 								            ):
 								                params["responseMimeType"] = self.response_mime_type
 								                logger.debug(
 								                    f"使用显式设置的 responseMimeType: {self.response_mime_type}"
 								                )
 								            if self.response_schema is not None and "responseSchema" not in params:
 								                params["responseSchema"] = self.response_schema
-												♻️ refactor!: 重构LLM服务架构并统一Pydantic兼容性处理 (#2002)

* ♻️ refactor(pydantic): 提取 Pydantic 兼容函数到独立模块

* ♻️ refactor!(llm): 重构LLM服务，引入现代化工具和执行器架构

🏗️ **架构变更**
- 引入ToolProvider/ToolExecutable协议，取代ToolRegistry
- 新增LLMToolExecutor，分离工具调用逻辑
- 新增BaseMemory抽象，解耦会话状态管理

🔄 **API重构**
- 移除：analyze, analyze_multimodal, pipeline_chat
- 新增：generate_structured, run_with_tools
- 重构：chat, search, code变为无状态调用

🛠️ **工具系统**
- 新增@function_tool装饰器
- 统一工具定义到ToolExecutable协议
- 移除MCP工具系统和mcp_tools.json

---------

Co-authored-by: webjoin111 <455457521@qq.com>
											
										
										
											2025-08-04 23:36:12 +08:00
 								            if self.thinking_budget is not None or self.include_thoughts is not None:
 								                thinking_config = params.setdefault("thinkingConfig", {})
 								                if self.thinking_budget is not None:
 								                    max_budget = 24576
 								                    budget_value = int(self.thinking_budget * max_budget)
 								                    thinking_config["thinkingBudget"] = budget_value
 								                    logger.debug(
 								                        f"已将 thinking_budget (float: {self.thinking_budget}) "
 								                        f"转换为 Gemini API 的整数格式: {budget_value}"
 								                    )
 								                if self.include_thoughts is not None:
 								                    thinking_config["includeThoughts"] = self.include_thoughts
 								                    logger.debug(f"已设置 includeThoughts: {self.include_thoughts}")
-												✨ feat(llm): 实现LLM服务模块，支持多提供商统一接口和高级功能 (#1923)

* ✨ feat(llm): 实现LLM服务模块，支持多提供商统一接口和高级功能

* 🎨 Ruff

* :sparkles: Config配置类支持BaseModel存储

* :art: 代码格式化

* :art: 代码格式化

* :art: 格式化代码

* ✨ feat(llm): 添加 AI 对话历史管理

* ✨ feat(llmConfig): 引入 LLM 配置模型及管理功能

* 🎨 Ruff

---------

Co-authored-by: fccckaug <xxxmio123123@gmail.com>
Co-authored-by: HibiKier <45528451+HibiKier@users.noreply.github.com>
Co-authored-by: HibiKier <775757368@qq.com>
Co-authored-by: fccckaug <xxxmcsmiomio3@gmail.com>
Co-authored-by: webjoin111 <455457521@qq.com>
											
										
										
											2025-06-21 16:33:21 +08:00
+								            if self.safety_settings is not None:
 								                params["safetySettings"] = self.safety_settings
 								            if self.response_modalities is not None:
 								                params["responseModalities"] = self.response_modalities
 								        logger.debug(f"为{api_type}转换配置参数: {len(params)}个参数")
 								        return params
 								def validate_override_params(
 								    override_config: dict[str, Any] | LLMGenerationConfig | None,
 								) -> LLMGenerationConfig:
 								    """验证和标准化覆盖参数"""
 								    if override_config is None:
 								        return LLMGenerationConfig()
 								    if isinstance(override_config, dict):
 								        try:
 								            filtered_config = {
 								                k: v for k, v in override_config.items() if v is not None
 								            }
 								            return LLMGenerationConfig(**filtered_config)
 								        except Exception as e:
 								            logger.warning(f"覆盖配置参数验证失败: {e}")
 								            raise LLMException(
 								                f"无效的覆盖配置参数: {e}",
 								                code=LLMErrorCode.CONFIGURATION_ERROR,
 								                cause=e,
 								            )
 								    return override_config
 								def apply_api_specific_mappings(
 								    params: dict[str, Any], api_type: str
 								) -> dict[str, Any]:
 								    """应用API特定的参数映射"""
 								    mapped_params = params.copy()
-												✨ feat(llm): 全面重构LLM服务模块，增强多模态与工具支持 (#1953)

* ✨ feat(llm): 全面重构LLM服务模块，增强多模态与工具支持

🚀 核心功能增强
- 多模型链式调用：新增 `pipeline_chat` 支持复杂任务流处理
- 扩展提供商支持：新增 ARK(火山方舟)、SiliconFlow(硅基流动) 适配器
- 多模态处理增强：支持URL媒体文件下载转换，提升输入灵活性
- 历史对话支持：AI.analyze 方法支持历史消息上下文和可选 UniMessage 参数
- 文本嵌入功能：新增 `embed`、`analyze_multimodal`、`search_multimodal` 等API
- 模型能力系统：新增 `ModelCapabilities` 统一管理模型特性（多模态、工具调用等）

🔧 架构重构与优化
- MCP工具系统重构：配置独立化至 `data/llm/mcp_tools.json`，预置常用工具
- API调用逻辑统一：提取通用 `_perform_api_call` 方法，消除代码重复
- 跨平台兼容：Windows平台MCP工具npx命令自动包装处理
- HTTP客户端增强：兼容不同版本httpx代理配置（0.28+版本适配）

🛠️ API与配置完善
- 统一返回类型：`AI.analyze` 统一返回 `LLMResponse` 类型
- 消息转换工具：新增 `message_to_unimessage` 转换函数
- Gemini适配器增强：URL图片下载编码、动态安全阈值配置
- 缓存管理：新增模型实例缓存和管理功能
- 配置预设：扩展 CommonOverrides 预设配置选项
- 历史管理优化：支持多模态内容占位符替换，提升效率

📚 文档与开发体验
- README全面重写：新增完整使用指南、API参考和架构概览
- 文档内容扩充：补充嵌入模型、缓存管理、工具注册等功能说明
- 日志记录增强：支持详细调试信息输出
- API简化：移除冗余函数，优化接口设计

* 🎨  feat(llm): 统一LLM服务函数文档格式

* ✨ feat(llm): 添加新模型并简化提供者配置加载

* :rotating_light: auto fix by pre-commit hooks

---------

Co-authored-by: webjoin111 <455457521@qq.com>
Co-authored-by: pre-commit-ci[bot] <66853113+pre-commit-ci[bot]@users.noreply.github.com>
											
										
										
											2025-07-08 11:15:15 +08:00
+								    if api_type == "gemini":
-												✨ feat(llm): 实现LLM服务模块，支持多提供商统一接口和高级功能 (#1923)

* ✨ feat(llm): 实现LLM服务模块，支持多提供商统一接口和高级功能

* 🎨 Ruff

* :sparkles: Config配置类支持BaseModel存储

* :art: 代码格式化

* :art: 代码格式化

* :art: 格式化代码

* ✨ feat(llm): 添加 AI 对话历史管理

* ✨ feat(llmConfig): 引入 LLM 配置模型及管理功能

* 🎨 Ruff

---------

Co-authored-by: fccckaug <xxxmio123123@gmail.com>
Co-authored-by: HibiKier <45528451+HibiKier@users.noreply.github.com>
Co-authored-by: HibiKier <775757368@qq.com>
Co-authored-by: fccckaug <xxxmcsmiomio3@gmail.com>
Co-authored-by: webjoin111 <455457521@qq.com>
											
										
										
											2025-06-21 16:33:21 +08:00
+								        if "max_tokens" in mapped_params:
 								            mapped_params["maxOutputTokens"] = mapped_params.pop("max_tokens")
 								        if "top_k" in mapped_params:
 								            mapped_params["topK"] = mapped_params.pop("top_k")
 								        if "top_p" in mapped_params:
 								            mapped_params["topP"] = mapped_params.pop("top_p")
 								        unsupported = ["frequency_penalty", "presence_penalty", "repetition_penalty"]
 								        for param in unsupported:
 								            if param in mapped_params:
 								                logger.warning(f"Gemini 原生API不支持参数 '{param}'，已忽略")
 								                mapped_params.pop(param)
 								    elif api_type in ["openai", "deepseek", "zhipu", "general_openai_compat"]:
 								        if "repetition_penalty" in mapped_params and api_type == "openai":
 								            logger.warning("OpenAI官方API不支持repetition_penalty参数，已忽略")
 								            mapped_params.pop("repetition_penalty")
 								        if "stop" in mapped_params:
 								            stop_value = mapped_params["stop"]
 								            if isinstance(stop_value, str):
 								                mapped_params["stop"] = [stop_value]
 								    return mapped_params
 								def create_generation_config_from_kwargs(**kwargs) -> LLMGenerationConfig:
 								    """从关键字参数创建生成配置"""
 								    model_fields = getattr(LLMGenerationConfig, "model_fields", {})
 								    known_fields = set(model_fields.keys())
 								    known_params = {}
 								    custom_params = {}
 								    for key, value in kwargs.items():
 								        if key in known_fields:
 								            known_params[key] = value
 								        else:
 								            custom_params[key] = value
 								    if custom_params:
 								        known_params["custom_params"] = custom_params
 								    return LLMGenerationConfig(**known_params)