agent/core/llm.py

"""
ZhipuAI LLM Client for B2B Shopping AI Assistant
"""
import concurrent.futures
from typing import Any, Optional
from dataclasses import dataclass

from zhipuai import ZhipuAI

from config import settings
from utils.logger import get_logger

logger = get_logger(__name__)


@dataclass
class Message:
    """Chat message structure"""
    role: str  # "system", "user", "assistant"
    content: str


@dataclass
class LLMResponse:
    """LLM response structure"""
    content: str
    finish_reason: str
    usage: dict[str, int]


class ZhipuLLMClient:
    """ZhipuAI LLM Client wrapper"""

    DEFAULT_TIMEOUT = 30  # seconds

    def __init__(
        self,
        api_key: Optional[str] = None,
        model: Optional[str] = None,
        timeout: Optional[int] = None
    ):
        self.api_key = api_key or settings.zhipu_api_key
        self.model = model or settings.zhipu_model
        self.timeout = timeout or self.DEFAULT_TIMEOUT
        self._client = ZhipuAI(api_key=self.api_key)
        logger.info("ZhipuAI client initialized", model=self.model, timeout=self.timeout)

    async def chat(
        self,
        messages: list[Message],
        temperature: float = 0.7,
        max_tokens: int = 2048,
        top_p: float = 0.9,
        **kwargs: Any
    ) -> LLMResponse:
        """Send chat completion request"""
        formatted_messages = [
            {"role": msg.role, "content": msg.content}
            for msg in messages
        ]

        logger.info(
            "Sending chat request",
            model=self.model,
            message_count=len(messages),
            temperature=temperature
        )

        def _make_request():
            return self._client.chat.completions.create(
                model=self.model,
                messages=formatted_messages,
                temperature=temperature,
                max_tokens=max_tokens,
                top_p=top_p,
                **kwargs
            )

        try:
            with concurrent.futures.ThreadPoolExecutor(max_workers=1) as executor:
                future = executor.submit(_make_request)
                response = future.result(timeout=self.timeout)

            choice = response.choices[0]
            content = choice.message.content

            logger.info(
                "Chat response received",
                finish_reason=choice.finish_reason,
                content_length=len(content) if content else 0,
                usage=response.usage.__dict__ if hasattr(response, 'usage') else {}
            )

            if not content:
                logger.warning("LLM returned empty content")

            return LLMResponse(
                content=content or "",
                finish_reason=choice.finish_reason,
                usage={
                    "prompt_tokens": response.usage.prompt_tokens,
                    "completion_tokens": response.usage.completion_tokens,
                    "total_tokens": response.usage.total_tokens
                }
            )

        except concurrent.futures.TimeoutError:
            logger.error("Chat request timed out", timeout=self.timeout)
            raise TimeoutError(f"Request timed out after {self.timeout} seconds")

        except Exception as e:
            logger.error("Chat request failed", error=str(e))
            raise

    async def chat_with_tools(
        self,
        messages: list[Message],
        tools: list[dict[str, Any]],
        temperature: float = 0.7,
        **kwargs: Any
    ) -> tuple[LLMResponse, None]:
        """Send chat completion request with tool calling"""
        formatted_messages = [
            {"role": msg.role, "content": msg.content}
            for msg in messages
        ]

        logger.info(
            "Sending chat request with tools",
            model=self.model,
            tool_count=len(tools)
        )

        try:
            response = self._client.chat.completions.create(
                model=self.model,
                messages=formatted_messages,
                tools=tools,
                temperature=temperature,
                **kwargs
            )

            choice = response.choices[0]
            content = choice.message.content or ""

            return LLMResponse(
                content=content,
                finish_reason=choice.finish_reason,
                usage={
                    "prompt_tokens": response.usage.prompt_tokens,
                    "completion_tokens": response.usage.completion_tokens,
                    "total_tokens": response.usage.total_tokens
                }
            ), None

        except Exception as e:
            logger.error("Chat with tools request failed", error=str(e))
            raise


llm_client: Optional[ZhipuLLMClient] = None


def get_llm_client() -> ZhipuLLMClient:
    """Get or create global LLM client instance"""
    global llm_client
    if llm_client is None:
        llm_client = ZhipuLLMClient()
    return llm_client
feat: 初始化 B2B AI Shopping Assistant 项目 - 配置 Docker Compose 多服务编排 - 实现 Chatwoot + Agent 集成 - 配置 Strapi MCP 知识库 - 支持 7 种语言的 FAQ 系统 - 实现 LangGraph AI 工作流 Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com> 2026-01-14 19:25:22 +08:00			`"""`
			`ZhipuAI LLM Client for B2B Shopping AI Assistant`
			`"""`
feat: 添加物流查询功能和完善 token 传递 - 添加 get_logistics 工具查询 Mall API /mall/api/order/parcel - 修复 Cookie token 传递到 MCP 的问题 - 增强 LLM 客户端超时处理和日志 - 移除 MALL_API_TOKEN，使用用户登录 token - 更新测试页面使用 setUser 设置用户属性 - 增强 webhook 调试日志 2026-01-16 18:36:17 +08:00			`import concurrent.futures`
			`from typing import Any, Optional`
feat: 初始化 B2B AI Shopping Assistant 项目 - 配置 Docker Compose 多服务编排 - 实现 Chatwoot + Agent 集成 - 配置 Strapi MCP 知识库 - 支持 7 种语言的 FAQ 系统 - 实现 LangGraph AI 工作流 Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com> 2026-01-14 19:25:22 +08:00			`from dataclasses import dataclass`

			`from zhipuai import ZhipuAI`

			`from config import settings`
			`from utils.logger import get_logger`

			`logger = get_logger(__name__)`


			`@dataclass`
			`class Message:`
			`"""Chat message structure"""`
			`role: str # "system", "user", "assistant"`
			`content: str`


			`@dataclass`
			`class LLMResponse:`
			`"""LLM response structure"""`
			`content: str`
			`finish_reason: str`
			`usage: dict[str, int]`


			`class ZhipuLLMClient:`
			`"""ZhipuAI LLM Client wrapper"""`
feat: 添加物流查询功能和完善 token 传递 - 添加 get_logistics 工具查询 Mall API /mall/api/order/parcel - 修复 Cookie token 传递到 MCP 的问题 - 增强 LLM 客户端超时处理和日志 - 移除 MALL_API_TOKEN，使用用户登录 token - 更新测试页面使用 setUser 设置用户属性 - 增强 webhook 调试日志 2026-01-16 18:36:17 +08:00
			`DEFAULT_TIMEOUT = 30 # seconds`

feat: 初始化 B2B AI Shopping Assistant 项目 - 配置 Docker Compose 多服务编排 - 实现 Chatwoot + Agent 集成 - 配置 Strapi MCP 知识库 - 支持 7 种语言的 FAQ 系统 - 实现 LangGraph AI 工作流 Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com> 2026-01-14 19:25:22 +08:00			`def __init__(`
			`self,`
			`api_key: Optional[str] = None,`
feat: 添加物流查询功能和完善 token 传递 - 添加 get_logistics 工具查询 Mall API /mall/api/order/parcel - 修复 Cookie token 传递到 MCP 的问题 - 增强 LLM 客户端超时处理和日志 - 移除 MALL_API_TOKEN，使用用户登录 token - 更新测试页面使用 setUser 设置用户属性 - 增强 webhook 调试日志 2026-01-16 18:36:17 +08:00			`model: Optional[str] = None,`
			`timeout: Optional[int] = None`
feat: 初始化 B2B AI Shopping Assistant 项目 - 配置 Docker Compose 多服务编排 - 实现 Chatwoot + Agent 集成 - 配置 Strapi MCP 知识库 - 支持 7 种语言的 FAQ 系统 - 实现 LangGraph AI 工作流 Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com> 2026-01-14 19:25:22 +08:00			`):`
			`self.api_key = api_key or settings.zhipu_api_key`
			`self.model = model or settings.zhipu_model`
feat: 添加物流查询功能和完善 token 传递 - 添加 get_logistics 工具查询 Mall API /mall/api/order/parcel - 修复 Cookie token 传递到 MCP 的问题 - 增强 LLM 客户端超时处理和日志 - 移除 MALL_API_TOKEN，使用用户登录 token - 更新测试页面使用 setUser 设置用户属性 - 增强 webhook 调试日志 2026-01-16 18:36:17 +08:00			`self.timeout = timeout or self.DEFAULT_TIMEOUT`
feat: 初始化 B2B AI Shopping Assistant 项目 - 配置 Docker Compose 多服务编排 - 实现 Chatwoot + Agent 集成 - 配置 Strapi MCP 知识库 - 支持 7 种语言的 FAQ 系统 - 实现 LangGraph AI 工作流 Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com> 2026-01-14 19:25:22 +08:00			`self._client = ZhipuAI(api_key=self.api_key)`
feat: 添加物流查询功能和完善 token 传递 - 添加 get_logistics 工具查询 Mall API /mall/api/order/parcel - 修复 Cookie token 传递到 MCP 的问题 - 增强 LLM 客户端超时处理和日志 - 移除 MALL_API_TOKEN，使用用户登录 token - 更新测试页面使用 setUser 设置用户属性 - 增强 webhook 调试日志 2026-01-16 18:36:17 +08:00			`logger.info("ZhipuAI client initialized", model=self.model, timeout=self.timeout)`

feat: 初始化 B2B AI Shopping Assistant 项目 - 配置 Docker Compose 多服务编排 - 实现 Chatwoot + Agent 集成 - 配置 Strapi MCP 知识库 - 支持 7 种语言的 FAQ 系统 - 实现 LangGraph AI 工作流 Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com> 2026-01-14 19:25:22 +08:00			`async def chat(`
			`self,`
			`messages: list[Message],`
			`temperature: float = 0.7,`
			`max_tokens: int = 2048,`
			`top_p: float = 0.9,`
			`**kwargs: Any`
			`) -> LLMResponse:`
feat: 添加物流查询功能和完善 token 传递 - 添加 get_logistics 工具查询 Mall API /mall/api/order/parcel - 修复 Cookie token 传递到 MCP 的问题 - 增强 LLM 客户端超时处理和日志 - 移除 MALL_API_TOKEN，使用用户登录 token - 更新测试页面使用 setUser 设置用户属性 - 增强 webhook 调试日志 2026-01-16 18:36:17 +08:00			`"""Send chat completion request"""`
feat: 初始化 B2B AI Shopping Assistant 项目 - 配置 Docker Compose 多服务编排 - 实现 Chatwoot + Agent 集成 - 配置 Strapi MCP 知识库 - 支持 7 种语言的 FAQ 系统 - 实现 LangGraph AI 工作流 Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com> 2026-01-14 19:25:22 +08:00			`formatted_messages = [`
			`{"role": msg.role, "content": msg.content}`
			`for msg in messages`
			`]`
feat: 添加物流查询功能和完善 token 传递 - 添加 get_logistics 工具查询 Mall API /mall/api/order/parcel - 修复 Cookie token 传递到 MCP 的问题 - 增强 LLM 客户端超时处理和日志 - 移除 MALL_API_TOKEN，使用用户登录 token - 更新测试页面使用 setUser 设置用户属性 - 增强 webhook 调试日志 2026-01-16 18:36:17 +08:00
			`logger.info(`
feat: 初始化 B2B AI Shopping Assistant 项目 - 配置 Docker Compose 多服务编排 - 实现 Chatwoot + Agent 集成 - 配置 Strapi MCP 知识库 - 支持 7 种语言的 FAQ 系统 - 实现 LangGraph AI 工作流 Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com> 2026-01-14 19:25:22 +08:00			`"Sending chat request",`
			`model=self.model,`
			`message_count=len(messages),`
			`temperature=temperature`
			`)`
feat: 添加物流查询功能和完善 token 传递 - 添加 get_logistics 工具查询 Mall API /mall/api/order/parcel - 修复 Cookie token 传递到 MCP 的问题 - 增强 LLM 客户端超时处理和日志 - 移除 MALL_API_TOKEN，使用用户登录 token - 更新测试页面使用 setUser 设置用户属性 - 增强 webhook 调试日志 2026-01-16 18:36:17 +08:00
			`def _make_request():`
			`return self._client.chat.completions.create(`
feat: 初始化 B2B AI Shopping Assistant 项目 - 配置 Docker Compose 多服务编排 - 实现 Chatwoot + Agent 集成 - 配置 Strapi MCP 知识库 - 支持 7 种语言的 FAQ 系统 - 实现 LangGraph AI 工作流 Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com> 2026-01-14 19:25:22 +08:00			`model=self.model,`
			`messages=formatted_messages,`
			`temperature=temperature,`
			`max_tokens=max_tokens,`
			`top_p=top_p,`
			`**kwargs`
			`)`
feat: 添加物流查询功能和完善 token 传递 - 添加 get_logistics 工具查询 Mall API /mall/api/order/parcel - 修复 Cookie token 传递到 MCP 的问题 - 增强 LLM 客户端超时处理和日志 - 移除 MALL_API_TOKEN，使用用户登录 token - 更新测试页面使用 setUser 设置用户属性 - 增强 webhook 调试日志 2026-01-16 18:36:17 +08:00
			`try:`
			`with concurrent.futures.ThreadPoolExecutor(max_workers=1) as executor:`
			`future = executor.submit(_make_request)`
			`response = future.result(timeout=self.timeout)`

feat: 初始化 B2B AI Shopping Assistant 项目 - 配置 Docker Compose 多服务编排 - 实现 Chatwoot + Agent 集成 - 配置 Strapi MCP 知识库 - 支持 7 种语言的 FAQ 系统 - 实现 LangGraph AI 工作流 Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com> 2026-01-14 19:25:22 +08:00			`choice = response.choices[0]`
feat: 添加物流查询功能和完善 token 传递 - 添加 get_logistics 工具查询 Mall API /mall/api/order/parcel - 修复 Cookie token 传递到 MCP 的问题 - 增强 LLM 客户端超时处理和日志 - 移除 MALL_API_TOKEN，使用用户登录 token - 更新测试页面使用 setUser 设置用户属性 - 增强 webhook 调试日志 2026-01-16 18:36:17 +08:00			`content = choice.message.content`

			`logger.info(`
			`"Chat response received",`
			`finish_reason=choice.finish_reason,`
			`content_length=len(content) if content else 0,`
			`usage=response.usage.__dict__ if hasattr(response, 'usage') else {}`
			`)`

			`if not content:`
			`logger.warning("LLM returned empty content")`

			`return LLMResponse(`
			`content=content or "",`
feat: 初始化 B2B AI Shopping Assistant 项目 - 配置 Docker Compose 多服务编排 - 实现 Chatwoot + Agent 集成 - 配置 Strapi MCP 知识库 - 支持 7 种语言的 FAQ 系统 - 实现 LangGraph AI 工作流 Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com> 2026-01-14 19:25:22 +08:00			`finish_reason=choice.finish_reason,`
			`usage={`
			`"prompt_tokens": response.usage.prompt_tokens,`
			`"completion_tokens": response.usage.completion_tokens,`
			`"total_tokens": response.usage.total_tokens`
			`}`
			`)`
feat: 添加物流查询功能和完善 token 传递 - 添加 get_logistics 工具查询 Mall API /mall/api/order/parcel - 修复 Cookie token 传递到 MCP 的问题 - 增强 LLM 客户端超时处理和日志 - 移除 MALL_API_TOKEN，使用用户登录 token - 更新测试页面使用 setUser 设置用户属性 - 增强 webhook 调试日志 2026-01-16 18:36:17 +08:00
			`except concurrent.futures.TimeoutError:`
			`logger.error("Chat request timed out", timeout=self.timeout)`
			`raise TimeoutError(f"Request timed out after {self.timeout} seconds")`

feat: 初始化 B2B AI Shopping Assistant 项目 - 配置 Docker Compose 多服务编排 - 实现 Chatwoot + Agent 集成 - 配置 Strapi MCP 知识库 - 支持 7 种语言的 FAQ 系统 - 实现 LangGraph AI 工作流 Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com> 2026-01-14 19:25:22 +08:00			`except Exception as e:`
			`logger.error("Chat request failed", error=str(e))`
			`raise`
feat: 添加物流查询功能和完善 token 传递 - 添加 get_logistics 工具查询 Mall API /mall/api/order/parcel - 修复 Cookie token 传递到 MCP 的问题 - 增强 LLM 客户端超时处理和日志 - 移除 MALL_API_TOKEN，使用用户登录 token - 更新测试页面使用 setUser 设置用户属性 - 增强 webhook 调试日志 2026-01-16 18:36:17 +08:00
feat: 初始化 B2B AI Shopping Assistant 项目 - 配置 Docker Compose 多服务编排 - 实现 Chatwoot + Agent 集成 - 配置 Strapi MCP 知识库 - 支持 7 种语言的 FAQ 系统 - 实现 LangGraph AI 工作流 Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com> 2026-01-14 19:25:22 +08:00			`async def chat_with_tools(`
			`self,`
			`messages: list[Message],`
			`tools: list[dict[str, Any]],`
			`temperature: float = 0.7,`
			`**kwargs: Any`
feat: 添加物流查询功能和完善 token 传递 - 添加 get_logistics 工具查询 Mall API /mall/api/order/parcel - 修复 Cookie token 传递到 MCP 的问题 - 增强 LLM 客户端超时处理和日志 - 移除 MALL_API_TOKEN，使用用户登录 token - 更新测试页面使用 setUser 设置用户属性 - 增强 webhook 调试日志 2026-01-16 18:36:17 +08:00			`) -> tuple[LLMResponse, None]:`
			`"""Send chat completion request with tool calling"""`
feat: 初始化 B2B AI Shopping Assistant 项目 - 配置 Docker Compose 多服务编排 - 实现 Chatwoot + Agent 集成 - 配置 Strapi MCP 知识库 - 支持 7 种语言的 FAQ 系统 - 实现 LangGraph AI 工作流 Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com> 2026-01-14 19:25:22 +08:00			`formatted_messages = [`
			`{"role": msg.role, "content": msg.content}`
			`for msg in messages`
			`]`
feat: 添加物流查询功能和完善 token 传递 - 添加 get_logistics 工具查询 Mall API /mall/api/order/parcel - 修复 Cookie token 传递到 MCP 的问题 - 增强 LLM 客户端超时处理和日志 - 移除 MALL_API_TOKEN，使用用户登录 token - 更新测试页面使用 setUser 设置用户属性 - 增强 webhook 调试日志 2026-01-16 18:36:17 +08:00
			`logger.info(`
feat: 初始化 B2B AI Shopping Assistant 项目 - 配置 Docker Compose 多服务编排 - 实现 Chatwoot + Agent 集成 - 配置 Strapi MCP 知识库 - 支持 7 种语言的 FAQ 系统 - 实现 LangGraph AI 工作流 Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com> 2026-01-14 19:25:22 +08:00			`"Sending chat request with tools",`
			`model=self.model,`
			`tool_count=len(tools)`
			`)`
feat: 添加物流查询功能和完善 token 传递 - 添加 get_logistics 工具查询 Mall API /mall/api/order/parcel - 修复 Cookie token 传递到 MCP 的问题 - 增强 LLM 客户端超时处理和日志 - 移除 MALL_API_TOKEN，使用用户登录 token - 更新测试页面使用 setUser 设置用户属性 - 增强 webhook 调试日志 2026-01-16 18:36:17 +08:00
feat: 初始化 B2B AI Shopping Assistant 项目 - 配置 Docker Compose 多服务编排 - 实现 Chatwoot + Agent 集成 - 配置 Strapi MCP 知识库 - 支持 7 种语言的 FAQ 系统 - 实现 LangGraph AI 工作流 Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com> 2026-01-14 19:25:22 +08:00			`try:`
			`response = self._client.chat.completions.create(`
			`model=self.model,`
			`messages=formatted_messages,`
			`tools=tools,`
			`temperature=temperature,`
			`**kwargs`
			`)`
feat: 添加物流查询功能和完善 token 传递 - 添加 get_logistics 工具查询 Mall API /mall/api/order/parcel - 修复 Cookie token 传递到 MCP 的问题 - 增强 LLM 客户端超时处理和日志 - 移除 MALL_API_TOKEN，使用用户登录 token - 更新测试页面使用 setUser 设置用户属性 - 增强 webhook 调试日志 2026-01-16 18:36:17 +08:00
feat: 初始化 B2B AI Shopping Assistant 项目 - 配置 Docker Compose 多服务编排 - 实现 Chatwoot + Agent 集成 - 配置 Strapi MCP 知识库 - 支持 7 种语言的 FAQ 系统 - 实现 LangGraph AI 工作流 Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com> 2026-01-14 19:25:22 +08:00			`choice = response.choices[0]`
feat: 添加物流查询功能和完善 token 传递 - 添加 get_logistics 工具查询 Mall API /mall/api/order/parcel - 修复 Cookie token 传递到 MCP 的问题 - 增强 LLM 客户端超时处理和日志 - 移除 MALL_API_TOKEN，使用用户登录 token - 更新测试页面使用 setUser 设置用户属性 - 增强 webhook 调试日志 2026-01-16 18:36:17 +08:00			`content = choice.message.content or ""`

			`return LLMResponse(`
			`content=content,`
feat: 初始化 B2B AI Shopping Assistant 项目 - 配置 Docker Compose 多服务编排 - 实现 Chatwoot + Agent 集成 - 配置 Strapi MCP 知识库 - 支持 7 种语言的 FAQ 系统 - 实现 LangGraph AI 工作流 Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com> 2026-01-14 19:25:22 +08:00			`finish_reason=choice.finish_reason,`
			`usage={`
			`"prompt_tokens": response.usage.prompt_tokens,`
			`"completion_tokens": response.usage.completion_tokens,`
			`"total_tokens": response.usage.total_tokens`
			`}`
feat: 添加物流查询功能和完善 token 传递 - 添加 get_logistics 工具查询 Mall API /mall/api/order/parcel - 修复 Cookie token 传递到 MCP 的问题 - 增强 LLM 客户端超时处理和日志 - 移除 MALL_API_TOKEN，使用用户登录 token - 更新测试页面使用 setUser 设置用户属性 - 增强 webhook 调试日志 2026-01-16 18:36:17 +08:00			`), None`

feat: 初始化 B2B AI Shopping Assistant 项目 - 配置 Docker Compose 多服务编排 - 实现 Chatwoot + Agent 集成 - 配置 Strapi MCP 知识库 - 支持 7 种语言的 FAQ 系统 - 实现 LangGraph AI 工作流 Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com> 2026-01-14 19:25:22 +08:00			`except Exception as e:`
			`logger.error("Chat with tools request failed", error=str(e))`
			`raise`


			`llm_client: Optional[ZhipuLLMClient] = None`


			`def get_llm_client() -> ZhipuLLMClient:`
			`"""Get or create global LLM client instance"""`
			`global llm_client`
			`if llm_client is None:`
			`llm_client = ZhipuLLMClient()`
			`return llm_client`