iot-device-management-service/app/services/agent_dispatcher.py

"""
交互Agent调度器

支持两种模式（通过 USE_LANGGRAPH 环境变量切换）：
- LangGraph 模式（默认）：基于 StateGraph 的 ReAct agent
- Legacy 模式：手写 Function Calling 循环（向后兼容）

企微入口适配层：处理图片上传、VLM分析等企微特有逻辑，
核心对话由 LangGraph 图处理。
"""

import json
import os
import time
from typing import Dict, List, Optional

from openai import AsyncOpenAI

from app.config import settings
from app.services.session_manager import get_session_manager
from app.utils.logger import logger
from app.utils.timezone import beijing_now

# LangGraph 模式开关
USE_LANGGRAPH = os.getenv("USE_LANGGRAPH", "true").lower() in ("true", "1", "yes")


class AgentDispatcher:
    """交互Agent调度器（单例）"""

    def __init__(self):
        self._vlm_client: Optional[AsyncOpenAI] = None
        self._enabled = False
        # LangGraph 图实例
        self._graph = None
        # Legacy 模式客户端
        self._legacy_client: Optional[AsyncOpenAI] = None
        # 待发送图片队列（两种模式共用）
        self._pending_images: Dict[str, List[str]] = {}

    def init(self, config):
        """初始化Agent"""
        self._enabled = config.enabled and bool(config.vlm_api_key)
        if not self._enabled:
            logger.info("交互Agent未启用（AGENT_ENABLED=false 或缺少 API Key）")
            return

        # VLM 客户端（图片分析，两种模式共用）
        self._vlm_client = AsyncOpenAI(
            api_key=config.vlm_api_key,
            base_url=config.vlm_base_url,
        )

        if USE_LANGGRAPH:
            try:
                from app.services.agent.graph import create_default_graph
                self._graph = create_default_graph()
                logger.info(f"交互Agent已启用(LangGraph模式): model={config.model}")
            except Exception as e:
                logger.error(f"LangGraph 初始化失败，降级到Legacy模式: {e}", exc_info=True)
                self._init_legacy(config)
        else:
            self._init_legacy(config)

    def _init_legacy(self, config):
        """初始化 Legacy 模式"""
        self._legacy_client = AsyncOpenAI(
            api_key=config.vlm_api_key,
            base_url=config.vlm_base_url,
        )
        self._graph = None
        logger.info(f"交互Agent已启用(Legacy模式): model={config.model}")

    @property
    def enabled(self) -> bool:
        return self._enabled

    # ==================== 消息入口 ====================

    async def handle_message(self, user_id: str, content: str) -> str:
        """处理文字消息"""
        if not self._enabled:
            return "AI助手未启用，请联系管理员配置。"

        self._pending_images[user_id] = []

        try:
            if self._graph:
                reply = await self._langgraph_chat(user_id, content)
            else:
                reply = await self._legacy_chat(user_id, content)
        except Exception as e:
            logger.error(f"Agent对话失败: {e}", exc_info=True)
            reply = "抱歉，AI助手暂时无法响应，请稍后重试。"

        # 发送待发图片
        pending = self._pending_images.pop(user_id, [])
        if pending:
            await self._send_images_to_user(user_id, pending)

        return reply

    async def handle_image(self, user_id: str, media_id: str) -> str:
        """处理图片消息（两种模式共用）"""
        if not self._enabled:
            return "AI助手未启用，请联系管理员配置。"

        session = get_session_manager().get(user_id)

        # 1. 下载图片
        from app.services.wechat_service import get_wechat_service
        wechat = get_wechat_service()
        image_data = await wechat.download_media(media_id)
        if not image_data:
            return "图片下载失败，请重新发送。"

        # 2. 上传 COS 持久化
        from app.services.oss_storage import get_oss_storage
        oss = get_oss_storage()
        object_key = f"agent/{user_id}/{int(time.time())}.jpg"
        try:
            oss.upload_file(image_data, object_key, content_type="image/jpeg")
        except Exception as e:
            logger.error(f"Agent图片上传COS失败: {e}")
            return "图片保存失败，请重新发送。"

        permanent_url = oss.get_permanent_url(object_key)
        presign_url = oss.get_presigned_url(object_key)

        # 3. 检查用户是否有待处理工单
        handling_alarm_id = self._find_handling_alarm(user_id)
        if handling_alarm_id:
            session.pending_images.append(permanent_url)
            reply = f"收到图片，是否作为【告警 {handling_alarm_id[:20]}...】的处理结果提交？\n回复「是」确认提交，或继续发送更多图片。"
            session.pending_alarm_id = handling_alarm_id
            return reply

        # 4. VLM 分析
        from app.services.agent.prompts import IMAGE_ANALYZE_PROMPT
        analysis = await self._analyze_image(presign_url, IMAGE_ANALYZE_PROMPT)

        if analysis.get("has_anomaly"):
            desc = analysis.get("description", "异常情况")
            reply = f"检测到异常：{desc}\n\n如需上报，请描述具体位置和情况。"
        else:
            reply = "未检测到明显安全隐患。如有疑问请描述情况。"

        return reply

    # ==================== LangGraph 模式 ====================

    async def _langgraph_chat(self, user_id: str, content: str) -> str:
        """LangGraph 图调用"""
        config = {
            "configurable": {
                "thread_id": f"wechat-{user_id}",
                "user_id": user_id,
            }
        }

        result = await self._graph.ainvoke(
            {
                "messages": [{"role": "user", "content": content}],
                "user_id": user_id,
                "pending_images": [],
                "user_uploaded_images": [],
            },
            config=config,
        )

        # 从工具返回中提取截图 URL（get_alarm_detail 返回的 snapshot_url）
        self._extract_pending_images(user_id, result)

        # 获取最终回复
        last_msg = result["messages"][-1]
        reply = last_msg.content if hasattr(last_msg, "content") else str(last_msg)
        return reply.strip() if reply else "处理完成"

    def _extract_pending_images(self, user_id: str, result):
        """从 LangGraph 结果中提取需要发送的截图"""
        for msg in result.get("messages", []):
            # ToolMessage 的 content 可能包含 snapshot_url
            if hasattr(msg, "type") and msg.type == "tool" and msg.name == "get_alarm_detail":
                try:
                    data = json.loads(msg.content) if isinstance(msg.content, str) else msg.content
                    url = data.get("snapshot_url", "")
                    if url:
                        if user_id not in self._pending_images:
                            self._pending_images[user_id] = []
                        self._pending_images[user_id].append(url)
                except Exception:
                    pass

    # ==================== Legacy 模式（保留向后兼容）====================

    async def _legacy_chat(self, user_id: str, content: str) -> str:
        """Legacy FC 循环（原有逻辑）"""
        from app.services.agent.prompts import SYSTEM_PROMPT

        session = get_session_manager().get(user_id)
        session.add_history("user", content)

        messages = [{"role": "system", "content": SYSTEM_PROMPT}]
        messages.extend(session.get_history_for_vlm())

        # 导入旧版工具定义
        from app.services.agent.tools.alarm_query import (
            ALARM_TYPE_NAMES, ALARM_LEVEL_NAMES, ALARM_STATUS_NAMES,
        )

        TOOLS = self._get_legacy_tools()

        max_rounds = 5
        for _ in range(max_rounds):
            resp = await self._legacy_client.chat.completions.create(
                model=settings.agent.model,
                messages=messages,
                tools=TOOLS,
                timeout=settings.agent.timeout,
            )
            choice = resp.choices[0]

            if choice.finish_reason == "stop":
                reply = (choice.message.content or "").strip()
                session.add_history("assistant", reply)
                return reply

            if choice.message.tool_calls:
                messages.append(choice.message)
                for tc in choice.message.tool_calls:
                    try:
                        args = json.loads(tc.function.arguments) if tc.function.arguments else {}
                    except json.JSONDecodeError:
                        args = {}
                    result = await self._legacy_execute_tool(tc.function.name, args, user_id)
                    messages.append({
                        "role": "tool",
                        "tool_call_id": tc.id,
                        "content": json.dumps(result, ensure_ascii=False),
                    })
            else:
                reply = (choice.message.content or "处理超时，请重试").strip()
                session.add_history("assistant", reply)
                return reply

        reply = "处理超时，请重试"
        session.add_history("assistant", reply)
        return reply

    async def _legacy_execute_tool(self, name: str, args: dict, user_id: str) -> dict:
        """Legacy 工具执行（复用新的 @tool 函数）"""
        try:
            from langchain_core.runnables import RunnableConfig
            config = RunnableConfig(configurable={"user_id": user_id})

            from app.services.agent.tools import all_tools
            tool_map = {t.name: t for t in all_tools}

            tool_fn = tool_map.get(name)
            if not tool_fn:
                return {"error": f"未知工具: {name}"}

            # 注入 config
            args["config"] = config
            result_str = await tool_fn.ainvoke(args)
            return json.loads(result_str) if isinstance(result_str, str) else result_str
        except Exception as e:
            logger.error(f"Legacy工具执行失败: {name}, error={e}", exc_info=True)
            return {"error": f"执行失败: {str(e)}"}

    @staticmethod
    def _get_legacy_tools():
        """获取 Legacy 模式的 OpenAI tools 定义"""
        from app.services.agent.tools import all_tools
        # 从 @tool 函数自动生成 OpenAI tools 格式
        result = []
        for t in all_tools:
            schema = t.args_schema.schema() if t.args_schema else {"type": "object", "properties": {}}
            # 移除 config 参数（LLM 不需要知道）
            props = {k: v for k, v in schema.get("properties", {}).items() if k != "config"}
            required = [r for r in schema.get("required", []) if r != "config"]
            result.append({
                "type": "function",
                "function": {
                    "name": t.name,
                    "description": t.description or "",
                    "parameters": {
                        "type": "object",
                        "properties": props,
                        "required": required,
                    },
                },
            })
        return result

    # ==================== 共用方法 ====================

    async def _analyze_image(self, image_url: str, prompt: str) -> Dict:
        """VLM 分析图片内容"""
        try:
            resp = await self._vlm_client.chat.completions.create(
                model=settings.agent.vlm_model,
                messages=[
                    {"role": "system", "content": prompt},
                    {"role": "user", "content": [
                        {"type": "image_url", "image_url": {"url": image_url}},
                        {"type": "text", "text": "请分析这张图片"},
                    ]},
                ],
                timeout=settings.agent.vlm_timeout,
            )
            text = resp.choices[0].message.content.strip()
            if "```" in text:
                text = text.split("```")[1].strip()
                if text.startswith("json"):
                    text = text[4:].strip()
            return json.loads(text)
        except Exception as e:
            logger.error(f"VLM图片分析失败: {e}")
            return {"has_anomaly": False, "description": "", "alarm_type": ""}

    async def _send_images_to_user(self, user_id: str, image_urls: List[str]):
        """通过企微发送图片消息给用户"""
        from app.services.wechat_service import get_wechat_service
        wechat = get_wechat_service()
        if not wechat.enabled:
            return

        for url in image_urls:
            try:
                media_id = await wechat.upload_media_from_url(url)
                if media_id:
                    access_token = await wechat._get_access_token()
                    import httpx
                    msg = {
                        "touser": user_id,
                        "msgtype": "image",
                        "agentid": wechat.agent_id_int,
                        "image": {"media_id": media_id},
                    }
                    api_url = f"https://qyapi.weixin.qq.com/cgi-bin/message/send?access_token={access_token}"
                    async with httpx.AsyncClient(timeout=10) as client:
                        await client.post(api_url, json=msg)
            except Exception as e:
                logger.error(f"发送告警截图失败: user={user_id}, error={e}")

    @staticmethod
    def _find_handling_alarm(user_id: str) -> str:
        """查找用户正在处理的告警ID"""
        from app.models import get_session, AlarmEvent
        db = get_session()
        try:
            alarm = db.query(AlarmEvent).filter(
                AlarmEvent.handler == user_id,
                AlarmEvent.handle_status == "HANDLING",
            ).order_by(AlarmEvent.event_time.desc()).first()
            return alarm.alarm_id if alarm else ""
        except Exception as e:
            logger.error(f"查询待处理告警失败: user={user_id}, error={e}")
            return ""
        finally:
            db.close()


# 全局单例
_agent_dispatcher: Optional[AgentDispatcher] = None


def get_agent_dispatcher() -> AgentDispatcher:
    global _agent_dispatcher
    if _agent_dispatcher is None:
        _agent_dispatcher = AgentDispatcher()
    return _agent_dispatcher