Add brain memory services and APIs

Introduce the backend pieces for brain memory ingestion, routing, and system telemetry so the new knowledge workflows can project data into a brain view. The supporting tests lock in the new behavior and keep the expanded backend surface stable. Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
2026-03-22 13:47:34 +08:00
parent e3691b01bb
commit d2447ee635
28 changed files with 2278 additions and 197 deletions
--- a/backend/app/services/agent_service.py
+++ b/backend/app/services/agent_service.py
@@ -6,15 +6,60 @@ Jarvis Agent 服务层
 import json
 import uuid
 from datetime import datetime
-from typing import AsyncGenerator
+from typing import Any, AsyncGenerator
+import asyncio
 from sqlalchemy.ext.asyncio import AsyncSession
 from sqlalchemy import select
 from langchain_core.messages import HumanMessage, AIMessage
+from langchain_openai import ChatOpenAI
+from langchain_anthropic import ChatAnthropic
+from langchain_ollama import ChatOllama
+import httpx
+
+from app.database import async_session

 from app.models.conversation import Conversation, Message
+from app.models.user import User
 from app.agents.graph import get_agent_graph
 from app.agents.context import set_current_user, clear_current_user
 from app.services import memory_service
+from app.services.brain_service import BrainService
+
+
+def _create_llm_from_config(config: dict):
+    """根据用户模型配置创建 LLM 实例"""
+    provider = config.get("provider", "openai")
+    model = config.get("model", "")
+    api_key = config.get("api_key", "")
+    base_url = config.get("base_url", "")
+
+    if provider == "openai" or provider == "deepseek" or provider == "custom":
+        return ChatOpenAI(
+            api_key=api_key,
+            model=model,
+            base_url=base_url or None,
+            timeout=httpx.Timeout(60.0, connect=10.0),
+        )
+    elif provider == "claude":
+        return ChatAnthropic(
+            api_key=api_key,
+            model=model,
+            timeout=httpx.Timeout(60.0, connect=10.0),
+        )
+    elif provider == "ollama":
+        return ChatOllama(
+            base_url=base_url or "http://localhost:11434",
+            model=model,
+            timeout=httpx.Timeout(120.0, connect=10.0),
+        )
+    else:
+        # 默认使用 OpenAI
+        return ChatOpenAI(
+            api_key=api_key,
+            model=model,
+            base_url=base_url or None,
+            timeout=httpx.Timeout(60.0, connect=10.0),
+        )


 class AgentService:
@@ -23,12 +68,70 @@ class AgentService:
    def __init__(self, db: AsyncSession):
        self.db = db

+    async def _try_auto_summarize_background(self, user_id: str, conversation_id: str) -> None:
+        async with async_session() as session:
+            await memory_service.try_auto_summarize(session, user_id, conversation_id)
+
+    def _build_progress_event(
+        self,
+        stage: str,
+        label: str,
+        *,
+        agent: str | None = None,
+        tool_name: str | None = None,
+        step: str | None = None,
+        steps: list[str] | None = None,
+    ) -> dict[str, Any]:
+        return {
+            "type": "progress",
+            "stage": stage,
+            "label": label,
+            "agent": agent,
+            "tool_name": tool_name,
+            "step": step,
+            "steps": steps or [],
+        }
+
+    async def _get_user_llm_config(self, user_id: str, model_name: str | None = None) -> dict | None:
+        """获取用户的 LLM 模型配置"""
+        result = await self.db.execute(select(User).where(User.id == user_id))
+        user = result.scalar_one_or_none()
+        if not user or not user.llm_config:
+            return None
+
+        llm_config = user.llm_config
+
+        # 如果指定了模型名称，查找对应的配置
+        if model_name:
+            for model_type in ["chat", "vlm"]:
+                models = llm_config.get(model_type, [])
+                for m in models:
+                    if m.get("name") == model_name:
+                        return m
+            # 没找到，返回 None 让调用方知道配置不存在
+            return None
+
+        # 如果没指定模型名，返回默认启用的 chat 模型
+        chat_models = llm_config.get("chat", [])
+        for m in chat_models:
+            if m.get("enabled"):
+                return m
+
+        vlm_models = llm_config.get("vlm", [])
+        for m in vlm_models:
+            if m.get("enabled"):
+                return m
+
+        return None
+
    async def chat(
        self,
        user_id: str,
        message: str,
        conversation_id: str | None = None,
-    ) -> tuple[str, str, AsyncGenerator[str, None]]:
+        file_ids: list[str] | None = None,
+        model_name: str | None = None,
+    ) -> tuple[str, str, AsyncGenerator[dict[str, Any], None]]:
        """
        处理对话请求（流式）

@@ -53,22 +156,54 @@ class AgentService:
        else:
            conversation_id = conv.id

+        # 如果有文件，读取内容作为上下文
+        file_context = ""
+        if file_ids:
+            from app.services.document_service import DocumentService
+            doc_svc = DocumentService(self.db)
+            for file_id in file_ids:
+                content = await doc_svc.get_document_content(user_id, file_id)
+                if content:
+                    file_context += f"\n\n[用户上传文件内容]\n{content}\n[/文件内容]"
+
+        full_message = f"{message}\n{file_context}" if file_context else message
+
        # 存储用户消息
        user_msg = Message(
            conversation_id=conversation_id,
            role="user",
            content=message,
+            attachments=[{"file_ids": file_ids}] if file_ids else None,
        )
        self.db.add(user_msg)
        await self.db.commit()
        await self.db.refresh(user_msg)

+        brain_service = BrainService(self.db)
+        await brain_service.create_event(
+            user_id,
+            source_type="conversation",
+            source_id=conversation_id,
+            event_type="message_created",
+            title="User message",
+            content_summary=message[:500],
+            raw_excerpt=message[:2000],
+            metadata_={"role": "user"},
+            importance_signal=1.0,
+        )
+        await self.db.commit()
+
        # 预创建助手消息（后续更新内容）
+        user_llm_config = await self._get_user_llm_config(user_id, model_name)
+        model_name_used = model_name
+        if user_llm_config:
+            model_name_used = user_llm_config.get("name", model_name)
+
        assistant_msg = Message(
            conversation_id=conversation_id,
            role="assistant",
            content="",
-            model="jarvis",
+            model=model_name_used or "jarvis",
        )
        self.db.add(assistant_msg)
        await self.db.commit()
@@ -85,7 +220,7 @@ class AgentService:
            try:
                graph = get_agent_graph()
                langgraph_state = {
-                    "messages": [HumanMessage(content=message)],  # type: ignore[arg-type]
+                    "messages": [HumanMessage(content=full_message)],  # type: ignore[arg-type]
                    "user_id": user_id,
                    "conversation_id": conversation_id,
                    "current_agent": "master",
@@ -102,33 +237,81 @@ class AgentService:
                    "final_response": None,
                    "should_respond": True,
                    "memory_context": memory_ctx,
+                    "user_llm_config": user_llm_config,
                }

+                yield self._build_progress_event("thinking", "Jarvis 正在分析请求", agent="master", step="理解你的问题")
+
                collected = ""
                async for event in graph.astream_events(langgraph_state, version="v2"):
                    kind = event.get("event")
-                    if kind == "on_chat_model_end":
-                        content = event.get("data", {}).get("output", {})
-                        if isinstance(content, dict):
-                            content = content.get("content", "")
-                        if content:
-                            delta = content[len(collected):]
-                            if delta:
-                                collected += delta
-                                yield delta
+                    event_name = event.get("name", "")
+                    metadata = event.get("metadata", {})
+                    data = event.get("data", {})
+
+                    if kind == "on_chain_start" and event_name in {"master", "planner", "executor", "librarian", "analyst"}:
+                        stage_map = {
+                            "master": ("thinking", "Jarvis 正在理解请求"),
+                            "planner": ("planning", "Jarvis 正在拆解步骤"),
+                            "executor": ("tool", "Jarvis 正在执行操作"),
+                            "librarian": ("tool", "Jarvis 正在检索知识"),
+                            "analyst": ("thinking", "Jarvis 正在分析信息"),
+                        }
+                        stage, label = stage_map[event_name]
+                        yield self._build_progress_event(stage, label, agent=event_name, step=label)
+                    elif kind == "on_tool_start":
+                        tool_input = data.get("input")
+                        step = None
+                        if isinstance(tool_input, dict) and tool_input:
+                            step = f"调用工具 {event_name}"
+                        yield self._build_progress_event("tool", f"Jarvis 正在调用工具 {event_name}", agent="executor", tool_name=event_name, step=step)
                    elif kind == "on_tool_end":
-                        name = event.get("name", "")
-                        yield f"\n[工具执行: {name}]\n"
+                        yield self._build_progress_event("tool", f"工具 {event_name} 已完成", agent="executor", tool_name=event_name, step=f"已获得 {event_name} 结果")
+                    elif kind == "on_chain_end" and event_name == "planner":
+                        output = data.get("output") or {}
+                        plan_steps = output.get("plan_steps") or []
+                        steps = [item.get("description", "") for item in plan_steps if item.get("description")]
+                        yield self._build_progress_event("planning", "Jarvis 已生成处理步骤", agent="planner", step=steps[0] if steps else "正在整理计划", steps=steps[:4])
+                    elif kind == "on_chat_model_stream":
+                        chunk = data.get("chunk")
+                        content = getattr(chunk, "content", "") if chunk else ""
+                        if isinstance(content, list):
+                            text_parts = []
+                            for item in content:
+                                if isinstance(item, dict):
+                                    text_parts.append(item.get("text", ""))
+                                else:
+                                    text_parts.append(str(item))
+                            content = "".join(text_parts)
+                        if content:
+                            collected += content
+                            yield {"type": "chunk", "content": content}
+                    elif kind == "on_chat_model_end" and not collected:
+                        output = data.get("output")
+                        content = getattr(output, "content", "") if output else ""
+                        if isinstance(content, list):
+                            text_parts = []
+                            for item in content:
+                                if isinstance(item, dict):
+                                    text_parts.append(item.get("text", ""))
+                                else:
+                                    text_parts.append(str(item))
+                            content = "".join(text_parts)
+                        if content:
+                            collected = content
+                            yield {"type": "chunk", "content": content}
+                    elif kind == "on_chain_end" and event_name in {"executor", "librarian", "analyst"}:
+                        yield self._build_progress_event("responding", "Jarvis 正在整理最终回答", agent=event_name, step="生成回复")
            except Exception as e:
-                yield f"\n执行出错: {str(e)}"
+                fallback = f"抱歉，发生错误: {str(e)}"
+                collected = fallback
+                yield {"type": "error", "error": str(e)}
+                yield {"type": "chunk", "content": fallback}
            finally:
                clear_current_user()
-                # 异步触发自动摘要和记忆提取（不阻塞响应）
-                import asyncio
                try:
-                    loop = asyncio.get_running_loop()
-                    loop.create_task(
-                        memory_service.try_auto_summarize(self.db, user_id, conversation_id)
+                    asyncio.get_running_loop().create_task(
+                        self._try_auto_summarize_background(user_id, conversation_id)
                    )
                except Exception:
                    pass
@@ -143,6 +326,18 @@ class AgentService:
                    if msg:
                        msg.content = collected
                        await self.db.commit()
+                        await brain_service.create_event(
+                            user_id,
+                            source_type="conversation",
+                            source_id=conversation_id,
+                            event_type="message_created",
+                            title="Assistant message",
+                            content_summary=collected[:500],
+                            raw_excerpt=collected[:2000],
+                            metadata_={"role": "assistant"},
+                            importance_signal=1.0,
+                        )
+                        await self.db.commit()
                except Exception:
                    pass

@@ -154,12 +349,13 @@ class AgentService:
        message: str,
        conversation_id: str | None = None,
        file_ids: list[str] | None = None,
-    ) -> tuple[str, str, str]:
+        model_name: str | None = None,
+    ) -> tuple[str, str, str, str | None]:
        """
        简单同步版对话（无流式）

        Returns:
-            (conversation_id, message_id, response_content)
+            (conversation_id, message_id, response_content, model_name_used)
        """
        # 获取或创建对话
        if conversation_id:
@@ -203,11 +399,31 @@ class AgentService:
        await self.db.commit()
        await self.db.refresh(user_msg)

+        brain_service = BrainService(self.db)
+        await brain_service.create_event(
+            user_id,
+            source_type="conversation",
+            source_id=conversation_id,
+            event_type="message_created",
+            title="User message",
+            content_summary=message[:500],
+            raw_excerpt=message[:2000],
+            metadata_={"role": "user"},
+            importance_signal=1.0,
+        )
+        await self.db.commit()
+
        # 加载记忆上下文
        memory_ctx = await memory_service.build_memory_context(
            self.db, user_id, conversation_id, message
        )

+        # 获取用户配置的 LLM
+        user_llm_config = await self._get_user_llm_config(user_id, model_name)
+        model_name_used = model_name
+        if user_llm_config:
+            model_name_used = user_llm_config.get("name", model_name)
+
        # 调用 LangGraph Agent
        set_current_user(user_id)
        graph = get_agent_graph()
@@ -229,6 +445,7 @@ class AgentService:
            "final_response": None,
            "should_respond": True,
            "memory_context": memory_ctx,
+            "user_llm_config": user_llm_config,  # 传递用户 LLM 配置
        }

        try:
@@ -238,11 +455,9 @@ class AgentService:
            response_content = f"抱歉，发生错误: {str(e)}"
        finally:
            clear_current_user()
-            # 异步触发自动摘要
-            import asyncio
            try:
                asyncio.get_running_loop().create_task(
-                    memory_service.try_auto_summarize(self.db, user_id, conversation_id)
+                    self._try_auto_summarize_background(user_id, conversation_id)
                )
            except Exception:
                pass
@@ -252,10 +467,23 @@ class AgentService:
            conversation_id=conversation_id,
            role="assistant",
            content=response_content,
-            model="jarvis",
+            model=model_name_used or "jarvis",
        )
        self.db.add(assistant_msg)
        await self.db.commit()
        await self.db.refresh(assistant_msg)

-        return conversation_id, assistant_msg.id, response_content
+        await brain_service.create_event(
+            user_id,
+            source_type="conversation",
+            source_id=conversation_id,
+            event_type="message_created",
+            title="Assistant message",
+            content_summary=response_content[:500],
+            raw_excerpt=response_content[:2000],
+            metadata_={"role": "assistant"},
+            importance_signal=1.0,
+        )
+        await self.db.commit()
+
+        return conversation_id, assistant_msg.id, response_content, model_name_used