Persist streaming chat state during generator cleanup, close the SSE inner stream safely, and reject cross-user conversation access while locking the behavior with focused regressions.
593 lines
23 KiB
Python
593 lines
23 KiB
Python
"""
|
|
Jarvis Agent 服务层
|
|
负责 LangGraph Agent 的调用、流式输出、对话历史管理
|
|
"""
|
|
|
|
import json
|
|
import uuid
|
|
import logging
|
|
from datetime import UTC, datetime
|
|
from typing import Any, AsyncGenerator
|
|
import asyncio
|
|
from openai import BadRequestError
|
|
from sqlalchemy.ext.asyncio import AsyncSession
|
|
from sqlalchemy import select
|
|
from langchain_core.messages import HumanMessage, AIMessage
|
|
|
|
from app.database import async_session
|
|
from app.logging_utils import summarize_llm_config
|
|
|
|
from app.models.conversation import Conversation, Message
|
|
from app.models.user import User
|
|
from app.agents.graph import get_agent_graph
|
|
from app.agents.context import set_current_user, clear_current_user
|
|
from app.services import memory_service
|
|
from app.services.brain_service import BrainService
|
|
from app.services.llm_service import create_llm_from_config, resolve_provider_capabilities
|
|
from app.agents.tools.time_reasoning import extract_reference_datetime
|
|
from app.agents.state import initial_state
|
|
|
|
logger = logging.getLogger(__name__)
|
|
|
|
|
|
def _is_streaming_rejection_error(error: Exception, user_llm_config: dict | None) -> bool:
|
|
capabilities = resolve_provider_capabilities(user_llm_config)
|
|
error_text = str(error).lower()
|
|
markers = [
|
|
"invalid chat setting",
|
|
"invalid params",
|
|
"stream",
|
|
"streaming",
|
|
"unsupported",
|
|
"bad_request_error",
|
|
"http 400",
|
|
"error code: 400",
|
|
]
|
|
|
|
if isinstance(error, BadRequestError):
|
|
return (
|
|
getattr(capabilities, "provider", None) not in {"openai", "claude"}
|
|
and any(marker in error_text for marker in markers)
|
|
)
|
|
|
|
return any(marker in error_text for marker in markers)
|
|
|
|
|
|
def _coerce_event_text(content: Any) -> str:
|
|
if isinstance(content, str):
|
|
return content
|
|
if isinstance(content, list):
|
|
parts: list[str] = []
|
|
for item in content:
|
|
if isinstance(item, str):
|
|
parts.append(item)
|
|
elif isinstance(item, dict):
|
|
text = item.get("text")
|
|
if isinstance(text, str):
|
|
parts.append(text)
|
|
return "".join(parts)
|
|
return str(content) if content else ""
|
|
|
|
|
|
_CONTINUITY_STATE_VERSION = 1
|
|
_CONTINUITY_SNAPSHOT_FIELDS = (
|
|
"turn_context",
|
|
"routing_decision",
|
|
"continuity_state",
|
|
"pending_action",
|
|
"last_completed_action",
|
|
"clarification_context",
|
|
"tool_outcomes",
|
|
"pending_tasks",
|
|
"completed_tasks",
|
|
"created_entities",
|
|
"current_agent",
|
|
"next_step",
|
|
"agent_trace",
|
|
)
|
|
|
|
|
|
def _build_continuity_snapshot(state: dict[str, Any]) -> dict[str, Any] | None:
|
|
snapshot = {
|
|
field: state.get(field)
|
|
for field in _CONTINUITY_SNAPSHOT_FIELDS
|
|
if state.get(field) is not None
|
|
}
|
|
if not snapshot:
|
|
return None
|
|
return {
|
|
"version": _CONTINUITY_STATE_VERSION,
|
|
"state": snapshot,
|
|
}
|
|
|
|
|
|
def _extract_continuity_snapshot(payload: Any) -> dict[str, Any] | None:
|
|
if isinstance(payload, list):
|
|
for item in payload:
|
|
snapshot = _extract_continuity_snapshot(item)
|
|
if snapshot:
|
|
return snapshot
|
|
return None
|
|
if not isinstance(payload, dict):
|
|
return None
|
|
if payload.get("kind") != "agent_continuity_state":
|
|
return None
|
|
if payload.get("version") != _CONTINUITY_STATE_VERSION:
|
|
return None
|
|
state = payload.get("state")
|
|
if isinstance(state, dict):
|
|
return state
|
|
return None
|
|
|
|
|
|
class AgentService:
|
|
"""对话 Agent 服务"""
|
|
|
|
def __init__(self, db: AsyncSession):
|
|
self.db = db
|
|
|
|
async def _try_auto_summarize_background(self, user_id: str, conversation_id: str) -> None:
|
|
async with async_session() as session:
|
|
await memory_service.try_auto_summarize(session, user_id, conversation_id)
|
|
|
|
def _build_progress_event(
|
|
self,
|
|
stage: str,
|
|
label: str,
|
|
*,
|
|
agent: str | None = None,
|
|
tool_name: str | None = None,
|
|
step: str | None = None,
|
|
steps: list[str] | None = None,
|
|
) -> dict[str, Any]:
|
|
return {
|
|
"type": "progress",
|
|
"stage": stage,
|
|
"label": label,
|
|
"agent": agent,
|
|
"tool_name": tool_name,
|
|
"step": step,
|
|
"steps": steps or [],
|
|
}
|
|
|
|
def _build_current_datetime_context(self) -> tuple[str, dict[str, str]]:
|
|
now_utc = datetime.now(UTC)
|
|
reference = {
|
|
"current_time_iso": now_utc.isoformat(),
|
|
"current_date_iso": now_utc.date().isoformat(),
|
|
}
|
|
context = (
|
|
"【当前时间】\n"
|
|
f"- current_time_utc: {reference['current_time_iso']}\n"
|
|
f"- current_date_utc: {reference['current_date_iso']}\n"
|
|
"说明:解析‘今天/明天/后天/本周/下周’等相对时间时,请以 current_time_utc 为准。"
|
|
)
|
|
return context, reference
|
|
|
|
async def _get_user_llm_config(self, user_id: str, model_name: str | None = None) -> dict | None:
|
|
"""获取用户的 LLM 模型配置"""
|
|
user = await self.db.get(User, user_id)
|
|
if not user or not user.llm_config:
|
|
return None
|
|
|
|
llm_config = user.llm_config
|
|
|
|
if model_name:
|
|
models = llm_config.get("chat", [])
|
|
for m in models:
|
|
if m.get("name") == model_name:
|
|
return m
|
|
return None
|
|
|
|
chat_models = llm_config.get("chat", [])
|
|
for m in chat_models:
|
|
if m.get("enabled"):
|
|
return m
|
|
|
|
return None
|
|
|
|
async def _load_continuity_snapshot(self, conversation: Conversation) -> dict[str, Any] | None:
|
|
snapshot = _extract_continuity_snapshot(conversation.agent_state)
|
|
if snapshot:
|
|
return snapshot
|
|
|
|
result = await self.db.execute(
|
|
select(Message)
|
|
.where(Message.conversation_id == conversation.id, Message.role == "assistant")
|
|
.order_by(Message.created_at.desc())
|
|
)
|
|
for message in result.scalars():
|
|
snapshot = _extract_continuity_snapshot(message.attachments)
|
|
if snapshot:
|
|
return snapshot
|
|
return None
|
|
|
|
async def _build_agent_state(
|
|
self,
|
|
*,
|
|
user_id: str,
|
|
conversation: Conversation,
|
|
full_message: str,
|
|
memory_context: str | None,
|
|
current_datetime_context: str,
|
|
current_datetime_reference: dict[str, str],
|
|
user_llm_config: dict | None,
|
|
) -> dict[str, Any]:
|
|
state = initial_state(user_id, conversation.id)
|
|
state.update({
|
|
"messages": [HumanMessage(content=full_message)],
|
|
"memory_context": memory_context,
|
|
"current_datetime_context": current_datetime_context,
|
|
"current_datetime_reference": current_datetime_reference,
|
|
"user_llm_config": user_llm_config,
|
|
})
|
|
previous_snapshot = await self._load_continuity_snapshot(conversation)
|
|
if previous_snapshot:
|
|
state.update(previous_snapshot)
|
|
state["messages"] = [HumanMessage(content=full_message)]
|
|
return state
|
|
|
|
async def chat(
|
|
self,
|
|
user_id: str,
|
|
message: str,
|
|
conversation_id: str | None = None,
|
|
file_ids: list[str] | None = None,
|
|
model_name: str | None = None,
|
|
) -> tuple[str, str, AsyncGenerator[dict[str, Any], None]]:
|
|
"""
|
|
处理对话请求(流式)
|
|
"""
|
|
user_llm_config = await self._get_user_llm_config(user_id, model_name)
|
|
model_name_used = model_name
|
|
if model_name and not user_llm_config:
|
|
raise ValueError("所选模型不可用于聊天,请切换到聊天模型")
|
|
if user_llm_config:
|
|
model_name_used = user_llm_config.get("name", model_name)
|
|
|
|
logger.info(
|
|
"agent_chat_started",
|
|
extra={
|
|
"details": {
|
|
"mode": "stream",
|
|
"requested_model_name": model_name,
|
|
"resolved_model_name": model_name_used,
|
|
"message_length": len(message or ""),
|
|
}
|
|
},
|
|
)
|
|
|
|
if conversation_id:
|
|
result = await self.db.execute(
|
|
select(Conversation).where(
|
|
Conversation.id == conversation_id,
|
|
Conversation.user_id == user_id,
|
|
)
|
|
)
|
|
conv = result.scalar_one_or_none()
|
|
if conv is None:
|
|
raise ValueError("会话不存在或无权访问")
|
|
else:
|
|
conv = None
|
|
|
|
if not conv:
|
|
conv = Conversation(user_id=user_id, title=message[:50])
|
|
self.db.add(conv)
|
|
await self.db.commit()
|
|
await self.db.refresh(conv)
|
|
conversation_id = conv.id
|
|
else:
|
|
conversation_id = conv.id
|
|
|
|
file_context = ""
|
|
if file_ids:
|
|
from app.services.document_service import DocumentService
|
|
doc_svc = DocumentService(self.db)
|
|
for file_id in file_ids:
|
|
content = await doc_svc.get_document_content(user_id, file_id)
|
|
if content:
|
|
file_context += f"\n\n[用户上传文件内容]\n{content}\n[/文件内容]"
|
|
|
|
full_message = f"{message}\n{file_context}" if file_context else message
|
|
|
|
user_msg = Message(
|
|
conversation_id=conversation_id,
|
|
role="user",
|
|
content=message,
|
|
attachments=[{"file_ids": file_ids}] if file_ids else None,
|
|
)
|
|
self.db.add(user_msg)
|
|
await self.db.commit()
|
|
await self.db.refresh(user_msg)
|
|
|
|
brain_service = BrainService(self.db)
|
|
await brain_service.create_event(
|
|
user_id,
|
|
source_type="conversation",
|
|
source_id=conversation_id,
|
|
event_type="message_created",
|
|
title="User message",
|
|
content_summary=message[:500],
|
|
raw_excerpt=message[:2000],
|
|
metadata_={"role": "user"},
|
|
importance_signal=1.0,
|
|
)
|
|
await self.db.commit()
|
|
|
|
memory_ctx = await memory_service.build_memory_context(
|
|
self.db, user_id, conversation_id, message
|
|
)
|
|
|
|
assistant_msg = Message(
|
|
conversation_id=conversation_id,
|
|
role="assistant",
|
|
content="",
|
|
model=model_name_used or "jarvis",
|
|
attachments=None,
|
|
)
|
|
self.db.add(assistant_msg)
|
|
await self.db.commit()
|
|
await self.db.refresh(assistant_msg)
|
|
|
|
def _build_assistant_event_payload(content: str) -> dict[str, Any]:
|
|
return {
|
|
"source_type": "conversation",
|
|
"source_id": conversation_id,
|
|
"event_type": "message_created",
|
|
"title": "Assistant message",
|
|
"content_summary": content[:500],
|
|
"raw_excerpt": content[:2000],
|
|
"metadata_": {"role": "assistant"},
|
|
"importance_signal": 0.8,
|
|
}
|
|
|
|
async def run_agent():
|
|
collected = ""
|
|
state: dict[str, Any] | None = None
|
|
set_current_user(user_id)
|
|
try:
|
|
graph = get_agent_graph()
|
|
current_datetime_context, current_datetime_reference = self._build_current_datetime_context()
|
|
|
|
state = await self._build_agent_state(
|
|
user_id=user_id,
|
|
conversation=conv,
|
|
full_message=full_message,
|
|
memory_context=memory_ctx,
|
|
current_datetime_context=current_datetime_context,
|
|
current_datetime_reference=current_datetime_reference,
|
|
user_llm_config=user_llm_config,
|
|
)
|
|
|
|
yield self._build_progress_event("thinking", "Jarvis 正在分析请求", agent="master", step="理解你的问题")
|
|
|
|
try:
|
|
async for event in graph.astream_events(state, version="v2"):
|
|
kind = event.get("event")
|
|
event_name = event.get("name", "")
|
|
metadata = event.get("metadata", {})
|
|
data = event.get("data", {})
|
|
|
|
if kind == "on_chain_start" and event_name in {"master", "schedule_planner", "executor", "librarian", "analyst"}:
|
|
stage_map = {
|
|
"master": ("thinking", "Jarvis 正在理解请求"),
|
|
"schedule_planner": ("planning", "Jarvis 正在编排日程"),
|
|
"executor": ("tool", "Jarvis 正在执行操作"),
|
|
"librarian": ("tool", "Jarvis 正在检索知识"),
|
|
"analyst": ("thinking", "Jarvis 正在分析信息"),
|
|
}
|
|
stage, label = stage_map.get(event_name, ("thinking", "Jarvis 正在思考"))
|
|
yield self._build_progress_event(stage, label, agent=event_name, step=label)
|
|
|
|
elif kind == "on_tool_start":
|
|
yield self._build_progress_event(
|
|
"tool",
|
|
f"Jarvis 正在调用工具 {event_name}",
|
|
agent="executor",
|
|
tool_name=event_name,
|
|
step=f"正在执行 {event_name}",
|
|
)
|
|
|
|
elif kind == "on_tool_end":
|
|
tool_result = data.get("output")
|
|
step = f"已完成 {event_name}"
|
|
if isinstance(tool_result, str) and len(tool_result) > 0:
|
|
step = tool_result[:100]
|
|
yield self._build_progress_event(
|
|
"tool",
|
|
f"工具 {event_name} 已完成",
|
|
agent="executor",
|
|
tool_name=event_name,
|
|
step=step,
|
|
)
|
|
|
|
elif kind == "on_chat_model_stream":
|
|
chunk = data.get("chunk")
|
|
content = _coerce_event_text(getattr(chunk, "content", "") if chunk else "")
|
|
if content:
|
|
collected += content
|
|
yield {"type": "chunk", "content": content}
|
|
|
|
elif kind == "on_chain_end":
|
|
output = data.get("output")
|
|
final_resp = None
|
|
if isinstance(output, dict):
|
|
state.update(output)
|
|
final_resp = output.get("final_response")
|
|
if final_resp:
|
|
final_text = str(final_resp)
|
|
if final_text != collected:
|
|
collected = final_text
|
|
yield {"type": "chunk", "content": final_text}
|
|
|
|
elif kind == "on_chat_model_end":
|
|
output = data.get("output")
|
|
final_content = _coerce_event_text(getattr(output, "content", "") if output else "")
|
|
if final_content:
|
|
final_text = final_content
|
|
if final_text != collected:
|
|
collected = final_text
|
|
yield {"type": "chunk", "content": final_text}
|
|
|
|
except Exception as e:
|
|
if _is_streaming_rejection_error(e, user_llm_config) and not collected:
|
|
yield self._build_progress_event("responding", "Jarvis 正在生成回复", agent="master", step="fallback")
|
|
try:
|
|
result_state = await graph.ainvoke(state)
|
|
if isinstance(result_state, dict):
|
|
state.update(result_state)
|
|
fallback_content = result_state.get("final_response") or str(result_state.get("messages", [AIMessage(content="")])[-1].content)
|
|
collected = str(fallback_content)
|
|
yield {"type": "chunk", "content": collected}
|
|
except Exception:
|
|
logger.exception("llm_sync_fallback_failed")
|
|
safe_error = "模型服务暂不可用,请稍后再试。"
|
|
yield {"type": "error", "error": safe_error}
|
|
collected = f"抱歉,发生错误: {safe_error}"
|
|
yield {"type": "chunk", "content": collected}
|
|
else:
|
|
logger.exception("agent_streaming_failed")
|
|
if not collected:
|
|
safe_error = "模型服务暂不可用,请稍后再试。"
|
|
yield {"type": "error", "error": safe_error}
|
|
collected = f"抱歉,发生错误: {safe_error}"
|
|
yield {"type": "chunk", "content": collected}
|
|
else:
|
|
yield {"type": "error", "error": str(e)}
|
|
finally:
|
|
clear_current_user()
|
|
try:
|
|
if collected:
|
|
assistant_msg.content = collected
|
|
continuity_snapshot = _build_continuity_snapshot(state or {})
|
|
assistant_msg.attachments = ([{
|
|
"kind": "agent_continuity_state",
|
|
**continuity_snapshot,
|
|
}] if continuity_snapshot else None)
|
|
conv.agent_state = continuity_snapshot
|
|
await BrainService(self.db).create_event(
|
|
user_id,
|
|
**_build_assistant_event_payload(collected),
|
|
)
|
|
await self.db.commit()
|
|
await self.db.refresh(assistant_msg)
|
|
except Exception:
|
|
logger.exception("save_assistant_message_failed")
|
|
asyncio.create_task(self._try_auto_summarize_background(user_id, conversation_id))
|
|
|
|
return conversation_id, assistant_msg.id, run_agent()
|
|
|
|
async def chat_simple(
|
|
self,
|
|
user_id: str,
|
|
message: str,
|
|
conversation_id: str | None = None,
|
|
file_ids: list[str] | None = None,
|
|
model_name: str | None = None,
|
|
) -> tuple[str, str, str, str | None]:
|
|
"""
|
|
简单同步版对话
|
|
"""
|
|
user_llm_config = await self._get_user_llm_config(user_id, model_name)
|
|
model_name_used = model_name
|
|
if model_name and not user_llm_config:
|
|
raise ValueError("所选模型不可用于聊天,请切换到聊天模型")
|
|
if user_llm_config:
|
|
model_name_used = user_llm_config.get("name", model_name)
|
|
|
|
if conversation_id:
|
|
result = await self.db.execute(
|
|
select(Conversation).where(
|
|
Conversation.id == conversation_id,
|
|
Conversation.user_id == user_id,
|
|
)
|
|
)
|
|
conv = result.scalar_one_or_none()
|
|
if conv is None:
|
|
raise ValueError("会话不存在或无权访问")
|
|
else:
|
|
conv = None
|
|
|
|
if not conv:
|
|
conv = Conversation(user_id=user_id, title=message[:50])
|
|
self.db.add(conv)
|
|
await self.db.commit()
|
|
await self.db.refresh(conv)
|
|
conversation_id = conv.id
|
|
else:
|
|
conversation_id = conv.id
|
|
|
|
user_msg = Message(conversation_id=conversation_id, role="user", content=message)
|
|
self.db.add(user_msg)
|
|
|
|
assistant_msg = Message(
|
|
conversation_id=conversation_id,
|
|
role="assistant",
|
|
content="",
|
|
model=model_name_used or "jarvis",
|
|
attachments=None,
|
|
)
|
|
self.db.add(assistant_msg)
|
|
|
|
brain_service = BrainService(self.db)
|
|
await brain_service.create_event(
|
|
user_id,
|
|
source_type="conversation",
|
|
source_id=conversation_id,
|
|
event_type="message_created",
|
|
title="User message",
|
|
content_summary=message[:500],
|
|
raw_excerpt=message[:2000],
|
|
metadata_={"role": "user"},
|
|
importance_signal=1.0,
|
|
)
|
|
|
|
memory_ctx = await memory_service.build_memory_context(self.db, user_id, conversation_id, message)
|
|
|
|
set_current_user(user_id)
|
|
try:
|
|
graph = get_agent_graph()
|
|
current_datetime_context, current_datetime_reference = self._build_current_datetime_context()
|
|
state = await self._build_agent_state(
|
|
user_id=user_id,
|
|
conversation=conv,
|
|
full_message=message,
|
|
memory_context=memory_ctx,
|
|
current_datetime_context=current_datetime_context,
|
|
current_datetime_reference=current_datetime_reference,
|
|
user_llm_config=user_llm_config,
|
|
)
|
|
|
|
result_state = await graph.ainvoke(state)
|
|
response_content = result_state.get("final_response") or str(result_state.get("messages", [AIMessage(content="")])[-1].content)
|
|
except Exception as e:
|
|
logger.exception("agent_chat_simple_failed")
|
|
response_content = "抱歉,发生错误。"
|
|
finally:
|
|
clear_current_user()
|
|
|
|
brain_service = BrainService(self.db)
|
|
await brain_service.create_event(
|
|
user_id,
|
|
source_type="conversation",
|
|
source_id=conversation_id,
|
|
event_type="message_created",
|
|
title="Assistant message",
|
|
content_summary=response_content[:500],
|
|
raw_excerpt=response_content[:2000],
|
|
metadata_={"role": "assistant"},
|
|
importance_signal=0.8,
|
|
)
|
|
|
|
assistant_msg.content = response_content
|
|
continuity_snapshot = _build_continuity_snapshot(result_state) if 'result_state' in locals() else None
|
|
assistant_msg.attachments = ([{
|
|
"kind": "agent_continuity_state",
|
|
**continuity_snapshot,
|
|
}] if continuity_snapshot else None)
|
|
conv.agent_state = continuity_snapshot
|
|
await self.db.commit()
|
|
await self.db.refresh(assistant_msg)
|
|
|
|
return conversation_id, assistant_msg.id, response_content, model_name_used
|