feat: 重构知识库系统，移除Hermes集成，增强RAG和同步功能

主要变更: - 移除Hermes智能体及相关回调服务 - 新增知识库RAG、同步、调度、规范化和索引任务服务 - 重构orchestrator服务，增强运行时聊天功能 - 更新前端聊天、政策制度、设置等页面样式和逻辑 - 更新expense_claims和document_intelligence服务 - 删除llm_wiki相关服务和测试文件 - 更新docker-compose配置和启动脚本
2026-05-17 08:38:41 +00:00
parent 212c935308
commit 68f663f2f4
308 changed files with 83729 additions and 13588 deletions
--- a/.tmp/lightrag_inspect/lightrag_pkg/lightrag/llm/voyageai.py
+++ b/.tmp/lightrag_inspect/lightrag_pkg/lightrag/llm/voyageai.py
@@ -0,0 +1,197 @@
+import os
+import numpy as np
+import pipmaster as pm  # Pipmaster for dynamic library install
+
+# Add Voyage AI import
+if not pm.is_installed("voyageai"):
+    pm.install("voyageai")
+
+import voyageai
+from voyageai.error import (
+    APIConnectionError,
+    RateLimitError,
+    ServerError,
+    ServiceUnavailableError,
+    Timeout,
+    TryAgain,
+)
+
+from tenacity import (
+    retry,
+    stop_after_attempt,
+    wait_exponential,
+    retry_if_exception_type,
+)
+from lightrag.utils import wrap_embedding_func_with_attrs, logger
+
+
+# Custom exceptions for VoyageAI errors
+class VoyageAIError(Exception):
+    """Generic VoyageAI API error"""
+
+    pass
+
+
+@wrap_embedding_func_with_attrs(
+    embedding_dim=1024, max_token_size=32000, supports_asymmetric=True
+)
+@retry(
+    stop=stop_after_attempt(3),
+    wait=wait_exponential(multiplier=1, min=4, max=60),
+    retry=retry_if_exception_type(
+        (
+            APIConnectionError,
+            RateLimitError,
+            ServerError,
+            ServiceUnavailableError,
+            Timeout,
+            TryAgain,
+        )
+    ),
+)
+async def voyageai_embed(
+    texts: list[str],
+    model: str = "voyage-3",
+    api_key: str | None = None,
+    embedding_dim: int | None = None,
+    input_type: str | None = None,
+    truncation: bool | None = True,
+    context: str | None = None,
+) -> np.ndarray:
+    """Generate embeddings for a list of texts using VoyageAI's API.
+
+    Args:
+        texts: List of texts to embed.
+        model: The VoyageAI embedding model to use. Options include:
+            - "voyage-3": General purpose (1024 dims, 32K context)
+            - "voyage-3-lite": Lightweight (512 dims, 32K context)
+            - "voyage-3-large": Highest accuracy (1024 dims, 32K context)
+            - "voyage-code-3": Code optimized (1024 dims, 32K context)
+            - "voyage-law-2": Legal documents (1024 dims, 16K context)
+            - "voyage-finance-2": Finance (1024 dims, 32K context)
+        api_key: Optional VoyageAI API key. If None, falls back to the
+            ``VOYAGE_API_KEY`` environment variable (the name VoyageAI's own
+            SDK uses), then to ``VOYAGEAI_API_KEY`` for backward compatibility.
+        embedding_dim: Optional Matryoshka output dimension. Only honored by
+            models that support dimension reduction (e.g. voyage-3-large);
+            ignored otherwise. The decorator default is 1024 to match
+            ``voyage-3``; if you select ``voyage-3-lite`` (512 dims) override
+            ``EMBEDDING_DIM`` accordingly so the vector store size matches.
+        input_type: Optional input type hint for the model. Options:
+            - "query": For search queries
+            - "document": For documents to be indexed
+            - None: Let the model decide (default)
+        truncation: Whether the API should truncate texts that exceed the model's
+            token limit. Defaults to True (matches the VoyageAI SDK default).
+        context: Optional LightRAG embedding context. When ``input_type`` is not
+            set, "query" maps to ``input_type="query"`` and "document" maps to
+            ``input_type="document"``.
+
+    Returns:
+        A numpy array of embeddings, one per input text.
+
+    Raises:
+        VoyageAIError: If the API call fails or returns invalid data.
+
+    """
+    if not api_key:
+        api_key = os.environ.get("VOYAGE_API_KEY") or os.environ.get("VOYAGEAI_API_KEY")
+        if not api_key:
+            logger.error(
+                "VoyageAI API key not provided and neither VOYAGE_API_KEY nor "
+                "VOYAGEAI_API_KEY environment variable is set"
+            )
+            raise ValueError(
+                "VoyageAI API key is required: pass api_key, or set the "
+                "VOYAGE_API_KEY (preferred) or VOYAGEAI_API_KEY environment variable"
+            )
+
+    if input_type is None and context in {"query", "document"}:
+        input_type = context
+
+    try:
+        client = voyageai.AsyncClient(api_key=api_key)
+
+        total_chars = sum(len(t) for t in texts)
+        avg_chars = total_chars / len(texts) if texts else 0
+        logger.debug(
+            f"VoyageAI embedding request: {len(texts)} texts, "
+            f"total_chars={total_chars}, avg_chars={avg_chars:.0f}, model={model}, "
+            f"input_type={input_type}"
+        )
+
+        # Prepare API call parameters
+        embed_params = dict(
+            texts=texts,
+            model=model,
+            # Optional parameters -- if None, voyageai client uses defaults
+            output_dimension=embedding_dim,
+            truncation=truncation,
+            input_type=input_type,
+        )
+        # Make API call with timing
+        result = await client.embed(**embed_params)
+
+        if not result.embeddings:
+            err_msg = "VoyageAI API returned empty embeddings"
+            logger.error(err_msg)
+            raise VoyageAIError(err_msg)
+
+        if len(result.embeddings) != len(texts):
+            err_msg = f"VoyageAI API returned {len(result.embeddings)} embeddings for {len(texts)} texts"
+            logger.error(err_msg)
+            raise VoyageAIError(err_msg)
+
+        # Convert to numpy array with timing
+        embeddings = np.array(result.embeddings, dtype=np.float32)
+        logger.debug(f"VoyageAI embeddings generated: shape {embeddings.shape}")
+
+        return embeddings
+
+    except Exception as e:
+        logger.error(f"VoyageAI embedding error: {e}")
+        raise
+
+
+# Optional: a helper function to get available embedding models
+def get_available_embedding_models() -> dict[str, dict]:
+    """
+    Returns a dictionary of available Voyage AI embedding models and their properties.
+    """
+    return {
+        "voyage-3-large": {
+            "context_length": 32000,
+            "dimension": 1024,
+            "description": "Best general-purpose and multilingual",
+        },
+        "voyage-3": {
+            "context_length": 32000,
+            "dimension": 1024,
+            "description": "General-purpose and multilingual",
+        },
+        "voyage-3-lite": {
+            "context_length": 32000,
+            "dimension": 512,
+            "description": "Optimized for latency and cost",
+        },
+        "voyage-code-3": {
+            "context_length": 32000,
+            "dimension": 1024,
+            "description": "Optimized for code",
+        },
+        "voyage-finance-2": {
+            "context_length": 32000,
+            "dimension": 1024,
+            "description": "Optimized for finance",
+        },
+        "voyage-law-2": {
+            "context_length": 16000,
+            "dimension": 1024,
+            "description": "Optimized for legal",
+        },
+        "voyage-multimodal-3": {
+            "context_length": 32000,
+            "dimension": 1024,
+            "description": "Multimodal text and images",
+        },
+    }