.tmp/lightrag_inspect/lightrag_pkg/lightrag/llm/voyageai.py

import os
import numpy as np
import pipmaster as pm  # Pipmaster for dynamic library install

# Add Voyage AI import
if not pm.is_installed("voyageai"):
    pm.install("voyageai")

import voyageai
from voyageai.error import (
    APIConnectionError,
    RateLimitError,
    ServerError,
    ServiceUnavailableError,
    Timeout,
    TryAgain,
)

from tenacity import (
    retry,
    stop_after_attempt,
    wait_exponential,
    retry_if_exception_type,
)
from lightrag.utils import wrap_embedding_func_with_attrs, logger


# Custom exceptions for VoyageAI errors
class VoyageAIError(Exception):
    """Generic VoyageAI API error"""

    pass


@wrap_embedding_func_with_attrs(
    embedding_dim=1024, max_token_size=32000, supports_asymmetric=True
)
@retry(
    stop=stop_after_attempt(3),
    wait=wait_exponential(multiplier=1, min=4, max=60),
    retry=retry_if_exception_type(
        (
            APIConnectionError,
            RateLimitError,
            ServerError,
            ServiceUnavailableError,
            Timeout,
            TryAgain,
        )
    ),
)
async def voyageai_embed(
    texts: list[str],
    model: str = "voyage-3",
    api_key: str | None = None,
    embedding_dim: int | None = None,
    input_type: str | None = None,
    truncation: bool | None = True,
    context: str | None = None,
) -> np.ndarray:
    """Generate embeddings for a list of texts using VoyageAI's API.

    Args:
        texts: List of texts to embed.
        model: The VoyageAI embedding model to use. Options include:
            - "voyage-3": General purpose (1024 dims, 32K context)
            - "voyage-3-lite": Lightweight (512 dims, 32K context)
            - "voyage-3-large": Highest accuracy (1024 dims, 32K context)
            - "voyage-code-3": Code optimized (1024 dims, 32K context)
            - "voyage-law-2": Legal documents (1024 dims, 16K context)
            - "voyage-finance-2": Finance (1024 dims, 32K context)
        api_key: Optional VoyageAI API key. If None, falls back to the
            ``VOYAGE_API_KEY`` environment variable (the name VoyageAI's own
            SDK uses), then to ``VOYAGEAI_API_KEY`` for backward compatibility.
        embedding_dim: Optional Matryoshka output dimension. Only honored by
            models that support dimension reduction (e.g. voyage-3-large);
            ignored otherwise. The decorator default is 1024 to match
            ``voyage-3``; if you select ``voyage-3-lite`` (512 dims) override
            ``EMBEDDING_DIM`` accordingly so the vector store size matches.
        input_type: Optional input type hint for the model. Options:
            - "query": For search queries
            - "document": For documents to be indexed
            - None: Let the model decide (default)
        truncation: Whether the API should truncate texts that exceed the model's
            token limit. Defaults to True (matches the VoyageAI SDK default).
        context: Optional LightRAG embedding context. When ``input_type`` is not
            set, "query" maps to ``input_type="query"`` and "document" maps to
            ``input_type="document"``.

    Returns:
        A numpy array of embeddings, one per input text.

    Raises:
        VoyageAIError: If the API call fails or returns invalid data.

    """
    if not api_key:
        api_key = os.environ.get("VOYAGE_API_KEY") or os.environ.get("VOYAGEAI_API_KEY")
        if not api_key:
            logger.error(
                "VoyageAI API key not provided and neither VOYAGE_API_KEY nor "
                "VOYAGEAI_API_KEY environment variable is set"
            )
            raise ValueError(
                "VoyageAI API key is required: pass api_key, or set the "
                "VOYAGE_API_KEY (preferred) or VOYAGEAI_API_KEY environment variable"
            )

    if input_type is None and context in {"query", "document"}:
        input_type = context

    try:
        client = voyageai.AsyncClient(api_key=api_key)

        total_chars = sum(len(t) for t in texts)
        avg_chars = total_chars / len(texts) if texts else 0
        logger.debug(
            f"VoyageAI embedding request: {len(texts)} texts, "
            f"total_chars={total_chars}, avg_chars={avg_chars:.0f}, model={model}, "
            f"input_type={input_type}"
        )

        # Prepare API call parameters
        embed_params = dict(
            texts=texts,
            model=model,
            # Optional parameters -- if None, voyageai client uses defaults
            output_dimension=embedding_dim,
            truncation=truncation,
            input_type=input_type,
        )
        # Make API call with timing
        result = await client.embed(**embed_params)

        if not result.embeddings:
            err_msg = "VoyageAI API returned empty embeddings"
            logger.error(err_msg)
            raise VoyageAIError(err_msg)

        if len(result.embeddings) != len(texts):
            err_msg = f"VoyageAI API returned {len(result.embeddings)} embeddings for {len(texts)} texts"
            logger.error(err_msg)
            raise VoyageAIError(err_msg)

        # Convert to numpy array with timing
        embeddings = np.array(result.embeddings, dtype=np.float32)
        logger.debug(f"VoyageAI embeddings generated: shape {embeddings.shape}")

        return embeddings

    except Exception as e:
        logger.error(f"VoyageAI embedding error: {e}")
        raise


# Optional: a helper function to get available embedding models
def get_available_embedding_models() -> dict[str, dict]:
    """
    Returns a dictionary of available Voyage AI embedding models and their properties.
    """
    return {
        "voyage-3-large": {
            "context_length": 32000,
            "dimension": 1024,
            "description": "Best general-purpose and multilingual",
        },
        "voyage-3": {
            "context_length": 32000,
            "dimension": 1024,
            "description": "General-purpose and multilingual",
        },
        "voyage-3-lite": {
            "context_length": 32000,
            "dimension": 512,
            "description": "Optimized for latency and cost",
        },
        "voyage-code-3": {
            "context_length": 32000,
            "dimension": 1024,
            "description": "Optimized for code",
        },
        "voyage-finance-2": {
            "context_length": 32000,
            "dimension": 1024,
            "description": "Optimized for finance",
        },
        "voyage-law-2": {
            "context_length": 16000,
            "dimension": 1024,
            "description": "Optimized for legal",
        },
        "voyage-multimodal-3": {
            "context_length": 32000,
            "dimension": 1024,
            "description": "Multimodal text and images",
        },
    }
feat: 重构知识库系统，移除Hermes集成，增强RAG和同步功能主要变更: - 移除Hermes智能体及相关回调服务 - 新增知识库RAG、同步、调度、规范化和索引任务服务 - 重构orchestrator服务，增强运行时聊天功能 - 更新前端聊天、政策制度、设置等页面样式和逻辑 - 更新expense_claims和document_intelligence服务 - 删除llm_wiki相关服务和测试文件 - 更新docker-compose配置和启动脚本 2026-05-17 08:38:41 +00:00			`import os`
			`import numpy as np`
			`import pipmaster as pm # Pipmaster for dynamic library install`

			`# Add Voyage AI import`
			`if not pm.is_installed("voyageai"):`
			`pm.install("voyageai")`

			`import voyageai`
			`from voyageai.error import (`
			`APIConnectionError,`
			`RateLimitError,`
			`ServerError,`
			`ServiceUnavailableError,`
			`Timeout,`
			`TryAgain,`
			`)`

			`from tenacity import (`
			`retry,`
			`stop_after_attempt,`
			`wait_exponential,`
			`retry_if_exception_type,`
			`)`
			`from lightrag.utils import wrap_embedding_func_with_attrs, logger`


			`# Custom exceptions for VoyageAI errors`
			`class VoyageAIError(Exception):`
			`"""Generic VoyageAI API error"""`

			`pass`


			`@wrap_embedding_func_with_attrs(`
			`embedding_dim=1024, max_token_size=32000, supports_asymmetric=True`
			`)`
			`@retry(`
			`stop=stop_after_attempt(3),`
			`wait=wait_exponential(multiplier=1, min=4, max=60),`
			`retry=retry_if_exception_type(`
			`(`
			`APIConnectionError,`
			`RateLimitError,`
			`ServerError,`
			`ServiceUnavailableError,`
			`Timeout,`
			`TryAgain,`
			`)`
			`),`
			`)`
			`async def voyageai_embed(`
			`texts: list[str],`
			`model: str = "voyage-3",`
			`api_key: str \| None = None,`
			`embedding_dim: int \| None = None,`
			`input_type: str \| None = None,`
			`truncation: bool \| None = True,`
			`context: str \| None = None,`
			`) -> np.ndarray:`
			`"""Generate embeddings for a list of texts using VoyageAI's API.`

			`Args:`
			`texts: List of texts to embed.`
			`model: The VoyageAI embedding model to use. Options include:`
			`- "voyage-3": General purpose (1024 dims, 32K context)`
			`- "voyage-3-lite": Lightweight (512 dims, 32K context)`
			`- "voyage-3-large": Highest accuracy (1024 dims, 32K context)`
			`- "voyage-code-3": Code optimized (1024 dims, 32K context)`
			`- "voyage-law-2": Legal documents (1024 dims, 16K context)`
			`- "voyage-finance-2": Finance (1024 dims, 32K context)`
			`api_key: Optional VoyageAI API key. If None, falls back to the`
			``VOYAGE_API_KEY`` environment variable (the name VoyageAI's own
			SDK uses), then to ``VOYAGEAI_API_KEY`` for backward compatibility.
			`embedding_dim: Optional Matryoshka output dimension. Only honored by`
			`models that support dimension reduction (e.g. voyage-3-large);`
			`ignored otherwise. The decorator default is 1024 to match`
			``voyage-3``; if you select ``voyage-3-lite`` (512 dims) override
			``EMBEDDING_DIM`` accordingly so the vector store size matches.
			`input_type: Optional input type hint for the model. Options:`
			`- "query": For search queries`
			`- "document": For documents to be indexed`
			`- None: Let the model decide (default)`
			`truncation: Whether the API should truncate texts that exceed the model's`
			`token limit. Defaults to True (matches the VoyageAI SDK default).`
			context: Optional LightRAG embedding context. When ``input_type`` is not
			set, "query" maps to ``input_type="query"`` and "document" maps to
			``input_type="document"``.

			`Returns:`
			`A numpy array of embeddings, one per input text.`

			`Raises:`
			`VoyageAIError: If the API call fails or returns invalid data.`

			`"""`
			`if not api_key:`
			`api_key = os.environ.get("VOYAGE_API_KEY") or os.environ.get("VOYAGEAI_API_KEY")`
			`if not api_key:`
			`logger.error(`
			`"VoyageAI API key not provided and neither VOYAGE_API_KEY nor "`
			`"VOYAGEAI_API_KEY environment variable is set"`
			`)`
			`raise ValueError(`
			`"VoyageAI API key is required: pass api_key, or set the "`
			`"VOYAGE_API_KEY (preferred) or VOYAGEAI_API_KEY environment variable"`
			`)`

			`if input_type is None and context in {"query", "document"}:`
			`input_type = context`

			`try:`
			`client = voyageai.AsyncClient(api_key=api_key)`

			`total_chars = sum(len(t) for t in texts)`
			`avg_chars = total_chars / len(texts) if texts else 0`
			`logger.debug(`
			`f"VoyageAI embedding request: {len(texts)} texts, "`
			`f"total_chars={total_chars}, avg_chars={avg_chars:.0f}, model={model}, "`
			`f"input_type={input_type}"`
			`)`

			`# Prepare API call parameters`
			`embed_params = dict(`
			`texts=texts,`
			`model=model,`
			`# Optional parameters -- if None, voyageai client uses defaults`
			`output_dimension=embedding_dim,`
			`truncation=truncation,`
			`input_type=input_type,`
			`)`
			`# Make API call with timing`
			`result = await client.embed(**embed_params)`

			`if not result.embeddings:`
			`err_msg = "VoyageAI API returned empty embeddings"`
			`logger.error(err_msg)`
			`raise VoyageAIError(err_msg)`

			`if len(result.embeddings) != len(texts):`
			`err_msg = f"VoyageAI API returned {len(result.embeddings)} embeddings for {len(texts)} texts"`
			`logger.error(err_msg)`
			`raise VoyageAIError(err_msg)`

			`# Convert to numpy array with timing`
			`embeddings = np.array(result.embeddings, dtype=np.float32)`
			`logger.debug(f"VoyageAI embeddings generated: shape {embeddings.shape}")`

			`return embeddings`

			`except Exception as e:`
			`logger.error(f"VoyageAI embedding error: {e}")`
			`raise`


			`# Optional: a helper function to get available embedding models`
			`def get_available_embedding_models() -> dict[str, dict]:`
			`"""`
			`Returns a dictionary of available Voyage AI embedding models and their properties.`
			`"""`
			`return {`
			`"voyage-3-large": {`
			`"context_length": 32000,`
			`"dimension": 1024,`
			`"description": "Best general-purpose and multilingual",`
			`},`
			`"voyage-3": {`
			`"context_length": 32000,`
			`"dimension": 1024,`
			`"description": "General-purpose and multilingual",`
			`},`
			`"voyage-3-lite": {`
			`"context_length": 32000,`
			`"dimension": 512,`
			`"description": "Optimized for latency and cost",`
			`},`
			`"voyage-code-3": {`
			`"context_length": 32000,`
			`"dimension": 1024,`
			`"description": "Optimized for code",`
			`},`
			`"voyage-finance-2": {`
			`"context_length": 32000,`
			`"dimension": 1024,`
			`"description": "Optimized for finance",`
			`},`
			`"voyage-law-2": {`
			`"context_length": 16000,`
			`"dimension": 1024,`
			`"description": "Optimized for legal",`
			`},`
			`"voyage-multimodal-3": {`
			`"context_length": 32000,`
			`"dimension": 1024,`
			`"description": "Multimodal text and images",`
			`},`
			`}`