LightRAG/lightrag/llm/anthropic.py

from ..utils import verbose_debug, VERBOSE_DEBUG
import sys
import os
import logging
import numpy as np
from typing import Any, Union, AsyncIterator
import pipmaster as pm  # Pipmaster for dynamic library install

if sys.version_info < (3, 9):
    from typing import AsyncIterator
else:
    from collections.abc import AsyncIterator

# Install Anthropic SDK if not present
if not pm.is_installed("anthropic"):
    pm.install("anthropic")

# Add Voyage AI import
if not pm.is_installed("voyageai"):
    pm.install("voyageai")
import voyageai

from anthropic import (
    AsyncAnthropic,
    APIConnectionError,
    RateLimitError,
    APITimeoutError,
)
from tenacity import (
    retry,
    stop_after_attempt,
    wait_exponential,
    retry_if_exception_type,
)
from lightrag.utils import (
    safe_unicode_decode,
    logger,
)
from lightrag.api import __api_version__


# Custom exception for retry mechanism
class InvalidResponseError(Exception):
    """Custom exception class for triggering retry mechanism"""

    pass


# Core Anthropic completion function with retry
@retry(
    stop=stop_after_attempt(3),
    wait=wait_exponential(multiplier=1, min=4, max=10),
    retry=retry_if_exception_type(
        (RateLimitError, APIConnectionError, APITimeoutError, InvalidResponseError)
    ),
)
async def anthropic_complete_if_cache(
    model: str,
    prompt: str,
    system_prompt: str | None = None,
    history_messages: list[dict[str, Any]] | None = None,
    base_url: str | None = None,
    api_key: str | None = None,
    **kwargs: Any,
) -> Union[str, AsyncIterator[str]]:
    if history_messages is None:
        history_messages = []
    if not api_key:
        api_key = os.environ.get("ANTHROPIC_API_KEY")

    default_headers = {
        "User-Agent": f"Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_8) LightRAG/{__api_version__}",
        "Content-Type": "application/json",
    }

    # Set logger level to INFO when VERBOSE_DEBUG is off
    if not VERBOSE_DEBUG and logger.level == logging.DEBUG:
        logging.getLogger("anthropic").setLevel(logging.INFO)

    anthropic_async_client = (
        AsyncAnthropic(default_headers=default_headers, api_key=api_key)
        if base_url is None
        else AsyncAnthropic(
            base_url=base_url, default_headers=default_headers, api_key=api_key
        )
    )
    kwargs.pop("hashing_kv", None)
    messages: list[dict[str, Any]] = []
    if system_prompt:
        messages.append({"role": "system", "content": system_prompt})
    messages.extend(history_messages)
    messages.append({"role": "user", "content": prompt})

    logger.debug("===== Sending Query to Anthropic LLM =====")
    logger.debug(f"Model: {model}   Base URL: {base_url}")
    logger.debug(f"Additional kwargs: {kwargs}")
    verbose_debug(f"Query: {prompt}")
    verbose_debug(f"System prompt: {system_prompt}")

    try:
        response = await anthropic_async_client.messages.create(
            model=model, messages=messages, stream=True, **kwargs
        )
    except APIConnectionError as e:
        logger.error(f"Anthropic API Connection Error: {e}")
        raise
    except RateLimitError as e:
        logger.error(f"Anthropic API Rate Limit Error: {e}")
        raise
    except APITimeoutError as e:
        logger.error(f"Anthropic API Timeout Error: {e}")
        raise
    except Exception as e:
        logger.error(
            f"Anthropic API Call Failed,\nModel: {model},\nParams: {kwargs}, Got: {e}"
        )
        raise

    async def stream_response():
        try:
            async for event in response:
                content = (
                    event.delta.text
                    if hasattr(event, "delta") and event.delta.text
                    else None
                )
                if content is None:
                    continue
                if r"\u" in content:
                    content = safe_unicode_decode(content.encode("utf-8"))
                yield content
        except Exception as e:
            logger.error(f"Error in stream response: {str(e)}")
            raise

    return stream_response()


# Generic Anthropic completion function
async def anthropic_complete(
    prompt: str,
    system_prompt: str | None = None,
    history_messages: list[dict[str, Any]] | None = None,
    **kwargs: Any,
) -> Union[str, AsyncIterator[str]]:
    if history_messages is None:
        history_messages = []
    model_name = kwargs["hashing_kv"].global_config["llm_model_name"]
    return await anthropic_complete_if_cache(
        model_name,
        prompt,
        system_prompt=system_prompt,
        history_messages=history_messages,
        **kwargs,
    )


# Claude 3 Opus specific completion
async def claude_3_opus_complete(
    prompt: str,
    system_prompt: str | None = None,
    history_messages: list[dict[str, Any]] | None = None,
    **kwargs: Any,
) -> Union[str, AsyncIterator[str]]:
    if history_messages is None:
        history_messages = []
    return await anthropic_complete_if_cache(
        "claude-3-opus-20240229",
        prompt,
        system_prompt=system_prompt,
        history_messages=history_messages,
        **kwargs,
    )


# Claude 3 Sonnet specific completion
async def claude_3_sonnet_complete(
    prompt: str,
    system_prompt: str | None = None,
    history_messages: list[dict[str, Any]] | None = None,
    **kwargs: Any,
) -> Union[str, AsyncIterator[str]]:
    if history_messages is None:
        history_messages = []
    return await anthropic_complete_if_cache(
        "claude-3-sonnet-20240229",
        prompt,
        system_prompt=system_prompt,
        history_messages=history_messages,
        **kwargs,
    )


# Claude 3 Haiku specific completion
async def claude_3_haiku_complete(
    prompt: str,
    system_prompt: str | None = None,
    history_messages: list[dict[str, Any]] | None = None,
    **kwargs: Any,
) -> Union[str, AsyncIterator[str]]:
    if history_messages is None:
        history_messages = []
    return await anthropic_complete_if_cache(
        "claude-3-haiku-20240307",
        prompt,
        system_prompt=system_prompt,
        history_messages=history_messages,
        **kwargs,
    )


# Embedding function (placeholder, as Anthropic does not provide embeddings)
@retry(
    stop=stop_after_attempt(3),
    wait=wait_exponential(multiplier=1, min=4, max=60),
    retry=retry_if_exception_type(
        (RateLimitError, APIConnectionError, APITimeoutError)
    ),
)
async def anthropic_embed(
    texts: list[str],
    model: str = "voyage-3",  # Default to voyage-3 as a good general-purpose model
    base_url: str = None,
    api_key: str = None,
) -> np.ndarray:
    """
    Generate embeddings using Voyage AI since Anthropic doesn't provide native embedding support.

    Args:
        texts: List of text strings to embed
        model: Voyage AI model name (e.g., "voyage-3", "voyage-3-large", "voyage-code-3")
        base_url: Optional custom base URL (not used for Voyage AI)
        api_key: API key for Voyage AI (defaults to VOYAGE_API_KEY environment variable)

    Returns:
        numpy array of shape (len(texts), embedding_dimension) containing the embeddings
    """
    if not api_key:
        api_key = os.environ.get("VOYAGE_API_KEY")
        if not api_key:
            logger.error("VOYAGE_API_KEY environment variable not set")
            raise ValueError(
                "VOYAGE_API_KEY environment variable is required for embeddings"
            )

    try:
        # Initialize Voyage AI client
        voyage_client = voyageai.Client(api_key=api_key)

        # Get embeddings
        result = voyage_client.embed(
            texts,
            model=model,
            input_type="document",  # Assuming document context; could be made configurable
        )

        # Convert list of embeddings to numpy array
        embeddings = np.array(result.embeddings, dtype=np.float32)

        logger.debug(f"Generated embeddings for {len(texts)} texts using {model}")
        verbose_debug(f"Embedding shape: {embeddings.shape}")

        return embeddings

    except Exception as e:
        logger.error(f"Voyage AI embedding failed: {str(e)}")
        raise


# Optional: a helper function to get available embedding models
def get_available_embedding_models() -> dict[str, dict]:
    """
    Returns a dictionary of available Voyage AI embedding models and their properties.
    """
    return {
        "voyage-3-large": {
            "context_length": 32000,
            "dimension": 1024,
            "description": "Best general-purpose and multilingual",
        },
        "voyage-3": {
            "context_length": 32000,
            "dimension": 1024,
            "description": "General-purpose and multilingual",
        },
        "voyage-3-lite": {
            "context_length": 32000,
            "dimension": 512,
            "description": "Optimized for latency and cost",
        },
        "voyage-code-3": {
            "context_length": 32000,
            "dimension": 1024,
            "description": "Optimized for code",
        },
        "voyage-finance-2": {
            "context_length": 32000,
            "dimension": 1024,
            "description": "Optimized for finance",
        },
        "voyage-law-2": {
            "context_length": 16000,
            "dimension": 1024,
            "description": "Optimized for legal",
        },
        "voyage-multimodal-3": {
            "context_length": 32000,
            "dimension": 1024,
            "description": "Multimodal text and images",
        },
    }
Create anthropic.py 2025-03-17 10:21:01 +01:00			`from ..utils import verbose_debug, VERBOSE_DEBUG`
			`import sys`
			`import os`
			`import logging`
			`import numpy as np`
			`from typing import Any, Union, AsyncIterator`
			`import pipmaster as pm # Pipmaster for dynamic library install`

			`if sys.version_info < (3, 9):`
			`from typing import AsyncIterator`
			`else:`
			`from collections.abc import AsyncIterator`

			`# Install Anthropic SDK if not present`
			`if not pm.is_installed("anthropic"):`
			`pm.install("anthropic")`

			`# Add Voyage AI import`
			`if not pm.is_installed("voyageai"):`
			`pm.install("voyageai")`
			`import voyageai`

			`from anthropic import (`
			`AsyncAnthropic,`
			`APIConnectionError,`
			`RateLimitError,`
			`APITimeoutError,`
			`)`
			`from tenacity import (`
			`retry,`
			`stop_after_attempt,`
			`wait_exponential,`
			`retry_if_exception_type,`
			`)`
			`from lightrag.utils import (`
			`safe_unicode_decode,`
			`logger,`
			`)`
			`from lightrag.api import __api_version__`

Update webui assets 2025-03-22 00:36:38 +08:00
Create anthropic.py 2025-03-17 10:21:01 +01:00			`# Custom exception for retry mechanism`
			`class InvalidResponseError(Exception):`
			`"""Custom exception class for triggering retry mechanism"""`
Update webui assets 2025-03-22 00:36:38 +08:00
Create anthropic.py 2025-03-17 10:21:01 +01:00			`pass`

Update webui assets 2025-03-22 00:36:38 +08:00
Create anthropic.py 2025-03-17 10:21:01 +01:00			`# Core Anthropic completion function with retry`
			`@retry(`
			`stop=stop_after_attempt(3),`
			`wait=wait_exponential(multiplier=1, min=4, max=10),`
			`retry=retry_if_exception_type(`
			`(RateLimitError, APIConnectionError, APITimeoutError, InvalidResponseError)`
			`),`
			`)`
			`async def anthropic_complete_if_cache(`
			`model: str,`
			`prompt: str,`
			`system_prompt: str \| None = None,`
			`history_messages: list[dict[str, Any]] \| None = None,`
			`base_url: str \| None = None,`
			`api_key: str \| None = None,`
			`**kwargs: Any,`
			`) -> Union[str, AsyncIterator[str]]:`
			`if history_messages is None:`
			`history_messages = []`
			`if not api_key:`
			`api_key = os.environ.get("ANTHROPIC_API_KEY")`

			`default_headers = {`
			`"User-Agent": f"Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_8) LightRAG/{__api_version__}",`
			`"Content-Type": "application/json",`
			`}`

			`# Set logger level to INFO when VERBOSE_DEBUG is off`
			`if not VERBOSE_DEBUG and logger.level == logging.DEBUG:`
			`logging.getLogger("anthropic").setLevel(logging.INFO)`

			`anthropic_async_client = (`
			`AsyncAnthropic(default_headers=default_headers, api_key=api_key)`
			`if base_url is None`
			`else AsyncAnthropic(`
			`base_url=base_url, default_headers=default_headers, api_key=api_key`
			`)`
			`)`
			`kwargs.pop("hashing_kv", None)`
			`messages: list[dict[str, Any]] = []`
			`if system_prompt:`
			`messages.append({"role": "system", "content": system_prompt})`
			`messages.extend(history_messages)`
			`messages.append({"role": "user", "content": prompt})`

			`logger.debug("===== Sending Query to Anthropic LLM =====")`
			`logger.debug(f"Model: {model} Base URL: {base_url}")`
			`logger.debug(f"Additional kwargs: {kwargs}")`
			`verbose_debug(f"Query: {prompt}")`
			`verbose_debug(f"System prompt: {system_prompt}")`

			`try:`
			`response = await anthropic_async_client.messages.create(`
Update webui assets 2025-03-22 00:36:38 +08:00			`model=model, messages=messages, stream=True, **kwargs`
Create anthropic.py 2025-03-17 10:21:01 +01:00			`)`
			`except APIConnectionError as e:`
			`logger.error(f"Anthropic API Connection Error: {e}")`
			`raise`
			`except RateLimitError as e:`
			`logger.error(f"Anthropic API Rate Limit Error: {e}")`
			`raise`
			`except APITimeoutError as e:`
			`logger.error(f"Anthropic API Timeout Error: {e}")`
			`raise`
			`except Exception as e:`
			`logger.error(`
			`f"Anthropic API Call Failed,\nModel: {model},\nParams: {kwargs}, Got: {e}"`
			`)`
			`raise`

			`async def stream_response():`
			`try:`
			`async for event in response:`
Update webui assets 2025-03-22 00:36:38 +08:00			`content = (`
			`event.delta.text`
			`if hasattr(event, "delta") and event.delta.text`
			`else None`
			`)`
Create anthropic.py 2025-03-17 10:21:01 +01:00			`if content is None:`
			`continue`
			`if r"\u" in content:`
			`content = safe_unicode_decode(content.encode("utf-8"))`
			`yield content`
			`except Exception as e:`
			`logger.error(f"Error in stream response: {str(e)}")`
			`raise`

			`return stream_response()`

Update webui assets 2025-03-22 00:36:38 +08:00
Create anthropic.py 2025-03-17 10:21:01 +01:00			`# Generic Anthropic completion function`
			`async def anthropic_complete(`
			`prompt: str,`
			`system_prompt: str \| None = None,`
			`history_messages: list[dict[str, Any]] \| None = None,`
			`**kwargs: Any,`
			`) -> Union[str, AsyncIterator[str]]:`
			`if history_messages is None:`
			`history_messages = []`
			`model_name = kwargs["hashing_kv"].global_config["llm_model_name"]`
			`return await anthropic_complete_if_cache(`
			`model_name,`
			`prompt,`
			`system_prompt=system_prompt,`
			`history_messages=history_messages,`
			`**kwargs,`
			`)`

Update webui assets 2025-03-22 00:36:38 +08:00
Create anthropic.py 2025-03-17 10:21:01 +01:00			`# Claude 3 Opus specific completion`
			`async def claude_3_opus_complete(`
			`prompt: str,`
			`system_prompt: str \| None = None,`
			`history_messages: list[dict[str, Any]] \| None = None,`
			`**kwargs: Any,`
			`) -> Union[str, AsyncIterator[str]]:`
			`if history_messages is None:`
			`history_messages = []`
			`return await anthropic_complete_if_cache(`
			`"claude-3-opus-20240229",`
			`prompt,`
			`system_prompt=system_prompt,`
			`history_messages=history_messages,`
			`**kwargs,`
			`)`

Update webui assets 2025-03-22 00:36:38 +08:00
Create anthropic.py 2025-03-17 10:21:01 +01:00			`# Claude 3 Sonnet specific completion`
			`async def claude_3_sonnet_complete(`
			`prompt: str,`
			`system_prompt: str \| None = None,`
			`history_messages: list[dict[str, Any]] \| None = None,`
			`**kwargs: Any,`
			`) -> Union[str, AsyncIterator[str]]:`
			`if history_messages is None:`
			`history_messages = []`
			`return await anthropic_complete_if_cache(`
			`"claude-3-sonnet-20240229",`
			`prompt,`
			`system_prompt=system_prompt,`
			`history_messages=history_messages,`
			`**kwargs,`
			`)`

Update webui assets 2025-03-22 00:36:38 +08:00
Create anthropic.py 2025-03-17 10:21:01 +01:00			`# Claude 3 Haiku specific completion`
			`async def claude_3_haiku_complete(`
			`prompt: str,`
			`system_prompt: str \| None = None,`
			`history_messages: list[dict[str, Any]] \| None = None,`
			`**kwargs: Any,`
			`) -> Union[str, AsyncIterator[str]]:`
			`if history_messages is None:`
			`history_messages = []`
			`return await anthropic_complete_if_cache(`
			`"claude-3-haiku-20240307",`
			`prompt,`
			`system_prompt=system_prompt,`
			`history_messages=history_messages,`
			`**kwargs,`
			`)`

Update webui assets 2025-03-22 00:36:38 +08:00
Create anthropic.py 2025-03-17 10:21:01 +01:00			`# Embedding function (placeholder, as Anthropic does not provide embeddings)`
			`@retry(`
			`stop=stop_after_attempt(3),`
			`wait=wait_exponential(multiplier=1, min=4, max=60),`
			`retry=retry_if_exception_type(`
			`(RateLimitError, APIConnectionError, APITimeoutError)`
			`),`
			`)`
			`async def anthropic_embed(`
			`texts: list[str],`
			`model: str = "voyage-3", # Default to voyage-3 as a good general-purpose model`
			`base_url: str = None,`
			`api_key: str = None,`
			`) -> np.ndarray:`
			`"""`
			`Generate embeddings using Voyage AI since Anthropic doesn't provide native embedding support.`
Update webui assets 2025-03-22 00:36:38 +08:00
Create anthropic.py 2025-03-17 10:21:01 +01:00			`Args:`
			`texts: List of text strings to embed`
			`model: Voyage AI model name (e.g., "voyage-3", "voyage-3-large", "voyage-code-3")`
			`base_url: Optional custom base URL (not used for Voyage AI)`
			`api_key: API key for Voyage AI (defaults to VOYAGE_API_KEY environment variable)`
Update webui assets 2025-03-22 00:36:38 +08:00
Create anthropic.py 2025-03-17 10:21:01 +01:00			`Returns:`
			`numpy array of shape (len(texts), embedding_dimension) containing the embeddings`
			`"""`
			`if not api_key:`
			`api_key = os.environ.get("VOYAGE_API_KEY")`
			`if not api_key:`
			`logger.error("VOYAGE_API_KEY environment variable not set")`
Update webui assets 2025-03-22 00:36:38 +08:00			`raise ValueError(`
			`"VOYAGE_API_KEY environment variable is required for embeddings"`
			`)`
Create anthropic.py 2025-03-17 10:21:01 +01:00
			`try:`
			`# Initialize Voyage AI client`
			`voyage_client = voyageai.Client(api_key=api_key)`
Update webui assets 2025-03-22 00:36:38 +08:00
Create anthropic.py 2025-03-17 10:21:01 +01:00			`# Get embeddings`
			`result = voyage_client.embed(`
			`texts,`
			`model=model,`
Update webui assets 2025-03-22 00:36:38 +08:00			`input_type="document", # Assuming document context; could be made configurable`
Create anthropic.py 2025-03-17 10:21:01 +01:00			`)`
Update webui assets 2025-03-22 00:36:38 +08:00
Create anthropic.py 2025-03-17 10:21:01 +01:00			`# Convert list of embeddings to numpy array`
			`embeddings = np.array(result.embeddings, dtype=np.float32)`
Update webui assets 2025-03-22 00:36:38 +08:00
Create anthropic.py 2025-03-17 10:21:01 +01:00			`logger.debug(f"Generated embeddings for {len(texts)} texts using {model}")`
			`verbose_debug(f"Embedding shape: {embeddings.shape}")`
Update webui assets 2025-03-22 00:36:38 +08:00
Create anthropic.py 2025-03-17 10:21:01 +01:00			`return embeddings`

			`except Exception as e:`
			`logger.error(f"Voyage AI embedding failed: {str(e)}")`
			`raise`

Update webui assets 2025-03-22 00:36:38 +08:00
Create anthropic.py 2025-03-17 10:21:01 +01:00			`# Optional: a helper function to get available embedding models`
			`def get_available_embedding_models() -> dict[str, dict]:`
			`"""`
			`Returns a dictionary of available Voyage AI embedding models and their properties.`
			`"""`
			`return {`
Update webui assets 2025-03-22 00:36:38 +08:00			`"voyage-3-large": {`
			`"context_length": 32000,`
			`"dimension": 1024,`
			`"description": "Best general-purpose and multilingual",`
			`},`
			`"voyage-3": {`
			`"context_length": 32000,`
			`"dimension": 1024,`
			`"description": "General-purpose and multilingual",`
			`},`
			`"voyage-3-lite": {`
			`"context_length": 32000,`
			`"dimension": 512,`
			`"description": "Optimized for latency and cost",`
			`},`
			`"voyage-code-3": {`
			`"context_length": 32000,`
			`"dimension": 1024,`
			`"description": "Optimized for code",`
			`},`
			`"voyage-finance-2": {`
			`"context_length": 32000,`
			`"dimension": 1024,`
			`"description": "Optimized for finance",`
			`},`
			`"voyage-law-2": {`
			`"context_length": 16000,`
			`"dimension": 1024,`
			`"description": "Optimized for legal",`
			`},`
			`"voyage-multimodal-3": {`
			`"context_length": 32000,`
			`"dimension": 1024,`
			`"description": "Multimodal text and images",`
			`},`
Create anthropic.py 2025-03-17 10:21:01 +01:00			`}`