graphiti/graphiti_core/llm_client/groq_client.py

"""
Copyright 2024, Zep Software, Inc.

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
"""

import json
import logging
import typing

from groq import AsyncGroq
from groq.types.chat import ChatCompletionMessageParam
from openai import AsyncOpenAI

from ..prompts.models import Message
from .client import LLMClient
from .config import LLMConfig

logger = logging.getLogger(__name__)


class GroqClient(LLMClient):
    def __init__(self, config: LLMConfig | None = None):
        if config is None:
            config = LLMConfig()
        self.client = AsyncGroq(api_key=config.api_key)
        self.model = config.model

    def get_embedder(self) -> typing.Any:
        openai_client = AsyncOpenAI()
        return openai_client.embeddings

    async def generate_response(self, messages: list[Message]) -> dict[str, typing.Any]:
        openai_messages: list[ChatCompletionMessageParam] = []
        for m in messages:
            if m.role == 'user':
                openai_messages.append({'role': 'user', 'content': m.content})
            elif m.role == 'system':
                openai_messages.append({'role': 'system', 'content': m.content})
        try:
            response = await self.client.chat.completions.create(
                model='llama-3.1-70b-versatile',
                messages=openai_messages,
                temperature=0.0,
                max_tokens=4096,
                response_format={'type': 'json_object'},
            )
            result = response.choices[0].message.content or ''
            return json.loads(result)
        except Exception as e:
            print(openai_messages)
            logger.error(f'Error in generating LLM response: {e}')
            raise
Controlled example (#37) * chore: Add romeo runner * fix: Linter * dedupe fixes * wip * wip dump * allbirds * chore: Update romeo parser * chore: Anthropic model fix * allbirds runner * format * wip * mypy updates * update * remove r * update tests * format * wip * wip * wip * chore: Strategically update the message * chore: Add romeo runner * fix: Linter * wip * wip dump * chore: Update romeo parser * chore: Anthropic model fix * wip * allbirds * allbirds runner * format * wip * wip * mypy updates * update * remove r * update tests * format * wip * chore: Strategically update the message * rebase and fix import issues * Update package imports for graphiti_core in examples and utils * nits * chore: Update OpenAI GPT-4o model to gpt-4o-2024-08-06 * implement groq * improvments & linting * cleanup and nits * Refactor package imports for graphiti_core in examples and utils * Refactor package imports for graphiti_core in examples and utils * chore: Nuke unused examples * chore: Nuke unused examples * chore: Only run type check on graphiti_core * fix unit tests * reformat * unit test * fix: Unit tests * test: Add coverage for extract_date_strings_from_edge * lint * remove commented code --------- Co-authored-by: prestonrasmussen <prasmuss15@gmail.com> Co-authored-by: Daniel Chalef <131175+danielchalef@users.noreply.github.com> 2024-08-26 10:30:22 -04:00			`"""`
			`Copyright 2024, Zep Software, Inc.`

			`Licensed under the Apache License, Version 2.0 (the "License");`
			`you may not use this file except in compliance with the License.`
			`You may obtain a copy of the License at`

			`http://www.apache.org/licenses/LICENSE-2.0`

			`Unless required by applicable law or agreed to in writing, software`
			`distributed under the License is distributed on an "AS IS" BASIS,`
			`WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.`
			`See the License for the specific language governing permissions and`
			`limitations under the License.`
			`"""`

			`import json`
			`import logging`
			`import typing`

			`from groq import AsyncGroq`
			`from groq.types.chat import ChatCompletionMessageParam`
			`from openai import AsyncOpenAI`

			`from ..prompts.models import Message`
			`from .client import LLMClient`
			`from .config import LLMConfig`

			`logger = logging.getLogger(__name__)`


			`class GroqClient(LLMClient):`
			`def __init__(self, config: LLMConfig \| None = None):`
			`if config is None:`
			`config = LLMConfig()`
			`self.client = AsyncGroq(api_key=config.api_key)`
			`self.model = config.model`

			`def get_embedder(self) -> typing.Any:`
			`openai_client = AsyncOpenAI()`
			`return openai_client.embeddings`

			`async def generate_response(self, messages: list[Message]) -> dict[str, typing.Any]:`
			`openai_messages: list[ChatCompletionMessageParam] = []`
			`for m in messages:`
			`if m.role == 'user':`
			`openai_messages.append({'role': 'user', 'content': m.content})`
			`elif m.role == 'system':`
			`openai_messages.append({'role': 'system', 'content': m.content})`
			`try:`
			`response = await self.client.chat.completions.create(`
			`model='llama-3.1-70b-versatile',`
			`messages=openai_messages,`
			`temperature=0.0,`
			`max_tokens=4096,`
			`response_format={'type': 'json_object'},`
			`)`
			`result = response.choices[0].message.content or ''`
			`return json.loads(result)`
			`except Exception as e:`
			`print(openai_messages)`
			`logger.error(f'Error in generating LLM response: {e}')`
			`raise`