autogen/python/teams/team-one/src/team_one/utils.py

import json
import logging
import os
from dataclasses import asdict
from datetime import datetime
from typing import Any, Dict, List, Literal

from agnext.application.logging.events import LLMCallEvent
from agnext.components import Image
from agnext.components.models import (
    AzureOpenAIChatCompletionClient,
    ChatCompletionClient,
    ModelCapabilities,
    OpenAIChatCompletionClient,
)

from .messages import (
    AssistantContent,
    FunctionExecutionContent,
    OrchestrationEvent,
    SystemContent,
    UserContent,
    WebSurferEvent,
)

ENVIRON_KEY_CHAT_COMPLETION_PROVIDER = "CHAT_COMPLETION_PROVIDER"
ENVIRON_KEY_CHAT_COMPLETION_KWARGS_JSON = "CHAT_COMPLETION_KWARGS_JSON"

# The singleton _default_azure_ad_token_provider, which will be created if needed
_default_azure_ad_token_provider = None


# Create a model client based on information provided in environment variables.
def create_completion_client_from_env(env: Dict[str, str] | None = None, **kwargs: Any) -> ChatCompletionClient:
    global _default_azure_ad_token_provider

    """
    Create a model client based on information provided in environment variables.
        env (Optional):     When provied, read from this dictionary rather than os.environ
        kwargs**:           ChatClient arguments to override (e.g., model)

    NOTE: If 'azure_ad_token_provider' is included, and euquals the string 'DEFAULT' then replace it with
          azure.identity.get_bearer_token_provider(DefaultAzureCredential(), "https://cognitiveservices.azure.com/.default")
    """

    # If a dictionary was not provided, load it from the environment
    if env is None:
        env = dict()
        env.update(os.environ)

    # Load the kwargs, and override with provided kwargs
    _kwargs = json.loads(env.get(ENVIRON_KEY_CHAT_COMPLETION_KWARGS_JSON, "{}"))
    _kwargs.update(kwargs)

    # If model capabilities were provided, deserialize them as well
    if "model_capabilities" in _kwargs:
        _kwargs["model_capabilities"] = ModelCapabilities(
            vision=_kwargs["model_capabilities"].get("vision"),
            function_calling=_kwargs["model_capabilities"].get("function_calling"),
            json_output=_kwargs["model_capabilities"].get("json_output"),
        )

    # Figure out what provider we are using. Default to OpenAI
    _provider = env.get(ENVIRON_KEY_CHAT_COMPLETION_PROVIDER, "openai").lower().strip()

    # Instantiate the correct client
    if _provider == "openai":
        return OpenAIChatCompletionClient(**_kwargs)
    elif _provider == "azure":
        if _kwargs.get("azure_ad_token_provider", "").lower() == "default":
            if _default_azure_ad_token_provider is None:
                from azure.identity import DefaultAzureCredential, get_bearer_token_provider

                _default_azure_ad_token_provider = get_bearer_token_provider(
                    DefaultAzureCredential(), "https://cognitiveservices.azure.com/.default"
                )
            _kwargs["azure_ad_token_provider"] = _default_azure_ad_token_provider
        return AzureOpenAIChatCompletionClient(**_kwargs)
    else:
        raise ValueError(f"Unknown OAI provider '{_provider}'")


# Convert UserContent to a string
def message_content_to_str(
    message_content: UserContent | AssistantContent | SystemContent | FunctionExecutionContent,
) -> str:
    if isinstance(message_content, str):
        return message_content
    elif isinstance(message_content, List):
        converted: List[str] = list()
        for item in message_content:
            if isinstance(item, str):
                converted.append(item.rstrip())
            elif isinstance(item, Image):
                converted.append("<Image>")
            else:
                converted.append(str(item).rstrip())
        return "\n".join(converted)
    else:
        raise AssertionError("Unexpected response type.")


# TeamOne log event handler
class LogHandler(logging.FileHandler):
    def __init__(self, filename: str = "log.jsonl") -> None:
        super().__init__(filename)

    def emit(self, record: logging.LogRecord) -> None:
        # try:
        if True:
            ts = datetime.fromtimestamp(record.created).isoformat()
            if isinstance(record.msg, OrchestrationEvent):
                console_message = (
                    f"\n{'-'*75} \n" f"\033[91m[{ts}], {record.msg.source}:\033[0m\n" f"\n{record.msg.message}"
                )
                print(console_message, flush=True)
                record.msg = json.dumps(
                    {
                        "timestamp": ts,
                        "source": record.msg.source,
                        "message": record.msg.message,
                        "type": "OrchestrationEvent",
                    }
                )
                super().emit(record)
            if isinstance(record.msg, WebSurferEvent):
                console_message = f"\033[96m[{ts}], {record.msg.source}: {record.msg.message}\033[0m"
                print(console_message, flush=True)
                payload: Dict[str, Any] = {
                    "timestamp": ts,
                    "type": "WebSurferEvent",
                }
                payload.update(asdict(record.msg))
                record.msg = json.dumps(payload)
                super().emit(record)
            if isinstance(record.msg, LLMCallEvent):
                record.msg = json.dumps(
                    {
                        "timestamp": ts,
                        "prompt_tokens": record.msg.prompt_tokens,
                        "completion_tokens": record.msg.completion_tokens,
                        "type": "LLMCallEvent",
                    }
                )
                super().emit(record)
        # except Exception:
        #    self.handleError(record)


class SentinelMeta(type):
    """
    A baseclass for sentinels that plays well with type hints.
    Define new sentinels like this:

    ```
    class MY_DEFAULT(metaclass=SentinelMeta):
        pass


    foo: list[str] | None | type[MY_DEFAULT] = MY_DEFAULT
    ```

    Reference: https://stackoverflow.com/questions/69239403/type-hinting-parameters-with-a-sentinel-value-as-the-default
    """

    def __repr__(cls) -> str:
        return f"<{cls.__name__}>"

    def __bool__(cls) -> Literal[False]:
        return False
Teamone utils (#192) * Added initial code for TeamOne utils. * Fixed hatch errors. * Updated examples. * Fixed more hatch errors. * Improve readme --------- Co-authored-by: gagb <gagb@users.noreply.github.com> 2024-07-09 10:46:55 -07:00			`import json`
Adds a standard logging / log-printing class to TeamOne (#194) * Added initial code for TeamOne utils. * Fixed hatch errors. * Updated examples. * Fixed more hatch errors. * examples/example_coder.py * Added standard logging for TeamOne * Read time from log record. 2024-07-09 13:51:05 -07:00			`import logging`
Teamone utils (#192) * Added initial code for TeamOne utils. * Fixed hatch errors. * Updated examples. * Fixed more hatch errors. * Improve readme --------- Co-authored-by: gagb <gagb@users.noreply.github.com> 2024-07-09 10:46:55 -07:00			`import os`
TeamOne implementation of GAIA (#221) Port of GAIA benchmark 2024-07-17 09:51:19 -07:00			`from dataclasses import asdict`
Adds a standard logging / log-printing class to TeamOne (#194) * Added initial code for TeamOne utils. * Fixed hatch errors. * Updated examples. * Fixed more hatch errors. * examples/example_coder.py * Added standard logging for TeamOne * Read time from log record. 2024-07-09 13:51:05 -07:00			`from datetime import datetime`
Agnext websurfer (#205) * Initial work on multimodal websurfer * A little more progress. * Getting function calling to work. * Some basic progress with navigation. * Added ability to print multimodal messages to console. * Fixed hatch error * Nicely print multimodal messages to console. * Got OCR working. * Fixed the click action. * Solved some hatch errors. * Fixed some formatting errors. * Fixed more type errors. * Yet more fixes to types. * Fixed many type errors. * Fixed all type errors. Some needed to be ignored. See todos. * Fixed all? hatch errors? * Fixed multiline aria-names in prompts. 2024-07-11 10:52:29 -07:00			`from typing import Any, Dict, List, Literal`
Teamone utils (#192) * Added initial code for TeamOne utils. * Fixed hatch errors. * Updated examples. * Fixed more hatch errors. * Improve readme --------- Co-authored-by: gagb <gagb@users.noreply.github.com> 2024-07-09 10:46:55 -07:00
extend base log handler in team one to also write events to a log file (#212) Looks good to me. 2024-07-12 15:21:45 -07:00			`from agnext.application.logging.events import LLMCallEvent`
TeamOne implementation of GAIA (#221) Port of GAIA benchmark 2024-07-17 09:51:19 -07:00			`from agnext.components import Image`
Teamone utils (#192) * Added initial code for TeamOne utils. * Fixed hatch errors. * Updated examples. * Fixed more hatch errors. * Improve readme --------- Co-authored-by: gagb <gagb@users.noreply.github.com> 2024-07-09 10:46:55 -07:00			`from agnext.components.models import (`
			`AzureOpenAIChatCompletionClient,`
			`ChatCompletionClient,`
			`ModelCapabilities,`
			`OpenAIChatCompletionClient,`
			`)`

TeamOne implementation of GAIA (#221) Port of GAIA benchmark 2024-07-17 09:51:19 -07:00			`from .messages import (`
			`AssistantContent,`
			`FunctionExecutionContent,`
			`OrchestrationEvent,`
			`SystemContent,`
			`UserContent,`
			`WebSurferEvent,`
			`)`
Adds a standard logging / log-printing class to TeamOne (#194) * Added initial code for TeamOne utils. * Fixed hatch errors. * Updated examples. * Fixed more hatch errors. * examples/example_coder.py * Added standard logging for TeamOne * Read time from log record. 2024-07-09 13:51:05 -07:00
Teamone utils (#192) * Added initial code for TeamOne utils. * Fixed hatch errors. * Updated examples. * Fixed more hatch errors. * Improve readme --------- Co-authored-by: gagb <gagb@users.noreply.github.com> 2024-07-09 10:46:55 -07:00			`ENVIRON_KEY_CHAT_COMPLETION_PROVIDER = "CHAT_COMPLETION_PROVIDER"`
			`ENVIRON_KEY_CHAT_COMPLETION_KWARGS_JSON = "CHAT_COMPLETION_KWARGS_JSON"`

			`# The singleton _default_azure_ad_token_provider, which will be created if needed`
			`_default_azure_ad_token_provider = None`


			`# Create a model client based on information provided in environment variables.`
			`def create_completion_client_from_env(env: Dict[str, str] \| None = None, **kwargs: Any) -> ChatCompletionClient:`
			`global _default_azure_ad_token_provider`

			`"""`
			`Create a model client based on information provided in environment variables.`
			`env (Optional): When provied, read from this dictionary rather than os.environ`
			`kwargs**: ChatClient arguments to override (e.g., model)`

			`NOTE: If 'azure_ad_token_provider' is included, and euquals the string 'DEFAULT' then replace it with`
			`azure.identity.get_bearer_token_provider(DefaultAzureCredential(), "https://cognitiveservices.azure.com/.default")`
			`"""`

			`# If a dictionary was not provided, load it from the environment`
			`if env is None:`
			`env = dict()`
			`env.update(os.environ)`

			`# Load the kwargs, and override with provided kwargs`
			`_kwargs = json.loads(env.get(ENVIRON_KEY_CHAT_COMPLETION_KWARGS_JSON, "{}"))`
			`_kwargs.update(kwargs)`

			`# If model capabilities were provided, deserialize them as well`
			`if "model_capabilities" in _kwargs:`
			`_kwargs["model_capabilities"] = ModelCapabilities(`
			`vision=_kwargs["model_capabilities"].get("vision"),`
			`function_calling=_kwargs["model_capabilities"].get("function_calling"),`
			`json_output=_kwargs["model_capabilities"].get("json_output"),`
			`)`

			`# Figure out what provider we are using. Default to OpenAI`
			`_provider = env.get(ENVIRON_KEY_CHAT_COMPLETION_PROVIDER, "openai").lower().strip()`

			`# Instantiate the correct client`
			`if _provider == "openai":`
			`return OpenAIChatCompletionClient(**_kwargs)`
			`elif _provider == "azure":`
			`if _kwargs.get("azure_ad_token_provider", "").lower() == "default":`
			`if _default_azure_ad_token_provider is None:`
			`from azure.identity import DefaultAzureCredential, get_bearer_token_provider`

			`_default_azure_ad_token_provider = get_bearer_token_provider(`
			`DefaultAzureCredential(), "https://cognitiveservices.azure.com/.default"`
			`)`
			`_kwargs["azure_ad_token_provider"] = _default_azure_ad_token_provider`
			`return AzureOpenAIChatCompletionClient(**_kwargs)`
			`else:`
			`raise ValueError(f"Unknown OAI provider '{_provider}'")`
Adds a standard logging / log-printing class to TeamOne (#194) * Added initial code for TeamOne utils. * Fixed hatch errors. * Updated examples. * Fixed more hatch errors. * examples/example_coder.py * Added standard logging for TeamOne * Read time from log record. 2024-07-09 13:51:05 -07:00

TeamOne handle multimodal console (#200) * Added ability to print multimodal messages to console. * Fixed hatch error 2024-07-10 00:01:13 -07:00			`# Convert UserContent to a string`
			`def message_content_to_str(`
			`message_content: UserContent \| AssistantContent \| SystemContent \| FunctionExecutionContent,`
			`) -> str:`
			`if isinstance(message_content, str):`
			`return message_content`
			`elif isinstance(message_content, List):`
			`converted: List[str] = list()`
			`for item in message_content:`
			`if isinstance(item, str):`
			`converted.append(item.rstrip())`
TeamOne implementation of GAIA (#221) Port of GAIA benchmark 2024-07-17 09:51:19 -07:00			`elif isinstance(item, Image):`
			`converted.append("<Image>")`
TeamOne handle multimodal console (#200) * Added ability to print multimodal messages to console. * Fixed hatch error 2024-07-10 00:01:13 -07:00			`else:`
			`converted.append(str(item).rstrip())`
			`return "\n".join(converted)`
			`else:`
			`raise AssertionError("Unexpected response type.")`


Adds a standard logging / log-printing class to TeamOne (#194) * Added initial code for TeamOne utils. * Fixed hatch errors. * Updated examples. * Fixed more hatch errors. * examples/example_coder.py * Added standard logging for TeamOne * Read time from log record. 2024-07-09 13:51:05 -07:00			`# TeamOne log event handler`
extend base log handler in team one to also write events to a log file (#212) Looks good to me. 2024-07-12 15:21:45 -07:00			`class LogHandler(logging.FileHandler):`
			`def __init__(self, filename: str = "log.jsonl") -> None:`
			`super().__init__(filename)`
Adds a standard logging / log-printing class to TeamOne (#194) * Added initial code for TeamOne utils. * Fixed hatch errors. * Updated examples. * Fixed more hatch errors. * examples/example_coder.py * Added standard logging for TeamOne * Read time from log record. 2024-07-09 13:51:05 -07:00
			`def emit(self, record: logging.LogRecord) -> None:`
TeamOne implementation of GAIA (#221) Port of GAIA benchmark 2024-07-17 09:51:19 -07:00			`# try:`
			`if True:`
extend base log handler in team one to also write events to a log file (#212) Looks good to me. 2024-07-12 15:21:45 -07:00			`ts = datetime.fromtimestamp(record.created).isoformat()`
Adds a standard logging / log-printing class to TeamOne (#194) * Added initial code for TeamOne utils. * Fixed hatch errors. * Updated examples. * Fixed more hatch errors. * examples/example_coder.py * Added standard logging for TeamOne * Read time from log record. 2024-07-09 13:51:05 -07:00			`if isinstance(record.msg, OrchestrationEvent):`
extend base log handler in team one to also write events to a log file (#212) Looks good to me. 2024-07-12 15:21:45 -07:00			`console_message = (`
			`f"\n{'-'*75} \n" f"\033[91m[{ts}], {record.msg.source}:\033[0m\n" f"\n{record.msg.message}"`
Adds a standard logging / log-printing class to TeamOne (#194) * Added initial code for TeamOne utils. * Fixed hatch errors. * Updated examples. * Fixed more hatch errors. * examples/example_coder.py * Added standard logging for TeamOne * Read time from log record. 2024-07-09 13:51:05 -07:00			`)`
extend base log handler in team one to also write events to a log file (#212) Looks good to me. 2024-07-12 15:21:45 -07:00			`print(console_message, flush=True)`
			`record.msg = json.dumps(`
			`{`
			`"timestamp": ts,`
			`"source": record.msg.source,`
			`"message": record.msg.message,`
			`"type": "OrchestrationEvent",`
			`}`
			`)`
			`super().emit(record)`
TeamOne implementation of GAIA (#221) Port of GAIA benchmark 2024-07-17 09:51:19 -07:00			`if isinstance(record.msg, WebSurferEvent):`
			`console_message = f"\033[96m[{ts}], {record.msg.source}: {record.msg.message}\033[0m"`
			`print(console_message, flush=True)`
			`payload: Dict[str, Any] = {`
			`"timestamp": ts,`
			`"type": "WebSurferEvent",`
			`}`
			`payload.update(asdict(record.msg))`
			`record.msg = json.dumps(payload)`
			`super().emit(record)`
extend base log handler in team one to also write events to a log file (#212) Looks good to me. 2024-07-12 15:21:45 -07:00			`if isinstance(record.msg, LLMCallEvent):`
			`record.msg = json.dumps(`
			`{`
			`"timestamp": ts,`
			`"prompt_tokens": record.msg.prompt_tokens,`
			`"completion_tokens": record.msg.completion_tokens,`
			`"type": "LLMCallEvent",`
			`}`
			`)`
TeamOne implementation of GAIA (#221) Port of GAIA benchmark 2024-07-17 09:51:19 -07:00			`super().emit(record)`
			`# except Exception:`
			`# self.handleError(record)`
Agnext websurfer (#205) * Initial work on multimodal websurfer * A little more progress. * Getting function calling to work. * Some basic progress with navigation. * Added ability to print multimodal messages to console. * Fixed hatch error * Nicely print multimodal messages to console. * Got OCR working. * Fixed the click action. * Solved some hatch errors. * Fixed some formatting errors. * Fixed more type errors. * Yet more fixes to types. * Fixed many type errors. * Fixed all type errors. Some needed to be ignored. See todos. * Fixed all? hatch errors? * Fixed multiline aria-names in prompts. 2024-07-11 10:52:29 -07:00

			`class SentinelMeta(type):`
			`"""`
			`A baseclass for sentinels that plays well with type hints.`
			`Define new sentinels like this:`

			```
			`class MY_DEFAULT(metaclass=SentinelMeta):`
			`pass`


			`foo: list[str] \| None \| type[MY_DEFAULT] = MY_DEFAULT`
			```

			`Reference: https://stackoverflow.com/questions/69239403/type-hinting-parameters-with-a-sentinel-value-as-the-default`
			`"""`

			`def __repr__(cls) -> str:`
			`return f"<{cls.__name__}>"`

			`def __bool__(cls) -> Literal[False]:`
			`return False`