autogen/python/packages/agbench/benchmarks/GAIA/Templates/SelectorGroupChat/scenario.py

import asyncio
import os
import yaml
import warnings
from typing import Sequence
from autogen_ext.agents.magentic_one import MagenticOneCoderAgent
from autogen_agentchat.teams import SelectorGroupChat
from autogen_agentchat.conditions import MaxMessageTermination
from autogen_agentchat.ui import Console
from autogen_agentchat.utils import content_to_str
from autogen_core.models import ModelFamily
from autogen_ext.code_executors.local import LocalCommandLineCodeExecutor
from autogen_agentchat.conditions import TextMentionTermination
from autogen_agentchat.base import TerminationCondition, TerminatedException
from autogen_core.models import ChatCompletionClient
from autogen_ext.agents.web_surfer import MultimodalWebSurfer
from autogen_ext.agents.file_surfer import FileSurfer
from autogen_agentchat.agents import CodeExecutorAgent
from autogen_agentchat.messages import TextMessage, BaseAgentEvent, BaseChatMessage, HandoffMessage, MultiModalMessage, StopMessage
from autogen_core.models import LLMMessage, UserMessage, AssistantMessage

# Suppress warnings about the requests.Session() not being closed
warnings.filterwarnings(action="ignore", message="unclosed", category=ResourceWarning)

async def main() -> None:

    # Load model configuration and create the model client.
    with open("config.yaml", "r") as f:
        config = yaml.safe_load(f)

    orchestrator_client = ChatCompletionClient.load_component(config["orchestrator_client"])
    coder_client = ChatCompletionClient.load_component(config["coder_client"])
    web_surfer_client = ChatCompletionClient.load_component(config["web_surfer_client"])
    file_surfer_client = ChatCompletionClient.load_component(config["file_surfer_client"])
    
    # Read the prompt
    prompt = ""
    with open("prompt.txt", "rt") as fh:
        prompt = fh.read().strip()
    filename = "__FILE_NAME__".strip()

    # Set up the team
    coder = MagenticOneCoderAgent(
        "Assistant",
        model_client = coder_client,
    )

    executor = CodeExecutorAgent("ComputerTerminal", code_executor=LocalCommandLineCodeExecutor())

    file_surfer = FileSurfer(
        name="FileSurfer",
        model_client = file_surfer_client,
    )
                
    web_surfer = MultimodalWebSurfer(
        name="WebSurfer",
        model_client = web_surfer_client,
        downloads_folder=os.getcwd(),
        debug_dir="logs",
        to_save_screenshots=True,
    )

    # Prepare the prompt
    filename_prompt = ""
    if len(filename) > 0:
        filename_prompt = f"The question is about a file, document or image, which can be accessed by the filename '{filename}' in the current working directory."
    task = f"{prompt}\n\n{filename_prompt}"

    # Termination conditions
    max_messages_termination = MaxMessageTermination(max_messages=20)
    llm_termination = LLMTermination(
        prompt=f"""Consider the following task:
{task.strip()}

Does the above conversation suggest that the task has been solved?
If so, reply "TERMINATE", otherwise reply "CONTINUE"
""",
        model_client=orchestrator_client
    )

    termination = max_messages_termination | llm_termination

    # Create the team
    team = SelectorGroupChat(
        [coder, executor, file_surfer, web_surfer],
        model_client=orchestrator_client,
        termination_condition=termination,
    )

    # Run the task
    stream = team.run_stream(task=task.strip())
    result = await Console(stream)

    # Do one more inference to format the results
    final_context: Sequence[LLMMessage] = []
    for message in result.messages:
        if isinstance(message, TextMessage):
            final_context.append(UserMessage(content=message.content, source=message.source))
        elif isinstance(message, MultiModalMessage):
            if orchestrator_client.model_info["vision"]:
                final_context.append(UserMessage(content=message.content, source=message.source))
            else:
                final_context.append(UserMessage(content=content_to_str(message.content), source=message.source))
    final_context.append(UserMessage(
        content=f"""We have completed the following task:
{prompt}

The above messages contain the conversation that took place to complete the task.
Read the above conversation and output a FINAL ANSWER to the question.
To output the final answer, use the following template: FINAL ANSWER: [YOUR FINAL ANSWER]
Your FINAL ANSWER should be a number OR as few words as possible OR a comma separated list of numbers and/or strings.
ADDITIONALLY, your FINAL ANSWER MUST adhere to any formatting instructions specified in the original question (e.g., alphabetization, sequencing, units, rounding, decimal places, etc.)
If you are asked for a number, express it numerically (i.e., with digits rather than words), don't use commas, and don't include units such as $ or percent signs unless specified otherwise.
If you are asked for a string, don't use articles or abbreviations (e.g. for cities), unless specified otherwise. Don't output any final sentence punctuation such as '.', '!', or '?'.
If you are asked for a comma separated list, apply the above rules depending on whether the elements are numbers or strings.
#""".strip(),
        source="user"))

    # Call the model to evaluate
    response = await orchestrator_client.create(final_context)
    print(response.content, flush=True)


class LLMTermination(TerminationCondition):
    """Terminate the conversation if an LLM determines the task is complete.

    Args:
        prompt: The prompt to evaluate in the llm
        model_client: The LLM model_client to use
        termination_phrase: The phrase to look for in the LLM output to trigger termination
    """

    def __init__(self, prompt: str, model_client: ChatCompletionClient, termination_phrase: str = "TERMINATE") -> None:
        self._prompt = prompt
        self._model_client = model_client
        self._termination_phrase = termination_phrase
        self._terminated = False
        self._context: Sequence[LLMMessage] = []

    @property
    def terminated(self) -> bool:
        return self._terminated

    async def __call__(self, messages: Sequence[BaseAgentEvent | BaseChatMessage]) -> StopMessage | None:
        if self._terminated:
            raise TerminatedException("Termination condition has already been reached")

        # Build the context
        for message in messages:
            if isinstance(message, TextMessage):
                self._context.append(UserMessage(content=message.content, source=message.source))
            elif isinstance(message, MultiModalMessage):
                if self._model_client.model_info["vision"]:
                    self._context.append(UserMessage(content=message.content, source=message.source))
                else:
                    self._context.append(UserMessage(content=content_to_str(message.content), source=message.source))

        if len(self._context) == 0:
            return None

        # Call the model to evaluate
        response = await self._model_client.create(self._context + [UserMessage(content=self._prompt, source="user")]) 

        # Check for termination
        if isinstance(message.content, str) and self._termination_phrase in response.content:
            self._terminated = True
            return StopMessage(content=message.content, source="LLMTermination")
        return None

    async def reset(self) -> None:
        self._terminated = False
        self._context = []


if __name__ == "__main__":
    asyncio.run(main())
Significant updates to agbench. (#5313) - Updated HumanEval template to use AgentChat - Update templates to use config.yaml for model and other configuration - Read environment from ENV.yaml (ENV.json still supported but deprecated) - Temporarily removed WebArena and AssistantBench. Neither had viable Templates after `autogen_magentic_one` was removed. Templates need to be update to AgentChat (in a future PR, but this PR is getting big enough already) 2025-02-07 10:01:44 -08:00			`import asyncio`
			`import os`
			`import yaml`
			`import warnings`
			`from typing import Sequence`
			`from autogen_ext.agents.magentic_one import MagenticOneCoderAgent`
			`from autogen_agentchat.teams import SelectorGroupChat`
			`from autogen_agentchat.conditions import MaxMessageTermination`
			`from autogen_agentchat.ui import Console`
			`from autogen_agentchat.utils import content_to_str`
			`from autogen_core.models import ModelFamily`
			`from autogen_ext.code_executors.local import LocalCommandLineCodeExecutor`
			`from autogen_agentchat.conditions import TextMentionTermination`
			`from autogen_agentchat.base import TerminationCondition, TerminatedException`
			`from autogen_core.models import ChatCompletionClient`
			`from autogen_ext.agents.web_surfer import MultimodalWebSurfer`
			`from autogen_ext.agents.file_surfer import FileSurfer`
			`from autogen_agentchat.agents import CodeExecutorAgent`
Rename to use BaseChatMessage and BaseAgentEvent. Bring back union types. (#6144) Rename the `ChatMessage` and `AgentEvent` base classes to `BaseChatMessage` and `BaseAgentEvent`. Bring back the `ChatMessage` and `AgentEvent` as union of built-in concrete types to avoid breaking existing applications that depends on Pydantic serialization. Why? Many existing code uses containers like this: ```python class AppMessage(BaseModel): name: str message: ChatMessage # Serialization is this: m = AppMessage(...) m.model_dump_json() # Fields like HandoffMessage.target will be lost because it is now treated as a base class without content or target fields. ``` The assumption on `ChatMessage` or `AgentEvent` to be a union of concrete types could be in many existing code bases. So this PR brings back the union types, while keep method type hints such as those on `on_messages` to use the `BaseChatMessage` and `BaseAgentEvent` base classes for flexibility. 2025-03-30 09:34:40 -07:00			`from autogen_agentchat.messages import TextMessage, BaseAgentEvent, BaseChatMessage, HandoffMessage, MultiModalMessage, StopMessage`
Significant updates to agbench. (#5313) - Updated HumanEval template to use AgentChat - Update templates to use config.yaml for model and other configuration - Read environment from ENV.yaml (ENV.json still supported but deprecated) - Temporarily removed WebArena and AssistantBench. Neither had viable Templates after `autogen_magentic_one` was removed. Templates need to be update to AgentChat (in a future PR, but this PR is getting big enough already) 2025-02-07 10:01:44 -08:00			`from autogen_core.models import LLMMessage, UserMessage, AssistantMessage`

			`# Suppress warnings about the requests.Session() not being closed`
			`warnings.filterwarnings(action="ignore", message="unclosed", category=ResourceWarning)`

			`async def main() -> None:`

			`# Load model configuration and create the model client.`
			`with open("config.yaml", "r") as f:`
			`config = yaml.safe_load(f)`

			`orchestrator_client = ChatCompletionClient.load_component(config["orchestrator_client"])`
			`coder_client = ChatCompletionClient.load_component(config["coder_client"])`
			`web_surfer_client = ChatCompletionClient.load_component(config["web_surfer_client"])`
			`file_surfer_client = ChatCompletionClient.load_component(config["file_surfer_client"])`

			`# Read the prompt`
			`prompt = ""`
			`with open("prompt.txt", "rt") as fh:`
			`prompt = fh.read().strip()`
			`filename = "__FILE_NAME__".strip()`

			`# Set up the team`
			`coder = MagenticOneCoderAgent(`
			`"Assistant",`
			`model_client = coder_client,`
			`)`

			`executor = CodeExecutorAgent("ComputerTerminal", code_executor=LocalCommandLineCodeExecutor())`

			`file_surfer = FileSurfer(`
			`name="FileSurfer",`
			`model_client = file_surfer_client,`
			`)`

			`web_surfer = MultimodalWebSurfer(`
			`name="WebSurfer",`
			`model_client = web_surfer_client,`
			`downloads_folder=os.getcwd(),`
			`debug_dir="logs",`
			`to_save_screenshots=True,`
			`)`

			`# Prepare the prompt`
			`filename_prompt = ""`
			`if len(filename) > 0:`
			`filename_prompt = f"The question is about a file, document or image, which can be accessed by the filename '{filename}' in the current working directory."`
			`task = f"{prompt}\n\n{filename_prompt}"`

			`# Termination conditions`
			`max_messages_termination = MaxMessageTermination(max_messages=20)`
			`llm_termination = LLMTermination(`
			`prompt=f"""Consider the following task:`
			`{task.strip()}`

			`Does the above conversation suggest that the task has been solved?`
			`If so, reply "TERMINATE", otherwise reply "CONTINUE"`
			`""",`
			`model_client=orchestrator_client`
			`)`

			`termination = max_messages_termination \| llm_termination`

			`# Create the team`
			`team = SelectorGroupChat(`
			`[coder, executor, file_surfer, web_surfer],`
			`model_client=orchestrator_client,`
			`termination_condition=termination,`
			`)`

			`# Run the task`
			`stream = team.run_stream(task=task.strip())`
			`result = await Console(stream)`

			`# Do one more inference to format the results`
			`final_context: Sequence[LLMMessage] = []`
			`for message in result.messages:`
			`if isinstance(message, TextMessage):`
			`final_context.append(UserMessage(content=message.content, source=message.source))`
			`elif isinstance(message, MultiModalMessage):`
			`if orchestrator_client.model_info["vision"]:`
			`final_context.append(UserMessage(content=message.content, source=message.source))`
			`else:`
			`final_context.append(UserMessage(content=content_to_str(message.content), source=message.source))`
			`final_context.append(UserMessage(`
			`content=f"""We have completed the following task:`
			`{prompt}`

			`The above messages contain the conversation that took place to complete the task.`
			`Read the above conversation and output a FINAL ANSWER to the question.`
			`To output the final answer, use the following template: FINAL ANSWER: [YOUR FINAL ANSWER]`
			`Your FINAL ANSWER should be a number OR as few words as possible OR a comma separated list of numbers and/or strings.`
			`ADDITIONALLY, your FINAL ANSWER MUST adhere to any formatting instructions specified in the original question (e.g., alphabetization, sequencing, units, rounding, decimal places, etc.)`
			`If you are asked for a number, express it numerically (i.e., with digits rather than words), don't use commas, and don't include units such as $ or percent signs unless specified otherwise.`
			`If you are asked for a string, don't use articles or abbreviations (e.g. for cities), unless specified otherwise. Don't output any final sentence punctuation such as '.', '!', or '?'.`
			`If you are asked for a comma separated list, apply the above rules depending on whether the elements are numbers or strings.`
			`#""".strip(),`
			`source="user"))`

			`# Call the model to evaluate`
			`response = await orchestrator_client.create(final_context)`
			`print(response.content, flush=True)`


			`class LLMTermination(TerminationCondition):`
			`"""Terminate the conversation if an LLM determines the task is complete.`

			`Args:`
			`prompt: The prompt to evaluate in the llm`
			`model_client: The LLM model_client to use`
			`termination_phrase: The phrase to look for in the LLM output to trigger termination`
			`"""`

			`def __init__(self, prompt: str, model_client: ChatCompletionClient, termination_phrase: str = "TERMINATE") -> None:`
			`self._prompt = prompt`
			`self._model_client = model_client`
			`self._termination_phrase = termination_phrase`
			`self._terminated = False`
			`self._context: Sequence[LLMMessage] = []`

			`@property`
			`def terminated(self) -> bool:`
			`return self._terminated`

Rename to use BaseChatMessage and BaseAgentEvent. Bring back union types. (#6144) Rename the `ChatMessage` and `AgentEvent` base classes to `BaseChatMessage` and `BaseAgentEvent`. Bring back the `ChatMessage` and `AgentEvent` as union of built-in concrete types to avoid breaking existing applications that depends on Pydantic serialization. Why? Many existing code uses containers like this: ```python class AppMessage(BaseModel): name: str message: ChatMessage # Serialization is this: m = AppMessage(...) m.model_dump_json() # Fields like HandoffMessage.target will be lost because it is now treated as a base class without content or target fields. ``` The assumption on `ChatMessage` or `AgentEvent` to be a union of concrete types could be in many existing code bases. So this PR brings back the union types, while keep method type hints such as those on `on_messages` to use the `BaseChatMessage` and `BaseAgentEvent` base classes for flexibility. 2025-03-30 09:34:40 -07:00			`async def __call__(self, messages: Sequence[BaseAgentEvent \| BaseChatMessage]) -> StopMessage \| None:`
Significant updates to agbench. (#5313) - Updated HumanEval template to use AgentChat - Update templates to use config.yaml for model and other configuration - Read environment from ENV.yaml (ENV.json still supported but deprecated) - Temporarily removed WebArena and AssistantBench. Neither had viable Templates after `autogen_magentic_one` was removed. Templates need to be update to AgentChat (in a future PR, but this PR is getting big enough already) 2025-02-07 10:01:44 -08:00			`if self._terminated:`
			`raise TerminatedException("Termination condition has already been reached")`

			`# Build the context`
			`for message in messages:`
			`if isinstance(message, TextMessage):`
			`self._context.append(UserMessage(content=message.content, source=message.source))`
			`elif isinstance(message, MultiModalMessage):`
			`if self._model_client.model_info["vision"]:`
			`self._context.append(UserMessage(content=message.content, source=message.source))`
			`else:`
			`self._context.append(UserMessage(content=content_to_str(message.content), source=message.source))`

			`if len(self._context) == 0:`
			`return None`

			`# Call the model to evaluate`
			`response = await self._model_client.create(self._context + [UserMessage(content=self._prompt, source="user")])`

			`# Check for termination`
			`if isinstance(message.content, str) and self._termination_phrase in response.content:`
			`self._terminated = True`
			`return StopMessage(content=message.content, source="LLMTermination")`
			`return None`

			`async def reset(self) -> None:`
			`self._terminated = False`
			`self._context = []`


			`if __name__ == "__main__":`
			`asyncio.run(main())`