mirror of
https://github.com/microsoft/autogen.git
synced 2025-07-04 07:26:28 +00:00

_(EXPERIMENTAL, RESEARCH IN PROGRESS)_ In 2023 AutoGen introduced [Teachable Agents](https://microsoft.github.io/autogen/0.2/blog/2023/10/26/TeachableAgent/) that users could teach new facts, preferences and skills. But teachable agents were limited in several ways: They could only be `ConversableAgent` subclasses, they couldn't learn a new skill unless the user stated (in a single turn) both the task and how to solve it, and they couldn't learn on their own. **Task-Centric Memory** overcomes these limitations, allowing users to teach arbitrary agents (or teams) more flexibly and reliably, and enabling agents to learn from their own trial-and-error experiences. This PR is large and complex. All of the files are new, and most of the added components depend on the others to run at all. But the review process can be accelerated if approached in the following order. 1. Start with the [Task-Centric Memory README](https://github.com/microsoft/autogen/tree/agentic_memory/python/packages/autogen-ext/src/autogen_ext/task_centric_memory). 1. Install the memory extension locally, since it won't be in pypi until it's merged. In the `agentic_memory` branch, and the `python/packages` directory: - `pip install -e autogen-agentchat` - `pip install -e autogen-ext[openai]` - `pip install -e autogen-ext[task-centric-memory]` 2. Run the Quickstart sample code, then immediately open the `./pagelogs/quick/0 Call Tree.html` file in a browser to view the work in progress. 3. Click through the web page links to see the details. 2. Continue through the rest of the main README to get a high-level overview of the architecture. 3. Read through the [code samples README](https://github.com/microsoft/autogen/tree/agentic_memory/python/samples/task_centric_memory), running each of the 4 code samples while viewing their page logs. 4. Skim through the 4 code samples, along with their corresponding yaml config files: 1. `chat_with_teachable_agent.py` 2. `eval_retrieval.py` 3. `eval_teachability.py` 4. `eval_learning_from_demonstration.py` 5. `eval_self_teaching.py` 6. Read `task_centric_memory_controller.py`, referring back to the previously generated page logs as needed. This is the most important and complex file in the PR. 7. Read the remaining core files. 1. `_task_centric_memory_bank.py` 2. `_string_similarity_map.py` 3. `_prompter.py` 8. Read the supporting files in the utils dir. 1. `teachability.py` 2. `apprentice.py` 3. `grader.py` 4. `page_logger.py` 5. `_functions.py`
113 lines
4.1 KiB
Python
113 lines
4.1 KiB
Python
import asyncio
|
|
import sys
|
|
from typing import Any, Dict
|
|
|
|
from autogen_core.models import (
|
|
ChatCompletionClient,
|
|
)
|
|
from autogen_ext.experimental.task_centric_memory.utils import Apprentice, Grader, PageLogger
|
|
|
|
from utils import create_oai_client, load_yaml_file
|
|
|
|
|
|
"""
|
|
This code sample connects task-centric memory to a selectable agent with no changes to that agent's code.
|
|
See the block diagram in the README for an overview of the components and their interactions.
|
|
See the config file configs/eval_teachability.yaml for an overall view of the structure and settings in this sample.
|
|
|
|
Execute the sample with this command:
|
|
python eval_teachability.py configs/eval_teachability.yaml
|
|
|
|
Teachable agents use memory to learn quickly from user teachings, hints, and advice.
|
|
The function below passes user instructions (loaded from a file) to the agent by calling Apprentice.handle_user_message().
|
|
If adapting this sample code to a new setting, the Apprentice class can be used or completely replaced by other code.
|
|
|
|
1. In the first conversation, the agent is expected to fail because it lacks the necessary knowledge.
|
|
2. In the second conversation (starting with an empty context window), the user provides the missing insight.
|
|
3. In the third conversation, the agent is expected to succeed after retrieving the key insight from memory.
|
|
"""
|
|
|
|
|
|
async def eval_teachability(
|
|
apprentice: Apprentice, client: ChatCompletionClient, logger: PageLogger, config: Dict[str, Any]
|
|
) -> str:
|
|
"""
|
|
Evaluates the ability to learn quickly from user teachings, hints, and advice.
|
|
"""
|
|
logger.enter_function()
|
|
|
|
# Load the specified data.
|
|
task_dict = load_yaml_file(config["task_file"])
|
|
task_description = task_dict["task_description"]
|
|
expected_answer = task_dict["expected_answer"]
|
|
|
|
insight_dict = load_yaml_file(config["insight_file"])
|
|
insight = insight_dict["insight"]
|
|
|
|
# First test without memory.
|
|
apprentice.reset_memory()
|
|
logger.info("\nClear memory, then ask the question.")
|
|
response = await apprentice.handle_user_message(task_description)
|
|
|
|
# Check the response.
|
|
grader = Grader(client, logger)
|
|
response_is_correct, extracted_answer = await grader.is_response_correct(
|
|
task_description, response, expected_answer
|
|
)
|
|
logger.info("Extracted answer: {}".format(extracted_answer))
|
|
if response_is_correct:
|
|
results_str_1 = "Answer before teaching is CORRECT."
|
|
else:
|
|
results_str_1 = "Answer before teaching is INCORRECT."
|
|
logger.info(results_str_1 + "\n")
|
|
|
|
# Give advice that should help solve this task.
|
|
logger.info("Give the advice.")
|
|
await apprentice.handle_user_message(insight)
|
|
|
|
# Now ask the question again to see if the advice helps.
|
|
logger.info("\nAsk the question again to see if the advice helps.")
|
|
response = await apprentice.handle_user_message(task_description)
|
|
|
|
# Check the response.
|
|
response_is_correct, extracted_answer = await grader.is_response_correct(
|
|
task_description, response, expected_answer
|
|
)
|
|
logger.info("Extracted answer: {}".format(extracted_answer))
|
|
if response_is_correct:
|
|
results_str_2 = "Answer after teaching is CORRECT."
|
|
else:
|
|
results_str_2 = "Answer after teaching is INCORRECT."
|
|
logger.info(results_str_2 + "\n")
|
|
|
|
logger.leave_function()
|
|
return "\neval_teachability\n" + results_str_1 + "\n" + results_str_2
|
|
|
|
|
|
async def run_example(config_filepath: str) -> None:
|
|
"""
|
|
Runs the code example with the necessary components.
|
|
"""
|
|
config = load_yaml_file(config_filepath)
|
|
|
|
# Create the necessary components.
|
|
logger = PageLogger(config["PageLogger"])
|
|
client = create_oai_client(config["client"])
|
|
apprentice = Apprentice(client, config["Apprentice"], logger)
|
|
|
|
# Call the example function.
|
|
results = await eval_teachability(apprentice, client, logger, config["test"])
|
|
|
|
# Finish up.
|
|
print(results)
|
|
|
|
|
|
if __name__ == "__main__":
|
|
args = sys.argv[1:]
|
|
if len(args) != 1:
|
|
# Print usage information.
|
|
print("Usage: amt.py <path to *.yaml file>")
|
|
else:
|
|
# Run the code example.
|
|
asyncio.run(run_example(config_filepath=args[0]))
|