mirror of
https://github.com/microsoft/autogen.git
synced 2025-08-13 03:01:30 +00:00

* Standardize printing of MessageTransforms * Fix pre-commit black failure * Add test for transform_messages printing * Return str instead of printing * Rename to_print_stats to verbose * Cleanup * t i# This is a combination of 3 commits. Update requirements * Remove lazy-fixture * Avoid calling apply_transform in two code paths * Format * Replace stats with logs * Handle no content messages in TokenLimiter get_logs() * Move tests from test_transform_messages to test_transforms --------- Co-authored-by: Wael Karkoub <wael.karkoub96@gmail.com>
123 lines
4.9 KiB
Python
123 lines
4.9 KiB
Python
import copy
|
|
from typing import Dict, List
|
|
|
|
import pytest
|
|
|
|
from autogen.agentchat.contrib.capabilities.transforms import MessageHistoryLimiter, MessageTokenLimiter, _count_tokens
|
|
|
|
|
|
def get_long_messages() -> List[Dict]:
|
|
return [
|
|
{"role": "assistant", "content": [{"type": "text", "text": "are you doing?"}]},
|
|
{"role": "user", "content": "very very very very very very long string"},
|
|
{"role": "user", "content": "hello"},
|
|
{"role": "assistant", "content": [{"type": "text", "text": "there"}]},
|
|
{"role": "user", "content": "how"},
|
|
]
|
|
|
|
|
|
def get_short_messages() -> List[Dict]:
|
|
return [
|
|
{"role": "user", "content": "hello"},
|
|
{"role": "assistant", "content": [{"type": "text", "text": "there"}]},
|
|
{"role": "user", "content": "how"},
|
|
]
|
|
|
|
|
|
def get_no_content_messages() -> List[Dict]:
|
|
return [{"role": "user", "function_call": "example"}, {"role": "assistant", "content": None}]
|
|
|
|
|
|
@pytest.fixture
|
|
def message_history_limiter() -> MessageHistoryLimiter:
|
|
return MessageHistoryLimiter(max_messages=3)
|
|
|
|
|
|
@pytest.fixture
|
|
def message_token_limiter() -> MessageTokenLimiter:
|
|
return MessageTokenLimiter(max_tokens_per_message=3)
|
|
|
|
|
|
# MessageHistoryLimiter tests
|
|
|
|
|
|
@pytest.mark.parametrize(
|
|
"messages, expected_messages_len",
|
|
[(get_long_messages(), 3), (get_short_messages(), 3), (get_no_content_messages(), 2)],
|
|
)
|
|
def test_message_history_limiter_apply_transform(message_history_limiter, messages, expected_messages_len):
|
|
transformed_messages = message_history_limiter.apply_transform(messages)
|
|
assert len(transformed_messages) == expected_messages_len
|
|
|
|
|
|
@pytest.mark.parametrize(
|
|
"messages, expected_logs, expected_effect",
|
|
[
|
|
(get_long_messages(), "Removed 2 messages. Number of messages reduced from 5 to 3.", True),
|
|
(get_short_messages(), "No messages were removed.", False),
|
|
(get_no_content_messages(), "No messages were removed.", False),
|
|
],
|
|
)
|
|
def test_message_history_limiter_get_logs(message_history_limiter, messages, expected_logs, expected_effect):
|
|
pre_transform_messages = copy.deepcopy(messages)
|
|
transformed_messages = message_history_limiter.apply_transform(messages)
|
|
logs_str, had_effect = message_history_limiter.get_logs(pre_transform_messages, transformed_messages)
|
|
assert had_effect == expected_effect
|
|
assert logs_str == expected_logs
|
|
|
|
|
|
# MessageTokenLimiter tests
|
|
|
|
|
|
@pytest.mark.parametrize(
|
|
"messages, expected_token_count, expected_messages_len",
|
|
[(get_long_messages(), 9, 5), (get_short_messages(), 3, 3), (get_no_content_messages(), 0, 2)],
|
|
)
|
|
def test_message_token_limiter_apply_transform(
|
|
message_token_limiter, messages, expected_token_count, expected_messages_len
|
|
):
|
|
transformed_messages = message_token_limiter.apply_transform(messages)
|
|
assert (
|
|
sum(_count_tokens(msg["content"]) for msg in transformed_messages if "content" in msg) == expected_token_count
|
|
)
|
|
assert len(transformed_messages) == expected_messages_len
|
|
|
|
|
|
@pytest.mark.parametrize(
|
|
"messages, expected_logs, expected_effect",
|
|
[
|
|
(get_long_messages(), "Truncated 6 tokens. Number of tokens reduced from 15 to 9", True),
|
|
(get_short_messages(), "No tokens were truncated.", False),
|
|
(get_no_content_messages(), "No tokens were truncated.", False),
|
|
],
|
|
)
|
|
def test_message_token_limiter_get_logs(message_token_limiter, messages, expected_logs, expected_effect):
|
|
pre_transform_messages = copy.deepcopy(messages)
|
|
transformed_messages = message_token_limiter.apply_transform(messages)
|
|
logs_str, had_effect = message_token_limiter.get_logs(pre_transform_messages, transformed_messages)
|
|
assert had_effect == expected_effect
|
|
assert logs_str == expected_logs
|
|
|
|
|
|
if __name__ == "__main__":
|
|
long_messages = get_long_messages()
|
|
short_messages = get_short_messages()
|
|
message_history_limiter = MessageHistoryLimiter(max_messages=3)
|
|
message_token_limiter = MessageTokenLimiter(max_tokens_per_message=3)
|
|
|
|
# Call the MessageHistoryLimiter tests
|
|
test_message_history_limiter_apply_transform(message_history_limiter, long_messages, 3)
|
|
test_message_history_limiter_apply_transform(message_history_limiter, short_messages, 3)
|
|
test_message_history_limiter_get_logs(
|
|
message_history_limiter, long_messages, "Removed 2 messages. Number of messages reduced from 5 to 3.", True
|
|
)
|
|
test_message_history_limiter_get_logs(message_history_limiter, short_messages, "No messages were removed.", False)
|
|
|
|
# Call the MessageTokenLimiter tests
|
|
test_message_token_limiter_apply_transform(message_token_limiter, long_messages, 9)
|
|
test_message_token_limiter_apply_transform(message_token_limiter, short_messages, 3)
|
|
test_message_token_limiter_get_logs(
|
|
message_token_limiter, long_messages, "Truncated 6 tokens. Number of tokens reduced from 15 to 9", True
|
|
)
|
|
test_message_token_limiter_get_logs(message_token_limiter, short_messages, "No tokens were truncated.", False)
|