2024-02-14 19:54:17 -05:00
|
|
|
import json
|
2024-04-15 05:34:26 -07:00
|
|
|
import os
|
2024-04-05 10:26:06 +08:00
|
|
|
import sqlite3
|
2024-02-14 19:54:17 -05:00
|
|
|
import sys
|
|
|
|
import uuid
|
|
|
|
|
2024-04-05 10:26:06 +08:00
|
|
|
import pytest
|
2024-02-14 19:54:17 -05:00
|
|
|
|
2024-04-15 05:34:26 -07:00
|
|
|
sys.path.append(os.path.join(os.path.dirname(__file__), ".."))
|
|
|
|
sys.path.append(os.path.join(os.path.dirname(__file__), "../.."))
|
2024-05-16 11:24:05 +05:30
|
|
|
|
|
|
|
|
2024-04-15 05:34:26 -07:00
|
|
|
from conftest import skip_openai # noqa: E402
|
|
|
|
from test_assistant_agent import KEY_LOC, OAI_CONFIG_LIST # noqa: E402
|
|
|
|
|
2024-05-16 11:24:05 +05:30
|
|
|
import autogen
|
|
|
|
import autogen.runtime_logging
|
|
|
|
|
2024-02-14 19:54:17 -05:00
|
|
|
TEACHER_MESSAGE = """
|
|
|
|
You are roleplaying a math teacher, and your job is to help your students with linear algebra.
|
|
|
|
Keep your explanations short.
|
|
|
|
"""
|
|
|
|
|
|
|
|
STUDENT_MESSAGE = """
|
|
|
|
You are roleplaying a high school student strugling with linear algebra.
|
|
|
|
Regardless how well the teacher explains things to you, you just don't quite get it.
|
|
|
|
Keep your questions short.
|
|
|
|
"""
|
|
|
|
|
|
|
|
CHAT_COMPLETIONS_QUERY = """SELECT id, invocation_id, client_id, wrapper_id, session_id,
|
|
|
|
request, response, is_cached, cost, start_time, end_time FROM chat_completions;"""
|
|
|
|
|
|
|
|
AGENTS_QUERY = "SELECT id, agent_id, wrapper_id, session_id, name, class, init_args, timestamp FROM agents"
|
|
|
|
|
|
|
|
OAI_CLIENTS_QUERY = "SELECT id, client_id, wrapper_id, session_id, class, init_args, timestamp FROM oai_clients"
|
|
|
|
|
|
|
|
OAI_WRAPPERS_QUERY = "SELECT id, wrapper_id, session_id, init_args, timestamp FROM oai_wrappers"
|
|
|
|
|
2024-04-23 18:27:47 -04:00
|
|
|
EVENTS_QUERY = (
|
|
|
|
"SELECT source_id, source_name, event_name, agent_module, agent_class_name, json_state, timestamp FROM events"
|
|
|
|
)
|
2024-02-14 19:54:17 -05:00
|
|
|
|
|
|
|
if not skip_openai:
|
|
|
|
config_list = autogen.config_list_from_json(
|
|
|
|
OAI_CONFIG_LIST,
|
|
|
|
filter_dict={
|
2024-06-14 11:58:17 -04:00
|
|
|
"tags": ["gpt-3.5-turbo"],
|
2024-02-14 19:54:17 -05:00
|
|
|
},
|
|
|
|
file_location=KEY_LOC,
|
|
|
|
)
|
|
|
|
|
|
|
|
llm_config = {"config_list": config_list}
|
|
|
|
|
|
|
|
num_of_configs = len(config_list)
|
|
|
|
###############################################################
|
|
|
|
|
|
|
|
|
|
|
|
@pytest.fixture(scope="function")
|
|
|
|
def db_connection():
|
|
|
|
autogen.runtime_logging.start(config={"dbname": ":memory:"})
|
|
|
|
con = autogen.runtime_logging.get_connection()
|
|
|
|
con.row_factory = sqlite3.Row
|
|
|
|
yield con
|
|
|
|
|
|
|
|
autogen.runtime_logging.stop()
|
|
|
|
|
|
|
|
|
|
|
|
@pytest.mark.skipif(
|
|
|
|
sys.platform in ["darwin", "win32"] or skip_openai,
|
|
|
|
reason="do not run on MacOS or windows OR dependency is not installed OR requested to skip",
|
|
|
|
)
|
|
|
|
def test_two_agents_logging(db_connection):
|
|
|
|
cur = db_connection.cursor()
|
|
|
|
|
|
|
|
teacher = autogen.AssistantAgent(
|
|
|
|
"teacher",
|
|
|
|
system_message=TEACHER_MESSAGE,
|
|
|
|
is_termination_msg=lambda x: x.get("content", "").find("TERMINATE") >= 0,
|
|
|
|
llm_config=llm_config,
|
|
|
|
max_consecutive_auto_reply=2,
|
|
|
|
)
|
|
|
|
|
|
|
|
student = autogen.AssistantAgent(
|
|
|
|
"student",
|
|
|
|
system_message=STUDENT_MESSAGE,
|
|
|
|
is_termination_msg=lambda x: x.get("content", "").find("TERMINATE") >= 0,
|
|
|
|
llm_config=llm_config,
|
|
|
|
max_consecutive_auto_reply=1,
|
|
|
|
)
|
|
|
|
|
|
|
|
student.initiate_chat(
|
|
|
|
teacher,
|
|
|
|
message="Can you explain the difference between eigenvalues and singular values again?",
|
|
|
|
)
|
|
|
|
|
|
|
|
# Verify log completions table
|
|
|
|
cur.execute(CHAT_COMPLETIONS_QUERY)
|
|
|
|
rows = cur.fetchall()
|
|
|
|
|
2024-02-15 13:51:38 -05:00
|
|
|
assert len(rows) >= 3 # some config may fail
|
2024-02-14 19:54:17 -05:00
|
|
|
session_id = rows[0]["session_id"]
|
|
|
|
|
|
|
|
for idx, row in enumerate(rows):
|
|
|
|
assert (
|
|
|
|
row["invocation_id"] and str(uuid.UUID(row["invocation_id"], version=4)) == row["invocation_id"]
|
|
|
|
), "invocation id is not valid uuid"
|
|
|
|
assert row["client_id"], "client id is empty"
|
|
|
|
assert row["wrapper_id"], "wrapper id is empty"
|
|
|
|
assert row["session_id"] and row["session_id"] == session_id
|
|
|
|
|
|
|
|
request = json.loads(row["request"])
|
|
|
|
first_request_message = request["messages"][0]["content"]
|
|
|
|
first_request_role = request["messages"][0]["role"]
|
|
|
|
|
2024-04-05 06:41:14 -07:00
|
|
|
# some config may fail
|
|
|
|
if idx == 0 or idx == len(rows) - 1:
|
2024-02-14 19:54:17 -05:00
|
|
|
assert first_request_message == TEACHER_MESSAGE
|
2024-04-05 06:41:14 -07:00
|
|
|
elif idx == 1 and len(rows) == 3:
|
2024-02-14 19:54:17 -05:00
|
|
|
assert first_request_message == STUDENT_MESSAGE
|
2024-04-05 06:41:14 -07:00
|
|
|
else:
|
|
|
|
assert first_request_message in (TEACHER_MESSAGE, STUDENT_MESSAGE)
|
2024-02-14 19:54:17 -05:00
|
|
|
assert first_request_role == "system"
|
|
|
|
|
|
|
|
response = json.loads(row["response"])
|
2024-03-16 21:27:00 -04:00
|
|
|
|
|
|
|
if "response" in response: # config failed or response was empty
|
|
|
|
assert response["response"] is None or "error_code" in response["response"]
|
|
|
|
else:
|
|
|
|
assert "choices" in response and len(response["choices"]) > 0
|
2024-02-14 19:54:17 -05:00
|
|
|
|
2024-04-04 10:36:46 -04:00
|
|
|
assert row["cost"] >= 0.0
|
2024-02-14 19:54:17 -05:00
|
|
|
assert row["start_time"], "start timestamp is empty"
|
|
|
|
assert row["end_time"], "end timestamp is empty"
|
|
|
|
|
|
|
|
# Verify agents table
|
|
|
|
cur.execute(AGENTS_QUERY)
|
|
|
|
rows = cur.fetchall()
|
|
|
|
|
|
|
|
assert len(rows) == 2
|
|
|
|
|
|
|
|
session_id = rows[0]["session_id"]
|
|
|
|
for idx, row in enumerate(rows):
|
|
|
|
assert row["wrapper_id"], "wrapper id is empty"
|
|
|
|
assert row["session_id"] and row["session_id"] == session_id
|
|
|
|
|
|
|
|
agent = json.loads(row["init_args"])
|
|
|
|
if idx == 0:
|
|
|
|
assert row["name"] == "teacher"
|
|
|
|
assert agent["name"] == "teacher"
|
|
|
|
agent["system_message"] == TEACHER_MESSAGE
|
|
|
|
elif idx == 1:
|
|
|
|
assert row["name"] == "student"
|
|
|
|
assert agent["name"] == "student"
|
|
|
|
agent["system_message"] = STUDENT_MESSAGE
|
|
|
|
|
|
|
|
assert "api_key" not in row["init_args"]
|
|
|
|
assert row["timestamp"], "timestamp is empty"
|
|
|
|
|
|
|
|
# Verify oai client table
|
|
|
|
cur.execute(OAI_CLIENTS_QUERY)
|
|
|
|
rows = cur.fetchall()
|
|
|
|
|
|
|
|
assert len(rows) == num_of_configs * 2 # two agents
|
|
|
|
|
|
|
|
session_id = rows[0]["session_id"]
|
|
|
|
for row in rows:
|
|
|
|
assert row["client_id"], "client id is empty"
|
|
|
|
assert row["wrapper_id"], "wrapper id is empty"
|
|
|
|
assert row["session_id"] and row["session_id"] == session_id
|
|
|
|
assert row["class"] in ["AzureOpenAI", "OpenAI"]
|
|
|
|
init_args = json.loads(row["init_args"])
|
2024-03-26 23:39:55 +01:00
|
|
|
if row["class"] == "AzureOpenAI":
|
|
|
|
assert "api_version" in init_args
|
2024-02-14 19:54:17 -05:00
|
|
|
assert row["timestamp"], "timestamp is empty"
|
|
|
|
|
|
|
|
# Verify oai wrapper table
|
|
|
|
cur.execute(OAI_WRAPPERS_QUERY)
|
|
|
|
rows = cur.fetchall()
|
|
|
|
|
|
|
|
session_id = rows[0]["session_id"]
|
|
|
|
|
|
|
|
for row in rows:
|
|
|
|
assert row["wrapper_id"], "wrapper id is empty"
|
|
|
|
assert row["session_id"] and row["session_id"] == session_id
|
|
|
|
init_args = json.loads(row["init_args"])
|
|
|
|
assert "config_list" in init_args
|
|
|
|
assert len(init_args["config_list"]) > 0
|
|
|
|
assert row["timestamp"], "timestamp is empty"
|
|
|
|
|
|
|
|
|
|
|
|
@pytest.mark.skipif(
|
|
|
|
sys.platform in ["darwin", "win32"] or skip_openai,
|
|
|
|
reason="do not run on MacOS or windows OR dependency is not installed OR requested to skip",
|
|
|
|
)
|
|
|
|
def test_groupchat_logging(db_connection):
|
|
|
|
cur = db_connection.cursor()
|
|
|
|
|
|
|
|
teacher = autogen.AssistantAgent(
|
|
|
|
"teacher",
|
|
|
|
system_message=TEACHER_MESSAGE,
|
|
|
|
is_termination_msg=lambda x: x.get("content", "").find("TERMINATE") >= 0,
|
|
|
|
llm_config=llm_config,
|
|
|
|
max_consecutive_auto_reply=2,
|
|
|
|
)
|
|
|
|
|
|
|
|
student = autogen.AssistantAgent(
|
|
|
|
"student",
|
|
|
|
system_message=STUDENT_MESSAGE,
|
|
|
|
is_termination_msg=lambda x: x.get("content", "").find("TERMINATE") >= 0,
|
|
|
|
llm_config=llm_config,
|
|
|
|
max_consecutive_auto_reply=1,
|
|
|
|
)
|
|
|
|
|
|
|
|
groupchat = autogen.GroupChat(
|
|
|
|
agents=[teacher, student], messages=[], max_round=3, speaker_selection_method="round_robin"
|
|
|
|
)
|
|
|
|
|
|
|
|
group_chat_manager = autogen.GroupChatManager(groupchat=groupchat, llm_config=llm_config)
|
|
|
|
|
|
|
|
student.initiate_chat(
|
|
|
|
group_chat_manager,
|
|
|
|
message="Can you explain the difference between eigenvalues and singular values again?",
|
|
|
|
)
|
|
|
|
|
|
|
|
# Verify chat_completions message
|
|
|
|
cur.execute(CHAT_COMPLETIONS_QUERY)
|
|
|
|
rows = cur.fetchall()
|
2024-02-14 20:51:22 -08:00
|
|
|
assert len(rows) >= 2 # some config may fail
|
2024-02-14 19:54:17 -05:00
|
|
|
|
|
|
|
# Verify group chat manager agent
|
|
|
|
cur.execute(AGENTS_QUERY)
|
|
|
|
rows = cur.fetchall()
|
|
|
|
assert len(rows) == 3
|
|
|
|
|
|
|
|
chat_manager_query = "SELECT agent_id, name, class, init_args FROM agents WHERE name = 'chat_manager'"
|
|
|
|
cur.execute(chat_manager_query)
|
|
|
|
rows = cur.fetchall()
|
|
|
|
assert len(rows) == 1
|
|
|
|
|
|
|
|
# Verify oai clients
|
|
|
|
cur.execute(OAI_CLIENTS_QUERY)
|
|
|
|
rows = cur.fetchall()
|
|
|
|
assert len(rows) == num_of_configs * 3 # three agents
|
|
|
|
|
|
|
|
# Verify oai wrappers
|
|
|
|
cur.execute(OAI_WRAPPERS_QUERY)
|
|
|
|
rows = cur.fetchall()
|
|
|
|
assert len(rows) == 3
|
|
|
|
|
2024-04-23 18:27:47 -04:00
|
|
|
# Verify events
|
|
|
|
cur.execute(EVENTS_QUERY)
|
|
|
|
rows = cur.fetchall()
|
|
|
|
json_state = json.loads(rows[0]["json_state"])
|
|
|
|
assert rows[0]["event_name"] == "received_message"
|
|
|
|
assert json_state["message"] == "Can you explain the difference between eigenvalues and singular values again?"
|
|
|
|
assert len(rows) == 15
|
|
|
|
|
2024-02-14 19:54:17 -05:00
|
|
|
# Verify schema version
|
|
|
|
version_query = "SELECT id, version_number from version"
|
|
|
|
cur.execute(version_query)
|
|
|
|
rows = cur.fetchall()
|
|
|
|
assert len(rows) == 1
|
|
|
|
assert rows[0]["id"] == 1 and rows[0]["version_number"] == 1
|