2024-09-30 10:46:07 -07:00
|
|
|
# Copyright (c) 2024 Microsoft Corporation.
|
|
|
|
# Licensed under the MIT License
|
|
|
|
|
2024-10-09 13:46:44 -07:00
|
|
|
|
|
|
|
import pytest
|
|
|
|
|
2025-01-06 10:58:59 -08:00
|
|
|
from graphrag.callbacks.noop_workflow_callbacks import NoopWorkflowCallbacks
|
2025-01-03 13:59:26 -08:00
|
|
|
from graphrag.config.create_graphrag_config import create_graphrag_config
|
2024-10-09 13:46:44 -07:00
|
|
|
from graphrag.config.enums import LLMType
|
2024-12-18 16:21:41 -08:00
|
|
|
from graphrag.index.operations.summarize_communities.community_reports_extractor.community_reports_extractor import (
|
2024-12-05 16:07:47 -08:00
|
|
|
CommunityReportResponse,
|
|
|
|
FindingModel,
|
|
|
|
)
|
2025-01-03 13:59:26 -08:00
|
|
|
from graphrag.index.run.derive_from_rows import ParallelizationError
|
|
|
|
from graphrag.index.workflows.create_final_community_reports import (
|
|
|
|
run_workflow,
|
2024-09-30 10:46:07 -07:00
|
|
|
workflow_name,
|
|
|
|
)
|
2025-01-03 13:59:26 -08:00
|
|
|
from graphrag.utils.storage import load_table_from_storage
|
2024-09-30 10:46:07 -07:00
|
|
|
|
|
|
|
from .util import (
|
|
|
|
compare_outputs,
|
2025-01-03 13:59:26 -08:00
|
|
|
create_test_context,
|
2024-12-05 09:57:26 -08:00
|
|
|
load_test_table,
|
2024-09-30 10:46:07 -07:00
|
|
|
)
|
|
|
|
|
2024-10-09 13:46:44 -07:00
|
|
|
MOCK_RESPONSES = [
|
2024-12-05 16:07:47 -08:00
|
|
|
CommunityReportResponse(
|
|
|
|
title="<report_title>",
|
|
|
|
summary="<executive_summary>",
|
|
|
|
rating=2,
|
|
|
|
rating_explanation="<rating_explanation>",
|
|
|
|
findings=[
|
|
|
|
FindingModel(
|
|
|
|
summary="<insight_1_summary>", explanation="<insight_1_explanation"
|
|
|
|
),
|
|
|
|
FindingModel(
|
|
|
|
summary="<insight_2_summary>", explanation="<insight_2_explanation"
|
|
|
|
),
|
2024-10-09 13:46:44 -07:00
|
|
|
],
|
2024-12-05 16:07:47 -08:00
|
|
|
)
|
2024-10-09 13:46:44 -07:00
|
|
|
]
|
|
|
|
|
2024-12-05 16:07:47 -08:00
|
|
|
MOCK_LLM_CONFIG = {
|
|
|
|
"type": LLMType.StaticResponse,
|
|
|
|
"responses": MOCK_RESPONSES,
|
|
|
|
"parse_json": True,
|
|
|
|
}
|
2024-10-09 13:46:44 -07:00
|
|
|
|
2024-09-30 10:46:07 -07:00
|
|
|
|
|
|
|
async def test_create_final_community_reports():
|
2024-12-05 09:57:26 -08:00
|
|
|
expected = load_test_table(workflow_name)
|
2024-09-30 10:46:07 -07:00
|
|
|
|
2025-01-03 13:59:26 -08:00
|
|
|
context = await create_test_context(
|
|
|
|
storage=[
|
|
|
|
"create_final_nodes",
|
|
|
|
"create_final_covariates",
|
|
|
|
"create_final_relationships",
|
|
|
|
"create_final_entities",
|
|
|
|
"create_final_communities",
|
|
|
|
]
|
|
|
|
)
|
2024-09-30 10:46:07 -07:00
|
|
|
|
2025-01-03 13:59:26 -08:00
|
|
|
config = create_graphrag_config()
|
|
|
|
config.community_reports.strategy = {
|
|
|
|
"type": "graph_intelligence",
|
|
|
|
"llm": MOCK_LLM_CONFIG,
|
|
|
|
}
|
2024-09-30 10:46:07 -07:00
|
|
|
|
2025-01-03 13:59:26 -08:00
|
|
|
await run_workflow(
|
|
|
|
config,
|
|
|
|
context,
|
2025-01-06 10:58:59 -08:00
|
|
|
NoopWorkflowCallbacks(),
|
2024-09-30 10:46:07 -07:00
|
|
|
)
|
|
|
|
|
2025-01-03 13:59:26 -08:00
|
|
|
actual = await load_table_from_storage(workflow_name, context.storage)
|
|
|
|
|
2024-09-30 10:46:07 -07:00
|
|
|
assert len(actual.columns) == len(expected.columns)
|
|
|
|
|
|
|
|
# only assert a couple of columns that are not mock - most of this table is LLM-generated
|
|
|
|
compare_outputs(actual, expected, columns=["community", "level"])
|
|
|
|
|
|
|
|
# assert a handful of mock data items to confirm they get put in the right spot
|
|
|
|
assert actual["rank"][:1][0] == 2
|
|
|
|
assert actual["rank_explanation"][:1][0] == "<rating_explanation>"
|
|
|
|
|
|
|
|
|
2024-10-09 13:46:44 -07:00
|
|
|
async def test_create_final_community_reports_missing_llm_throws():
|
2025-01-03 13:59:26 -08:00
|
|
|
context = await create_test_context(
|
|
|
|
storage=[
|
|
|
|
"create_final_nodes",
|
|
|
|
"create_final_covariates",
|
|
|
|
"create_final_relationships",
|
|
|
|
"create_final_entities",
|
|
|
|
"create_final_communities",
|
|
|
|
]
|
|
|
|
)
|
|
|
|
|
|
|
|
config = create_graphrag_config()
|
|
|
|
config.community_reports.strategy = {
|
|
|
|
"type": "graph_intelligence",
|
|
|
|
}
|
|
|
|
|
|
|
|
with pytest.raises(ParallelizationError):
|
|
|
|
await run_workflow(
|
|
|
|
config,
|
|
|
|
context,
|
2025-01-06 10:58:59 -08:00
|
|
|
NoopWorkflowCallbacks(),
|
2024-10-09 13:46:44 -07:00
|
|
|
)
|