mirror of
https://github.com/microsoft/autogen.git
synced 2025-07-04 07:26:28 +00:00
159 lines
5.1 KiB
Python
159 lines
5.1 KiB
Python
![]() |
#
|
||
|
# Run this file to download the human_eval dataset, and create a corresponding testbed scenario:
|
||
|
# (default: ../scenarios/human_eval_two_agents_gpt4.jsonl and ./scenarios/human_eval_two_agents_gpt35.jsonl)
|
||
|
#
|
||
|
|
||
|
import json
|
||
|
import os
|
||
|
import re
|
||
|
import sys
|
||
|
|
||
|
from huggingface_hub import snapshot_download
|
||
|
|
||
|
SCRIPT_PATH = os.path.realpath(__file__)
|
||
|
SCRIPT_NAME = os.path.basename(SCRIPT_PATH)
|
||
|
SCRIPT_DIR = os.path.dirname(SCRIPT_PATH)
|
||
|
|
||
|
SCENARIO_DIR = os.path.realpath(os.path.join(SCRIPT_DIR, os.path.pardir))
|
||
|
TEMPLATES_DIR = os.path.join(SCENARIO_DIR, "Templates")
|
||
|
TASKS_DIR = os.path.join(SCENARIO_DIR, "Tasks")
|
||
|
DOWNLOADS_DIR = os.path.join(SCENARIO_DIR, "Downloads")
|
||
|
REPO_DIR = os.path.join(DOWNLOADS_DIR, "GAIA")
|
||
|
|
||
|
|
||
|
def download_gaia():
|
||
|
"""Download the GAIA benchmark from Hugging Face."""
|
||
|
|
||
|
if not os.path.isdir(DOWNLOADS_DIR):
|
||
|
os.mkdir(DOWNLOADS_DIR)
|
||
|
|
||
|
"""Download the GAIA dataset from Hugging Face Hub"""
|
||
|
snapshot_download(
|
||
|
repo_id="gaia-benchmark/GAIA",
|
||
|
repo_type="dataset",
|
||
|
local_dir=REPO_DIR,
|
||
|
local_dir_use_symlinks=True,
|
||
|
)
|
||
|
|
||
|
|
||
|
def create_jsonl(name, tasks, files_dir, template):
|
||
|
"""Creates a JSONL scenario file with a given name, and template path."""
|
||
|
|
||
|
if not os.path.isdir(TASKS_DIR):
|
||
|
os.mkdir(TASKS_DIR)
|
||
|
|
||
|
with open(os.path.join(TASKS_DIR, name + ".jsonl"), "wt") as fh:
|
||
|
for task in tasks:
|
||
|
print(f"Converting: [{name}] {task['task_id']}")
|
||
|
|
||
|
# Figure out what files we need to copy
|
||
|
template_cp_list = [template]
|
||
|
if len(task["file_name"].strip()) > 0:
|
||
|
template_cp_list.append(
|
||
|
[
|
||
|
os.path.join(files_dir, task["file_name"].strip()),
|
||
|
task["file_name"].strip(),
|
||
|
#os.path.join("coding", task["file_name"].strip()),
|
||
|
]
|
||
|
)
|
||
|
|
||
|
record = {
|
||
|
"id": task["task_id"],
|
||
|
"template": template_cp_list,
|
||
|
"substitutions": {
|
||
|
"scenario.py": {
|
||
|
"__FILE_NAME__": task["file_name"],
|
||
|
},
|
||
|
"expected_answer.txt": {"__EXPECTED_ANSWER__": task["Final answer"]},
|
||
|
"prompt.txt": {"__PROMPT__": task["Question"]},
|
||
|
},
|
||
|
}
|
||
|
|
||
|
fh.write(json.dumps(record).strip() + "\n")
|
||
|
|
||
|
|
||
|
###############################################################################
|
||
|
def main():
|
||
|
gaia_validation_files = os.path.join(REPO_DIR, "2023", "validation")
|
||
|
gaia_test_files = os.path.join(REPO_DIR, "2023", "test")
|
||
|
|
||
|
if not os.path.isdir(gaia_validation_files) or not os.path.isdir(gaia_test_files):
|
||
|
download_gaia()
|
||
|
|
||
|
if not os.path.isdir(gaia_validation_files) or not os.path.isdir(gaia_test_files):
|
||
|
sys.exit(f"Error: '{REPO_DIR}' does not appear to be a copy of the GAIA repository.")
|
||
|
|
||
|
# Load the GAIA data
|
||
|
gaia_validation_tasks = [[], [], []]
|
||
|
with open(os.path.join(gaia_validation_files, "metadata.jsonl")) as fh:
|
||
|
for line in fh:
|
||
|
data = json.loads(line)
|
||
|
gaia_validation_tasks[data["Level"] - 1].append(data)
|
||
|
|
||
|
gaia_test_tasks = [[], [], []]
|
||
|
with open(os.path.join(gaia_test_files, "metadata.jsonl")) as fh:
|
||
|
for line in fh:
|
||
|
data = json.loads(line)
|
||
|
|
||
|
# A welcome message -- not a real task
|
||
|
if data["task_id"] == "0-0-0-0-0":
|
||
|
continue
|
||
|
|
||
|
gaia_test_tasks[data["Level"] - 1].append(data)
|
||
|
|
||
|
# list all directories in the Templates directory
|
||
|
# and populate a dictionary with the name and path
|
||
|
templates = {}
|
||
|
for entry in os.scandir(TEMPLATES_DIR):
|
||
|
if entry.is_dir():
|
||
|
templates[re.sub(r"\s", "", entry.name)] = entry.path
|
||
|
|
||
|
# Add coding directories if needed (these are usually empty and left out of the repo)
|
||
|
#for template in templates.values():
|
||
|
# code_dir_path = os.path.join(template, "coding")
|
||
|
# if not os.path.isdir(code_dir_path):
|
||
|
# os.mkdir(code_dir_path)
|
||
|
|
||
|
# Create the various combinations of [models] x [templates]
|
||
|
for t in templates.items():
|
||
|
create_jsonl(
|
||
|
f"gaia_validation_level_1__{t[0]}",
|
||
|
gaia_validation_tasks[0],
|
||
|
gaia_validation_files,
|
||
|
t[1],
|
||
|
)
|
||
|
create_jsonl(
|
||
|
f"gaia_validation_level_2__{t[0]}",
|
||
|
gaia_validation_tasks[1],
|
||
|
gaia_validation_files,
|
||
|
t[1],
|
||
|
)
|
||
|
create_jsonl(
|
||
|
f"gaia_validation_level_3__{t[0]}",
|
||
|
gaia_validation_tasks[2],
|
||
|
gaia_validation_files,
|
||
|
t[1],
|
||
|
)
|
||
|
create_jsonl(
|
||
|
f"gaia_test_level_1__{t[0]}",
|
||
|
gaia_test_tasks[0],
|
||
|
gaia_test_files,
|
||
|
t[1],
|
||
|
)
|
||
|
create_jsonl(
|
||
|
f"gaia_test_level_2__{t[0]}",
|
||
|
gaia_test_tasks[1],
|
||
|
gaia_test_files,
|
||
|
t[1],
|
||
|
)
|
||
|
create_jsonl(
|
||
|
f"gaia_test_level_3__{t[0]}",
|
||
|
gaia_test_tasks[2],
|
||
|
gaia_test_files,
|
||
|
t[1],
|
||
|
)
|
||
|
|
||
|
|
||
|
if __name__ == "__main__" and __package__ is None:
|
||
|
main()
|