mirror of
				https://github.com/microsoft/autogen.git
				synced 2025-10-25 06:49:13 +00:00 
			
		
		
		
	
		
			
	
	
		
			159 lines
		
	
	
		
			5.1 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
		
		
			
		
	
	
			159 lines
		
	
	
		
			5.1 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
|   | # | ||
|  | # Run this file to download the human_eval dataset, and create a corresponding testbed scenario: | ||
|  | # (default: ../scenarios/human_eval_two_agents_gpt4.jsonl and ./scenarios/human_eval_two_agents_gpt35.jsonl) | ||
|  | # | ||
|  | 
 | ||
|  | import json | ||
|  | import os | ||
|  | import re | ||
|  | import sys | ||
|  | 
 | ||
|  | from huggingface_hub import snapshot_download | ||
|  | 
 | ||
|  | SCRIPT_PATH = os.path.realpath(__file__) | ||
|  | SCRIPT_NAME = os.path.basename(SCRIPT_PATH) | ||
|  | SCRIPT_DIR = os.path.dirname(SCRIPT_PATH) | ||
|  | 
 | ||
|  | SCENARIO_DIR = os.path.realpath(os.path.join(SCRIPT_DIR, os.path.pardir)) | ||
|  | TEMPLATES_DIR = os.path.join(SCENARIO_DIR, "Templates") | ||
|  | TASKS_DIR = os.path.join(SCENARIO_DIR, "Tasks") | ||
|  | DOWNLOADS_DIR = os.path.join(SCENARIO_DIR, "Downloads") | ||
|  | REPO_DIR = os.path.join(DOWNLOADS_DIR, "GAIA") | ||
|  | 
 | ||
|  | 
 | ||
|  | def download_gaia(): | ||
|  |     """Download the GAIA benchmark from Hugging Face.""" | ||
|  | 
 | ||
|  |     if not os.path.isdir(DOWNLOADS_DIR): | ||
|  |         os.mkdir(DOWNLOADS_DIR) | ||
|  | 
 | ||
|  |     """Download the GAIA dataset from Hugging Face Hub""" | ||
|  |     snapshot_download( | ||
|  |         repo_id="gaia-benchmark/GAIA", | ||
|  |         repo_type="dataset", | ||
|  |         local_dir=REPO_DIR, | ||
|  |         local_dir_use_symlinks=True, | ||
|  |     ) | ||
|  | 
 | ||
|  | 
 | ||
|  | def create_jsonl(name, tasks, files_dir, template): | ||
|  |     """Creates a JSONL scenario file with a given name, and template path.""" | ||
|  | 
 | ||
|  |     if not os.path.isdir(TASKS_DIR): | ||
|  |         os.mkdir(TASKS_DIR) | ||
|  | 
 | ||
|  |     with open(os.path.join(TASKS_DIR, name + ".jsonl"), "wt") as fh: | ||
|  |         for task in tasks: | ||
|  |             print(f"Converting: [{name}] {task['task_id']}") | ||
|  | 
 | ||
|  |             # Figure out what files we need to copy | ||
|  |             template_cp_list = [template] | ||
|  |             if len(task["file_name"].strip()) > 0: | ||
|  |                 template_cp_list.append( | ||
|  |                     [ | ||
|  |                         os.path.join(files_dir, task["file_name"].strip()), | ||
|  |                         task["file_name"].strip(), | ||
|  |                         #os.path.join("coding", task["file_name"].strip()), | ||
|  |                     ] | ||
|  |                 ) | ||
|  | 
 | ||
|  |             record = { | ||
|  |                 "id": task["task_id"], | ||
|  |                 "template": template_cp_list, | ||
|  |                 "substitutions": { | ||
|  |                     "scenario.py": { | ||
|  |                         "__FILE_NAME__": task["file_name"], | ||
|  |                     }, | ||
|  |                     "expected_answer.txt": {"__EXPECTED_ANSWER__": task["Final answer"]}, | ||
|  |                     "prompt.txt": {"__PROMPT__": task["Question"]}, | ||
|  |                 }, | ||
|  |             } | ||
|  | 
 | ||
|  |             fh.write(json.dumps(record).strip() + "\n") | ||
|  | 
 | ||
|  | 
 | ||
|  | ############################################################################### | ||
|  | def main(): | ||
|  |     gaia_validation_files = os.path.join(REPO_DIR, "2023", "validation") | ||
|  |     gaia_test_files = os.path.join(REPO_DIR, "2023", "test") | ||
|  | 
 | ||
|  |     if not os.path.isdir(gaia_validation_files) or not os.path.isdir(gaia_test_files): | ||
|  |         download_gaia() | ||
|  | 
 | ||
|  |     if not os.path.isdir(gaia_validation_files) or not os.path.isdir(gaia_test_files): | ||
|  |         sys.exit(f"Error: '{REPO_DIR}' does not appear to be a copy of the GAIA repository.") | ||
|  | 
 | ||
|  |     # Load the GAIA data | ||
|  |     gaia_validation_tasks = [[], [], []] | ||
|  |     with open(os.path.join(gaia_validation_files, "metadata.jsonl")) as fh: | ||
|  |         for line in fh: | ||
|  |             data = json.loads(line) | ||
|  |             gaia_validation_tasks[data["Level"] - 1].append(data) | ||
|  | 
 | ||
|  |     gaia_test_tasks = [[], [], []] | ||
|  |     with open(os.path.join(gaia_test_files, "metadata.jsonl")) as fh: | ||
|  |         for line in fh: | ||
|  |             data = json.loads(line) | ||
|  | 
 | ||
|  |             # A welcome message -- not a real task | ||
|  |             if data["task_id"] == "0-0-0-0-0": | ||
|  |                 continue | ||
|  | 
 | ||
|  |             gaia_test_tasks[data["Level"] - 1].append(data) | ||
|  | 
 | ||
|  |     # list all directories in the Templates directory | ||
|  |     # and populate a dictionary with the name and path | ||
|  |     templates = {} | ||
|  |     for entry in os.scandir(TEMPLATES_DIR): | ||
|  |         if entry.is_dir(): | ||
|  |             templates[re.sub(r"\s", "", entry.name)] = entry.path | ||
|  | 
 | ||
|  |     # Add coding directories if needed (these are usually empty and left out of the repo) | ||
|  |     #for template in templates.values(): | ||
|  |     #    code_dir_path = os.path.join(template, "coding") | ||
|  |     #    if not os.path.isdir(code_dir_path): | ||
|  |     #        os.mkdir(code_dir_path) | ||
|  | 
 | ||
|  |     # Create the various combinations of [models] x [templates] | ||
|  |     for t in templates.items(): | ||
|  |         create_jsonl( | ||
|  |             f"gaia_validation_level_1__{t[0]}", | ||
|  |             gaia_validation_tasks[0], | ||
|  |             gaia_validation_files, | ||
|  |             t[1], | ||
|  |         ) | ||
|  |         create_jsonl( | ||
|  |             f"gaia_validation_level_2__{t[0]}", | ||
|  |             gaia_validation_tasks[1], | ||
|  |             gaia_validation_files, | ||
|  |             t[1], | ||
|  |         ) | ||
|  |         create_jsonl( | ||
|  |             f"gaia_validation_level_3__{t[0]}", | ||
|  |             gaia_validation_tasks[2], | ||
|  |             gaia_validation_files, | ||
|  |             t[1], | ||
|  |         ) | ||
|  |         create_jsonl( | ||
|  |             f"gaia_test_level_1__{t[0]}", | ||
|  |             gaia_test_tasks[0], | ||
|  |             gaia_test_files, | ||
|  |             t[1], | ||
|  |         ) | ||
|  |         create_jsonl( | ||
|  |             f"gaia_test_level_2__{t[0]}", | ||
|  |             gaia_test_tasks[1], | ||
|  |             gaia_test_files, | ||
|  |             t[1], | ||
|  |         ) | ||
|  |         create_jsonl( | ||
|  |             f"gaia_test_level_3__{t[0]}", | ||
|  |             gaia_test_tasks[2], | ||
|  |             gaia_test_files, | ||
|  |             t[1], | ||
|  |         ) | ||
|  | 
 | ||
|  | 
 | ||
|  | if __name__ == "__main__" and __package__ is None: | ||
|  |     main() |