| 
									
										
										
										
											2024-10-07 18:55:43 +08:00
										 |  |  | from openai import OpenAI | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2024-10-08 14:39:05 +08:00
										 |  |  | # os.environ["OPENAI_API_KEY"] = "" | 
					
						
							| 
									
										
										
										
											2024-10-07 18:55:43 +08:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2024-10-19 09:43:17 +05:30
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2024-10-07 18:55:43 +08:00
										 |  |  | def openai_complete_if_cache( | 
					
						
							|  |  |  |     model="gpt-4o-mini", prompt=None, system_prompt=None, history_messages=[], **kwargs | 
					
						
							|  |  |  | ) -> str: | 
					
						
							|  |  |  |     openai_client = OpenAI() | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     messages = [] | 
					
						
							|  |  |  |     if system_prompt: | 
					
						
							|  |  |  |         messages.append({"role": "system", "content": system_prompt}) | 
					
						
							|  |  |  |     messages.extend(history_messages) | 
					
						
							|  |  |  |     messages.append({"role": "user", "content": prompt}) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     response = openai_client.chat.completions.create( | 
					
						
							|  |  |  |         model=model, messages=messages, **kwargs | 
					
						
							|  |  |  |     ) | 
					
						
							|  |  |  |     return response.choices[0].message.content | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | if __name__ == "__main__": | 
					
						
							|  |  |  |     description = "" | 
					
						
							|  |  |  |     prompt = f"""
 | 
					
						
							|  |  |  |     Given the following description of a dataset: | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     {description} | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     Please identify 5 potential users who would engage with this dataset. For each user, list 5 tasks they would perform with this dataset. Then, for each (user, task) combination, generate 5 questions that require a high-level understanding of the entire dataset. | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     Output the results in the following structure: | 
					
						
							|  |  |  |     - User 1: [user description] | 
					
						
							|  |  |  |         - Task 1: [task description] | 
					
						
							|  |  |  |             - Question 1: | 
					
						
							|  |  |  |             - Question 2: | 
					
						
							|  |  |  |             - Question 3: | 
					
						
							|  |  |  |             - Question 4: | 
					
						
							|  |  |  |             - Question 5: | 
					
						
							|  |  |  |         - Task 2: [task description] | 
					
						
							|  |  |  |             ... | 
					
						
							|  |  |  |         - Task 5: [task description] | 
					
						
							|  |  |  |     - User 2: [user description] | 
					
						
							|  |  |  |         ... | 
					
						
							|  |  |  |     - User 5: [user description] | 
					
						
							|  |  |  |         ... | 
					
						
							|  |  |  |     """
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2024-10-19 09:43:17 +05:30
										 |  |  |     result = openai_complete_if_cache(model="gpt-4o-mini", prompt=prompt) | 
					
						
							| 
									
										
										
										
											2024-10-07 18:55:43 +08:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2024-10-19 09:43:17 +05:30
										 |  |  |     file_path = "./queries.txt" | 
					
						
							| 
									
										
										
										
											2024-10-07 18:55:43 +08:00
										 |  |  |     with open(file_path, "w") as file: | 
					
						
							|  |  |  |         file.write(result) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2024-10-19 09:43:17 +05:30
										 |  |  |     print(f"Queries written to {file_path}") |