mirror of
				https://github.com/deepset-ai/haystack.git
				synced 2025-10-31 09:49:48 +00:00 
			
		
		
		
	 a75b9dd4bb
			
		
	
	
		a75b9dd4bb
		
			
		
	
	
	
	
		
			
			* Add content type resolution, pdf handler, user agent switching --------- Co-authored-by: Daria Fokina <daria.fokina@deepset.ai> Co-authored-by: ZanSara <sara.zanzottera@deepset.ai>
		
			
				
	
	
		
			35 lines
		
	
	
		
			1.3 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			35 lines
		
	
	
		
			1.3 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
| import os
 | |
| from haystack.nodes import PromptNode, LinkContentFetcher, PromptTemplate
 | |
| from haystack import Pipeline
 | |
| 
 | |
| anthropic_key = os.environ.get("ANTHROPIC_API_KEY")
 | |
| if not anthropic_key:
 | |
|     raise ValueError("Please set the ANTHROPIC_API_KEY environment variable")
 | |
| 
 | |
| alt_user_agents = [
 | |
|     "Mozilla/5.0 (Macintosh; Intel Mac OS X 13_4_1) AppleWebKit/605.1.15 (KHTML, like Gecko) Version/16.5 Safari/605.1.15"
 | |
| ]
 | |
| 
 | |
| retriever = LinkContentFetcher(user_agents=alt_user_agents)
 | |
| pt = PromptTemplate(
 | |
|     "Given the content below, create a summary consisting of three sections: Objectives, "
 | |
|     "Implementation and Learnings/Conclusions.\n"
 | |
|     "Each section should have at least three bullet points. \n"
 | |
|     "In the content below disregard References section.\n\n: {documents}"
 | |
| )
 | |
| 
 | |
| prompt_node = PromptNode(
 | |
|     "claude-instant-1", api_key=anthropic_key, max_length=512, default_prompt_template=pt, model_kwargs={"stream": True}
 | |
| )
 | |
| 
 | |
| pipeline = Pipeline()
 | |
| pipeline.add_node(component=retriever, name="Retriever", inputs=["Query"])
 | |
| pipeline.add_node(component=prompt_node, name="PromptNode", inputs=["Retriever"])
 | |
| 
 | |
| research_papers = ["https://arxiv.org/pdf/2307.03172.pdf", "https://arxiv.org/pdf/1706.03762.pdf"]
 | |
| 
 | |
| for research_paper in research_papers:
 | |
|     print(f"Research paper summary: {research_paper}")
 | |
|     pipeline.run(research_paper)
 | |
|     print("\n\n\n")
 |