mirror of
https://github.com/deepset-ai/haystack.git
synced 2025-06-26 22:00:13 +00:00

* Add content type resolution, pdf handler, user agent switching --------- Co-authored-by: Daria Fokina <daria.fokina@deepset.ai> Co-authored-by: ZanSara <sara.zanzottera@deepset.ai>
35 lines
1.3 KiB
Python
35 lines
1.3 KiB
Python
import os
|
|
from haystack.nodes import PromptNode, LinkContentFetcher, PromptTemplate
|
|
from haystack import Pipeline
|
|
|
|
anthropic_key = os.environ.get("ANTHROPIC_API_KEY")
|
|
if not anthropic_key:
|
|
raise ValueError("Please set the ANTHROPIC_API_KEY environment variable")
|
|
|
|
alt_user_agents = [
|
|
"Mozilla/5.0 (Macintosh; Intel Mac OS X 13_4_1) AppleWebKit/605.1.15 (KHTML, like Gecko) Version/16.5 Safari/605.1.15"
|
|
]
|
|
|
|
retriever = LinkContentFetcher(user_agents=alt_user_agents)
|
|
pt = PromptTemplate(
|
|
"Given the content below, create a summary consisting of three sections: Objectives, "
|
|
"Implementation and Learnings/Conclusions.\n"
|
|
"Each section should have at least three bullet points. \n"
|
|
"In the content below disregard References section.\n\n: {documents}"
|
|
)
|
|
|
|
prompt_node = PromptNode(
|
|
"claude-instant-1", api_key=anthropic_key, max_length=512, default_prompt_template=pt, model_kwargs={"stream": True}
|
|
)
|
|
|
|
pipeline = Pipeline()
|
|
pipeline.add_node(component=retriever, name="Retriever", inputs=["Query"])
|
|
pipeline.add_node(component=prompt_node, name="PromptNode", inputs=["Retriever"])
|
|
|
|
research_papers = ["https://arxiv.org/pdf/2307.03172.pdf", "https://arxiv.org/pdf/1706.03762.pdf"]
|
|
|
|
for research_paper in research_papers:
|
|
print(f"Research paper summary: {research_paper}")
|
|
pipeline.run(research_paper)
|
|
print("\n\n\n")
|