48 lines
1.5 KiB
Python

#!/usr/bin/env python3
"""
Minimal examples for Firecrawl v2.
"""
import os
from dotenv import load_dotenv
from firecrawl import Firecrawl
load_dotenv()
def main():
api_key = os.getenv("FIRECRAWL_API_KEY")
if not api_key:
raise ValueError("FIRECRAWL_API_KEY is not set")
api_url = os.getenv("FIRECRAWL_API_URL")
if not api_url:
raise ValueError("FIRECRAWL_API_URL is not set")
firecrawl = Firecrawl(api_key=api_key, api_url=api_url)
# # Scrape
# doc = firecrawl.scrape("https://docs.firecrawl.dev", formats=["markdown"])
# print("scrape:", doc.markdown)
# # Crawl (waits until terminal state)
# crawl_job = firecrawl.crawl("https://docs.firecrawl.dev", limit=3, poll_interval=1, timeout=120)
# print("crawl:", crawl_job.status, crawl_job.completed, "/", crawl_job.total)
# # Batch scrape
# batch = firecrawl.batch_scrape([
# "https://docs.firecrawl.dev",
# "https://firecrawl.dev",
# ], formats=["markdown"], poll_interval=1, wait_timeout=120)
# print("batch:", batch.status, batch.completed, "/", batch.total)
# # Search
# search_response = firecrawl.search(query="What is the capital of France?", limit=5)
# print("search web results:", len(getattr(search_response, "web", []) or []))
# Map
map_response = firecrawl.map("https://firecrawl.dev")
print("map links:", len(getattr(map_response, "links", []) or []))
if __name__ == "__main__":
main()