crawl4ai/docs/examples/docker_python_sdk.py

import asyncio
from crawl4ai.docker_client import Crawl4aiDockerClient
from crawl4ai import (
    BrowserConfig,
    CrawlerRunConfig
)

async def main():
    async with Crawl4aiDockerClient(base_url="http://localhost:8000", verbose=True) as client:
        # If jwt is enabled, authenticate first
        # await client.authenticate("test@example.com")
        
        # Non-streaming crawl
        results = await client.crawl(
            ["https://example.com", "https://python.org"],
            browser_config=BrowserConfig(headless=True),
            crawler_config=CrawlerRunConfig()
        )
        print(f"Non-streaming results: {results}")
        
        # Streaming crawl
        crawler_config = CrawlerRunConfig(stream=True)
        async for result in await client.crawl(
            ["https://example.com", "https://python.org"],
            browser_config=BrowserConfig(headless=True),
            crawler_config=crawler_config
        ):
            print(f"Streamed result: {result}")
        
        # Get schema
        schema = await client.get_schema()
        print(f"Schema: {schema}")

if __name__ == "__main__":
    asyncio.run(main())
feat(docker): add JWT authentication and improve server architecture Add JWT token-based authentication to Docker server and client. Refactor server architecture for better code organization and error handling. Move Dockerfile to root deploy directory and update configuration. Add comprehensive documentation and examples. BREAKING CHANGE: Docker server now requires authentication by default. Endpoints require JWT tokens when security.jwt_enabled is true in config. 2025-02-18 22:07:13 +08:00			`import asyncio`
			`from crawl4ai.docker_client import Crawl4aiDockerClient`
			`from crawl4ai import (`
			`BrowserConfig,`
			`CrawlerRunConfig`
			`)`

			`async def main():`
			`async with Crawl4aiDockerClient(base_url="http://localhost:8000", verbose=True) as client:`
			`# If jwt is enabled, authenticate first`
			`# await client.authenticate("test@example.com")`

			`# Non-streaming crawl`
			`results = await client.crawl(`
			`["https://example.com", "https://python.org"],`
			`browser_config=BrowserConfig(headless=True),`
			`crawler_config=CrawlerRunConfig()`
			`)`
			`print(f"Non-streaming results: {results}")`

			`# Streaming crawl`
			`crawler_config = CrawlerRunConfig(stream=True)`
			`async for result in await client.crawl(`
			`["https://example.com", "https://python.org"],`
			`browser_config=BrowserConfig(headless=True),`
			`crawler_config=crawler_config`
			`):`
			`print(f"Streamed result: {result}")`

			`# Get schema`
			`schema = await client.get_schema()`
			`print(f"Schema: {schema}")`

			`if __name__ == "__main__":`
			`asyncio.run(main())`