crawl4ai/docs/examples/hello_world_docker.py

import asyncio
from crawl4ai import *

async def main():
    # Configure browser to use Docker
    browser_config = BrowserConfig(
        headless=True,
        verbose=True,
        use_docker=True  # Enable Docker browser
    )

    async with AsyncWebCrawler(config=browser_config) as crawler:
        crawler_config = CrawlerRunConfig(
            cache_mode=CacheMode.BYPASS,
            markdown_generator=DefaultMarkdownGenerator(
                content_filter=PruningContentFilter(
                    threshold=0.48,
                    threshold_type="fixed",
                    min_word_threshold=0
                )
            )
        )

        result = await crawler.arun(
            url="https://www.helloworld.org",
            config=crawler_config
        )
        print(result.markdown_v2.raw_markdown[:500])

if __name__ == "__main__":
    asyncio.run(main())