From 09fd3e152a3a5132c63ed196ca974a130571e756 Mon Sep 17 00:00:00 2001 From: UncleCode Date: Tue, 3 Jun 2025 23:34:11 +0800 Subject: [PATCH] fix: Import os and adjust file saving path in URL seeder demo --- docs/examples/url_seeder/url_seeder_quick_demo.py | 15 +++++++++------ 1 file changed, 9 insertions(+), 6 deletions(-) diff --git a/docs/examples/url_seeder/url_seeder_quick_demo.py b/docs/examples/url_seeder/url_seeder_quick_demo.py index 3dc58b98..2a05f636 100644 --- a/docs/examples/url_seeder/url_seeder_quick_demo.py +++ b/docs/examples/url_seeder/url_seeder_quick_demo.py @@ -2,10 +2,12 @@ 🚀 URL Seeder + AsyncWebCrawler = Magic! Quick demo showing discovery → filter → crawl pipeline """ -import asyncio +import asyncio, os from crawl4ai import AsyncUrlSeeder, AsyncWebCrawler, SeedingConfig, CrawlerRunConfig, AsyncLogger, DefaultMarkdownGenerator from crawl4ai.content_filter_strategy import PruningContentFilter +CURRENT_DIR = os.path.dirname(os.path.abspath(__file__)) + # 🔍 Example 1: Discover ALL → Filter → Crawl async def discover_and_crawl(): """Find Python module tutorials & extract them all!""" @@ -57,6 +59,7 @@ async def discover_and_crawl(): if result.success: # Save each tutorial (name from URL) name = result.url.split("/")[-2] + ".md" + name = os.path.join(CURRENT_DIR, name) with open(name, "w") as f: f.write(result.markdown.fit_markdown) saved += 1 @@ -117,11 +120,11 @@ async def smart_search_with_bm25(): # 🎬 Run the show! async def main(): - # print("=" * 60) - # await discover_and_crawl() - # print("\n" + "=" * 60 + "\n") - # await explore_beautifulsoup() - # print("\n" + "=" * 60 + "\n") + print("=" * 60) + await discover_and_crawl() + print("\n" + "=" * 60 + "\n") + await explore_beautifulsoup() + print("\n" + "=" * 60 + "\n") await smart_search_with_bm25() if __name__ == "__main__":