From 5ce1dc1622e2e17c7f16fef2edbd9fe1820dcd92 Mon Sep 17 00:00:00 2001 From: UncleCode Date: Thu, 16 May 2024 21:58:11 +0800 Subject: [PATCH] Update web_crawler.py Set all extraction strategies default to NoExtractionStrategy --- crawl4ai/web_crawler.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/crawl4ai/web_crawler.py b/crawl4ai/web_crawler.py index 7fa4304f..311ae351 100644 --- a/crawl4ai/web_crawler.py +++ b/crawl4ai/web_crawler.py @@ -63,7 +63,7 @@ class WebCrawler: extract_blocks_flag: bool = True, word_count_threshold=MIN_WORD_THRESHOLD, use_cached_html: bool = False, - extraction_strategy: ExtractionStrategy = LLMExtractionStrategy(), + extraction_strategy: ExtractionStrategy = NoExtractionStrategy(), chunking_strategy: ChunkingStrategy = RegexChunking(), **kwargs, ) -> CrawlResult: