fix: Added browser config and crawler run config from 0.4.22

This commit is contained in:
Aravind Karnam
2024-12-18 10:33:09 +05:30
parent 7c0fa269a6
commit 7a5f83b76f
2 changed files with 9 additions and 6 deletions

View File

@@ -14,7 +14,7 @@ from collections import defaultdict
from .models import CrawlResult
from .filters import FilterChain
from .scorers import URLScorer
from ..async_webcrawler import AsyncWebCrawler
from ..async_webcrawler import AsyncWebCrawler, CrawlerRunConfig
from .scraper_strategy import ScraperStrategy
@dataclass
@@ -116,7 +116,8 @@ class BFSScraperStrategy(ScraperStrategy):
) -> CrawlResult:
"""Crawl URL with retry logic"""
try:
return await asyncio.wait_for(crawler.arun(url), timeout=self.timeout)
crawler_config = CrawlerRunConfig(cache_mode="BYPASS")
return await asyncio.wait_for(crawler.arun(url, config=crawler_config), timeout=self.timeout)
except asyncio.TimeoutError:
self.logger.error(f"Timeout crawling {url}")
raise