Renames browser_config param to config in AsyncWebCrawler
Standardizes parameter naming convention across the codebase by renaming browser_config to the more concise config in AsyncWebCrawler constructor. Updates all documentation examples and internal usages to reflect the new parameter name for consistency. Also improves hook execution by adding url/response parameters to goto hooks and fixes parameter ordering in before_return_html hook.
This commit is contained in:
@@ -68,7 +68,7 @@ class AsyncWebCrawler:
|
||||
|
||||
New way (recommended):
|
||||
browser_config = BrowserConfig(browser_type="chromium", headless=True)
|
||||
crawler = AsyncWebCrawler(browser_config=browser_config)
|
||||
crawler = AsyncWebCrawler(config=browser_config)
|
||||
"""
|
||||
_domain_last_hit = {}
|
||||
|
||||
@@ -117,12 +117,19 @@ class AsyncWebCrawler:
|
||||
|
||||
|
||||
# Initialize crawler strategy
|
||||
params = {
|
||||
k:v for k, v in kwargs.items() if k in ['browser_congig', 'logger']
|
||||
}
|
||||
self.crawler_strategy = crawler_strategy or AsyncPlaywrightCrawlerStrategy(
|
||||
browser_config=browser_config,
|
||||
logger=self.logger,
|
||||
**kwargs # Pass remaining kwargs for backwards compatibility
|
||||
**params # Pass remaining kwargs for backwards compatibility
|
||||
)
|
||||
|
||||
# If craweler strategy doesnt have logger, use crawler logger
|
||||
if not self.crawler_strategy.logger:
|
||||
self.crawler_strategy.logger = self.logger
|
||||
|
||||
# Handle deprecated cache parameter
|
||||
if always_by_pass_cache is not None:
|
||||
if kwargs.get("warning", True):
|
||||
|
||||
Reference in New Issue
Block a user