Merge branch 'format-inline-tags'

This commit is contained in:
unclecode
2024-06-19 00:48:38 +08:00
5 changed files with 56 additions and 3 deletions

View File

@@ -176,7 +176,7 @@ class WebCrawler:
t = time.time()
# Extract content from HTML
try:
result = get_content_of_website(url, html, word_count_threshold, css_selector=css_selector)
result = get_content_of_website(url, html, word_count_threshold, css_selector=css_selector, only_text=kwargs.get("only_text", False))
metadata = extract_metadata(html)
if result is None:
raise ValueError(f"Failed to extract content from the website: {url}")