From 45f1652d980359b38fd2e80d0d9b564f883a68f6 Mon Sep 17 00:00:00 2001 From: UncleCode Date: Sat, 17 May 2025 10:31:19 +0800 Subject: [PATCH] Fix merge_chunks splitter usage and remove incorrect return --- crawl4ai/utils.py | 4 +--- 1 file changed, 1 insertion(+), 3 deletions(-) diff --git a/crawl4ai/utils.py b/crawl4ai/utils.py index bfa8ce9d..7214a80d 100644 --- a/crawl4ai/utils.py +++ b/crawl4ai/utils.py @@ -150,7 +150,7 @@ def merge_chunks( total_tokens = 0 for doc in docs: - tokens = doc.split() + tokens = splitter(doc) count = int(len(tokens) * word_token_ratio) if count: # Skip empty docs token_counts.append(count) @@ -1196,8 +1196,6 @@ def get_content_of_website_optimized( return None except InvalidSchema: return None - finally: - return image_height = img.get("height") height_value, height_unit = parse_dimension(image_height)