From 0bba0e074f720a5d03027ee8fdf699f46ce8af82 Mon Sep 17 00:00:00 2001
From: bizrockman <d.gerst@bizrock.de>
Date: Mon, 4 Nov 2024 20:12:24 +0100
Subject: [PATCH 001/115] Preventing NoneType has no attribute get Errors

Sometimes the list contains Tag elements that do not have attrs set, resulting in this Error.
---
 crawl4ai/utils.py | 9 ++++++---
 1 file changed, 6 insertions(+), 3 deletions(-)

diff --git a/crawl4ai/utils.py b/crawl4ai/utils.py
index baa08a0f..869c22d5 100644
--- a/crawl4ai/utils.py
+++ b/crawl4ai/utils.py
@@ -706,9 +706,12 @@ def get_content_of_website_optimized(url: str, html: str, word_count_threshold:
     body = flatten_nested_elements(body)
     base64_pattern = re.compile(r'data:image/[^;]+;base64,([^"]+)')
     for img in imgs:
-        src = img.get('src', '')
-        if base64_pattern.match(src):
-            img['src'] = base64_pattern.sub('', src)
+        try:
+            src = img.get('src', '')
+            if base64_pattern.match(src):
+                img['src'] = base64_pattern.sub('', src)
+        except:
+            pass        
 
     cleaned_html = str(body).replace('\n\n', '\n').replace('  ', ' ')
     cleaned_html = sanitize_html(cleaned_html)

From a28046c233059c3dc2c4ce442e5cda6f7f18645b Mon Sep 17 00:00:00 2001
From: bizrockman <d.gerst@bizrock.de>
Date: Mon, 4 Nov 2024 20:18:26 +0100
Subject: [PATCH 002/115] Rename
 episode_08_Media_Handling:_Images,_Videos,_and_Audio.md to
 episode_08_Media_Handling_Images_Videos_and_Audio.md

Name that will work in Windows
---
 ....md => episode_08_Media_Handling_Images_Videos_and_Audio.md} | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)
 rename docs/md_v2/tutorial/{episode_08_Media_Handling:_Images,_Videos,_and_Audio.md => episode_08_Media_Handling_Images_Videos_and_Audio.md} (99%)

diff --git a/docs/md_v2/tutorial/episode_08_Media_Handling:_Images,_Videos,_and_Audio.md b/docs/md_v2/tutorial/episode_08_Media_Handling_Images_Videos_and_Audio.md
similarity index 99%
rename from docs/md_v2/tutorial/episode_08_Media_Handling:_Images,_Videos,_and_Audio.md
rename to docs/md_v2/tutorial/episode_08_Media_Handling_Images_Videos_and_Audio.md
index c3a57009..c0daacad 100644
--- a/docs/md_v2/tutorial/episode_08_Media_Handling:_Images,_Videos,_and_Audio.md
+++ b/docs/md_v2/tutorial/episode_08_Media_Handling_Images_Videos_and_Audio.md
@@ -113,4 +113,4 @@ Here’s a clear and focused outline for the **Media Handling: Images, Videos, a
 
 ---
 
-This outline provides users with a complete guide to handling images, videos, and audio in Crawl4AI, using metadata to enhance relevance and precision in multimedia extraction.
\ No newline at end of file
+This outline provides users with a complete guide to handling images, videos, and audio in Crawl4AI, using metadata to enhance relevance and precision in multimedia extraction.

From 870296fa7ee43b221cdede34dbe22a8a2ea4ea4c Mon Sep 17 00:00:00 2001
From: bizrockman <d.gerst@bizrock.de>
Date: Mon, 4 Nov 2024 20:18:58 +0100
Subject: [PATCH 003/115] Rename
 episode_11_1_Extraction_Strategies:_JSON_CSS.md to
 episode_11_1_Extraction_Strategies_JSON_CSS.md

Name that will work in Windows
---
 ...ON_CSS.md => episode_11_1_Extraction_Strategies_JSON_CSS.md} | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)
 rename docs/md_v2/tutorial/{episode_11_1_Extraction_Strategies:_JSON_CSS.md => episode_11_1_Extraction_Strategies_JSON_CSS.md} (99%)

diff --git a/docs/md_v2/tutorial/episode_11_1_Extraction_Strategies:_JSON_CSS.md b/docs/md_v2/tutorial/episode_11_1_Extraction_Strategies_JSON_CSS.md
similarity index 99%
rename from docs/md_v2/tutorial/episode_11_1_Extraction_Strategies:_JSON_CSS.md
rename to docs/md_v2/tutorial/episode_11_1_Extraction_Strategies_JSON_CSS.md
index a8a357af..b460ff8c 100644
--- a/docs/md_v2/tutorial/episode_11_1_Extraction_Strategies:_JSON_CSS.md
+++ b/docs/md_v2/tutorial/episode_11_1_Extraction_Strategies_JSON_CSS.md
@@ -183,4 +183,4 @@ Here’s a detailed outline for the **JSON-CSS Extraction Strategy** video, cove
 
 ---
 
-This outline covers each JSON-CSS Extraction option in Crawl4AI, with practical examples and schema configurations, making it a thorough guide for users.
\ No newline at end of file
+This outline covers each JSON-CSS Extraction option in Crawl4AI, with practical examples and schema configurations, making it a thorough guide for users.

From 3a3c88a2d0d76141179d9284d43021083d1e663b Mon Sep 17 00:00:00 2001
From: bizrockman <d.gerst@bizrock.de>
Date: Mon, 4 Nov 2024 20:19:20 +0100
Subject: [PATCH 004/115] Rename episode_11_2_Extraction_Strategies:_LLM.md to
 episode_11_2_Extraction_Strategies_LLM.md

Name that will work in Windows
---
 ...tegies:_LLM.md => episode_11_2_Extraction_Strategies_LLM.md} | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)
 rename docs/md_v2/tutorial/{episode_11_2_Extraction_Strategies:_LLM.md => episode_11_2_Extraction_Strategies_LLM.md} (99%)

diff --git a/docs/md_v2/tutorial/episode_11_2_Extraction_Strategies:_LLM.md b/docs/md_v2/tutorial/episode_11_2_Extraction_Strategies_LLM.md
similarity index 99%
rename from docs/md_v2/tutorial/episode_11_2_Extraction_Strategies:_LLM.md
rename to docs/md_v2/tutorial/episode_11_2_Extraction_Strategies_LLM.md
index 900c32f2..3682425f 100644
--- a/docs/md_v2/tutorial/episode_11_2_Extraction_Strategies:_LLM.md
+++ b/docs/md_v2/tutorial/episode_11_2_Extraction_Strategies_LLM.md
@@ -150,4 +150,4 @@ Here’s a comprehensive outline for the **LLM Extraction Strategy** video, cove
 
 ---
 
-This outline explains LLM Extraction in Crawl4AI, with examples showing how to extract structured data using custom schemas and instructions. It demonstrates flexibility with multiple providers, ensuring practical application for different use cases.
\ No newline at end of file
+This outline explains LLM Extraction in Crawl4AI, with examples showing how to extract structured data using custom schemas and instructions. It demonstrates flexibility with multiple providers, ensuring practical application for different use cases.

From 796dbaf08c92efd606c5b82d00168c29702f6927 Mon Sep 17 00:00:00 2001
From: bizrockman <d.gerst@bizrock.de>
Date: Mon, 4 Nov 2024 20:19:43 +0100
Subject: [PATCH 005/115] Rename episode_11_3_Extraction_Strategies:_Cosine.md
 to episode_11_3_Extraction_Strategies_Cosine.md

Name that will work in Windows
---
 ...:_Cosine.md => episode_11_3_Extraction_Strategies_Cosine.md} | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)
 rename docs/md_v2/tutorial/{episode_11_3_Extraction_Strategies:_Cosine.md => episode_11_3_Extraction_Strategies_Cosine.md} (99%)

diff --git a/docs/md_v2/tutorial/episode_11_3_Extraction_Strategies:_Cosine.md b/docs/md_v2/tutorial/episode_11_3_Extraction_Strategies_Cosine.md
similarity index 99%
rename from docs/md_v2/tutorial/episode_11_3_Extraction_Strategies:_Cosine.md
rename to docs/md_v2/tutorial/episode_11_3_Extraction_Strategies_Cosine.md
index 61e210e4..9f1c00ea 100644
--- a/docs/md_v2/tutorial/episode_11_3_Extraction_Strategies:_Cosine.md
+++ b/docs/md_v2/tutorial/episode_11_3_Extraction_Strategies_Cosine.md
@@ -133,4 +133,4 @@ Here’s a structured outline for the **Cosine Similarity Strategy** video, cove
 
 ---
 
-This outline covers Cosine Similarity Strategy’s speed and effectiveness, providing examples that showcase its potential for clustering various content types efficiently.
\ No newline at end of file
+This outline covers Cosine Similarity Strategy’s speed and effectiveness, providing examples that showcase its potential for clustering various content types efficiently.

From 9f5eef1f3890094a4df707458fa611a83398429d Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Wed, 6 Nov 2024 21:50:09 +0800
Subject: [PATCH 006/115] Refactored the `CustomHTML2Text` class in
 `content_scrapping_strategy.py` to remove the handling logic for header tags
 (h1-h6), which are now commented out. This cleanup improves code readability
 and reduces maintenance overhead.

---
 crawl4ai/content_scrapping_strategy.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/crawl4ai/content_scrapping_strategy.py b/crawl4ai/content_scrapping_strategy.py
index 66b3ad91..caed7319 100644
--- a/crawl4ai/content_scrapping_strategy.py
+++ b/crawl4ai/content_scrapping_strategy.py
@@ -93,8 +93,8 @@ class CustomHTML2Text(HTML2Text):
             else:
                 self.o('\n```')
                 self.inside_pre = False
-        elif tag in ["h1", "h2", "h3", "h4", "h5", "h6"]:
-            pass
+        # elif tag in ["h1", "h2", "h3", "h4", "h5", "h6"]:
+        #     pass
         else:
             super().handle_tag(tag, attrs, start)
 

From 2879344d9ccc281054587c079a5d5d2a2245b60a Mon Sep 17 00:00:00 2001
From: devatnull <lateralus@criptext.com>
Date: Wed, 6 Nov 2024 17:36:46 +0300
Subject: [PATCH 007/115] Update README.md

---
 README.md | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/README.md b/README.md
index 28563762..a0e8b005 100644
--- a/README.md
+++ b/README.md
@@ -1,4 +1,4 @@
-# 🔥🕷️ Crawl4AI: LLM Friendly Web Crawler & Scrapper
+# 🔥🕷️ Crawl4AI: LLM Friendly Web Crawler & Scraper
 
 <a href="https://trendshift.io/repositories/11716" target="_blank"><img src="https://trendshift.io/api/badge/repositories/11716" alt="unclecode%2Fcrawl4ai | Trendshift" style="width: 250px; height: 55px;" width="250" height="55"/></a>
 
@@ -480,4 +480,4 @@ For a detailed exploration of our vision, challenges, and solutions, please see
 
 ## Star History
 
-[![Star History Chart](https://api.star-history.com/svg?repos=unclecode/crawl4ai&type=Date)](https://star-history.com/#unclecode/crawl4ai&Date)
\ No newline at end of file
+[![Star History Chart](https://api.star-history.com/svg?repos=unclecode/crawl4ai&type=Date)](https://star-history.com/#unclecode/crawl4ai&Date)

From f7574230a11278fef07f7dcaeb29a3b45752380f Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Thu, 7 Nov 2024 19:29:31 +0800
Subject: [PATCH 008/115] Update API server request object. text_docker file
 and Readme

---
 README.md            | 2 +-
 main.py              | 3 ++-
 tests/test_docker.py | 7 ++++---
 3 files changed, 7 insertions(+), 5 deletions(-)

diff --git a/README.md b/README.md
index 28563762..1f36aca6 100644
--- a/README.md
+++ b/README.md
@@ -22,7 +22,7 @@ Use the [Crawl4AI GPT Assistant](https://tinyurl.com/crawl4ai-gpt) as your AI-po
 ## New in 0.3.73 ✨
 
 - 🐳 Docker Ready: Full API server with seamless deployment & scaling
-- 🎯 Smart Browser: Managed browser integration with CDP support
+- 🎯 Browser Takeover: Use your own browser with cookies & history intact (CDP support)
 - 📝 Mockdown+: Enhanced tag preservation & content extraction
 - ⚡️ Parallel Power: Supercharged multi-URL crawling performance
 - 🌟 And many more exciting updates...
diff --git a/main.py b/main.py
index 3e32fe9c..853cd0b7 100644
--- a/main.py
+++ b/main.py
@@ -62,6 +62,7 @@ class CrawlRequest(BaseModel):
     css_selector: Optional[str] = None
     screenshot: bool = False
     magic: bool = False
+    extra: Optional[Dict[str, Any]] = {}
 
 @dataclass
 class TaskInfo:
@@ -251,7 +252,7 @@ class CrawlerService:
         while True:
             try:
                 available_slots = await self.resource_monitor.get_available_slots()
-                if available_slots <= 0:
+                if False and available_slots <= 0:
                     await asyncio.sleep(1)
                     continue
 
diff --git a/tests/test_docker.py b/tests/test_docker.py
index 913450ca..c22acd55 100644
--- a/tests/test_docker.py
+++ b/tests/test_docker.py
@@ -7,7 +7,7 @@ import os
 from typing import Dict, Any
 
 class Crawl4AiTester:
-    def __init__(self, base_url: str = "http://localhost:8000"):
+    def __init__(self, base_url: str = "http://localhost:11235"):
         self.base_url = base_url
         
     def submit_and_wait(self, request_data: Dict[str, Any], timeout: int = 300) -> Dict[str, Any]:
@@ -54,8 +54,9 @@ def test_docker_deployment(version="basic"):
     
     # Test cases based on version
     test_basic_crawl(tester)
-    if version in ["full", "transformer"]:
-        test_cosine_extraction(tester)
+    
+    # if version in ["full", "transformer"]:
+    #     test_cosine_extraction(tester)
 
     # test_js_execution(tester)
     # test_css_selector(tester)

From b120965b6ac9773f599a854f214aa16c1a7426b9 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Thu, 7 Nov 2024 20:15:03 +0800
Subject: [PATCH 009/115] Fixed issues with the Manage Browser, including its
 inability to connect to the user directory and inability to create new pages
 within the Manage Browser context; all issues are now resolved.

---
 crawl4ai/async_crawler_strategy.py | 143 +++++++++++++++++++----------
 1 file changed, 93 insertions(+), 50 deletions(-)

diff --git a/crawl4ai/async_crawler_strategy.py b/crawl4ai/async_crawler_strategy.py
index e79c8268..fa50e7b5 100644
--- a/crawl4ai/async_crawler_strategy.py
+++ b/crawl4ai/async_crawler_strategy.py
@@ -187,6 +187,7 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
         self.use_managed_browser = kwargs.get("use_managed_browser", False)
         self.user_data_dir = kwargs.get("user_data_dir", None)
         self.managed_browser = None
+        self.default_context = None
         self.hooks = {
             'on_browser_created': None,
             'on_user_agent_updated': None,
@@ -217,6 +218,25 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
                 )
                 cdp_url = await self.managed_browser.start()
                 self.browser = await self.playwright.chromium.connect_over_cdp(cdp_url)
+                
+                # Get the default context that maintains the user profile
+                contexts = self.browser.contexts
+                if contexts:
+                    self.default_context = contexts[0]
+                else:
+                    # If no default context exists, create one
+                    self.default_context = await self.browser.new_context(
+                        viewport={"width": 1920, "height": 1080}
+                    )
+                
+                # Set up the default context
+                if self.default_context:
+                    await self.default_context.set_extra_http_headers(self.headers)
+                    
+                    if self.user_agent:
+                        await self.default_context.set_extra_http_headers({
+                            "User-Agent": self.user_agent
+                        })
             else:
                 browser_args = {
                     "headless": self.headless,
@@ -254,12 +274,20 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
     async def close(self):
         if self.sleep_on_close:
             await asyncio.sleep(0.5)
+            
+        # Close all active sessions
+        session_ids = list(self.sessions.keys())
+        for session_id in session_ids:
+            await self.kill_session(session_id)
+            
         if self.browser:
             await self.browser.close()
             self.browser = None
+            
         if self.managed_browser:
             await self.managed_browser.cleanup()
             self.managed_browser = None
+            
         if self.playwright:
             await self.playwright.stop()
             self.playwright = None
@@ -293,7 +321,8 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
         if session_id in self.sessions:
             context, page, _ = self.sessions[session_id]
             await page.close()
-            await context.close()
+            if not self.use_managed_browser:
+                await context.close()
             del self.sessions[session_id]
 
     def _cleanup_expired_sessions(self):
@@ -415,61 +444,75 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
         
         self._cleanup_expired_sessions()
         session_id = kwargs.get("session_id")
-        if session_id:
-            context, page, _ = self.sessions.get(session_id, (None, None, None))
-            if not context:
+        
+        # Handle page creation differently for managed browser
+        if self.use_managed_browser:
+            if session_id:
+                # Reuse existing session if available
+                context, page, _ = self.sessions.get(session_id, (None, None, None))
+                if not page:
+                    # Create new page in default context if session doesn't exist
+                    page = await self.default_context.new_page()
+                    self.sessions[session_id] = (self.default_context, page, time.time())
+            else:
+                # Create new page in default context for non-session requests
+                page = await self.default_context.new_page()
+        else:
+            if session_id:
+                context, page, _ = self.sessions.get(session_id, (None, None, None))
+                if not context:
+                    context = await self.browser.new_context(
+                        user_agent=self.user_agent,
+                        viewport={"width": 1920, "height": 1080},
+                        proxy={"server": self.proxy} if self.proxy else None,
+                        accept_downloads=True,
+                        java_script_enabled=True
+                    )
+                    await context.add_cookies([{"name": "cookiesEnabled", "value": "true", "url": url}])
+                    await context.set_extra_http_headers(self.headers)
+                    page = await context.new_page()
+                    self.sessions[session_id] = (context, page, time.time())
+            else:
                 context = await self.browser.new_context(
                     user_agent=self.user_agent,
                     viewport={"width": 1920, "height": 1080},
-                    proxy={"server": self.proxy} if self.proxy else None,
-                    accept_downloads=True,
-                    java_script_enabled=True
+                    proxy={"server": self.proxy} if self.proxy else None
                 )
-                await context.add_cookies([{"name": "cookiesEnabled", "value": "true", "url": url}])
                 await context.set_extra_http_headers(self.headers)
+                
+                if kwargs.get("override_navigator", False) or kwargs.get("simulate_user", False) or kwargs.get("magic", False):
+                    # Inject scripts to override navigator properties
+                    await context.add_init_script("""
+                        // Pass the Permissions Test.
+                        const originalQuery = window.navigator.permissions.query;
+                        window.navigator.permissions.query = (parameters) => (
+                            parameters.name === 'notifications' ?
+                                Promise.resolve({ state: Notification.permission }) :
+                                originalQuery(parameters)
+                        );
+                        Object.defineProperty(navigator, 'webdriver', {
+                            get: () => undefined
+                        });
+                        window.navigator.chrome = {
+                            runtime: {},
+                            // Add other properties if necessary
+                        };
+                        Object.defineProperty(navigator, 'plugins', {
+                            get: () => [1, 2, 3, 4, 5],
+                        });
+                        Object.defineProperty(navigator, 'languages', {
+                            get: () => ['en-US', 'en'],
+                        });
+                        Object.defineProperty(document, 'hidden', {
+                            get: () => false
+                        });
+                        Object.defineProperty(document, 'visibilityState', {
+                            get: () => 'visible'
+                        });
+                    """)
+                
                 page = await context.new_page()
-                self.sessions[session_id] = (context, page, time.time())
-        else:
-            context = await self.browser.new_context(
-                user_agent=self.user_agent,
-                viewport={"width": 1920, "height": 1080},
-                proxy={"server": self.proxy} if self.proxy else None
-            )
-            await context.set_extra_http_headers(self.headers)
-            
-            if kwargs.get("override_navigator", False) or kwargs.get("simulate_user", False) or kwargs.get("magic", False):
-                # Inject scripts to override navigator properties
-                await context.add_init_script("""
-                    // Pass the Permissions Test.
-                    const originalQuery = window.navigator.permissions.query;
-                    window.navigator.permissions.query = (parameters) => (
-                        parameters.name === 'notifications' ?
-                            Promise.resolve({ state: Notification.permission }) :
-                            originalQuery(parameters)
-                    );
-                    Object.defineProperty(navigator, 'webdriver', {
-                        get: () => undefined
-                    });
-                    window.navigator.chrome = {
-                        runtime: {},
-                        // Add other properties if necessary
-                    };
-                    Object.defineProperty(navigator, 'plugins', {
-                        get: () => [1, 2, 3, 4, 5],
-                    });
-                    Object.defineProperty(navigator, 'languages', {
-                        get: () => ['en-US', 'en'],
-                    });
-                    Object.defineProperty(document, 'hidden', {
-                        get: () => false
-                    });
-                    Object.defineProperty(document, 'visibilityState', {
-                        get: () => 'visible'
-                    });
-                """)
-            
-            page = await context.new_page()
-            # await stealth_async(page) #, stealth_config)
+                # await stealth_async(page) #, stealth_config)
 
         # Add console message and error logging
         if kwargs.get("log_console", False):

From bcdd80911fff320b041921f3d25524aae103e79a Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Fri, 8 Nov 2024 19:08:58 +0800
Subject: [PATCH 010/115] Remove some old files.

---
 crawl4ai/train.py            | 146 --------------
 crawl4ai/web_crawler.back.py | 357 -----------------------------------
 2 files changed, 503 deletions(-)
 delete mode 100644 crawl4ai/train.py
 delete mode 100644 crawl4ai/web_crawler.back.py

diff --git a/crawl4ai/train.py b/crawl4ai/train.py
deleted file mode 100644
index f7e7c1a9..00000000
--- a/crawl4ai/train.py
+++ /dev/null
@@ -1,146 +0,0 @@
-import spacy
-from spacy.training import Example
-import random
-import nltk
-from nltk.corpus import reuters
-import torch
-
-def save_spacy_model_as_torch(nlp, model_dir="models/reuters"):
-    # Extract the TextCategorizer component
-    textcat = nlp.get_pipe("textcat_multilabel")
-
-    # Convert the weights to a PyTorch state dictionary
-    state_dict = {name: torch.tensor(param.data) for name, param in textcat.model.named_parameters()}
-
-    # Save the state dictionary
-    torch.save(state_dict, f"{model_dir}/model_weights.pth")
-
-    # Extract and save the vocabulary
-    vocab = extract_vocab(nlp)
-    with open(f"{model_dir}/vocab.txt", "w") as vocab_file:
-        for word, idx in vocab.items():
-            vocab_file.write(f"{word}\t{idx}\n")
-    
-    print(f"Model weights and vocabulary saved to: {model_dir}")
-
-def extract_vocab(nlp):
-    # Extract vocabulary from the SpaCy model
-    vocab = {word: i for i, word in enumerate(nlp.vocab.strings)}
-    return vocab
-
-nlp = spacy.load("models/reuters")
-save_spacy_model_as_torch(nlp, model_dir="models")
-
-def train_and_save_reuters_model(model_dir="models/reuters"):
-    # Ensure the Reuters corpus is downloaded
-    nltk.download('reuters')
-    nltk.download('punkt')
-    if not reuters.fileids():
-        print("Reuters corpus not found.")
-        return
-
-    # Load a blank English spaCy model
-    nlp = spacy.blank("en")
-
-    # Create a TextCategorizer with the ensemble model for multi-label classification
-    textcat = nlp.add_pipe("textcat_multilabel")
-
-    # Add labels to text classifier
-    for label in reuters.categories():
-        textcat.add_label(label)
-
-    # Prepare training data
-    train_examples = []
-    for fileid in reuters.fileids():
-        categories = reuters.categories(fileid)
-        text = reuters.raw(fileid)
-        cats = {label: label in categories for label in reuters.categories()}
-        # Prepare spacy Example objects
-        doc = nlp.make_doc(text)
-        example = Example.from_dict(doc, {'cats': cats})
-        train_examples.append(example)
-
-    # Initialize the text categorizer with the example objects
-    nlp.initialize(lambda: train_examples)
-
-    # Train the model
-    random.seed(1)
-    spacy.util.fix_random_seed(1)
-    for i in range(5):  # Adjust iterations for better accuracy
-        random.shuffle(train_examples)
-        losses = {}
-        # Create batches of data
-        batches = spacy.util.minibatch(train_examples, size=8)
-        for batch in batches:
-            nlp.update(batch, drop=0.2, losses=losses)
-        print(f"Losses at iteration {i}: {losses}")
-
-    # Save the trained model
-    nlp.to_disk(model_dir)
-    print(f"Model saved to: {model_dir}")
-
-def train_model(model_dir, additional_epochs=0):
-    # Load the model if it exists, otherwise start with a blank model
-    try:
-        nlp = spacy.load(model_dir)
-        print("Model loaded from disk.")
-    except IOError:
-        print("No existing model found. Starting with a new model.")
-        nlp = spacy.blank("en")
-        textcat = nlp.add_pipe("textcat_multilabel")
-        for label in reuters.categories():
-            textcat.add_label(label)
-
-    # Prepare training data
-    train_examples = []
-    for fileid in reuters.fileids():
-        categories = reuters.categories(fileid)
-        text = reuters.raw(fileid)
-        cats = {label: label in categories for label in reuters.categories()}
-        doc = nlp.make_doc(text)
-        example = Example.from_dict(doc, {'cats': cats})
-        train_examples.append(example)
-
-    # Initialize the model if it was newly created
-    if 'textcat_multilabel' not in nlp.pipe_names:
-        nlp.initialize(lambda: train_examples)
-    else:
-        print("Continuing training with existing model.")
-
-    # Train the model
-    random.seed(1)
-    spacy.util.fix_random_seed(1)
-    num_epochs = 5 + additional_epochs
-    for i in range(num_epochs):
-        random.shuffle(train_examples)
-        losses = {}
-        batches = spacy.util.minibatch(train_examples, size=8)
-        for batch in batches:
-            nlp.update(batch, drop=0.2, losses=losses)
-        print(f"Losses at iteration {i}: {losses}")
-
-    # Save the trained model
-    nlp.to_disk(model_dir)
-    print(f"Model saved to: {model_dir}")
-
-def load_model_and_predict(model_dir, text, tok_k = 3):
-    # Load the trained model from the specified directory
-    nlp = spacy.load(model_dir)
-    
-    # Process the text with the loaded model
-    doc = nlp(text)
-    
-    # gee top 3 categories
-    top_categories = sorted(doc.cats.items(), key=lambda x: x[1], reverse=True)[:tok_k]
-    print(f"Top {tok_k} categories:")
-    
-    return top_categories    
-
-if __name__ == "__main__":
-    train_and_save_reuters_model()
-    train_model("models/reuters", additional_epochs=5)
-    model_directory = "reuters_model_10"
-    print(reuters.categories())
-    example_text = "Apple Inc. is reportedly buying a startup for $1 billion"
-    r =load_model_and_predict(model_directory, example_text)
-    print(r)
\ No newline at end of file
diff --git a/crawl4ai/web_crawler.back.py b/crawl4ai/web_crawler.back.py
deleted file mode 100644
index af78f126..00000000
--- a/crawl4ai/web_crawler.back.py
+++ /dev/null
@@ -1,357 +0,0 @@
-import os, time
-os.environ["TOKENIZERS_PARALLELISM"] = "false"
-from pathlib import Path
-
-from .models import UrlModel, CrawlResult
-from .database import init_db, get_cached_url, cache_url, DB_PATH, flush_db
-from .utils import *
-from .chunking_strategy import *
-from .extraction_strategy import *
-from .crawler_strategy import *
-from typing import List
-from concurrent.futures import ThreadPoolExecutor
-from .config import *
-
-
-class WebCrawler:
-    def __init__(
-        self,
-        # db_path: str = None,
-        crawler_strategy: CrawlerStrategy = None,
-        always_by_pass_cache: bool = False,
-        verbose: bool = False,
-    ):
-        # self.db_path = db_path
-        self.crawler_strategy = crawler_strategy or LocalSeleniumCrawlerStrategy(verbose=verbose)
-        self.always_by_pass_cache = always_by_pass_cache
-
-        # Create the .crawl4ai folder in the user's home directory if it doesn't exist
-        self.crawl4ai_folder = os.path.join(Path.home(), ".crawl4ai")
-        os.makedirs(self.crawl4ai_folder, exist_ok=True)
-        os.makedirs(f"{self.crawl4ai_folder}/cache", exist_ok=True)
-
-        # If db_path is not provided, use the default path
-        # if not db_path:
-            # self.db_path = f"{self.crawl4ai_folder}/crawl4ai.db"
-        
-        # flush_db()
-        init_db()
-        
-        self.ready = False
-        
-    def warmup(self):
-        print("[LOG] 🌤️  Warming up the WebCrawler")
-        result = self.run(
-            url='https://crawl4ai.uccode.io/',
-            word_count_threshold=5,
-            extraction_strategy= NoExtractionStrategy(),
-            bypass_cache=False,
-            verbose = False
-        )
-        self.ready = True
-        print("[LOG] 🌞 WebCrawler is ready to crawl")
-        
-    def fetch_page(
-        self,
-        url_model: UrlModel,
-        provider: str = DEFAULT_PROVIDER,
-        api_token: str = None,
-        extract_blocks_flag: bool = True,
-        word_count_threshold=MIN_WORD_THRESHOLD,
-        css_selector: str = None,
-        screenshot: bool = False,
-        use_cached_html: bool = False,
-        extraction_strategy: ExtractionStrategy = None,
-        chunking_strategy: ChunkingStrategy = RegexChunking(),
-        **kwargs,
-    ) -> CrawlResult:
-        return self.run(
-            url_model.url,
-            word_count_threshold,
-            extraction_strategy or NoExtractionStrategy(),
-            chunking_strategy,
-            bypass_cache=url_model.forced,
-            css_selector=css_selector,
-            screenshot=screenshot,
-            **kwargs,
-        )
-        pass
-
-    def run_old(
-        self,
-        url: str,
-        word_count_threshold=MIN_WORD_THRESHOLD,
-        extraction_strategy: ExtractionStrategy = None,
-        chunking_strategy: ChunkingStrategy = RegexChunking(),
-        bypass_cache: bool = False,
-        css_selector: str = None,
-        screenshot: bool = False,
-        user_agent: str = None,
-        verbose=True,
-        **kwargs,
-    ) -> CrawlResult:
-        if user_agent:
-            self.crawler_strategy.update_user_agent(user_agent)
-        extraction_strategy = extraction_strategy or NoExtractionStrategy()
-        extraction_strategy.verbose = verbose
-        # Check if extraction strategy is an instance of ExtractionStrategy if not raise an error
-        if not isinstance(extraction_strategy, ExtractionStrategy):
-            raise ValueError("Unsupported extraction strategy")
-        if not isinstance(chunking_strategy, ChunkingStrategy):
-            raise ValueError("Unsupported chunking strategy")
-        
-        # make sure word_count_threshold is not lesser than MIN_WORD_THRESHOLD
-        if word_count_threshold < MIN_WORD_THRESHOLD:
-            word_count_threshold = MIN_WORD_THRESHOLD
-
-        # Check cache first
-        if not bypass_cache and not self.always_by_pass_cache:
-            cached = get_cached_url(url)
-            if cached:
-                return CrawlResult(
-                    **{
-                        "url": cached[0],
-                        "html": cached[1],
-                        "cleaned_html": cached[2],
-                        "markdown": cached[3],
-                        "extracted_content": cached[4],
-                        "success": cached[5],
-                        "media": json.loads(cached[6] or "{}"),
-                        "links": json.loads(cached[7] or "{}"),
-                        "metadata": json.loads(cached[8] or "{}"), # "metadata": "{}
-                        "screenshot": cached[9],
-                        "error_message": "",
-                    }
-                )
-
-        # Initialize WebDriver for crawling
-        t = time.time()
-        if kwargs.get("js", None):
-            self.crawler_strategy.js_code = kwargs.get("js")
-        html = self.crawler_strategy.crawl(url)
-        base64_image = None
-        if screenshot:
-            base64_image = self.crawler_strategy.take_screenshot()
-        success = True
-        error_message = ""
-        # Extract content from HTML
-        try:
-            result = get_content_of_website(url, html, word_count_threshold, css_selector=css_selector)
-            metadata = extract_metadata(html)
-            if result is None:
-                raise ValueError(f"Failed to extract content from the website: {url}")
-        except InvalidCSSSelectorError as e:
-            raise ValueError(str(e))
-        
-        cleaned_html = result.get("cleaned_html", "")
-        markdown = result.get("markdown", "")
-        media = result.get("media", [])
-        links = result.get("links", [])
-
-        # Print a profession LOG style message, show time taken and say crawling is done
-        if verbose:
-            print(
-                f"[LOG] 🚀 Crawling done for {url}, success: {success}, time taken: {time.time() - t} seconds"
-            )
-
-        extracted_content = []
-        if verbose:
-            print(f"[LOG] 🔥 Extracting semantic blocks for {url}, Strategy: {extraction_strategy.name}")
-        t = time.time()
-        # Split markdown into sections
-        sections = chunking_strategy.chunk(markdown)
-        # sections = merge_chunks_based_on_token_threshold(sections, CHUNK_TOKEN_THRESHOLD)
-
-        extracted_content = extraction_strategy.run(
-            url, sections,
-        )
-        extracted_content = json.dumps(extracted_content)
-
-        if verbose:
-            print(
-                f"[LOG] 🚀 Extraction done for {url}, time taken: {time.time() - t} seconds."
-            )
-
-        # Cache the result
-        cleaned_html = beautify_html(cleaned_html)
-        cache_url(
-            url,
-            html,
-            cleaned_html,
-            markdown,
-            extracted_content,
-            success,
-            json.dumps(media),
-            json.dumps(links),
-            json.dumps(metadata),
-            screenshot=base64_image,
-        )
-
-        return CrawlResult(
-            url=url,
-            html=html,
-            cleaned_html=cleaned_html,
-            markdown=markdown,
-            media=media,
-            links=links,
-            metadata=metadata,
-            screenshot=base64_image,
-            extracted_content=extracted_content,
-            success=success,
-            error_message=error_message,
-        )
-
-    def fetch_pages(
-        self,
-        url_models: List[UrlModel],
-        provider: str = DEFAULT_PROVIDER,
-        api_token: str = None,
-        extract_blocks_flag: bool = True,
-        word_count_threshold=MIN_WORD_THRESHOLD,
-        use_cached_html: bool = False,
-        css_selector: str = None,
-        screenshot: bool = False,
-        extraction_strategy: ExtractionStrategy = None,
-        chunking_strategy: ChunkingStrategy = RegexChunking(),
-        **kwargs,
-    ) -> List[CrawlResult]:
-        extraction_strategy = extraction_strategy or NoExtractionStrategy()
-        def fetch_page_wrapper(url_model, *args, **kwargs):
-            return self.fetch_page(url_model, *args, **kwargs)
-
-        with ThreadPoolExecutor() as executor:
-            results = list(
-                executor.map(
-                    fetch_page_wrapper,
-                    url_models,
-                    [provider] * len(url_models),
-                    [api_token] * len(url_models),
-                    [extract_blocks_flag] * len(url_models),
-                    [word_count_threshold] * len(url_models),
-                    [css_selector] * len(url_models),
-                    [screenshot] * len(url_models),
-                    [use_cached_html] * len(url_models),
-                    [extraction_strategy] * len(url_models),
-                    [chunking_strategy] * len(url_models),
-                    *[kwargs] * len(url_models),
-                )
-            )
-
-        return results
-
-    def run(
-            self,
-            url: str,
-            word_count_threshold=MIN_WORD_THRESHOLD,
-            extraction_strategy: ExtractionStrategy = None,
-            chunking_strategy: ChunkingStrategy = RegexChunking(),
-            bypass_cache: bool = False,
-            css_selector: str = None,
-            screenshot: bool = False,
-            user_agent: str = None,
-            verbose=True,
-            **kwargs,
-        ) -> CrawlResult:
-            extraction_strategy = extraction_strategy or NoExtractionStrategy()
-            extraction_strategy.verbose = verbose
-            if not isinstance(extraction_strategy, ExtractionStrategy):
-                raise ValueError("Unsupported extraction strategy")
-            if not isinstance(chunking_strategy, ChunkingStrategy):
-                raise ValueError("Unsupported chunking strategy")
-            
-            if word_count_threshold < MIN_WORD_THRESHOLD:
-                word_count_threshold = MIN_WORD_THRESHOLD
-
-            # Check cache first
-            cached = None
-            extracted_content = None
-            if not bypass_cache and not self.always_by_pass_cache:
-                cached = get_cached_url(url)
-            
-            if cached:
-                html = cached[1]
-                extracted_content = cached[2]
-                if screenshot:
-                    screenshot = cached[9]
-            
-            else:
-                if user_agent:
-                    self.crawler_strategy.update_user_agent(user_agent)
-                html = self.crawler_strategy.crawl(url)
-                if screenshot:
-                    screenshot = self.crawler_strategy.take_screenshot()
-            
-            return self.process_html(url, html, extracted_content, word_count_threshold, extraction_strategy, chunking_strategy, css_selector, screenshot, verbose, bool(cached), **kwargs)
-
-    def process_html(
-            self,
-            url: str,
-            html: str,
-            extracted_content: str,
-            word_count_threshold: int,
-            extraction_strategy: ExtractionStrategy,
-            chunking_strategy: ChunkingStrategy,
-            css_selector: str,
-            screenshot: bool,
-            verbose: bool,
-            is_cached: bool,
-            **kwargs,
-        ) -> CrawlResult:
-            t = time.time()
-            # Extract content from HTML
-            try:
-                result = get_content_of_website(url, html, word_count_threshold, css_selector=css_selector)
-                metadata = extract_metadata(html)
-                if result is None:
-                    raise ValueError(f"Failed to extract content from the website: {url}")
-            except InvalidCSSSelectorError as e:
-                raise ValueError(str(e))
-            
-            cleaned_html = result.get("cleaned_html", "")
-            markdown = result.get("markdown", "")
-            media = result.get("media", [])
-            links = result.get("links", [])
-
-            if verbose:
-                print(f"[LOG] 🚀 Crawling done for {url}, success: True, time taken: {time.time() - t} seconds")
-                        
-            if extracted_content is None:
-                if verbose:
-                    print(f"[LOG] 🔥 Extracting semantic blocks for {url}, Strategy: {extraction_strategy.name}")
-
-                sections = chunking_strategy.chunk(markdown)
-                extracted_content = extraction_strategy.run(url, sections)
-                extracted_content = json.dumps(extracted_content)
-
-                if verbose:
-                    print(f"[LOG] 🚀 Extraction done for {url}, time taken: {time.time() - t} seconds.")
-                
-            screenshot = None if not screenshot else screenshot
-            
-            if not is_cached:
-                cache_url(
-                    url,
-                    html,
-                    cleaned_html,
-                    markdown,
-                    extracted_content,
-                    True,
-                    json.dumps(media),
-                    json.dumps(links),
-                    json.dumps(metadata),
-                    screenshot=screenshot,
-                )                
-
-            return CrawlResult(
-                url=url,
-                html=html,
-                cleaned_html=cleaned_html,
-                markdown=markdown,
-                media=media,
-                links=links,
-                metadata=metadata,
-                screenshot=screenshot,
-                extracted_content=extracted_content,
-                success=True,
-                error_message="",
-            )
\ No newline at end of file

From f9a297e08deac1963a302f8e70d0fe284564ceca Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Fri, 8 Nov 2024 19:39:05 +0800
Subject: [PATCH 011/115] Add Docker example script for testing Crawl4AI
 functionality

---
 docs/examples/docker_example.py | 300 ++++++++++++++++++++++++++++++++
 1 file changed, 300 insertions(+)
 create mode 100644 docs/examples/docker_example.py

diff --git a/docs/examples/docker_example.py b/docs/examples/docker_example.py
new file mode 100644
index 00000000..c22acd55
--- /dev/null
+++ b/docs/examples/docker_example.py
@@ -0,0 +1,300 @@
+import requests
+import json
+import time
+import sys
+import base64
+import os
+from typing import Dict, Any
+
+class Crawl4AiTester:
+    def __init__(self, base_url: str = "http://localhost:11235"):
+        self.base_url = base_url
+        
+    def submit_and_wait(self, request_data: Dict[str, Any], timeout: int = 300) -> Dict[str, Any]:
+        # Submit crawl job
+        response = requests.post(f"{self.base_url}/crawl", json=request_data)
+        task_id = response.json()["task_id"]
+        print(f"Task ID: {task_id}")
+        
+        # Poll for result
+        start_time = time.time()
+        while True:
+            if time.time() - start_time > timeout:
+                raise TimeoutError(f"Task {task_id} did not complete within {timeout} seconds")
+                
+            result = requests.get(f"{self.base_url}/task/{task_id}")
+            status = result.json()
+            
+            if status["status"] == "failed":
+                print("Task failed:", status.get("error"))
+                raise Exception(f"Task failed: {status.get('error')}")
+                
+            if status["status"] == "completed":
+                return status
+                
+            time.sleep(2)
+
+def test_docker_deployment(version="basic"):
+    tester = Crawl4AiTester()
+    print(f"Testing Crawl4AI Docker {version} version")
+    
+    # Health check with timeout and retry
+    max_retries = 5
+    for i in range(max_retries):
+        try:
+            health = requests.get(f"{tester.base_url}/health", timeout=10)
+            print("Health check:", health.json())
+            break
+        except requests.exceptions.RequestException as e:
+            if i == max_retries - 1:
+                print(f"Failed to connect after {max_retries} attempts")
+                sys.exit(1)
+            print(f"Waiting for service to start (attempt {i+1}/{max_retries})...")
+            time.sleep(5)
+    
+    # Test cases based on version
+    test_basic_crawl(tester)
+    
+    # if version in ["full", "transformer"]:
+    #     test_cosine_extraction(tester)
+
+    # test_js_execution(tester)
+    # test_css_selector(tester)
+    # test_structured_extraction(tester)
+    # test_llm_extraction(tester)
+    # test_llm_with_ollama(tester)
+    # test_screenshot(tester)
+    
+
+def test_basic_crawl(tester: Crawl4AiTester):
+    print("\n=== Testing Basic Crawl ===")
+    request = {
+        "urls": "https://www.nbcnews.com/business",
+        "priority": 10
+    }
+    
+    result = tester.submit_and_wait(request)
+    print(f"Basic crawl result length: {len(result['result']['markdown'])}")
+    assert result["result"]["success"]
+    assert len(result["result"]["markdown"]) > 0
+
+def test_js_execution(tester: Crawl4AiTester):
+    print("\n=== Testing JS Execution ===")
+    request = {
+        "urls": "https://www.nbcnews.com/business",
+        "priority": 8,
+        "js_code": [
+            "const loadMoreButton = Array.from(document.querySelectorAll('button')).find(button => button.textContent.includes('Load More')); loadMoreButton && loadMoreButton.click();"
+        ],
+        "wait_for": "article.tease-card:nth-child(10)",
+        "crawler_params": {
+            "headless": True
+        }
+    }
+    
+    result = tester.submit_and_wait(request)
+    print(f"JS execution result length: {len(result['result']['markdown'])}")
+    assert result["result"]["success"]
+
+def test_css_selector(tester: Crawl4AiTester):
+    print("\n=== Testing CSS Selector ===")
+    request = {
+        "urls": "https://www.nbcnews.com/business",
+        "priority": 7,
+        "css_selector": ".wide-tease-item__description",
+        "crawler_params": {
+            "headless": True
+        },
+        "extra": {"word_count_threshold": 10}
+        
+    }
+    
+    result = tester.submit_and_wait(request)
+    print(f"CSS selector result length: {len(result['result']['markdown'])}")
+    assert result["result"]["success"]
+
+def test_structured_extraction(tester: Crawl4AiTester):
+    print("\n=== Testing Structured Extraction ===")
+    schema = {
+        "name": "Coinbase Crypto Prices",
+        "baseSelector": ".cds-tableRow-t45thuk",
+        "fields": [
+            {
+                "name": "crypto",
+                "selector": "td:nth-child(1) h2",
+                "type": "text",
+            },
+            {
+                "name": "symbol",
+                "selector": "td:nth-child(1) p",
+                "type": "text",
+            },
+            {
+                "name": "price",
+                "selector": "td:nth-child(2)",
+                "type": "text",
+            }
+        ],
+    }
+    
+    request = {
+        "urls": "https://www.coinbase.com/explore",
+        "priority": 9,
+        "extraction_config": {
+            "type": "json_css",
+            "params": {
+                "schema": schema
+            }
+        }
+    }
+    
+    result = tester.submit_and_wait(request)
+    extracted = json.loads(result["result"]["extracted_content"])
+    print(f"Extracted {len(extracted)} items")
+    print("Sample item:", json.dumps(extracted[0], indent=2))
+    assert result["result"]["success"]
+    assert len(extracted) > 0
+
+def test_llm_extraction(tester: Crawl4AiTester):
+    print("\n=== Testing LLM Extraction ===")
+    schema = {
+        "type": "object",
+        "properties": {
+            "model_name": {
+                "type": "string",
+                "description": "Name of the OpenAI model."
+            },
+            "input_fee": {
+                "type": "string",
+                "description": "Fee for input token for the OpenAI model."
+            },
+            "output_fee": {
+                "type": "string",
+                "description": "Fee for output token for the OpenAI model."
+            }
+        },
+        "required": ["model_name", "input_fee", "output_fee"]
+    }
+    
+    request = {
+        "urls": "https://openai.com/api/pricing",
+        "priority": 8,
+        "extraction_config": {
+            "type": "llm",
+            "params": {
+                "provider": "openai/gpt-4o-mini",
+                "api_token": os.getenv("OPENAI_API_KEY"),
+                "schema": schema,
+                "extraction_type": "schema",
+                "instruction": """From the crawled content, extract all mentioned model names along with their fees for input and output tokens."""
+            }
+        },
+        "crawler_params": {"word_count_threshold": 1}
+    }
+    
+    try:
+        result = tester.submit_and_wait(request)
+        extracted = json.loads(result["result"]["extracted_content"])
+        print(f"Extracted {len(extracted)} model pricing entries")
+        print("Sample entry:", json.dumps(extracted[0], indent=2))
+        assert result["result"]["success"]
+    except Exception as e:
+        print(f"LLM extraction test failed (might be due to missing API key): {str(e)}")
+
+def test_llm_with_ollama(tester: Crawl4AiTester):
+    print("\n=== Testing LLM with Ollama ===")
+    schema = {
+        "type": "object",
+        "properties": {
+            "article_title": {
+                "type": "string",
+                "description": "The main title of the news article"
+            },
+            "summary": {
+                "type": "string",
+                "description": "A brief summary of the article content"
+            },
+            "main_topics": {
+                "type": "array",
+                "items": {"type": "string"},
+                "description": "Main topics or themes discussed in the article"
+            }
+        }
+    }
+    
+    request = {
+        "urls": "https://www.nbcnews.com/business",
+        "priority": 8,
+        "extraction_config": {
+            "type": "llm",
+            "params": {
+                "provider": "ollama/llama2",
+                "schema": schema,
+                "extraction_type": "schema",
+                "instruction": "Extract the main article information including title, summary, and main topics."
+            }
+        },
+        "extra": {"word_count_threshold": 1},
+        "crawler_params": {"verbose": True}
+    }
+    
+    try:
+        result = tester.submit_and_wait(request)
+        extracted = json.loads(result["result"]["extracted_content"])
+        print("Extracted content:", json.dumps(extracted, indent=2))
+        assert result["result"]["success"]
+    except Exception as e:
+        print(f"Ollama extraction test failed: {str(e)}")
+
+def test_cosine_extraction(tester: Crawl4AiTester):
+    print("\n=== Testing Cosine Extraction ===")
+    request = {
+        "urls": "https://www.nbcnews.com/business",
+        "priority": 8,
+        "extraction_config": {
+            "type": "cosine",
+            "params": {
+                "semantic_filter": "business finance economy",
+                "word_count_threshold": 10,
+                "max_dist": 0.2,
+                "top_k": 3
+            }
+        }
+    }
+    
+    try:
+        result = tester.submit_and_wait(request)
+        extracted = json.loads(result["result"]["extracted_content"])
+        print(f"Extracted {len(extracted)} text clusters")
+        print("First cluster tags:", extracted[0]["tags"])
+        assert result["result"]["success"]
+    except Exception as e:
+        print(f"Cosine extraction test failed: {str(e)}")
+
+def test_screenshot(tester: Crawl4AiTester):
+    print("\n=== Testing Screenshot ===")
+    request = {
+        "urls": "https://www.nbcnews.com/business",
+        "priority": 5,
+        "screenshot": True,
+        "crawler_params": {
+            "headless": True
+        }
+    }
+    
+    result = tester.submit_and_wait(request)
+    print("Screenshot captured:", bool(result["result"]["screenshot"]))
+    
+    if result["result"]["screenshot"]:
+        # Save screenshot
+        screenshot_data = base64.b64decode(result["result"]["screenshot"])
+        with open("test_screenshot.jpg", "wb") as f:
+            f.write(screenshot_data)
+        print("Screenshot saved as test_screenshot.jpg")
+    
+    assert result["result"]["success"]
+
+if __name__ == "__main__":
+    version = sys.argv[1] if len(sys.argv) > 1 else "basic"
+    # version = "full"
+    test_docker_deployment(version)
\ No newline at end of file

From a098483cbbb26be3d3b6f8d678f8409d6b007789 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Sat, 9 Nov 2024 20:40:30 +0800
Subject: [PATCH 012/115] Update Roadmap

---
 README.md  |  24 +++
 ROADMAP.md | 503 +++++++++++++++++++++++++++++++++++++++++++++++++++++
 2 files changed, 527 insertions(+)
 create mode 100644 ROADMAP.md

diff --git a/README.md b/README.md
index 1f36aca6..e1a64aa1 100644
--- a/README.md
+++ b/README.md
@@ -432,6 +432,30 @@ You can find the full comparison code in our repository at `docs/examples/crawl4
 
 For detailed documentation, including installation instructions, advanced features, and API reference, visit our [Documentation Website](https://crawl4ai.com/mkdocs/).
 
+## Crawl4AI Roadmap 🗺️
+
+For detailed information on our development plans and upcoming features, check out our [Roadmap](https://github.com/unclecode/crawl4ai/blob/main/ROADMAP.md).
+
+### Advanced Crawling Systems 🔧
+- [x] 0. Graph Crawler: Smart website traversal using graph search algorithms for comprehensive nested page extraction
+- [ ] 1. Question-Based Crawler: Natural language driven web discovery and content extraction
+- [ ] 2. Knowledge-Optimal Crawler: Smart crawling that maximizes knowledge while minimizing data extraction
+- [ ] 3. Agentic Crawler: Autonomous system for complex multi-step crawling operations
+
+### Specialized Features 🛠️
+- [ ] 4. Automated Schema Generator: Convert natural language to extraction schemas
+- [ ] 5. Domain-Specific Scrapers: Pre-configured extractors for common platforms (academic, e-commerce)
+- [ ] 6. Web Embedding Index: Semantic search infrastructure for crawled content
+
+### Development Tools 🔨
+- [ ] 7. Interactive Playground: Web UI for testing, comparing strategies with AI assistance
+- [ ] 8. Performance Monitor: Real-time insights into crawler operations
+- [ ] 9. Cloud Integration: One-click deployment solutions across cloud providers
+
+### Community & Growth 🌱
+- [ ] 10. Sponsorship Program: Structured support system with tiered benefits
+- [ ] 11. Educational Content: "How to Crawl" video series and interactive tutorials
+
 ## Contributing 🤝
 
 We welcome contributions from the open-source community. Check out our [contribution guidelines](https://github.com/unclecode/crawl4ai/blob/main/CONTRIBUTING.md) for more information.
diff --git a/ROADMAP.md b/ROADMAP.md
new file mode 100644
index 00000000..0fd784c1
--- /dev/null
+++ b/ROADMAP.md
@@ -0,0 +1,503 @@
+# Crawl4AI Strategic Roadmap
+
+```mermaid
+%%{init: {'themeVariables': { 'fontSize': '14px'}}}%%
+graph TD
+    subgraph A1[Advanced Crawling Systems 🔧]
+        A["`
+        • Graph Crawler ✓
+        • Question-Based Crawler
+        • Knowledge-Optimal Crawler
+        • Agentic Crawler
+        `"]
+    end
+
+    subgraph A2[Specialized Features 🛠️]
+        B["`
+        • Automated Schema Generator
+        • Domain-Specific Scrapers
+        • 
+        • 
+        `"]
+    end
+
+    subgraph A3[Development Tools 🔨]
+        C["`
+        • Interactive Playground
+        • Performance Monitor
+        • Cloud Integration
+        • 
+        `"]
+    end
+
+    subgraph A4[Community & Growth 🌱]
+        D["`
+        • Sponsorship Program
+        • Educational Content
+        • 
+        • 
+        `"]
+    end
+
+    classDef default fill:#f9f9f9,stroke:#333,stroke-width:2px
+    classDef section fill:#f0f0f0,stroke:#333,stroke-width:4px,rx:10
+    class A1,A2,A3,A4 section
+
+    %% Layout hints
+    A1 --> A2[" "]
+    A3 --> A4[" "]
+    linkStyle 0,1 stroke:none
+```
+
+Crawl4AI is evolving to provide more intelligent, efficient, and versatile web crawling capabilities. This roadmap outlines the key developments and features planned for the project, organized into strategic sections that build upon our current foundation.
+
+## 1. Advanced Crawling Systems 🔧
+
+This section introduces three powerful crawling systems that extend Crawl4AI's capabilities from basic web crawling to intelligent, purpose-driven data extraction.
+
+### 1.1 Question-Based Crawler
+The Question-Based Crawler enhances our core engine by enabling automatic discovery and extraction of relevant web content based on natural language questions.
+
+Key Features:
+- SerpiAPI integration for intelligent web search
+- Relevancy scoring for search results
+- Automatic URL discovery and prioritization
+- Cross-source validation
+
+```python
+from crawl4ai import AsyncWebCrawler
+from crawl4ai.discovery import QuestionBasedDiscovery
+
+async with AsyncWebCrawler() as crawler:
+    discovery = QuestionBasedDiscovery(crawler)
+    results = await discovery.arun(
+        question="What are the system requirements for major cloud providers' GPU instances?",
+        max_urls=5,
+        relevance_threshold=0.7
+    )
+    
+    for result in results:
+        print(f"Source: {result.url} (Relevance: {result.relevance_score})")
+        print(f"Content: {result.markdown}\n")
+```
+
+### 1.2 Knowledge-Optimal Crawler
+An intelligent crawling system that solves the optimization problem of minimizing data extraction while maximizing knowledge acquisition for specific objectives.
+
+Key Features:
+- Smart content prioritization
+- Minimal data extraction for maximum knowledge
+- Probabilistic relevance assessment
+- Objective-driven crawling paths
+
+```python
+from crawl4ai import AsyncWebCrawler
+from crawl4ai.optimization import KnowledgeOptimizer
+
+async with AsyncWebCrawler() as crawler:
+    optimizer = KnowledgeOptimizer(
+        objective="Understand GPU instance pricing and limitations across cloud providers",
+        required_knowledge=[
+            "pricing structure",
+            "GPU specifications",
+            "usage limits",
+            "availability zones"
+        ],
+        confidence_threshold=0.85
+    )
+    
+    result = await crawler.arun(
+        urls=[
+            "https://aws.amazon.com/ec2/pricing/",
+            "https://cloud.google.com/gpu",
+            "https://azure.microsoft.com/pricing/"
+        ],
+        optimizer=optimizer,
+        optimization_mode="minimal_extraction"
+    )
+    
+    print(f"Knowledge Coverage: {result.knowledge_coverage}")
+    print(f"Data Efficiency: {result.efficiency_ratio}")
+    print(f"Extracted Content: {result.optimal_content}")
+```
+
+### 1.3 Agentic Crawler
+An autonomous system capable of understanding complex goals and automatically planning and executing multi-step crawling operations.
+
+Key Features:
+- Autonomous goal interpretation
+- Dynamic step planning
+- Interactive navigation capabilities
+- Visual recognition and interaction
+- Automatic error recovery
+
+```python
+from crawl4ai import AsyncWebCrawler
+from crawl4ai.agents import CrawlerAgent
+
+async with AsyncWebCrawler() as crawler:
+    agent = CrawlerAgent(crawler)
+    
+    # Automatic planning and execution
+    result = await agent.arun(
+        goal="Find research papers about quantum computing published in 2023 with more than 50 citations",
+        auto_retry=True
+    )
+    print("Generated Plan:", result.executed_steps)
+    print("Extracted Data:", result.data)
+    
+    # Using custom steps with automatic execution
+    result = await agent.arun(
+        goal="Extract conference deadlines from ML conferences",
+        custom_plan=[
+            "Navigate to conference page",
+            "Find important dates section",
+            "Extract submission deadlines",
+            "Verify dates are for 2024"
+        ]
+    )
+    
+    # Monitoring execution
+    print("Step Completion:", result.step_status)
+    print("Execution Time:", result.execution_time)
+    print("Success Rate:", result.success_rate)
+```
+
+# Section 2: Specialized Features 🛠️
+
+This section introduces specialized tools and features that enhance Crawl4AI's capabilities for specific use cases and data extraction needs.
+
+### 2.1 Automated Schema Generator
+A system that automatically generates JsonCssExtractionStrategy schemas from natural language descriptions, making structured data extraction accessible to all users.
+
+Key Features:
+- Natural language schema generation
+- Automatic pattern detection
+- Predefined schema templates
+- Chrome extension for visual schema building
+
+```python
+from crawl4ai import AsyncWebCrawler
+from crawl4ai.schema import SchemaGenerator
+
+# Generate schema from natural language description
+generator = SchemaGenerator()
+schema = await generator.generate(
+    url="https://news-website.com",
+    description="For each news article on the page, I need the headline, publication date, and main image"
+)
+
+# Use generated schema with crawler
+async with AsyncWebCrawler() as crawler:
+    result = await crawler.arun(
+        url="https://news-website.com",
+        extraction_strategy=schema
+    )
+
+# Example of generated schema:
+"""
+{
+    "name": "News Article Extractor",
+    "baseSelector": "article.news-item",
+    "fields": [
+        {
+            "name": "headline",
+            "selector": "h2.article-title",
+            "type": "text"
+        },
+        {
+            "name": "date",
+            "selector": "span.publish-date",
+            "type": "text"
+        },
+        {
+            "name": "image",
+            "selector": "img.article-image",
+            "type": "attribute",
+            "attribute": "src"
+        }
+    ]
+}
+"""
+```
+
+### 2.2 Domain Specific Scrapers
+Specialized extraction strategies optimized for common website types and platforms, providing consistent and reliable data extraction without additional configuration.
+
+Key Features:
+- Pre-configured extractors for popular platforms
+- Academic site specialization (arXiv, NCBI)
+- E-commerce standardization
+- Documentation site handling
+
+```python
+from crawl4ai import AsyncWebCrawler
+from crawl4ai.extractors import AcademicExtractor, EcommerceExtractor
+
+async with AsyncWebCrawler() as crawler:
+    # Academic paper extraction
+    papers = await crawler.arun(
+        url="https://arxiv.org/list/cs.AI/recent",
+        extractor="academic",  # Built-in extractor type
+        site_type="arxiv",     # Specific site optimization
+        extract_fields=[
+            "title", 
+            "authors", 
+            "abstract", 
+            "citations"
+        ]
+    )
+    
+    # E-commerce product data
+    products = await crawler.arun(
+        url="https://store.example.com/products",
+        extractor="ecommerce",
+        extract_fields=[
+            "name",
+            "price",
+            "availability",
+            "reviews"
+        ]
+    )
+```
+
+### 2.3 Web Embedding Index
+Creates and maintains a semantic search infrastructure for crawled content, enabling efficient retrieval and querying of web content through vector embeddings.
+
+Key Features:
+- Automatic embedding generation
+- Intelligent content chunking
+- Efficient vector storage and indexing
+- Semantic search capabilities
+
+```python
+from crawl4ai import AsyncWebCrawler
+from crawl4ai.indexing import WebIndex
+
+# Initialize and build index
+index = WebIndex(model="efficient-mini")
+
+async with AsyncWebCrawler() as crawler:
+    # Crawl and index content
+    await index.build(
+        urls=["https://docs.example.com"],
+        crawler=crawler,
+        options={
+            "chunk_method": "semantic",
+            "update_policy": "incremental",
+            "embedding_batch_size": 100
+        }
+    )
+
+    # Search through indexed content
+    results = await index.search(
+        query="How to implement OAuth authentication?",
+        filters={
+            "content_type": "technical",
+            "recency": "6months"
+        },
+        top_k=5
+    )
+
+    # Get similar content
+    similar = await index.find_similar(
+        url="https://docs.example.com/auth/oauth",
+        threshold=0.85
+    )
+```
+
+Each of these specialized features builds upon Crawl4AI's core functionality while providing targeted solutions for specific use cases. They can be used independently or combined for more complex data extraction and processing needs.
+
+# Section 3: Development Tools 🔧
+
+This section covers tools designed to enhance the development experience, monitoring, and deployment of Crawl4AI applications.
+
+### 3.1 Crawl4AI Playground 🎮
+
+The Crawl4AI Playground is an interactive web-based development environment that simplifies web scraping experimentation, development, and deployment. With its intuitive interface and AI-powered assistance, users can quickly prototype, test, and deploy web scraping solutions.
+
+#### Key Features 🌟
+
+##### Visual Strategy Builder
+- Interactive point-and-click interface for building extraction strategies
+- Real-time preview of selected elements
+- Side-by-side comparison of different extraction approaches
+- Visual validation of CSS selectors and XPath queries
+
+##### AI Assistant Integration
+- Strategy recommendations based on target website analysis
+- Parameter optimization suggestions
+- Best practices guidance for specific use cases
+- Automated error detection and resolution
+- Performance optimization tips
+
+##### Real-Time Testing & Validation
+- Live preview of extraction results
+- Side-by-side comparison of multiple strategies
+- Performance metrics visualization
+- Automatic validation of extracted data
+- Error detection and debugging tools
+
+##### Project Management
+- Save and organize multiple scraping projects
+- Version control for configurations
+- Export/import project settings
+- Share configurations with team members
+- Project templates for common use cases
+
+##### Deployment Pipeline
+- One-click deployment to various environments
+- Docker container generation
+- Cloud deployment templates (AWS, GCP, Azure)
+- Scaling configuration management
+- Monitoring setup automation
+
+
+### 3.2 Performance Monitoring System
+A comprehensive monitoring solution providing real-time insights into crawler operations, resource usage, and system health through both CLI and GUI interfaces.
+
+Key Features:
+- Real-time resource tracking
+- Active crawl monitoring
+- Performance statistics
+- Customizable alerting system
+
+```python
+from crawl4ai import AsyncWebCrawler
+from crawl4ai.monitor import CrawlMonitor
+
+# Initialize monitoring
+monitor = CrawlMonitor()
+
+# Start monitoring with CLI interface
+await monitor.start(
+    mode="cli",  # or "gui"
+    refresh_rate="1s",
+    metrics={
+        "resources": ["cpu", "memory", "network"],
+        "crawls": ["active", "queued", "completed"],
+        "performance": ["success_rate", "response_times"]
+    }
+)
+
+# Example CLI output:
+"""
+Crawl4AI Monitor (Live) - Press Q to exit
+────────────────────────────────────────
+System Usage:
+ ├─ CPU: ███████░░░ 70%
+ └─ Memory: ████░░░░░ 2.1GB/8GB
+
+Active Crawls:
+ID    URL                   Status    Progress
+001   docs.example.com     🟢 Active   75%
+002   api.service.com      🟡 Queue    -
+
+Metrics (Last 5min):
+ ├─ Success Rate: 98%
+ ├─ Avg Response: 0.6s
+ └─ Pages/sec: 8.5
+"""
+```
+
+### 3.3 Cloud Integration
+Streamlined deployment tools for setting up Crawl4AI in various cloud environments, with support for scaling and monitoring.
+
+Key Features:
+- One-click deployment solutions
+- Auto-scaling configuration
+- Load balancing setup
+- Cloud-specific optimizations
+- Monitoring integration
+
+```python
+from crawl4ai import AsyncWebCrawler
+from crawl4ai.deploy import CloudDeployer
+
+# Initialize deployer
+deployer = CloudDeployer()
+
+# Deploy crawler service
+deployment = await deployer.deploy(
+    service_name="crawler-cluster",
+    platform="aws",  # or "gcp", "azure"
+    config={
+        "instance_type": "compute-optimized",
+        "auto_scaling": {
+            "min_instances": 2,
+            "max_instances": 10,
+            "scale_based_on": "cpu_usage"
+        },
+        "region": "us-east-1",
+        "monitoring": True
+    }
+)
+
+# Get deployment status and endpoints
+print(f"Service Status: {deployment.status}")
+print(f"API Endpoint: {deployment.endpoint}")
+print(f"Monitor URL: {deployment.monitor_url}")
+```
+
+These development tools work together to provide a comprehensive environment for developing, testing, monitoring, and deploying Crawl4AI applications. The Playground helps users experiment and generate optimal configurations, the Performance Monitor ensures smooth operation, and the Cloud Integration tools simplify deployment and scaling.
+
+# Section 4: Community & Growth 🌱
+
+This section outlines initiatives designed to build and support the Crawl4AI community, provide educational resources, and ensure sustainable project growth.
+
+### 4.1 Sponsorship Program
+A structured program to support ongoing development and maintenance of Crawl4AI while providing valuable benefits to sponsors.
+
+Key Features:
+- Multiple sponsorship tiers
+- Sponsor recognition system
+- Priority support for sponsors
+- Early access to new features
+- Custom feature development opportunities
+
+Program Structure (not yet finalized):
+```
+Sponsorship Tiers:
+
+🥉 Bronze Supporter
+- GitHub Sponsor badge
+- Priority issue response
+- Community Discord role
+
+🥈 Silver Supporter
+- All Bronze benefits
+- Technical support channel
+- Vote on roadmap priorities
+- Early access to beta features
+
+🥇 Gold Supporter
+- All Silver benefits
+- Custom feature requests
+- Direct developer access
+- Private support sessions
+
+💎 Diamond Partner
+- All Gold benefits
+- Custom development
+- On-demand consulting
+- Integration support
+```
+
+### 4.2 "How to Crawl" Video Series
+A comprehensive educational resource teaching users how to effectively use Crawl4AI for various web scraping and data extraction scenarios.
+
+Key Features:
+- Step-by-step tutorials
+- Real-world use cases
+- Best practices
+- Integration guides
+- Advanced feature deep-dives
+
+These community initiatives are designed to:
+- Provide comprehensive learning resources
+- Foster a supportive user community
+- Ensure sustainable project development
+- Share knowledge and best practices
+- Create opportunities for collaboration
+
+The combination of structured support through sponsorship, educational content through video series, and interactive learning through the playground creates a robust ecosystem for both new and experienced users of Crawl4AI.

From b6d6631b125bde49b402ba30ae22fc3fb4661228 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Tue, 12 Nov 2024 12:10:58 +0800
Subject: [PATCH 013/115] Enhance Async Crawler with Playwright support -
 Implemented new async crawler strategy using Playwright. - Introduced
 ManagedBrowser for better browser management. - Added support for persistent
 browser sessions and improved error handling. - Updated version from 0.3.73
 to 0.3.731. - Enhanced logic in main.py for conditional mounting of static
 files. - Updated requirements to replace playwright_stealth with
 tf-playwright-stealth.

---
 crawl4ai/_version.py                      |   2 +-
 crawl4ai/async_crawler_strategy.py        | 106 ++-
 crawl4ai/async_crawler_strategy_0.3.73.py | 965 ++++++++++++++++++++++
 main.py                                   |  12 +-
 requirements.txt                          |   2 +-
 5 files changed, 1057 insertions(+), 30 deletions(-)
 create mode 100644 crawl4ai/async_crawler_strategy_0.3.73.py

diff --git a/crawl4ai/_version.py b/crawl4ai/_version.py
index 85030f0e..7ab71c9b 100644
--- a/crawl4ai/_version.py
+++ b/crawl4ai/_version.py
@@ -1,2 +1,2 @@
 # crawl4ai/_version.py
-__version__ = "0.3.73"
\ No newline at end of file
+__version__ = "0.3.731"
\ No newline at end of file
diff --git a/crawl4ai/async_crawler_strategy.py b/crawl4ai/async_crawler_strategy.py
index fa50e7b5..896a0644 100644
--- a/crawl4ai/async_crawler_strategy.py
+++ b/crawl4ai/async_crawler_strategy.py
@@ -186,6 +186,8 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
         self.sleep_on_close = kwargs.get("sleep_on_close", False)
         self.use_managed_browser = kwargs.get("use_managed_browser", False)
         self.user_data_dir = kwargs.get("user_data_dir", None)
+        self.use_persistent_context = kwargs.get("use_persistent_context", False)
+        self.chrome_channel = kwargs.get("chrome_channel", "chrome")
         self.managed_browser = None
         self.default_context = None
         self.hooks = {
@@ -197,6 +199,7 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
             'before_return_html': None,
             'before_retrieve_html': None
         }
+        self.extra_args = kwargs.get("extra_args", [])
 
     async def __aenter__(self):
         await self.start()
@@ -238,36 +241,71 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
                             "User-Agent": self.user_agent
                         })
             else:
+                # Base browser arguments
                 browser_args = {
                     "headless": self.headless,
                     "args": [
-                        "--disable-gpu",
                         "--no-sandbox",
                         "--disable-dev-shm-usage",
-                        "--disable-blink-features=AutomationControlled",
+                        "--no-first-run",
+                        "--no-default-browser-check",
                         "--disable-infobars",
                         "--window-position=0,0",
                         "--ignore-certificate-errors",
                         "--ignore-certificate-errors-spki-list",
-                        # "--headless=new",  # Use the new headless mode
                     ]
                 }
+
+                # Add channel if specified (try Chrome first)
+                if self.chrome_channel:
+                    browser_args["channel"] = self.chrome_channel
+                
+                # Add extra args if provided
+                if self.extra_args:
+                    browser_args["args"].extend(self.extra_args)
                 
                 # Add proxy settings if a proxy is specified
                 if self.proxy:
                     proxy_settings = ProxySettings(server=self.proxy)
                     browser_args["proxy"] = proxy_settings
                 elif self.proxy_config:
-                    proxy_settings = ProxySettings(server=self.proxy_config.get("server"), username=self.proxy_config.get("username"), password=self.proxy_config.get("password"))
+                    proxy_settings = ProxySettings(
+                        server=self.proxy_config.get("server"),
+                        username=self.proxy_config.get("username"),
+                        password=self.proxy_config.get("password")
+                    )
                     browser_args["proxy"] = proxy_settings
                     
-                # Select the appropriate browser based on the browser_type
-                if self.browser_type == "firefox":
-                    self.browser = await self.playwright.firefox.launch(**browser_args)
-                elif self.browser_type == "webkit":
-                    self.browser = await self.playwright.webkit.launch(**browser_args)
-                else:
-                    self.browser = await self.playwright.chromium.launch(**browser_args)
+                try:
+                    # Select the appropriate browser based on the browser_type
+                    if self.browser_type == "firefox":
+                        self.browser = await self.playwright.firefox.launch(**browser_args)
+                    elif self.browser_type == "webkit":
+                        self.browser = await self.playwright.webkit.launch(**browser_args)
+                    else:
+                        if self.use_persistent_context and self.user_data_dir:
+                            self.browser = await self.playwright.chromium.launch_persistent_context(
+                                user_data_dir=self.user_data_dir,
+                                **browser_args
+                            )
+                            self.default_context = self.browser
+                        else:
+                            self.browser = await self.playwright.chromium.launch(**browser_args)
+
+                except Exception as e:
+                    # Fallback to chromium if Chrome channel fails
+                    if "chrome" in str(e) and browser_args.get("channel") == "chrome":
+                        browser_args["channel"] = "chromium"
+                        if self.use_persistent_context and self.user_data_dir:
+                            self.browser = await self.playwright.chromium.launch_persistent_context(
+                                user_data_dir=self.user_data_dir,
+                                **browser_args
+                            )
+                            self.default_context = self.browser
+                        else:
+                            self.browser = await self.playwright.chromium.launch(**browser_args)
+                    else:
+                        raise
 
             await self.execute_hook('on_browser_created', self.browser)
 
@@ -461,24 +499,35 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
             if session_id:
                 context, page, _ = self.sessions.get(session_id, (None, None, None))
                 if not context:
+                    if self.use_persistent_context and self.browser_type in ["chrome", "chromium"]:
+                        # In persistent context, browser is the context
+                        context = self.browser
+                        page = await context.new_page()
+                    else:
+                        # Normal context creation for non-persistent or non-Chrome browsers
+                        context = await self.browser.new_context(
+                            user_agent=self.user_agent,
+                            viewport={"width": 1920, "height": 1080},
+                            proxy={"server": self.proxy} if self.proxy else None,
+                            accept_downloads=True,
+                            java_script_enabled=True
+                        )
+                        await context.add_cookies([{"name": "cookiesEnabled", "value": "true", "url": url}])
+                        await context.set_extra_http_headers(self.headers)
+                        page = await context.new_page()
+                    self.sessions[session_id] = (context, page, time.time())
+            else:
+                if self.use_persistent_context and self.browser_type in ["chrome", "chromium"]:
+                    # In persistent context, browser is the context
+                    context = self.browser
+                else:
+                    # Normal context creation
                     context = await self.browser.new_context(
                         user_agent=self.user_agent,
                         viewport={"width": 1920, "height": 1080},
-                        proxy={"server": self.proxy} if self.proxy else None,
-                        accept_downloads=True,
-                        java_script_enabled=True
+                        proxy={"server": self.proxy} if self.proxy else None
                     )
-                    await context.add_cookies([{"name": "cookiesEnabled", "value": "true", "url": url}])
                     await context.set_extra_http_headers(self.headers)
-                    page = await context.new_page()
-                    self.sessions[session_id] = (context, page, time.time())
-            else:
-                context = await self.browser.new_context(
-                    user_agent=self.user_agent,
-                    viewport={"width": 1920, "height": 1080},
-                    proxy={"server": self.proxy} if self.proxy else None
-                )
-                await context.set_extra_http_headers(self.headers)
                 
                 if kwargs.get("override_navigator", False) or kwargs.get("simulate_user", False) or kwargs.get("magic", False):
                     # Inject scripts to override navigator properties
@@ -512,7 +561,8 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
                     """)
                 
                 page = await context.new_page()
-                # await stealth_async(page) #, stealth_config)
+                if kwargs.get("magic", False):
+                    await stealth_async(page, stealth_config)
 
         # Add console message and error logging
         if kwargs.get("log_console", False):
@@ -544,8 +594,12 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
             if not kwargs.get("js_only", False):
                 await self.execute_hook('before_goto', page)
                 
+
                 response = await page.goto(
-                    url, wait_until="domcontentloaded", timeout=kwargs.get("page_timeout", 60000)
+                    url,
+                    # wait_until=kwargs.get("wait_until", ["domcontentloaded", "networkidle"]),
+                    wait_until=kwargs.get("wait_until", "domcontentloaded"),
+                    timeout=kwargs.get("page_timeout", 60000)
                 )
                 
                 # response = await page.goto("about:blank")
diff --git a/crawl4ai/async_crawler_strategy_0.3.73.py b/crawl4ai/async_crawler_strategy_0.3.73.py
new file mode 100644
index 00000000..54835dad
--- /dev/null
+++ b/crawl4ai/async_crawler_strategy_0.3.73.py
@@ -0,0 +1,965 @@
+import asyncio
+import base64
+import time
+from abc import ABC, abstractmethod
+from typing import Callable, Dict, Any, List, Optional, Awaitable
+import os, sys, shutil
+import tempfile, subprocess
+from playwright.async_api import async_playwright, Page, Browser, Error
+from io import BytesIO
+from PIL import Image, ImageDraw, ImageFont
+from pathlib import Path
+from playwright.async_api import ProxySettings
+from pydantic import BaseModel
+import hashlib
+import json
+import uuid
+
+from playwright_stealth import StealthConfig, stealth_async
+
+stealth_config = StealthConfig(
+    webdriver=True,
+    chrome_app=True,
+    chrome_csi=True,
+    chrome_load_times=True,
+    chrome_runtime=True,
+    navigator_languages=True,
+    navigator_plugins=True,
+    navigator_permissions=True,
+    webgl_vendor=True,
+    outerdimensions=True,
+    navigator_hardware_concurrency=True,
+    media_codecs=True,
+)
+
+
+class ManagedBrowser:
+    def __init__(self, browser_type: str = "chromium", user_data_dir: Optional[str] = None, headless: bool = False):
+        self.browser_type = browser_type
+        self.user_data_dir = user_data_dir
+        self.headless = headless
+        self.browser_process = None
+        self.temp_dir = None
+        self.debugging_port = 9222
+
+    async def start(self) -> str:
+        """
+        Starts the browser process and returns the CDP endpoint URL.
+        If user_data_dir is not provided, creates a temporary directory.
+        """
+        
+        # Create temp dir if needed
+        if not self.user_data_dir:
+            self.temp_dir = tempfile.mkdtemp(prefix="browser-profile-")
+            self.user_data_dir = self.temp_dir
+
+        # Get browser path and args based on OS and browser type
+        browser_path = self._get_browser_path()
+        args = self._get_browser_args()
+
+        # Start browser process
+        try:
+            self.browser_process = subprocess.Popen(
+                args,
+                stdout=subprocess.PIPE,
+                stderr=subprocess.PIPE
+            )
+            await asyncio.sleep(2)  # Give browser time to start
+            return f"http://localhost:{self.debugging_port}"
+        except Exception as e:
+            await self.cleanup()
+            raise Exception(f"Failed to start browser: {e}")
+
+    def _get_browser_path(self) -> str:
+        """Returns the browser executable path based on OS and browser type"""
+        if sys.platform == "darwin":  # macOS
+            paths = {
+                "chromium": "/Applications/Google Chrome.app/Contents/MacOS/Google Chrome",
+                "firefox": "/Applications/Firefox.app/Contents/MacOS/firefox",
+                "webkit": "/Applications/Safari.app/Contents/MacOS/Safari"
+            }
+        elif sys.platform == "win32":  # Windows
+            paths = {
+                "chromium": "C:\\Program Files\\Google\\Chrome\\Application\\chrome.exe",
+                "firefox": "C:\\Program Files\\Mozilla Firefox\\firefox.exe",
+                "webkit": None  # WebKit not supported on Windows
+            }
+        else:  # Linux
+            paths = {
+                "chromium": "google-chrome",
+                "firefox": "firefox",
+                "webkit": None  # WebKit not supported on Linux
+            }
+        
+        return paths.get(self.browser_type)
+
+    def _get_browser_args(self) -> List[str]:
+        """Returns browser-specific command line arguments"""
+        base_args = [self._get_browser_path()]
+        
+        if self.browser_type == "chromium":
+            args = [
+                f"--remote-debugging-port={self.debugging_port}",
+                f"--user-data-dir={self.user_data_dir}",
+            ]
+            if self.headless:
+                args.append("--headless=new")
+        elif self.browser_type == "firefox":
+            args = [
+                "--remote-debugging-port", str(self.debugging_port),
+                "--profile", self.user_data_dir,
+            ]
+            if self.headless:
+                args.append("--headless")
+        else:
+            raise NotImplementedError(f"Browser type {self.browser_type} not supported")
+            
+        return base_args + args
+
+    async def cleanup(self):
+        """Cleanup browser process and temporary directory"""
+        if self.browser_process:
+            try:
+                self.browser_process.terminate()
+                await asyncio.sleep(1)
+                if self.browser_process.poll() is None:
+                    self.browser_process.kill()
+            except Exception as e:
+                print(f"Error terminating browser: {e}")
+
+        if self.temp_dir and os.path.exists(self.temp_dir):
+            try:
+                shutil.rmtree(self.temp_dir)
+            except Exception as e:
+                print(f"Error removing temporary directory: {e}")
+
+class AsyncCrawlResponse(BaseModel):
+    html: str
+    response_headers: Dict[str, str]
+    status_code: int
+    screenshot: Optional[str] = None
+    get_delayed_content: Optional[Callable[[Optional[float]], Awaitable[str]]] = None
+
+    class Config:
+        arbitrary_types_allowed = True
+
+class AsyncCrawlerStrategy(ABC):
+    @abstractmethod
+    async def crawl(self, url: str, **kwargs) -> AsyncCrawlResponse:
+        pass
+    
+    @abstractmethod
+    async def crawl_many(self, urls: List[str], **kwargs) -> List[AsyncCrawlResponse]:
+        pass
+    
+    @abstractmethod
+    async def take_screenshot(self, **kwargs) -> str:
+        pass
+    
+    @abstractmethod
+    def update_user_agent(self, user_agent: str):
+        pass
+    
+    @abstractmethod
+    def set_hook(self, hook_type: str, hook: Callable):
+        pass
+
+class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
+    def __init__(self, use_cached_html=False, js_code=None, **kwargs):
+        self.use_cached_html = use_cached_html
+        self.user_agent = kwargs.get(
+            "user_agent",
+            "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 "
+            "(KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36"
+        )
+        self.proxy = kwargs.get("proxy")
+        self.proxy_config = kwargs.get("proxy_config")
+        self.headless = kwargs.get("headless", True)
+        self.browser_type = kwargs.get("browser_type", "chromium")
+        self.headers = kwargs.get("headers", {})
+        self.sessions = {}
+        self.session_ttl = 1800 
+        self.js_code = js_code
+        self.verbose = kwargs.get("verbose", False)
+        self.playwright = None
+        self.browser = None
+        self.sleep_on_close = kwargs.get("sleep_on_close", False)
+        self.use_managed_browser = kwargs.get("use_managed_browser", False)
+        self.user_data_dir = kwargs.get("user_data_dir", None)
+        self.use_persistent_context = kwargs.get("use_persistent_context", False)
+        self.chrome_channel = kwargs.get("chrome_channel", "chrome")
+        self.managed_browser = None
+        self.default_context = None
+        self.hooks = {
+            'on_browser_created': None,
+            'on_user_agent_updated': None,
+            'on_execution_started': None,
+            'before_goto': None,
+            'after_goto': None,
+            'before_return_html': None,
+            'before_retrieve_html': None
+        }
+        self.extra_args = kwargs.get("extra_args", [])
+
+    async def __aenter__(self):
+        await self.start()
+        return self
+
+    async def __aexit__(self, exc_type, exc_val, exc_tb):
+        await self.close()
+
+    async def start(self):
+        if self.playwright is None:
+            self.playwright = await async_playwright().start()
+        if self.browser is None:
+            if self.use_managed_browser:
+                # Use managed browser approach
+                self.managed_browser = ManagedBrowser(
+                    browser_type=self.browser_type,
+                    user_data_dir=self.user_data_dir,
+                    headless=self.headless
+                )
+                cdp_url = await self.managed_browser.start()
+                self.browser = await self.playwright.chromium.connect_over_cdp(cdp_url)
+                
+                # Get the default context that maintains the user profile
+                contexts = self.browser.contexts
+                if contexts:
+                    self.default_context = contexts[0]
+                else:
+                    # If no default context exists, create one
+                    self.default_context = await self.browser.new_context(
+                        viewport={"width": 1920, "height": 1080}
+                    )
+                
+                # Set up the default context
+                if self.default_context:
+                    await self.default_context.set_extra_http_headers(self.headers)
+                    
+                    if self.user_agent:
+                        await self.default_context.set_extra_http_headers({
+                            "User-Agent": self.user_agent
+                        })
+            else:
+                browser_args = {
+                    "headless": self.headless,
+                    "args": [
+                        "--disable-gpu",
+                        "--no-sandbox",
+                        "--disable-dev-shm-usage",
+                        "--disable-blink-features=AutomationControlled",
+                        "--disable-infobars",
+                        "--window-position=0,0",
+                        "--ignore-certificate-errors",
+                        "--ignore-certificate-errors-spki-list",
+                        # "--disable-http2",
+                        # "--headless=new",  # Use the new headless mode
+                    ]
+                }
+                
+                # Add extra args if provided
+                if self.extra_args:
+                    browser_args["args"].extend(self.extra_args)
+                
+                # Add proxy settings if a proxy is specified
+                if self.proxy:
+                    proxy_settings = ProxySettings(server=self.proxy)
+                    browser_args["proxy"] = proxy_settings
+                elif self.proxy_config:
+                    proxy_settings = ProxySettings(server=self.proxy_config.get("server"), username=self.proxy_config.get("username"), password=self.proxy_config.get("password"))
+                    browser_args["proxy"] = proxy_settings
+                    
+                # Select the appropriate browser based on the browser_type
+                if self.browser_type == "firefox":
+                    self.browser = await self.playwright.firefox.launch(**browser_args)
+                elif self.browser_type == "webkit":
+                    self.browser = await self.playwright.webkit.launch(**browser_args)
+                else:
+                    self.browser = await self.playwright.chromium.launch(**browser_args)
+                    
+                # Update the headless configuration
+                if self.headless:
+                    # Use the new headless mode explicitly
+                    browser_args["args"].append("--headless=new")
+
+            await self.execute_hook('on_browser_created', self.browser)
+
+    async def close(self):
+        if self.sleep_on_close:
+            await asyncio.sleep(0.5)
+            
+        # Close all active sessions
+        session_ids = list(self.sessions.keys())
+        for session_id in session_ids:
+            await self.kill_session(session_id)
+            
+        if self.browser:
+            await self.browser.close()
+            self.browser = None
+            
+        if self.managed_browser:
+            await self.managed_browser.cleanup()
+            self.managed_browser = None
+            
+        if self.playwright:
+            await self.playwright.stop()
+            self.playwright = None
+
+    def __del__(self):
+        if self.browser or self.playwright:
+            asyncio.get_event_loop().run_until_complete(self.close())
+
+    def set_hook(self, hook_type: str, hook: Callable):
+        if hook_type in self.hooks:
+            self.hooks[hook_type] = hook
+        else:
+            raise ValueError(f"Invalid hook type: {hook_type}")
+
+    async def execute_hook(self, hook_type: str, *args):
+        hook = self.hooks.get(hook_type)
+        if hook:
+            if asyncio.iscoroutinefunction(hook):
+                return await hook(*args)
+            else:
+                return hook(*args)
+        return args[0] if args else None
+
+    def update_user_agent(self, user_agent: str):
+        self.user_agent = user_agent
+
+    def set_custom_headers(self, headers: Dict[str, str]):
+        self.headers = headers
+
+    async def kill_session(self, session_id: str):
+        if session_id in self.sessions:
+            context, page, _ = self.sessions[session_id]
+            await page.close()
+            if not self.use_managed_browser:
+                await context.close()
+            del self.sessions[session_id]
+
+    def _cleanup_expired_sessions(self):
+        current_time = time.time()
+        expired_sessions = [
+            sid for sid, (_, _, last_used) in self.sessions.items() 
+            if current_time - last_used > self.session_ttl
+        ]
+        for sid in expired_sessions:
+            asyncio.create_task(self.kill_session(sid))
+            
+    async def smart_wait(self, page: Page, wait_for: str, timeout: float = 30000):
+        wait_for = wait_for.strip()
+        
+        if wait_for.startswith('js:'):
+            # Explicitly specified JavaScript
+            js_code = wait_for[3:].strip()
+            return await self.csp_compliant_wait(page, js_code, timeout)
+        elif wait_for.startswith('css:'):
+            # Explicitly specified CSS selector
+            css_selector = wait_for[4:].strip()
+            try:
+                await page.wait_for_selector(css_selector, timeout=timeout)
+            except Error as e:
+                if 'Timeout' in str(e):
+                    raise TimeoutError(f"Timeout after {timeout}ms waiting for selector '{css_selector}'")
+                else:
+                    raise ValueError(f"Invalid CSS selector: '{css_selector}'")
+        else:
+            # Auto-detect based on content
+            if wait_for.startswith('()') or wait_for.startswith('function'):
+                # It's likely a JavaScript function
+                return await self.csp_compliant_wait(page, wait_for, timeout)
+            else:
+                # Assume it's a CSS selector first
+                try:
+                    await page.wait_for_selector(wait_for, timeout=timeout)
+                except Error as e:
+                    if 'Timeout' in str(e):
+                        raise TimeoutError(f"Timeout after {timeout}ms waiting for selector '{wait_for}'")
+                    else:
+                        # If it's not a timeout error, it might be an invalid selector
+                        # Let's try to evaluate it as a JavaScript function as a fallback
+                        try:
+                            return await self.csp_compliant_wait(page, f"() => {{{wait_for}}}", timeout)
+                        except Error:
+                            raise ValueError(f"Invalid wait_for parameter: '{wait_for}'. "
+                                             "It should be either a valid CSS selector, a JavaScript function, "
+                                             "or explicitly prefixed with 'js:' or 'css:'.")
+    
+    async def csp_compliant_wait(self, page: Page, user_wait_function: str, timeout: float = 30000):
+        wrapper_js = f"""
+        async () => {{
+            const userFunction = {user_wait_function};
+            const startTime = Date.now();
+            while (true) {{
+                if (await userFunction()) {{
+                    return true;
+                }}
+                if (Date.now() - startTime > {timeout}) {{
+                    throw new Error('Timeout waiting for condition');
+                }}
+                await new Promise(resolve => setTimeout(resolve, 100));
+            }}
+        }}
+        """
+        
+        try:
+            await page.evaluate(wrapper_js)
+        except TimeoutError:
+            raise TimeoutError(f"Timeout after {timeout}ms waiting for condition")
+        except Exception as e:
+            raise RuntimeError(f"Error in wait condition: {str(e)}")
+
+    async def process_iframes(self, page):
+        # Find all iframes
+        iframes = await page.query_selector_all('iframe')
+        
+        for i, iframe in enumerate(iframes):
+            try:
+                # Add a unique identifier to the iframe
+                await iframe.evaluate(f'(element) => element.id = "iframe-{i}"')
+                
+                # Get the frame associated with this iframe
+                frame = await iframe.content_frame()
+                
+                if frame:
+                    # Wait for the frame to load
+                    await frame.wait_for_load_state('load', timeout=30000)  # 30 seconds timeout
+                    
+                    # Extract the content of the iframe's body
+                    iframe_content = await frame.evaluate('() => document.body.innerHTML')
+                    
+                    # Generate a unique class name for this iframe
+                    class_name = f'extracted-iframe-content-{i}'
+                    
+                    # Replace the iframe with a div containing the extracted content
+                    _iframe = iframe_content.replace('`', '\\`')
+                    await page.evaluate(f"""
+                        () => {{
+                            const iframe = document.getElementById('iframe-{i}');
+                            const div = document.createElement('div');
+                            div.innerHTML = `{_iframe}`;
+                            div.className = '{class_name}';
+                            iframe.replaceWith(div);
+                        }}
+                    """)
+                else:
+                    print(f"Warning: Could not access content frame for iframe {i}")
+            except Exception as e:
+                print(f"Error processing iframe {i}: {str(e)}")
+
+        # Return the page object
+        return page  
+    
+    async def crawl(self, url: str, **kwargs) -> AsyncCrawlResponse:
+        response_headers = {}
+        status_code = None
+        
+        self._cleanup_expired_sessions()
+        session_id = kwargs.get("session_id")
+        
+        # Handle page creation differently for managed browser
+        if self.use_managed_browser:
+            if session_id:
+                # Reuse existing session if available
+                context, page, _ = self.sessions.get(session_id, (None, None, None))
+                if not page:
+                    # Create new page in default context if session doesn't exist
+                    page = await self.default_context.new_page()
+                    self.sessions[session_id] = (self.default_context, page, time.time())
+            else:
+                # Create new page in default context for non-session requests
+                page = await self.default_context.new_page()
+        else:
+            if session_id:
+                context, page, _ = self.sessions.get(session_id, (None, None, None))
+                if not context:
+                    context = await self.browser.new_context(
+                        user_agent=self.user_agent,
+                        viewport={"width": 1920, "height": 1080},
+                        proxy={"server": self.proxy} if self.proxy else None,
+                        accept_downloads=True,
+                        java_script_enabled=True
+                    )
+                    await context.add_cookies([{"name": "cookiesEnabled", "value": "true", "url": url}])
+                    await context.set_extra_http_headers(self.headers)
+                    page = await context.new_page()
+                    self.sessions[session_id] = (context, page, time.time())
+            else:
+                context = await self.browser.new_context(
+                    user_agent=self.user_agent,
+                    viewport={"width": 1920, "height": 1080},
+                    proxy={"server": self.proxy} if self.proxy else None
+                )
+                await context.set_extra_http_headers(self.headers)
+                
+                if kwargs.get("override_navigator", False) or kwargs.get("simulate_user", False) or kwargs.get("magic", False):
+                    # Inject scripts to override navigator properties
+                    await context.add_init_script("""
+                        // Pass the Permissions Test.
+                        const originalQuery = window.navigator.permissions.query;
+                        window.navigator.permissions.query = (parameters) => (
+                            parameters.name === 'notifications' ?
+                                Promise.resolve({ state: Notification.permission }) :
+                                originalQuery(parameters)
+                        );
+                        Object.defineProperty(navigator, 'webdriver', {
+                            get: () => undefined
+                        });
+                        window.navigator.chrome = {
+                            runtime: {},
+                            // Add other properties if necessary
+                        };
+                        Object.defineProperty(navigator, 'plugins', {
+                            get: () => [1, 2, 3, 4, 5],
+                        });
+                        Object.defineProperty(navigator, 'languages', {
+                            get: () => ['en-US', 'en'],
+                        });
+                        Object.defineProperty(document, 'hidden', {
+                            get: () => false
+                        });
+                        Object.defineProperty(document, 'visibilityState', {
+                            get: () => 'visible'
+                        });
+                    """)
+                
+                page = await context.new_page()
+                if kwargs.get("magic", False):
+                    await stealth_async(page, stealth_config)
+
+        # Add console message and error logging
+        if kwargs.get("log_console", False):
+            page.on("console", lambda msg: print(f"Console: {msg.text}"))
+            page.on("pageerror", lambda exc: print(f"Page Error: {exc}"))
+        
+        try:
+            if self.verbose:
+                print(f"[LOG] 🕸️ Crawling {url} using AsyncPlaywrightCrawlerStrategy...")
+
+            if self.use_cached_html:
+                cache_file_path = os.path.join(
+                    Path.home(), ".crawl4ai", "cache", hashlib.md5(url.encode()).hexdigest()
+                )
+                if os.path.exists(cache_file_path):
+                    html = ""
+                    with open(cache_file_path, "r") as f:
+                        html = f.read()
+                    # retrieve response headers and status code from cache
+                    with open(cache_file_path + ".meta", "r") as f:
+                        meta = json.load(f)
+                        response_headers = meta.get("response_headers", {})
+                        status_code = meta.get("status_code")
+                    response = AsyncCrawlResponse(
+                        html=html, response_headers=response_headers, status_code=status_code
+                    )
+                    return response
+
+            if not kwargs.get("js_only", False):
+                await self.execute_hook('before_goto', page)
+                
+                # response = await page.goto(
+                #     url, wait_until="domcontentloaded", timeout=kwargs.get("page_timeout", 60000)
+                # )
+                
+                # Add retry logic for HTTP2 errors
+                max_retries = kwargs.get("max_retries", 3)
+                current_try = 0
+                
+                while current_try < max_retries:
+                    try:
+                        response = await page.goto(
+                            url,
+                            # wait_until=kwargs.get("wait_until", ["domcontentloaded", "networkidle"]),
+                            wait_until=kwargs.get("wait_until", "networkidle"),
+                            timeout=kwargs.get("page_timeout", 60000)
+                        )
+                        break
+                    except Exception as e:
+                        current_try += 1
+                        if "ERR_HTTP2_PROTOCOL_ERROR" in str(e):
+                            if current_try < max_retries:
+                                # Add exponential backoff
+                                await asyncio.sleep(2 ** current_try)
+                                # Try with different protocol
+                                if 'args' not in kwargs:
+                                    kwargs['args'] = []
+                                kwargs['args'].extend(['--disable-http2'])
+                                continue
+                        if current_try == max_retries:
+                            raise
+                
+                # response = await page.goto("about:blank")
+                # await page.evaluate(f"window.location.href = '{url}'")
+                
+                await self.execute_hook('after_goto', page)
+                
+                # Get status code and headers
+                status_code = response.status
+                response_headers = response.headers
+            else:
+                status_code = 200
+                response_headers = {}
+
+            # Replace the current wait_for_selector line with this more robust check:
+            try:
+                # First wait for body to exist, regardless of visibility
+                await page.wait_for_selector('body', state='attached', timeout=30000)
+                
+                # Then wait for it to become visible by checking CSS
+                await page.wait_for_function("""
+                    () => {
+                        const body = document.body;
+                        const style = window.getComputedStyle(body);
+                        return style.display !== 'none' && 
+                            style.visibility !== 'hidden' && 
+                            style.opacity !== '0';
+                    }
+                """, timeout=30000)
+                
+            except Error as e:
+                # If waiting fails, let's try to diagnose the issue
+                visibility_info = await page.evaluate("""
+                    () => {
+                        const body = document.body;
+                        const style = window.getComputedStyle(body);
+                        return {
+                            display: style.display,
+                            visibility: style.visibility,
+                            opacity: style.opacity,
+                            hasContent: body.innerHTML.length,
+                            classList: Array.from(body.classList)
+                        }
+                    }
+                """)
+                
+                if self.verbose:
+                    print(f"Body visibility debug info: {visibility_info}")
+                
+                # Even if body is hidden, we might still want to proceed
+                if kwargs.get('ignore_body_visibility', True):
+                    if self.verbose:
+                        print("Proceeding despite hidden body...")
+                    pass
+                else:
+                    raise Error(f"Body element is hidden: {visibility_info}")
+            
+            await page.evaluate("window.scrollTo(0, document.body.scrollHeight)")
+
+            js_code = kwargs.get("js_code", kwargs.get("js", self.js_code))
+            if js_code:
+                if isinstance(js_code, str):
+                    await page.evaluate(js_code)
+                elif isinstance(js_code, list):
+                    for js in js_code:
+                        await page.evaluate(js)
+                
+                await page.wait_for_load_state('networkidle')
+                # Check for on execution event
+                await self.execute_hook('on_execution_started', page)
+                
+            if kwargs.get("simulate_user", False) or kwargs.get("magic", False):
+                # Simulate user interactions
+                await page.mouse.move(100, 100)
+                await page.mouse.down()
+                await page.mouse.up()
+                await page.keyboard.press('ArrowDown')
+
+            # Handle the wait_for parameter
+            wait_for = kwargs.get("wait_for")
+            if wait_for:
+                try:
+                    await self.smart_wait(page, wait_for, timeout=kwargs.get("page_timeout", 60000))
+                except Exception as e:
+                    raise RuntimeError(f"Wait condition failed: {str(e)}")
+
+            # Update image dimensions
+            update_image_dimensions_js = """
+            () => {
+                return new Promise((resolve) => {
+                    const filterImage = (img) => {
+                        // Filter out images that are too small
+                        if (img.width < 100 && img.height < 100) return false;
+                        
+                        // Filter out images that are not visible
+                        const rect = img.getBoundingClientRect();
+                        if (rect.width === 0 || rect.height === 0) return false;
+                        
+                        // Filter out images with certain class names (e.g., icons, thumbnails)
+                        if (img.classList.contains('icon') || img.classList.contains('thumbnail')) return false;
+                        
+                        // Filter out images with certain patterns in their src (e.g., placeholder images)
+                        if (img.src.includes('placeholder') || img.src.includes('icon')) return false;
+                        
+                        return true;
+                    };
+
+                    const images = Array.from(document.querySelectorAll('img')).filter(filterImage);
+                    let imagesLeft = images.length;
+                    
+                    if (imagesLeft === 0) {
+                        resolve();
+                        return;
+                    }
+
+                    const checkImage = (img) => {
+                        if (img.complete && img.naturalWidth !== 0) {
+                            img.setAttribute('width', img.naturalWidth);
+                            img.setAttribute('height', img.naturalHeight);
+                            imagesLeft--;
+                            if (imagesLeft === 0) resolve();
+                        }
+                    };
+
+                    images.forEach(img => {
+                        checkImage(img);
+                        if (!img.complete) {
+                            img.onload = () => {
+                                checkImage(img);
+                            };
+                            img.onerror = () => {
+                                imagesLeft--;
+                                if (imagesLeft === 0) resolve();
+                            };
+                        }
+                    });
+
+                    // Fallback timeout of 5 seconds
+                    // setTimeout(() => resolve(), 5000);
+                    resolve();
+                });
+            }
+            """
+            await page.evaluate(update_image_dimensions_js)
+
+            # Wait a bit for any onload events to complete
+            await page.wait_for_timeout(100)
+
+            # Process iframes
+            if kwargs.get("process_iframes", False):
+                page = await self.process_iframes(page)
+            
+            await self.execute_hook('before_retrieve_html', page)
+            # Check if delay_before_return_html is set then wait for that time
+            delay_before_return_html = kwargs.get("delay_before_return_html")
+            if delay_before_return_html:
+                await asyncio.sleep(delay_before_return_html)
+                
+            # Check for remove_overlay_elements parameter
+            if kwargs.get("remove_overlay_elements", False):
+                await self.remove_overlay_elements(page)
+            
+            html = await page.content()
+            await self.execute_hook('before_return_html', page, html)
+            
+            # Check if kwargs has screenshot=True then take screenshot
+            screenshot_data = None
+            if kwargs.get("screenshot"):
+                # Check we have screenshot_wait_for parameter, if we have simply wait for that time
+                screenshot_wait_for = kwargs.get("screenshot_wait_for")
+                if screenshot_wait_for:
+                    await asyncio.sleep(screenshot_wait_for)
+                screenshot_data = await self.take_screenshot(page)          
+
+            if self.verbose:
+                print(f"[LOG] ✅ Crawled {url} successfully!")
+
+            if self.use_cached_html:
+                cache_file_path = os.path.join(
+                    Path.home(), ".crawl4ai", "cache", hashlib.md5(url.encode()).hexdigest()
+                )
+                with open(cache_file_path, "w", encoding="utf-8") as f:
+                    f.write(html)
+                # store response headers and status code in cache
+                with open(cache_file_path + ".meta", "w", encoding="utf-8") as f:
+                    json.dump({
+                        "response_headers": response_headers,
+                        "status_code": status_code
+                    }, f)
+
+            async def get_delayed_content(delay: float = 5.0) -> str:
+                if self.verbose:
+                    print(f"[LOG] Waiting for {delay} seconds before retrieving content for {url}")
+                await asyncio.sleep(delay)
+                return await page.content()
+                
+            response = AsyncCrawlResponse(
+                html=html, 
+                response_headers=response_headers, 
+                status_code=status_code,
+                screenshot=screenshot_data,
+                get_delayed_content=get_delayed_content
+            )
+            return response
+        except Error as e:
+            raise Error(f"[ERROR] 🚫 crawl(): Failed to crawl {url}: {str(e)}")
+        # finally:
+        #     if not session_id:
+        #         await page.close()
+        #         await context.close()
+
+    async def crawl_many(self, urls: List[str], **kwargs) -> List[AsyncCrawlResponse]:
+        semaphore_count = kwargs.get('semaphore_count', 5)  # Adjust as needed
+        semaphore = asyncio.Semaphore(semaphore_count)
+
+        async def crawl_with_semaphore(url):
+            async with semaphore:
+                return await self.crawl(url, **kwargs)
+
+        tasks = [crawl_with_semaphore(url) for url in urls]
+        results = await asyncio.gather(*tasks, return_exceptions=True)
+        return [result if not isinstance(result, Exception) else str(result) for result in results]
+
+    async def remove_overlay_elements(self, page: Page) -> None:
+        """
+        Removes popup overlays, modals, cookie notices, and other intrusive elements from the page.
+        
+        Args:
+            page (Page): The Playwright page instance
+        """
+        remove_overlays_js = """
+        async () => {
+            // Function to check if element is visible
+            const isVisible = (elem) => {
+                const style = window.getComputedStyle(elem);
+                return style.display !== 'none' && 
+                       style.visibility !== 'hidden' && 
+                       style.opacity !== '0';
+            };
+
+            // Common selectors for popups and overlays
+            const commonSelectors = [
+                // Close buttons first
+                'button[class*="close" i]', 'button[class*="dismiss" i]', 
+                'button[aria-label*="close" i]', 'button[title*="close" i]',
+                'a[class*="close" i]', 'span[class*="close" i]',
+                
+                // Cookie notices
+                '[class*="cookie-banner" i]', '[id*="cookie-banner" i]',
+                '[class*="cookie-consent" i]', '[id*="cookie-consent" i]',
+                
+                // Newsletter/subscription dialogs
+                '[class*="newsletter" i]', '[class*="subscribe" i]',
+                
+                // Generic popups/modals
+                '[class*="popup" i]', '[class*="modal" i]', 
+                '[class*="overlay" i]', '[class*="dialog" i]',
+                '[role="dialog"]', '[role="alertdialog"]'
+            ];
+
+            // Try to click close buttons first
+            for (const selector of commonSelectors.slice(0, 6)) {
+                const closeButtons = document.querySelectorAll(selector);
+                for (const button of closeButtons) {
+                    if (isVisible(button)) {
+                        try {
+                            button.click();
+                            await new Promise(resolve => setTimeout(resolve, 100));
+                        } catch (e) {
+                            console.log('Error clicking button:', e);
+                        }
+                    }
+                }
+            }
+
+            // Remove remaining overlay elements
+            const removeOverlays = () => {
+                // Find elements with high z-index
+                const allElements = document.querySelectorAll('*');
+                for (const elem of allElements) {
+                    const style = window.getComputedStyle(elem);
+                    const zIndex = parseInt(style.zIndex);
+                    const position = style.position;
+                    
+                    if (
+                        isVisible(elem) && 
+                        (zIndex > 999 || position === 'fixed' || position === 'absolute') &&
+                        (
+                            elem.offsetWidth > window.innerWidth * 0.5 ||
+                            elem.offsetHeight > window.innerHeight * 0.5 ||
+                            style.backgroundColor.includes('rgba') ||
+                            parseFloat(style.opacity) < 1
+                        )
+                    ) {
+                        elem.remove();
+                    }
+                }
+
+                // Remove elements matching common selectors
+                for (const selector of commonSelectors) {
+                    const elements = document.querySelectorAll(selector);
+                    elements.forEach(elem => {
+                        if (isVisible(elem)) {
+                            elem.remove();
+                        }
+                    });
+                }
+            };
+
+            // Remove overlay elements
+            removeOverlays();
+
+            // Remove any fixed/sticky position elements at the top/bottom
+            const removeFixedElements = () => {
+                const elements = document.querySelectorAll('*');
+                elements.forEach(elem => {
+                    const style = window.getComputedStyle(elem);
+                    if (
+                        (style.position === 'fixed' || style.position === 'sticky') &&
+                        isVisible(elem)
+                    ) {
+                        elem.remove();
+                    }
+                });
+            };
+
+            removeFixedElements();
+            
+            // Remove empty block elements as: div, p, span, etc.
+            const removeEmptyBlockElements = () => {
+                const blockElements = document.querySelectorAll('div, p, span, section, article, header, footer, aside, nav, main, ul, ol, li, dl, dt, dd, h1, h2, h3, h4, h5, h6');
+                blockElements.forEach(elem => {
+                    if (elem.innerText.trim() === '') {
+                        elem.remove();
+                    }
+                });
+            };
+
+            // Remove margin-right and padding-right from body (often added by modal scripts)
+            document.body.style.marginRight = '0px';
+            document.body.style.paddingRight = '0px';
+            document.body.style.overflow = 'auto';
+
+            // Wait a bit for any animations to complete
+            await new Promise(resolve => setTimeout(resolve, 100));
+        }
+        """
+        
+        try:
+            await page.evaluate(remove_overlays_js)
+            await page.wait_for_timeout(500)  # Wait for any animations to complete
+        except Exception as e:
+            if self.verbose:
+                print(f"Warning: Failed to remove overlay elements: {str(e)}")
+
+    async def take_screenshot(self, page: Page) -> str:
+        try:
+            # The page is already loaded, just take the screenshot
+            screenshot = await page.screenshot(full_page=True)
+            return base64.b64encode(screenshot).decode('utf-8')
+        except Exception as e:
+            error_message = f"Failed to take screenshot: {str(e)}"
+            print(error_message)
+
+            # Generate an error image
+            img = Image.new('RGB', (800, 600), color='black')
+            draw = ImageDraw.Draw(img)
+            font = ImageFont.load_default()
+            draw.text((10, 10), error_message, fill=(255, 255, 255), font=font)
+            
+            buffered = BytesIO()
+            img.save(buffered, format="JPEG")
+            return base64.b64encode(buffered.getvalue()).decode('utf-8')
+        finally:
+            await page.close()
+
diff --git a/main.py b/main.py
index 853cd0b7..a5da029c 100644
--- a/main.py
+++ b/main.py
@@ -321,7 +321,12 @@ app.add_middleware(
 
 # Mount the pages directory as a static directory
 app.mount("/pages", StaticFiles(directory=__location__ + "/pages"), name="pages")
-app.mount("/mkdocs", StaticFiles(directory="site", html=True), name="mkdocs")
+
+# Check if site directory exists
+if os.path.exists(__location__ + "/site"):
+    # Mount the site directory as a static directory
+    app.mount("/mkdocs", StaticFiles(directory="site", html=True), name="mkdocs")
+
 site_templates = Jinja2Templates(directory=__location__ + "/site")
 templates = Jinja2Templates(directory=__location__ + "/pages")
 
@@ -337,7 +342,10 @@ async def shutdown_event():
 
 @app.get("/")
 def read_root():
-    return RedirectResponse(url="/mkdocs")
+    if os.path.exists(__location__ + "/site"):
+        return RedirectResponse(url="/mkdocs")
+    # Return a json response
+    return {"message": "Crawl4AI API service is running"}
 
 
 @app.post("/crawl")
diff --git a/requirements.txt b/requirements.txt
index 9a942958..e83643b3 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -8,4 +8,4 @@ playwright>=1.47,<1.48
 python-dotenv~=1.0
 requests~=2.26
 beautifulsoup4~=4.12
-playwright_stealth~=1.0
+tf-playwright-stealth~=1.0

From 00026b5f8b9aec4ef5f4aa1fde8594c8118de74f Mon Sep 17 00:00:00 2001
From: Mahesh <mahesh.a.subramanian@lendistry.com>
Date: Tue, 12 Nov 2024 14:52:51 -0700
Subject: [PATCH 014/115] feat(config): Adding a configurable way of setting
 the cache directory for constrained environments

---
 crawl4ai/async_crawler_strategy.py | 4 ++--
 crawl4ai/async_database.py         | 2 +-
 crawl4ai/async_webcrawler.py       | 4 ++--
 crawl4ai/crawler_strategy.py       | 6 +++---
 crawl4ai/database.py               | 2 +-
 crawl4ai/model_loader.py           | 2 +-
 crawl4ai/utils.py                  | 2 +-
 crawl4ai/web_crawler.py            | 2 +-
 docs/md_v2/api/async-webcrawler.md | 2 +-
 setup.py                           | 2 +-
 10 files changed, 14 insertions(+), 14 deletions(-)

diff --git a/crawl4ai/async_crawler_strategy.py b/crawl4ai/async_crawler_strategy.py
index fa50e7b5..9af9f826 100644
--- a/crawl4ai/async_crawler_strategy.py
+++ b/crawl4ai/async_crawler_strategy.py
@@ -525,7 +525,7 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
 
             if self.use_cached_html:
                 cache_file_path = os.path.join(
-                    Path.home(), ".crawl4ai", "cache", hashlib.md5(url.encode()).hexdigest()
+                    os.getenv("CRAWL4_AI_BASE_DIRECTORY", Path.home()), ".crawl4ai", "cache", hashlib.md5(url.encode()).hexdigest()
                 )
                 if os.path.exists(cache_file_path):
                     html = ""
@@ -725,7 +725,7 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
 
             if self.use_cached_html:
                 cache_file_path = os.path.join(
-                    Path.home(), ".crawl4ai", "cache", hashlib.md5(url.encode()).hexdigest()
+                    os.getenv("CRAWL4_AI_BASE_DIRECTORY", Path.home()), ".crawl4ai", "cache", hashlib.md5(url.encode()).hexdigest()
                 )
                 with open(cache_file_path, "w", encoding="utf-8") as f:
                     f.write(html)
diff --git a/crawl4ai/async_database.py b/crawl4ai/async_database.py
index 78931d28..249c4b31 100644
--- a/crawl4ai/async_database.py
+++ b/crawl4ai/async_database.py
@@ -10,7 +10,7 @@ import logging
 logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger(__name__)
 
-DB_PATH = os.path.join(Path.home(), ".crawl4ai")
+DB_PATH = os.path.join(os.getenv("CRAWL4_AI_BASE_DIRECTORY", Path.home()), ".crawl4ai")
 os.makedirs(DB_PATH, exist_ok=True)
 DB_PATH = os.path.join(DB_PATH, "crawl4ai.db")
 
diff --git a/crawl4ai/async_webcrawler.py b/crawl4ai/async_webcrawler.py
index ceb9ad28..38e429ca 100644
--- a/crawl4ai/async_webcrawler.py
+++ b/crawl4ai/async_webcrawler.py
@@ -23,14 +23,14 @@ class AsyncWebCrawler:
         self,
         crawler_strategy: Optional[AsyncCrawlerStrategy] = None,
         always_by_pass_cache: bool = False,
-        base_directory: str = str(Path.home()),
+        base_directory: str = str(os.getenv("CRAWL4_AI_BASE_DIRECTORY", Path.home())),
         **kwargs,
     ):
         self.crawler_strategy = crawler_strategy or AsyncPlaywrightCrawlerStrategy(
             **kwargs
         )
         self.always_by_pass_cache = always_by_pass_cache
-        # self.crawl4ai_folder = os.path.join(Path.home(), ".crawl4ai")
+        # self.crawl4ai_folder = os.path.join(os.getenv("CRAWL4_AI_BASE_DIRECTORY", Path.home()), ".crawl4ai")
         self.crawl4ai_folder = os.path.join(base_directory, ".crawl4ai")
         os.makedirs(self.crawl4ai_folder, exist_ok=True)
         os.makedirs(f"{self.crawl4ai_folder}/cache", exist_ok=True)
diff --git a/crawl4ai/crawler_strategy.py b/crawl4ai/crawler_strategy.py
index 5d6864b5..ce802e49 100644
--- a/crawl4ai/crawler_strategy.py
+++ b/crawl4ai/crawler_strategy.py
@@ -132,7 +132,7 @@ class LocalSeleniumCrawlerStrategy(CrawlerStrategy):
 
         # chromedriver_autoinstaller.install()
         # import chromedriver_autoinstaller
-        # crawl4ai_folder = os.path.join(Path.home(), ".crawl4ai")
+        # crawl4ai_folder = os.path.join(os.getenv("CRAWL4_AI_BASE_DIRECTORY", Path.home()), ".crawl4ai")
         # driver = webdriver.Chrome(service=ChromeService(ChromeDriverManager().install()), options=self.options)
         # chromedriver_path = chromedriver_autoinstaller.install()
         # chromedriver_path = chromedriver_autoinstaller.utils.download_chromedriver()
@@ -205,7 +205,7 @@ class LocalSeleniumCrawlerStrategy(CrawlerStrategy):
         url_hash = hashlib.md5(url.encode()).hexdigest()
         
         if self.use_cached_html:
-            cache_file_path = os.path.join(Path.home(), ".crawl4ai", "cache", url_hash)
+            cache_file_path = os.path.join(os.getenv("CRAWL4_AI_BASE_DIRECTORY", Path.home()), ".crawl4ai", "cache", url_hash)
             if os.path.exists(cache_file_path):
                 with open(cache_file_path, "r") as f:
                     return sanitize_input_encode(f.read())
@@ -275,7 +275,7 @@ class LocalSeleniumCrawlerStrategy(CrawlerStrategy):
             self.driver = self.execute_hook('before_return_html', self.driver, html)
             
             # Store in cache
-            cache_file_path = os.path.join(Path.home(), ".crawl4ai", "cache", url_hash)
+            cache_file_path = os.path.join(os.getenv("CRAWL4_AI_BASE_DIRECTORY", Path.home()), ".crawl4ai", "cache", url_hash)
             with open(cache_file_path, "w", encoding="utf-8") as f:
                 f.write(html)
                 
diff --git a/crawl4ai/database.py b/crawl4ai/database.py
index 37d94463..42ad7017 100644
--- a/crawl4ai/database.py
+++ b/crawl4ai/database.py
@@ -3,7 +3,7 @@ from pathlib import Path
 import sqlite3
 from typing import Optional, Tuple
 
-DB_PATH = os.path.join(Path.home(), ".crawl4ai")
+DB_PATH = os.path.join(os.getenv("CRAWL4_AI_BASE_DIRECTORY", Path.home()), ".crawl4ai")
 os.makedirs(DB_PATH, exist_ok=True)
 DB_PATH = os.path.join(DB_PATH, "crawl4ai.db")
 
diff --git a/crawl4ai/model_loader.py b/crawl4ai/model_loader.py
index 7b3a2846..d1872d7e 100644
--- a/crawl4ai/model_loader.py
+++ b/crawl4ai/model_loader.py
@@ -56,7 +56,7 @@ def set_model_device(model):
 
 @lru_cache()
 def get_home_folder():
-    home_folder = os.path.join(Path.home(), ".crawl4ai")
+    home_folder = os.path.join(os.getenv("CRAWL4_AI_BASE_DIRECTORY", Path.home()), ".crawl4ai")
     os.makedirs(home_folder, exist_ok=True)
     os.makedirs(f"{home_folder}/cache", exist_ok=True)
     os.makedirs(f"{home_folder}/models", exist_ok=True)
diff --git a/crawl4ai/utils.py b/crawl4ai/utils.py
index d96f1ded..1f15dea1 100644
--- a/crawl4ai/utils.py
+++ b/crawl4ai/utils.py
@@ -60,7 +60,7 @@ def get_system_memory():
         raise OSError("Unsupported operating system")
 
 def get_home_folder():
-    home_folder = os.path.join(Path.home(), ".crawl4ai")
+    home_folder = os.path.join(os.getenv("CRAWL4_AI_BASE_DIRECTORY", os.getenv("CRAWL4_AI_BASE_DIRECTORY", Path.home())), ".crawl4ai")
     os.makedirs(home_folder, exist_ok=True)
     os.makedirs(f"{home_folder}/cache", exist_ok=True)
     os.makedirs(f"{home_folder}/models", exist_ok=True)
diff --git a/crawl4ai/web_crawler.py b/crawl4ai/web_crawler.py
index 20e9b04e..d44de183 100644
--- a/crawl4ai/web_crawler.py
+++ b/crawl4ai/web_crawler.py
@@ -20,7 +20,7 @@ class WebCrawler:
     def __init__(self, crawler_strategy: CrawlerStrategy = None, always_by_pass_cache: bool = False, verbose: bool = False):
         self.crawler_strategy = crawler_strategy or LocalSeleniumCrawlerStrategy(verbose=verbose)
         self.always_by_pass_cache = always_by_pass_cache
-        self.crawl4ai_folder = os.path.join(Path.home(), ".crawl4ai")
+        self.crawl4ai_folder = os.path.join(os.getenv("CRAWL4_AI_BASE_DIRECTORY", Path.home()), ".crawl4ai")
         os.makedirs(self.crawl4ai_folder, exist_ok=True)
         os.makedirs(f"{self.crawl4ai_folder}/cache", exist_ok=True)
         init_db()
diff --git a/docs/md_v2/api/async-webcrawler.md b/docs/md_v2/api/async-webcrawler.md
index 25164f6c..be956101 100644
--- a/docs/md_v2/api/async-webcrawler.md
+++ b/docs/md_v2/api/async-webcrawler.md
@@ -13,7 +13,7 @@ AsyncWebCrawler(
     
     # Cache Settings
     always_by_pass_cache: bool = False,     # Always bypass cache
-    base_directory: str = str(Path.home()), # Base directory for cache
+    base_directory: str = str(os.getenv("CRAWL4_AI_BASE_DIRECTORY", Path.home())), # Base directory for cache
     
     # Network Settings
     proxy: str = None,                      # Simple proxy URL
diff --git a/setup.py b/setup.py
index 93190291..90063212 100644
--- a/setup.py
+++ b/setup.py
@@ -8,7 +8,7 @@ import sys
 
 # Create the .crawl4ai folder in the user's home directory if it doesn't exist
 # If the folder already exists, remove the cache folder
-crawl4ai_folder = Path.home() / ".crawl4ai"
+crawl4ai_folder = os.getenv("CRAWL4_AI_BASE_DIRECTORY", Path.home()) / ".crawl4ai"
 cache_folder = crawl4ai_folder / "cache"
 
 if cache_folder.exists():

From bf91adf3f84ade380b819f55c444ed87c80c032b Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Wed, 13 Nov 2024 15:37:16 +0800
Subject: [PATCH 015/115] fix: Resolve unexpected BrowserContext closure during
 crawl in Docker

- Removed __del__ method in AsyncPlaywrightCrawlerStrategy to ensure reliable browser lifecycle management by using explicit context managers.
- Added process monitoring in ManagedBrowser to detect and log unexpected terminations of the browser subprocess.
- Updated Docker configuration to expose port 9222 for remote debugging and allocate extra shared memory to prevent browser crashes.
- Improved error handling and resource cleanup for browser instances, particularly in Docker environments.

Resolves Issue #256
---
 .gitignore                         |  1 +
 Dockerfile                         |  7 ++++++-
 README.md                          |  5 ++++-
 crawl4ai/__init__.py               |  4 ++--
 crawl4ai/async_crawler_strategy.py | 22 +++++++++++++++++++---
 crawl4ai/async_webcrawler.py       | 14 +++++++-------
 crawl4ai/config.py                 |  2 ++
 crawl4ai/web_crawler.py            | 17 ++++++++++++++++-
 8 files changed, 57 insertions(+), 15 deletions(-)

diff --git a/.gitignore b/.gitignore
index 4c3e151e..aca02959 100644
--- a/.gitignore
+++ b/.gitignore
@@ -199,6 +199,7 @@ test_env/
 **/.DS_Store
 
 todo.md
+todo_executor.md
 git_changes.py
 git_changes.md
 pypi_build.sh
diff --git a/Dockerfile b/Dockerfile
index 9a921d03..125fb9b8 100644
--- a/Dockerfile
+++ b/Dockerfile
@@ -115,7 +115,12 @@ HEALTHCHECK --interval=30s --timeout=30s --start-period=5s --retries=3 \
     CMD curl -f http://localhost:8000/health || exit 1
 
 # Expose port
-EXPOSE 8000
+EXPOSE 8000 11235 9222 8080
+
+# Optional: Increase shared memory size to prevent browser crashes
+# when loading heavy pages
+RUN mkdir /dev/shm
+VOLUME /dev/shm
 
 # Start the FastAPI server
 CMD ["uvicorn", "main:app", "--host", "0.0.0.0", "--port", "11235"]
\ No newline at end of file
diff --git a/README.md b/README.md
index e1a64aa1..d250f936 100644
--- a/README.md
+++ b/README.md
@@ -1,4 +1,4 @@
-# 🔥🕷️ Crawl4AI: LLM Friendly Web Crawler & Scrapper
+# 🔥🕷️ Crawl4AI: LLM Friendly Web Crawler & Scraper
 
 <a href="https://trendshift.io/repositories/11716" target="_blank"><img src="https://trendshift.io/api/badge/repositories/11716" alt="unclecode%2Fcrawl4ai | Trendshift" style="width: 250px; height: 55px;" width="250" height="55"/></a>
 
@@ -127,6 +127,9 @@ docker pull unclecode/crawl4ai:gpu      # GPU-enabled version
 
 # Run the container
 docker run -p 11235:11235 unclecode/crawl4ai:basic  # Replace 'basic' with your chosen version
+
+# In case to allocate more shared memory for the container
+docker run --shm-size=2gb -p 11235:11235 unclecode/crawl4ai:basic
 ```
 
 #### Option 2: Build from Repository
diff --git a/crawl4ai/__init__.py b/crawl4ai/__init__.py
index 0c6a2db4..1bcc491c 100644
--- a/crawl4ai/__init__.py
+++ b/crawl4ai/__init__.py
@@ -26,5 +26,5 @@ if is_sync_version_installed():
         print("Warning: Failed to import WebCrawler even though selenium is installed. This might be due to other missing dependencies.")
 else:
     WebCrawler = None
-    import warnings
-    print("Warning: Synchronous WebCrawler is not available. Install crawl4ai[sync] for synchronous support. However, please note that the synchronous version will be deprecated soon.")
\ No newline at end of file
+    # import warnings
+    # print("Warning: Synchronous WebCrawler is not available. Install crawl4ai[sync] for synchronous support. However, please note that the synchronous version will be deprecated soon.")
\ No newline at end of file
diff --git a/crawl4ai/async_crawler_strategy.py b/crawl4ai/async_crawler_strategy.py
index 896a0644..57288b59 100644
--- a/crawl4ai/async_crawler_strategy.py
+++ b/crawl4ai/async_crawler_strategy.py
@@ -64,12 +64,27 @@ class ManagedBrowser:
                 stdout=subprocess.PIPE,
                 stderr=subprocess.PIPE
             )
+            # Monitor browser process output for errors
+            asyncio.create_task(self._monitor_browser_process())
             await asyncio.sleep(2)  # Give browser time to start
             return f"http://localhost:{self.debugging_port}"
         except Exception as e:
             await self.cleanup()
             raise Exception(f"Failed to start browser: {e}")
 
+    async def _monitor_browser_process(self):
+        """Monitor the browser process for unexpected termination."""
+        if self.browser_process:
+            stdout, stderr = await asyncio.gather(
+                asyncio.to_thread(self.browser_process.stdout.read),
+                asyncio.to_thread(self.browser_process.stderr.read)
+            )
+            if self.browser_process.poll() is not None:
+                print(f"Browser process terminated unexpectedly with code {self.browser_process.returncode}")
+                print(f"STDOUT: {stdout.decode()}")
+                print(f"STDERR: {stderr.decode()}")
+                await self.cleanup()
+    
     def _get_browser_path(self) -> str:
         """Returns the browser executable path based on OS and browser type"""
         if sys.platform == "darwin":  # macOS
@@ -330,9 +345,10 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
             await self.playwright.stop()
             self.playwright = None
 
-    def __del__(self):
-        if self.browser or self.playwright:
-            asyncio.get_event_loop().run_until_complete(self.close())
+    # Issue #256: Remove __del__ method to avoid potential issues with async cleanup
+    # def __del__(self):
+    #     if self.browser or self.playwright:
+    #         asyncio.get_event_loop().run_until_complete(self.close())
 
     def set_hook(self, hook_type: str, hook: Callable):
         if hook_type in self.hooks:
diff --git a/crawl4ai/async_webcrawler.py b/crawl4ai/async_webcrawler.py
index ceb9ad28..f580776b 100644
--- a/crawl4ai/async_webcrawler.py
+++ b/crawl4ai/async_webcrawler.py
@@ -47,17 +47,17 @@ class AsyncWebCrawler:
 
     async def awarmup(self):
         # Print a message for crawl4ai and its version
-        print(f"[LOG] 🚀 Crawl4AI {crawl4ai_version}")
         if self.verbose:
+            print(f"[LOG] 🚀 Crawl4AI {crawl4ai_version}")
             print("[LOG] 🌤️  Warming up the AsyncWebCrawler")
         # await async_db_manager.ainit_db()
         await async_db_manager.initialize()
-        await self.arun(
-            url="https://google.com/",
-            word_count_threshold=5,
-            bypass_cache=False,
-            verbose=False,
-        )
+        # await self.arun(
+        #     url="https://google.com/",
+        #     word_count_threshold=5,
+        #     bypass_cache=False,
+        #     verbose=False,
+        # )
         self.ready = True
         if self.verbose:
             print("[LOG] 🌞 AsyncWebCrawler is ready to crawl")
diff --git a/crawl4ai/config.py b/crawl4ai/config.py
index a07ca977..16638b6d 100644
--- a/crawl4ai/config.py
+++ b/crawl4ai/config.py
@@ -51,3 +51,5 @@ SOCIAL_MEDIA_DOMAINS = [
 # If image format is in jpg, png or webp
 # If image is in the first half of the total images extracted from the page
 IMAGE_SCORE_THRESHOLD = 2
+
+MAX_METRICS_HISTORY = 1000
\ No newline at end of file
diff --git a/crawl4ai/web_crawler.py b/crawl4ai/web_crawler.py
index 20e9b04e..95af6c7a 100644
--- a/crawl4ai/web_crawler.py
+++ b/crawl4ai/web_crawler.py
@@ -10,6 +10,7 @@ from .extraction_strategy import *
 from .crawler_strategy import *
 from typing import List
 from concurrent.futures import ThreadPoolExecutor
+from .content_scrapping_strategy import WebScrappingStrategy
 from .config import *
 import warnings
 import json
@@ -181,7 +182,21 @@ class WebCrawler:
             # Extract content from HTML
             try:
                 t1 = time.time()
-                result = get_content_of_website_optimized(url, html, word_count_threshold, css_selector=css_selector, only_text=kwargs.get("only_text", False))
+                scrapping_strategy = WebScrappingStrategy()
+                extra_params = {k: v for k, v in kwargs.items() if k not in ["only_text", "image_description_min_word_threshold"]}
+                result = scrapping_strategy.scrap(
+                    url,
+                    html,
+                    word_count_threshold=word_count_threshold,
+                    css_selector=css_selector,
+                    only_text=kwargs.get("only_text", False),
+                    image_description_min_word_threshold=kwargs.get(
+                        "image_description_min_word_threshold", IMAGE_DESCRIPTION_MIN_WORD_THRESHOLD
+                    ),
+                    **extra_params,
+                )
+                
+                # result = get_content_of_website_optimized(url, html, word_count_threshold, css_selector=css_selector, only_text=kwargs.get("only_text", False))
                 if verbose:
                     print(f"[LOG] 🚀 Content extracted for {url}, success: True, time taken: {time.time() - t1:.2f} seconds")
                 

From 61b93ebf362205e2c96c5c2d74bc1b880ca59f51 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Wed, 13 Nov 2024 15:38:30 +0800
Subject: [PATCH 016/115] Update change log

---
 CHANGELOG.md | 7 ++++++-
 1 file changed, 6 insertions(+), 1 deletion(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 583c7807..ff52e10e 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -1,6 +1,11 @@
 # Changelog
 
-# CHANGELOG
+## [v0.3.731] - 2024-11-13 Changelog for Issue 256 Fix
+- Fixed: Browser context unexpectedly closing in Docker environment during crawl operations.
+- Removed: __del__ method from AsyncPlaywrightCrawlerStrategy to prevent unreliable asynchronous cleanup, ensuring - browser context is closed explicitly within context managers.
+- Added: Monitoring for ManagedBrowser subprocess to detect and log unexpected terminations.
+- Updated: Dockerfile configurations to expose debugging port (9222) and allocate additional shared memory for improved browser stability.
+- Improved: Error handling and resource cleanup processes for browser lifecycle management within the Docker environment.
 
 ## [v0.3.73] - 2024-11-05
 

From c38ac29edbcebcb2f3672145424e7af3193caa6e Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Wed, 13 Nov 2024 19:40:40 +0800
Subject: [PATCH 017/115] perf(crawler): major performance improvements & raw
 HTML support

- Switch to lxml parser (~4x speedup)
- Add raw HTML & local file crawling support
- Fix cache headers & async cleanup
- Add browser process monitoring
- Optimize BeautifulSoup operations
- Pre-compile regex patterns

Breaking: Raw HTML handling requires new URL prefixes
Fixes: #256, #253
---
 CHANGELOG.md                                 |   33 +-
 crawl4ai/async_crawler_strategy.py           |  114 +-
 crawl4ai/async_database.py                   |   67 +-
 crawl4ai/async_webcrawler.py                 |  127 +-
 crawl4ai/content_cleaning_strategy.py        |   10 +-
 crawl4ai/content_scrapping_strategy.py       |  102 +-
 crawl4ai/utils.py                            |   50 +-
 crawl4ai/web_crawler.py                      |    4 +-
 docs/md_v2/basic/prefix-based-input.md       |  235 ++
 tests/async/sample_wikipedia.html            | 2179 ++++++++++++++++++
 tests/async/test_content_scraper_strategy.py |  162 ++
 11 files changed, 2953 insertions(+), 130 deletions(-)
 create mode 100644 docs/md_v2/basic/prefix-based-input.md
 create mode 100644 tests/async/sample_wikipedia.html
 create mode 100644 tests/async/test_content_scraper_strategy.py

diff --git a/CHANGELOG.md b/CHANGELOG.md
index ff52e10e..33d09184 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -1,5 +1,30 @@
 # Changelog
 
+# Changelog - November 13, 2024
+
+### Added
+- Support for raw HTML and local file crawling via URL prefixes ('raw:', 'file://')
+- Browser process monitoring for managed browser instances
+- Screenshot capability for raw HTML and local file content
+- Response headers storage in cache database
+- New `fit_markdown` flag for optional markdown generation
+
+### Changed
+- Switched HTML parser from 'html.parser' to 'lxml' for ~4x performance improvement 
+- Optimized BeautifulSoup text conversion and element selection
+- Pre-compiled regular expressions for better performance
+- Improved metadata extraction efficiency
+- Response headers now stored alongside HTML in cache
+
+### Removed
+- `__del__` method from AsyncPlaywrightCrawlerStrategy to prevent async cleanup issues
+
+### Fixed 
+- Issue #256: Added support for crawling raw HTML content
+- Issue #253: Implemented file:// protocol handling
+- Missing response headers in cached results
+- Memory leaks from improper async cleanup
+
 ## [v0.3.731] - 2024-11-13 Changelog for Issue 256 Fix
 - Fixed: Browser context unexpectedly closing in Docker environment during crawl operations.
 - Removed: __del__ method from AsyncPlaywrightCrawlerStrategy to prevent unreliable asynchronous cleanup, ensuring - browser context is closed explicitly within context managers.
@@ -185,7 +210,7 @@ This commit introduces several key enhancements, including improved error handli
 ## [v0.3.72] - 2024-10-20
 
 ### Fixed
-- Added support for parsing Base64 encoded images in WebScrappingStrategy
+- Added support for parsing Base64 encoded images in WebScrapingStrategy
 
 ### Added
 - Forked and integrated a customized version of the html2text library for more control over Markdown generation
@@ -208,7 +233,7 @@ This commit introduces several key enhancements, including improved error handli
 ### Developer Notes
 - The customized html2text library is now located within the crawl4ai package
 - New configuration options are available in the `config.py` file for external content handling
-- The `WebScrappingStrategy` class has been updated to accommodate new external content exclusion options
+- The `WebScrapingStrategy` class has been updated to accommodate new external content exclusion options
 
 ## [v0.3.71] - 2024-10-19
 
@@ -285,7 +310,7 @@ These updates aim to provide more flexibility in text processing, improve perfor
 
 ### Improvements
 1. **Better Error Handling**:
-   - Enhanced error reporting in WebScrappingStrategy with detailed error messages and suggestions.
+   - Enhanced error reporting in WebScrapingStrategy with detailed error messages and suggestions.
    - Added console message and error logging for better debugging.
 
 2. **Image Processing Enhancements**:
@@ -350,7 +375,7 @@ These updates aim to provide more flexibility in text processing, improve perfor
 - Allows for more customized setups.
 
 ### 2. Image Processing Optimization
-- Enhanced image handling in WebScrappingStrategy.
+- Enhanced image handling in WebScrapingStrategy.
 - Added filtering for small, invisible, or irrelevant images.
 - Improved image scoring system for better content relevance.
 - Implemented JavaScript-based image dimension updating for more accurate representation.
diff --git a/crawl4ai/async_crawler_strategy.py b/crawl4ai/async_crawler_strategy.py
index 57288b59..baa06e47 100644
--- a/crawl4ai/async_crawler_strategy.py
+++ b/crawl4ai/async_crawler_strategy.py
@@ -84,7 +84,7 @@ class ManagedBrowser:
                 print(f"STDOUT: {stdout.decode()}")
                 print(f"STDERR: {stderr.decode()}")
                 await self.cleanup()
-    
+
     def _get_browser_path(self) -> str:
         """Returns the browser executable path based on OS and browser type"""
         if sys.platform == "darwin":  # macOS
@@ -493,6 +493,75 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
         return page  
     
     async def crawl(self, url: str, **kwargs) -> AsyncCrawlResponse:
+        """
+        Crawls a given URL or processes raw HTML/local file content based on the URL prefix.
+
+        Args:
+            url (str): The URL to crawl. Supported prefixes:
+                - 'http://' or 'https://': Web URL to crawl.
+                - 'file://': Local file path to process.
+                - 'raw:': Raw HTML content to process.
+            **kwargs: Additional parameters:
+                - 'screenshot' (bool): Whether to take a screenshot.
+                - ... [other existing parameters]
+
+        Returns:
+            AsyncCrawlResponse: The response containing HTML, headers, status code, and optional screenshot.
+        """
+        response_headers = {}
+        status_code = 200  # Default to 200 for local/raw HTML
+        screenshot_requested = kwargs.get('screenshot', False)
+        screenshot_data = None
+
+        if url.startswith(('http://', 'https://')):
+            # Proceed with standard web crawling
+            return await self._crawl_web(url, **kwargs)
+
+        elif url.startswith('file://'):
+            # Process local file
+            local_file_path = url[7:]  # Remove 'file://' prefix
+            if not os.path.exists(local_file_path):
+                raise FileNotFoundError(f"Local file not found: {local_file_path}")
+            with open(local_file_path, 'r', encoding='utf-8') as f:
+                html = f.read()
+            if screenshot_requested:
+                screenshot_data = await self._generate_screenshot_from_html(html)
+            return AsyncCrawlResponse(
+                html=html,
+                response_headers=response_headers,
+                status_code=status_code,
+                screenshot=screenshot_data,
+                get_delayed_content=None
+            )
+
+        elif url.startswith('raw:'):
+            # Process raw HTML content
+            raw_html = url[4:]  # Remove 'raw:' prefix
+            html = raw_html
+            if screenshot_requested:
+                screenshot_data = await self._generate_screenshot_from_html(html)
+            return AsyncCrawlResponse(
+                html=html,
+                response_headers=response_headers,
+                status_code=status_code,
+                screenshot=screenshot_data,
+                get_delayed_content=None
+            )
+        else:
+            raise ValueError("URL must start with 'http://', 'https://', 'file://', or 'raw:'")
+
+
+    async def _crawl_web(self, url: str, **kwargs) -> AsyncCrawlResponse:
+        """
+        Existing web crawling logic remains unchanged.
+
+        Args:
+            url (str): The web URL to crawl.
+            **kwargs: Additional parameters.
+
+        Returns:
+            AsyncCrawlResponse: The response containing HTML, headers, status code, and optional screenshot.
+        """
         response_headers = {}
         status_code = None
         
@@ -792,7 +861,7 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
 
             if self.verbose:
                 print(f"[LOG] ✅ Crawled {url} successfully!")
-
+           
             if self.use_cached_html:
                 cache_file_path = os.path.join(
                     Path.home(), ".crawl4ai", "cache", hashlib.md5(url.encode()).hexdigest()
@@ -972,6 +1041,15 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
                 print(f"Warning: Failed to remove overlay elements: {str(e)}")
 
     async def take_screenshot(self, page: Page) -> str:
+        """
+        Takes a screenshot of the current page.
+        
+        Args:
+            page (Page): The Playwright page instance
+            
+        Returns:
+            str: Base64-encoded screenshot image
+        """
         try:
             # The page is already loaded, just take the screenshot
             screenshot = await page.screenshot(full_page=True)
@@ -991,4 +1069,36 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
             return base64.b64encode(buffered.getvalue()).decode('utf-8')
         finally:
             await page.close()
+            
+    async def _generate_screenshot_from_html(self, html: str) -> Optional[str]:
+        """
+        Generates a screenshot from raw HTML content.
+
+        Args:
+            html (str): The HTML content to render and capture.
+
+        Returns:
+            Optional[str]: Base64-encoded screenshot image or an error image if failed.
+        """
+        try:
+            if not self.browser:
+                await self.start()
+            page = await self.browser.new_page()
+            await page.set_content(html, wait_until='networkidle')
+            screenshot = await page.screenshot(full_page=True)
+            await page.close()
+            return base64.b64encode(screenshot).decode('utf-8')
+        except Exception as e:
+            error_message = f"Failed to take screenshot: {str(e)}"
+            print(error_message)
+
+            # Generate an error image
+            img = Image.new('RGB', (800, 600), color='black')
+            draw = ImageDraw.Draw(img)
+            font = ImageFont.load_default()
+            draw.text((10, 10), error_message, fill=(255, 255, 255), font=font)
+
+            buffered = BytesIO()
+            img.save(buffered, format="JPEG")
+            return base64.b64encode(buffered.getvalue()).decode('utf-8')
 
diff --git a/crawl4ai/async_database.py b/crawl4ai/async_database.py
index 78931d28..273ca6c9 100644
--- a/crawl4ai/async_database.py
+++ b/crawl4ai/async_database.py
@@ -5,6 +5,7 @@ import asyncio
 from typing import Optional, Tuple, Dict
 from contextlib import asynccontextmanager
 import logging
+import json  # Added for serialization/deserialization
 
 # Set up logging
 logging.basicConfig(level=logging.INFO)
@@ -89,7 +90,8 @@ class AsyncDatabaseManager:
                     media TEXT DEFAULT "{}",
                     links TEXT DEFAULT "{}",
                     metadata TEXT DEFAULT "{}",
-                    screenshot TEXT DEFAULT ""
+                    screenshot TEXT DEFAULT "",
+                    response_headers TEXT DEFAULT "{}"  -- New column added
                 )
             ''')
         
@@ -105,26 +107,51 @@ class AsyncDatabaseManager:
 
         column_names = await self.execute_with_retry(_check_columns)
         
-        for column in ['media', 'links', 'metadata', 'screenshot']:
+        # List of new columns to add
+        new_columns = ['media', 'links', 'metadata', 'screenshot', 'response_headers']
+        
+        for column in new_columns:
             if column not in column_names:
                 await self.aalter_db_add_column(column)
 
     async def aalter_db_add_column(self, new_column: str):
         """Add new column to the database"""
         async def _alter(db):
-            await db.execute(f'ALTER TABLE crawled_data ADD COLUMN {new_column} TEXT DEFAULT ""')
+            if new_column == 'response_headers':
+                await db.execute(f'ALTER TABLE crawled_data ADD COLUMN {new_column} TEXT DEFAULT "{{}}"')
+            else:
+                await db.execute(f'ALTER TABLE crawled_data ADD COLUMN {new_column} TEXT DEFAULT ""')
             logger.info(f"Added column '{new_column}' to the database.")
 
         await self.execute_with_retry(_alter)
 
-    async def aget_cached_url(self, url: str) -> Optional[Tuple[str, str, str, str, str, str, str, bool, str]]:
+    async def aget_cached_url(self, url: str) -> Optional[Tuple[str, str, str, str, str, bool, str, str, str, str]]:
         """Retrieve cached URL data"""
         async def _get(db):
             async with db.execute(
-                'SELECT url, html, cleaned_html, markdown, extracted_content, success, media, links, metadata, screenshot FROM crawled_data WHERE url = ?',
+                '''
+                SELECT url, html, cleaned_html, markdown, extracted_content, success, media, links, metadata, screenshot, response_headers
+                FROM crawled_data WHERE url = ?
+                ''',
                 (url,)
             ) as cursor:
-                return await cursor.fetchone()
+                row = await cursor.fetchone()
+                if row:
+                    # Deserialize JSON fields
+                    return (
+                        row[0],  # url
+                        row[1],  # html
+                        row[2],  # cleaned_html
+                        row[3],  # markdown
+                        row[4],  # extracted_content
+                        row[5],  # success
+                        json.loads(row[6] or '{}'),  # media
+                        json.loads(row[7] or '{}'),  # links
+                        json.loads(row[8] or '{}'),  # metadata
+                        row[9],  # screenshot
+                        json.loads(row[10] or '{}')  # response_headers
+                    )
+                return None
 
         try:
             return await self.execute_with_retry(_get)
@@ -132,12 +159,27 @@ class AsyncDatabaseManager:
             logger.error(f"Error retrieving cached URL: {e}")
             return None
 
-    async def acache_url(self, url: str, html: str, cleaned_html: str, markdown: str, extracted_content: str, success: bool, media: str = "{}", links: str = "{}", metadata: str = "{}", screenshot: str = ""):
+    async def acache_url(
+        self,
+        url: str,
+        html: str,
+        cleaned_html: str,
+        markdown: str,
+        extracted_content: str,
+        success: bool,
+        media: str = "{}",
+        links: str = "{}",
+        metadata: str = "{}",
+        screenshot: str = "",
+        response_headers: str = "{}"  # New parameter added
+    ):
         """Cache URL data with retry logic"""
         async def _cache(db):
             await db.execute('''
-                INSERT INTO crawled_data (url, html, cleaned_html, markdown, extracted_content, success, media, links, metadata, screenshot)
-                VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?)
+                INSERT INTO crawled_data (
+                    url, html, cleaned_html, markdown, extracted_content, success, media, links, metadata, screenshot, response_headers
+                )
+                VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)
                 ON CONFLICT(url) DO UPDATE SET
                     html = excluded.html,
                     cleaned_html = excluded.cleaned_html,
@@ -147,8 +189,9 @@ class AsyncDatabaseManager:
                     media = excluded.media,      
                     links = excluded.links,    
                     metadata = excluded.metadata,      
-                    screenshot = excluded.screenshot
-            ''', (url, html, cleaned_html, markdown, extracted_content, success, media, links, metadata, screenshot))
+                    screenshot = excluded.screenshot,
+                    response_headers = excluded.response_headers  -- Update response_headers
+            ''', (url, html, cleaned_html, markdown, extracted_content, success, media, links, metadata, screenshot, response_headers))
 
         try:
             await self.execute_with_retry(_cache)
@@ -189,4 +232,4 @@ class AsyncDatabaseManager:
             logger.error(f"Error flushing database: {e}")
 
 # Create a singleton instance
-async_db_manager = AsyncDatabaseManager()
\ No newline at end of file
+async_db_manager = AsyncDatabaseManager()
diff --git a/crawl4ai/async_webcrawler.py b/crawl4ai/async_webcrawler.py
index f580776b..9d0340dc 100644
--- a/crawl4ai/async_webcrawler.py
+++ b/crawl4ai/async_webcrawler.py
@@ -9,7 +9,7 @@ from .async_database import async_db_manager
 from .chunking_strategy import *
 from .extraction_strategy import *
 from .async_crawler_strategy import AsyncCrawlerStrategy, AsyncPlaywrightCrawlerStrategy, AsyncCrawlResponse
-from .content_scrapping_strategy import WebScrappingStrategy
+from .content_scrapping_strategy import WebScrapingStrategy
 from .config import MIN_WORD_THRESHOLD, IMAGE_DESCRIPTION_MIN_WORD_THRESHOLD
 from .utils import (
     sanitize_input_encode,
@@ -47,17 +47,17 @@ class AsyncWebCrawler:
 
     async def awarmup(self):
         # Print a message for crawl4ai and its version
+        print(f"[LOG] 🚀 Crawl4AI {crawl4ai_version}")
         if self.verbose:
-            print(f"[LOG] 🚀 Crawl4AI {crawl4ai_version}")
             print("[LOG] 🌤️  Warming up the AsyncWebCrawler")
         # await async_db_manager.ainit_db()
         await async_db_manager.initialize()
-        # await self.arun(
-        #     url="https://google.com/",
-        #     word_count_threshold=5,
-        #     bypass_cache=False,
-        #     verbose=False,
-        # )
+        await self.arun(
+            url="https://google.com/",
+            word_count_threshold=5,
+            bypass_cache=False,
+            verbose=False,
+        )
         self.ready = True
         if self.verbose:
             print("[LOG] 🌞 AsyncWebCrawler is ready to crawl")
@@ -75,6 +75,19 @@ class AsyncWebCrawler:
         verbose=True,
         **kwargs,
     ) -> CrawlResult:
+        """
+        Runs the crawler for a single source: URL (web, local file, or raw HTML).
+
+        Args:
+            url (str): The URL to crawl. Supported prefixes:
+                - 'http://' or 'https://': Web URL to crawl.
+                - 'file://': Local file path to process.
+                - 'raw:': Raw HTML content to process.
+            ... [other existing parameters]
+
+        Returns:
+            CrawlResult: The result of the crawling and processing.
+        """
         try:
             extraction_strategy = extraction_strategy or NoExtractionStrategy()
             extraction_strategy.verbose = verbose
@@ -89,8 +102,13 @@ class AsyncWebCrawler:
             cached = None
             screenshot_data = None
             extracted_content = None
-            if not bypass_cache and not self.always_by_pass_cache:
+            
+            is_web_url = url.startswith(('http://', 'https://'))
+            if is_web_url and not bypass_cache and not self.always_by_pass_cache:
                 cached = await async_db_manager.aget_cached_url(url)
+                        
+            # if not bypass_cache and not self.always_by_pass_cache:
+            #     cached = await async_db_manager.aget_cached_url(url)
 
             if kwargs.get("warmup", True) and not self.ready:
                 return None
@@ -117,25 +135,32 @@ class AsyncWebCrawler:
                     )
 
             crawl_result = await self.aprocess_html(
-                url,
-                html,
-                extracted_content,
-                word_count_threshold,
-                extraction_strategy,
-                chunking_strategy,
-                css_selector,
-                screenshot_data,
-                verbose,
-                bool(cached),
+                url=url,
+                html=html,
+                extracted_content=extracted_content,
+                word_count_threshold=word_count_threshold,
+                extraction_strategy=extraction_strategy,
+                chunking_strategy=chunking_strategy,
+                css_selector=css_selector,
+                screenshot=screenshot_data,
+                verbose=verbose,
+                is_cached=bool(cached),
                 async_response=async_response,
                 bypass_cache=bypass_cache,
                 **kwargs,
             )
-            crawl_result.status_code = async_response.status_code if async_response else 200
-            crawl_result.response_headers = async_response.response_headers if async_response else {}
+            
+            if async_response:
+                crawl_result.status_code = async_response.status_code
+                crawl_result.response_headers = async_response.response_headers
+            else:
+                crawl_result.status_code = 200
+                crawl_result.response_headers = cached[10]
+
             crawl_result.success = bool(html)
             crawl_result.session_id = kwargs.get("session_id", None)
             return crawl_result
+        
         except Exception as e:
             if not hasattr(e, "msg"):
                 e.msg = str(e)
@@ -155,22 +180,40 @@ class AsyncWebCrawler:
         verbose=True,
         **kwargs,
     ) -> List[CrawlResult]:
-        tasks = [
-            self.arun(
-                url,
-                word_count_threshold,
-                extraction_strategy,
-                chunking_strategy,
-                bypass_cache,
-                css_selector,
-                screenshot,
-                user_agent,
-                verbose,
-                **kwargs
-            )
-            for url in urls
-        ]
-        return await asyncio.gather(*tasks)
+        """
+        Runs the crawler for multiple sources: URLs (web, local files, or raw HTML).
+
+        Args:
+            urls (List[str]): A list of URLs with supported prefixes:
+                - 'http://' or 'https://': Web URL to crawl.
+                - 'file://': Local file path to process.
+                - 'raw:': Raw HTML content to process.
+            ... [other existing parameters]
+
+        Returns:
+            List[CrawlResult]: The results of the crawling and processing.
+        """
+        semaphore_count = kwargs.get('semaphore_count', 5)  # Adjust as needed
+        semaphore = asyncio.Semaphore(semaphore_count)
+
+        async def crawl_with_semaphore(url):
+            async with semaphore:
+                return await self.arun(
+                    url,
+                    word_count_threshold=word_count_threshold,
+                    extraction_strategy=extraction_strategy,
+                    chunking_strategy=chunking_strategy,
+                    bypass_cache=bypass_cache,
+                    css_selector=css_selector,
+                    screenshot=screenshot,
+                    user_agent=user_agent,
+                    verbose=verbose,
+                    **kwargs,
+                )
+
+        tasks = [crawl_with_semaphore(url) for url in urls]
+        results = await asyncio.gather(*tasks, return_exceptions=True)
+        return [result if not isinstance(result, Exception) else str(result) for result in results]
 
     async def aprocess_html(
         self,
@@ -184,13 +227,14 @@ class AsyncWebCrawler:
         screenshot: str,
         verbose: bool,
         is_cached: bool,
+        async_response: Optional[AsyncCrawlResponse],
         **kwargs,
     ) -> CrawlResult:
         t = time.time()
         # Extract content from HTML
         try:
             t1 = time.time()
-            scrapping_strategy = WebScrappingStrategy()
+            scrapping_strategy = WebScrapingStrategy()
             # result = await scrapping_strategy.ascrap(
             result = scrapping_strategy.scrap(
                 url,
@@ -245,6 +289,12 @@ class AsyncWebCrawler:
             )
 
         screenshot = None if not screenshot else screenshot
+        
+        response_headers = "{}"  # Default value
+        if async_response:
+            # Serialize response_headers dict to JSON string
+            response_headers = json.dumps(async_response.response_headers, ensure_ascii=False)
+
 
         if not is_cached or kwargs.get("bypass_cache", False) or self.always_by_pass_cache:
             await async_db_manager.acache_url(
@@ -258,6 +308,7 @@ class AsyncWebCrawler:
                 json.dumps(links),
                 json.dumps(metadata),
                 screenshot=screenshot,
+                response_headers=response_headers,
             )
 
         return CrawlResult(
diff --git a/crawl4ai/content_cleaning_strategy.py b/crawl4ai/content_cleaning_strategy.py
index 2f052f76..b8a5053d 100644
--- a/crawl4ai/content_cleaning_strategy.py
+++ b/crawl4ai/content_cleaning_strategy.py
@@ -15,7 +15,7 @@ class ContentCleaningStrategy:
         self.link_density_threshold = 0.2
         self.max_dom_depth = 10  # To prevent excessive DOM traversal
 
-    def clean(self, clean_html: str) -> str:
+    def clean(self, clean_html: str, soup = None) -> str:
         """
         Main function that takes cleaned HTML and returns super cleaned HTML.
 
@@ -28,18 +28,20 @@ class ContentCleaningStrategy:
         try:
             if not clean_html or not isinstance(clean_html, str):
                 return ''
-            soup = BeautifulSoup(clean_html, 'html.parser')
+            if not soup:
+                # soup = BeautifulSoup(clean_html, 'html.parser')
+                soup = BeautifulSoup(clean_html, 'lxml')
             main_content = self.extract_main_content(soup)
             if main_content:
                 super_clean_element = self.clean_element(main_content)
-                return str(super_clean_element)
+                return super_clean_element.encode_contents().decode('utf-8')
             else:
                 return ''
         except Exception:
             # Handle exceptions silently or log them as needed
             return ''
 
-    def extract_main_content(self, soup: BeautifulSoup) -> Optional[Tag]:
+    def extract_main_content(self, soup) -> Optional[Tag]:
         """
         Identifies and extracts the main content element from the HTML.
 
diff --git a/crawl4ai/content_scrapping_strategy.py b/crawl4ai/content_scrapping_strategy.py
index caed7319..a2dbbd96 100644
--- a/crawl4ai/content_scrapping_strategy.py
+++ b/crawl4ai/content_scrapping_strategy.py
@@ -1,3 +1,4 @@
+import re  # Point 1: Pre-Compile Regular Expressions
 from abc import ABC, abstractmethod
 from typing import Dict, Any
 from bs4 import BeautifulSoup
@@ -105,7 +106,39 @@ class CustomHTML2Text(HTML2Text):
             return
         super().handle_data(data, entity_char)
 
-class ContentScrappingStrategy(ABC):
+# Pre-compile regular expressions for Open Graph and Twitter metadata
+OG_REGEX = re.compile(r'^og:')
+TWITTER_REGEX = re.compile(r'^twitter:')
+DIMENSION_REGEX = re.compile(r"(\d+)(\D*)")
+
+# Function to parse image height/width value and units
+def parse_dimension(dimension):
+    if dimension:
+        # match = re.match(r"(\d+)(\D*)", dimension)
+        match = DIMENSION_REGEX.match(dimension)
+        if match:
+            number = int(match.group(1))
+            unit = match.group(2) or 'px'  # Default unit is 'px' if not specified
+            return number, unit
+    return None, None
+
+# Fetch image file metadata to extract size and extension
+def fetch_image_file_size(img, base_url):
+    #If src is relative path construct full URL, if not it may be CDN URL
+    img_url = urljoin(base_url,img.get('src'))
+    try:
+        response = requests.head(img_url)
+        if response.status_code == 200:
+            return response.headers.get('Content-Length',None)
+        else:
+            print(f"Failed to retrieve file size for {img_url}")
+            return None
+    except InvalidSchema as e:
+        return None
+    finally:
+        return
+
+class ContentScrapingStrategy(ABC):
     @abstractmethod
     def scrap(self, url: str, html: str, **kwargs) -> Dict[str, Any]:
         pass
@@ -114,7 +147,7 @@ class ContentScrappingStrategy(ABC):
     async def ascrap(self, url: str, html: str, **kwargs) -> Dict[str, Any]:
         pass
 
-class WebScrappingStrategy(ContentScrappingStrategy):
+class WebScrapingStrategy(ContentScrapingStrategy):
     def scrap(self, url: str, html: str, **kwargs) -> Dict[str, Any]:
         return self._get_content_of_website_optimized(url, html, is_async=False, **kwargs)
 
@@ -126,9 +159,16 @@ class WebScrappingStrategy(ContentScrappingStrategy):
         if not html:
             return None
 
-        soup = BeautifulSoup(html, 'html.parser')
+        # soup = BeautifulSoup(html, 'html.parser')
+        soup = BeautifulSoup(html, 'lxml')
         body = soup.body
         
+        try:
+            meta = extract_metadata("", soup)
+        except Exception as e:
+            print('Error extracting metadata:', str(e))
+            meta = {}
+        
         
         image_description_min_word_threshold = kwargs.get('image_description_min_word_threshold', IMAGE_DESCRIPTION_MIN_WORD_THRESHOLD)
 
@@ -187,31 +227,7 @@ class WebScrappingStrategy(ContentScrappingStrategy):
 
             #Score an image for it's usefulness
             def score_image_for_usefulness(img, base_url, index, images_count):
-                # Function to parse image height/width value and units
-                def parse_dimension(dimension):
-                    if dimension:
-                        match = re.match(r"(\d+)(\D*)", dimension)
-                        if match:
-                            number = int(match.group(1))
-                            unit = match.group(2) or 'px'  # Default unit is 'px' if not specified
-                            return number, unit
-                    return None, None
 
-                # Fetch image file metadata to extract size and extension
-                def fetch_image_file_size(img, base_url):
-                    #If src is relative path construct full URL, if not it may be CDN URL
-                    img_url = urljoin(base_url,img.get('src'))
-                    try:
-                        response = requests.head(img_url)
-                        if response.status_code == 200:
-                            return response.headers.get('Content-Length',None)
-                        else:
-                            print(f"Failed to retrieve file size for {img_url}")
-                            return None
-                    except InvalidSchema as e:
-                        return None
-                    finally:
-                        return
 
                 image_height = img.get('height')
                 height_value, height_unit = parse_dimension(image_height)
@@ -294,7 +310,6 @@ class WebScrappingStrategy(ContentScrappingStrategy):
                 
                 exclude_social_media_domains = SOCIAL_MEDIA_DOMAINS + kwargs.get('exclude_social_media_domains', [])
                 exclude_social_media_domains = list(set(exclude_social_media_domains))
-
                 
                 try:
                     if element.name == 'a' and element.get('href'):
@@ -439,15 +454,7 @@ class WebScrappingStrategy(ContentScrappingStrategy):
             except Exception as e:
                 print('Error processing element:', str(e))
                 return False
-
-        #process images by filtering and extracting contextual text from the page
-        # imgs = body.find_all('img')
-        # media['images'] = [
-        #     result for result in
-        #     (process_image(img, url, i, len(imgs)) for i, img in enumerate(imgs))
-        #     if result is not None
-        # ]
-        
+       
         process_element(body)
         
         # Update the links dictionary with unique links
@@ -478,8 +485,9 @@ class WebScrappingStrategy(ContentScrappingStrategy):
                 # Replace base64 data with empty string
                 img['src'] = base64_pattern.sub('', src)
                 
+        str_body = ""
         try:
-            str(body)
+            str_body = body.encode_contents().decode('utf-8')
         except Exception as e:
             # Reset body to the original HTML
             success = False
@@ -504,11 +512,12 @@ class WebScrappingStrategy(ContentScrappingStrategy):
             
             # Append the error div to the body
             body.body.append(error_div)
+            str_body = body.encode_contents().decode('utf-8')
             
             print(f"[LOG] 😧 Error: After processing the crawled HTML and removing irrelevant tags, nothing was left in the page. Check the markdown for further details.")
 
 
-        cleaned_html = str(body).replace('\n\n', '\n').replace('  ', ' ')
+        cleaned_html = str_body.replace('\n\n', '\n').replace('  ', ' ')
 
         try:
             h = CustomHTML2Text()
@@ -518,15 +527,14 @@ class WebScrappingStrategy(ContentScrappingStrategy):
             markdown = h.handle(sanitize_html(cleaned_html))
         markdown = markdown.replace('    ```', '```')
 
-        try:
-            meta = extract_metadata(html, soup)
-        except Exception as e:
-            print('Error extracting metadata:', str(e))
-            meta = {}
+        
             
-        cleaner = ContentCleaningStrategy()
-        fit_html = cleaner.clean(cleaned_html)
-        fit_markdown = h.handle(fit_html)
+        fit_markdown = "Set flag 'fit_markdown' to True to get cleaned HTML content."
+        fit_html = "Set flag 'fit_markdown' to True to get cleaned HTML content."
+        if kwargs.get('fit_markdown', False):
+            cleaner = ContentCleaningStrategy()
+            fit_html = cleaner.clean(cleaned_html)
+            fit_markdown = h.handle(fit_html)
 
         cleaned_html = sanitize_html(cleaned_html)
         return {
diff --git a/crawl4ai/utils.py b/crawl4ai/utils.py
index d96f1ded..d8bd6992 100644
--- a/crawl4ai/utils.py
+++ b/crawl4ai/utils.py
@@ -736,46 +736,54 @@ def get_content_of_website_optimized(url: str, html: str, word_count_threshold:
         'metadata': meta
     }
 
-def extract_metadata(html, soup = None):
+def extract_metadata(html, soup=None):
     metadata = {}
     
-    if not html:
+    if not html and not soup:
+        return {}
+    
+    if not soup:
+        soup = BeautifulSoup(html, 'lxml')
+    
+    head = soup.head
+    if not head:
         return metadata
     
-    # Parse HTML content with BeautifulSoup
-    if not soup:
-        soup = BeautifulSoup(html, 'html.parser')
-
     # Title
-    title_tag = soup.find('title')
-    metadata['title'] = title_tag.string if title_tag else None
+    title_tag = head.find('title')
+    metadata['title'] = title_tag.string.strip() if title_tag and title_tag.string else None
 
     # Meta description
-    description_tag = soup.find('meta', attrs={'name': 'description'})
-    metadata['description'] = description_tag['content'] if description_tag else None
+    description_tag = head.find('meta', attrs={'name': 'description'})
+    metadata['description'] = description_tag.get('content', '').strip() if description_tag else None
 
     # Meta keywords
-    keywords_tag = soup.find('meta', attrs={'name': 'keywords'})
-    metadata['keywords'] = keywords_tag['content'] if keywords_tag else None
+    keywords_tag = head.find('meta', attrs={'name': 'keywords'})
+    metadata['keywords'] = keywords_tag.get('content', '').strip() if keywords_tag else None
 
     # Meta author
-    author_tag = soup.find('meta', attrs={'name': 'author'})
-    metadata['author'] = author_tag['content'] if author_tag else None
+    author_tag = head.find('meta', attrs={'name': 'author'})
+    metadata['author'] = author_tag.get('content', '').strip() if author_tag else None
 
     # Open Graph metadata
-    og_tags = soup.find_all('meta', attrs={'property': lambda value: value and value.startswith('og:')})
+    og_tags = head.find_all('meta', attrs={'property': re.compile(r'^og:')})
     for tag in og_tags:
-        property_name = tag['property']
-        metadata[property_name] = tag['content']
+        property_name = tag.get('property', '').strip()
+        content = tag.get('content', '').strip()
+        if property_name and content:
+            metadata[property_name] = content
 
     # Twitter Card metadata
-    twitter_tags = soup.find_all('meta', attrs={'name': lambda value: value and value.startswith('twitter:')})
+    twitter_tags = head.find_all('meta', attrs={'name': re.compile(r'^twitter:')})
     for tag in twitter_tags:
-        property_name = tag['name']
-        metadata[property_name] = tag['content']
-
+        property_name = tag.get('name', '').strip()
+        content = tag.get('content', '').strip()
+        if property_name and content:
+            metadata[property_name] = content
+    
     return metadata
 
+
 def extract_xml_tags(string):
     tags = re.findall(r'<(\w+)>', string)
     return list(set(tags))
diff --git a/crawl4ai/web_crawler.py b/crawl4ai/web_crawler.py
index 95af6c7a..c97a9cf4 100644
--- a/crawl4ai/web_crawler.py
+++ b/crawl4ai/web_crawler.py
@@ -10,7 +10,7 @@ from .extraction_strategy import *
 from .crawler_strategy import *
 from typing import List
 from concurrent.futures import ThreadPoolExecutor
-from .content_scrapping_strategy import WebScrappingStrategy
+from .content_scrapping_strategy import WebScrapingStrategy
 from .config import *
 import warnings
 import json
@@ -182,7 +182,7 @@ class WebCrawler:
             # Extract content from HTML
             try:
                 t1 = time.time()
-                scrapping_strategy = WebScrappingStrategy()
+                scrapping_strategy = WebScrapingStrategy()
                 extra_params = {k: v for k, v in kwargs.items() if k not in ["only_text", "image_description_min_word_threshold"]}
                 result = scrapping_strategy.scrap(
                     url,
diff --git a/docs/md_v2/basic/prefix-based-input.md b/docs/md_v2/basic/prefix-based-input.md
new file mode 100644
index 00000000..42987a67
--- /dev/null
+++ b/docs/md_v2/basic/prefix-based-input.md
@@ -0,0 +1,235 @@
+# Prefix-Based Input Handling in Crawl4AI
+
+This guide will walk you through using the Crawl4AI library to crawl web pages, local HTML files, and raw HTML strings. We'll demonstrate these capabilities using a Wikipedia page as an example.
+
+## Table of Contents
+- [Prefix-Based Input Handling in Crawl4AI](#prefix-based-input-handling-in-crawl4ai)
+  - [Table of Contents](#table-of-contents)
+    - [Crawling a Web URL](#crawling-a-web-url)
+    - [Crawling a Local HTML File](#crawling-a-local-html-file)
+    - [Crawling Raw HTML Content](#crawling-raw-html-content)
+  - [Complete Example](#complete-example)
+    - [**How It Works**](#how-it-works)
+    - [**Running the Example**](#running-the-example)
+  - [Conclusion](#conclusion)
+
+---
+
+
+### Crawling a Web URL
+
+To crawl a live web page, provide the URL starting with `http://` or `https://`.
+
+```python
+import asyncio
+from crawl4ai import AsyncWebCrawler
+
+async def crawl_web():
+    async with AsyncWebCrawler(verbose=True) as crawler:
+        result = await crawler.arun(url="https://en.wikipedia.org/wiki/apple", bypass_cache=True)
+        if result.success:
+            print("Markdown Content:")
+            print(result.markdown)
+        else:
+            print(f"Failed to crawl: {result.error_message}")
+
+asyncio.run(crawl_web())
+```
+
+### Crawling a Local HTML File
+
+To crawl a local HTML file, prefix the file path with `file://`.
+
+```python
+import asyncio
+from crawl4ai import AsyncWebCrawler
+
+async def crawl_local_file():
+    local_file_path = "/path/to/apple.html"  # Replace with your file path
+    file_url = f"file://{local_file_path}"
+    
+    async with AsyncWebCrawler(verbose=True) as crawler:
+        result = await crawler.arun(url=file_url, bypass_cache=True)
+        if result.success:
+            print("Markdown Content from Local File:")
+            print(result.markdown)
+        else:
+            print(f"Failed to crawl local file: {result.error_message}")
+
+asyncio.run(crawl_local_file())
+```
+
+### Crawling Raw HTML Content
+
+To crawl raw HTML content, prefix the HTML string with `raw:`.
+
+```python
+import asyncio
+from crawl4ai import AsyncWebCrawler
+
+async def crawl_raw_html():
+    raw_html = "<html><body><h1>Hello, World!</h1></body></html>"
+    raw_html_url = f"raw:{raw_html}"
+    
+    async with AsyncWebCrawler(verbose=True) as crawler:
+        result = await crawler.arun(url=raw_html_url, bypass_cache=True)
+        if result.success:
+            print("Markdown Content from Raw HTML:")
+            print(result.markdown)
+        else:
+            print(f"Failed to crawl raw HTML: {result.error_message}")
+
+asyncio.run(crawl_raw_html())
+```
+
+---
+
+## Complete Example
+
+Below is a comprehensive script that:
+1. **Crawls the Wikipedia page for "Apple".**
+2. **Saves the HTML content to a local file (`apple.html`).**
+3. **Crawls the local HTML file and verifies the markdown length matches the original crawl.**
+4. **Crawls the raw HTML content from the saved file and verifies consistency.**
+
+```python
+import os
+import sys
+import asyncio
+from pathlib import Path
+
+# Adjust the parent directory to include the crawl4ai module
+parent_dir = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
+sys.path.append(parent_dir)
+
+from crawl4ai import AsyncWebCrawler
+
+async def main():
+    # Define the URL to crawl
+    wikipedia_url = "https://en.wikipedia.org/wiki/apple"
+    
+    # Define the path to save the HTML file
+    # Save the file in the same directory as the script
+    script_dir = Path(__file__).parent
+    html_file_path = script_dir / "apple.html"
+    
+    async with AsyncWebCrawler(verbose=True) as crawler:
+        print("\n=== Step 1: Crawling the Wikipedia URL ===")
+        # Crawl the Wikipedia URL
+        result = await crawler.arun(url=wikipedia_url, bypass_cache=True)
+        
+        # Check if crawling was successful
+        if not result.success:
+            print(f"Failed to crawl {wikipedia_url}: {result.error_message}")
+            return
+        
+        # Save the HTML content to a local file
+        with open(html_file_path, 'w', encoding='utf-8') as f:
+            f.write(result.html)
+        print(f"Saved HTML content to {html_file_path}")
+        
+        # Store the length of the generated markdown
+        web_crawl_length = len(result.markdown)
+        print(f"Length of markdown from web crawl: {web_crawl_length}\n")
+        
+        print("=== Step 2: Crawling from the Local HTML File ===")
+        # Construct the file URL with 'file://' prefix
+        file_url = f"file://{html_file_path.resolve()}"
+        
+        # Crawl the local HTML file
+        local_result = await crawler.arun(url=file_url, bypass_cache=True)
+        
+        # Check if crawling was successful
+        if not local_result.success:
+            print(f"Failed to crawl local file {file_url}: {local_result.error_message}")
+            return
+        
+        # Store the length of the generated markdown from local file
+        local_crawl_length = len(local_result.markdown)
+        print(f"Length of markdown from local file crawl: {local_crawl_length}")
+        
+        # Compare the lengths
+        assert web_crawl_length == local_crawl_length, (
+            f"Markdown length mismatch: Web crawl ({web_crawl_length}) != Local file crawl ({local_crawl_length})"
+        )
+        print("✅ Markdown length matches between web crawl and local file crawl.\n")
+        
+        print("=== Step 3: Crawling Using Raw HTML Content ===")
+        # Read the HTML content from the saved file
+        with open(html_file_path, 'r', encoding='utf-8') as f:
+            raw_html_content = f.read()
+        
+        # Prefix the raw HTML content with 'raw:'
+        raw_html_url = f"raw:{raw_html_content}"
+        
+        # Crawl using the raw HTML content
+        raw_result = await crawler.arun(url=raw_html_url, bypass_cache=True)
+        
+        # Check if crawling was successful
+        if not raw_result.success:
+            print(f"Failed to crawl raw HTML content: {raw_result.error_message}")
+            return
+        
+        # Store the length of the generated markdown from raw HTML
+        raw_crawl_length = len(raw_result.markdown)
+        print(f"Length of markdown from raw HTML crawl: {raw_crawl_length}")
+        
+        # Compare the lengths
+        assert web_crawl_length == raw_crawl_length, (
+            f"Markdown length mismatch: Web crawl ({web_crawl_length}) != Raw HTML crawl ({raw_crawl_length})"
+        )
+        print("✅ Markdown length matches between web crawl and raw HTML crawl.\n")
+        
+        print("All tests passed successfully!")
+        
+    # Clean up by removing the saved HTML file
+    if html_file_path.exists():
+        os.remove(html_file_path)
+        print(f"Removed the saved HTML file: {html_file_path}")
+
+# Run the main function
+if __name__ == "__main__":
+    asyncio.run(main())
+```
+
+### **How It Works**
+
+1. **Step 1: Crawl the Web URL**
+   - Crawls `https://en.wikipedia.org/wiki/apple`.
+   - Saves the HTML content to `apple.html`.
+   - Records the length of the generated markdown.
+
+2. **Step 2: Crawl from the Local HTML File**
+   - Uses the `file://` prefix to crawl `apple.html`.
+   - Ensures the markdown length matches the original web crawl.
+
+3. **Step 3: Crawl Using Raw HTML Content**
+   - Reads the HTML from `apple.html`.
+   - Prefixes it with `raw:` and crawls.
+   - Verifies the markdown length matches the previous results.
+
+4. **Cleanup**
+   - Deletes the `apple.html` file after testing.
+
+### **Running the Example**
+
+1. **Save the Script:**
+   - Save the above code as `test_crawl4ai.py` in your project directory.
+
+2. **Execute the Script:**
+   - Run the script using:
+     ```bash
+     python test_crawl4ai.py
+     ```
+
+3. **Observe the Output:**
+   - The script will print logs detailing each step.
+   - Assertions ensure consistency across different crawling methods.
+   - Upon success, it confirms that all markdown lengths match.
+
+---
+
+## Conclusion
+
+With the new prefix-based input handling in **Crawl4AI**, you can effortlessly crawl web URLs, local HTML files, and raw HTML strings using a unified `url` parameter. This enhancement simplifies the API usage and provides greater flexibility for diverse crawling scenarios.
+
diff --git a/tests/async/sample_wikipedia.html b/tests/async/sample_wikipedia.html
new file mode 100644
index 00000000..a22b3e3f
--- /dev/null
+++ b/tests/async/sample_wikipedia.html
@@ -0,0 +1,2179 @@
+<!DOCTYPE html><html class="client-js vector-feature-language-in-header-enabled vector-feature-language-in-main-page-header-disabled vector-feature-sticky-header-disabled vector-feature-page-tools-pinned-disabled vector-feature-toc-pinned-clientpref-1 vector-feature-main-menu-pinned-disabled vector-feature-limited-width-clientpref-1 vector-feature-limited-width-content-enabled vector-feature-custom-font-size-clientpref-1 vector-feature-appearance-pinned-clientpref-1 vector-feature-night-mode-enabled skin-theme-clientpref-day vector-toc-available vector-animations-ready ve-available" lang="en" dir="ltr"><head>
+<meta charset="UTF-8">
+<title>Apple - Wikipedia</title>
+<script>(function(){var className="client-js vector-feature-language-in-header-enabled vector-feature-language-in-main-page-header-disabled vector-feature-sticky-header-disabled vector-feature-page-tools-pinned-disabled vector-feature-toc-pinned-clientpref-1 vector-feature-main-menu-pinned-disabled vector-feature-limited-width-clientpref-1 vector-feature-limited-width-content-enabled vector-feature-custom-font-size-clientpref-1 vector-feature-appearance-pinned-clientpref-1 vector-feature-night-mode-enabled skin-theme-clientpref-day vector-toc-available";var cookie=document.cookie.match(/(?:^|; )enwikimwclientpreferences=([^;]+)/);if(cookie){cookie[1].split('%2C').forEach(function(pref){className=className.replace(new RegExp('(^| )'+pref.replace(/-clientpref-\w+$|[^\w-]+/g,'')+'-clientpref-\\w+( |$)'),'$1'+pref+'$2');});}document.documentElement.className=className;}());RLCONF={"wgBreakFrames":false,"wgSeparatorTransformTable":["",""],"wgDigitTransformTable":["",""],"wgDefaultDateFormat":"dmy",
+"wgMonthNames":["","January","February","March","April","May","June","July","August","September","October","November","December"],"wgRequestId":"6b8a48ac-4f28-463e-9ccd-c0249a8e617a","wgCanonicalNamespace":"","wgCanonicalSpecialPageName":false,"wgNamespaceNumber":0,"wgPageName":"Apple","wgTitle":"Apple","wgCurRevisionId":1256174424,"wgRevisionId":1256174424,"wgArticleId":18978754,"wgIsArticle":true,"wgIsRedirect":false,"wgAction":"view","wgUserName":null,"wgUserGroups":["*"],"wgCategories":["CS1: long volume value","CS1 Spanish-language sources (es)","CS1 maint: bot: original URL status unknown","CS1 German-language sources (de)","Articles with short description","Short description is different from Wikidata","Wikipedia indefinitely semi-protected pages","Wikipedia indefinitely move-protected pages","Use dmy dates from September 2019","Good articles","Articles with 'species' microformats","Articles containing Old English (ca. 450-1100)-language text",
+"Articles containing Proto-Germanic-language text","Articles containing Proto-Indo-European-language text","Articles containing Middle English (1100-1500)-language text","Articles with hAudio microformats","Commons category link is on Wikidata","Taxonbars desynced from Wikidata","Taxonbars on possible non-taxon pages","Taxonbars with multiple manual Wikidata items","Taxonbars with 25–29 taxon IDs","Taxonbars with 30–34 taxon IDs","Apples","Fruit","Fruits originating in Asia","Malus","Plants described in 1768"],"wgPageViewLanguage":"en","wgPageContentLanguage":"en","wgPageContentModel":"wikitext","wgRelevantPageName":"Apple","wgRelevantArticleId":18978754,"wgIsProbablyEditable":false,"wgRelevantPageIsProbablyEditable":false,"wgRestrictionEdit":["autoconfirmed"],"wgRestrictionMove":["sysop"],"wgNoticeProject":"wikipedia","wgCiteReferencePreviewsActive":false,"wgFlaggedRevsParams":{"tags":{"status":{"levels":1}}},"wgMediaViewerOnClick":true,"wgMediaViewerEnabledByDefault":true,
+"wgPopupsFlags":0,"wgVisualEditor":{"pageLanguageCode":"en","pageLanguageDir":"ltr","pageVariantFallbacks":"en"},"wgMFDisplayWikibaseDescriptions":{"search":true,"watchlist":true,"tagline":false,"nearby":true},"wgWMESchemaEditAttemptStepOversample":false,"wgWMEPageLength":100000,"wgRelatedArticlesCompat":[],"wgCentralAuthMobileDomain":false,"wgEditSubmitButtonLabelPublish":true,"wgULSPosition":"interlanguage","wgULSisCompactLinksEnabled":false,"wgVector2022LanguageInHeader":true,"wgULSisLanguageSelectorEmpty":false,"wgWikibaseItemId":"Q89","wgCheckUserClientHintsHeadersJsApi":["architecture","bitness","brands","fullVersionList","mobile","model","platform","platformVersion"],"GEHomepageSuggestedEditsEnableTopics":true,"wgGETopicsMatchModeEnabled":false,"wgGEStructuredTaskRejectionReasonTextInputEnabled":false,"wgGELevelingUpEnabledForUser":false};RLSTATE={"ext.globalCssJs.user.styles":"ready","site.styles":"ready","user.styles":"ready","ext.globalCssJs.user":"ready","user":"ready",
+"user.options":"loading","ext.cite.styles":"ready","mediawiki.page.gallery.styles":"ready","ext.tmh.player.styles":"ready","skins.vector.search.codex.styles":"ready","skins.vector.styles":"ready","skins.vector.icons":"ready","jquery.makeCollapsible.styles":"ready","ext.wikimediamessages.styles":"ready","ext.visualEditor.desktopArticleTarget.noscript":"ready","ext.uls.interlanguage":"ready","wikibase.client.init":"ready","ext.wikimediaBadges":"ready"};RLPAGEMODULES=["ext.cite.ux-enhancements","mediawiki.page.gallery","mediawiki.page.media","ext.tmh.player","site","mediawiki.page.ready","jquery.makeCollapsible","mediawiki.toc","skins.vector.js","ext.centralNotice.geoIP","ext.centralNotice.startUp","ext.gadget.ReferenceTooltips","ext.gadget.switcher","ext.urlShortener.toolbar","ext.centralauth.centralautologin","mmv.bootstrap","ext.popups","ext.visualEditor.desktopArticleTarget.init","ext.visualEditor.targetLoader","ext.echo.centralauth","ext.eventLogging","ext.wikimediaEvents",
+"ext.navigationTiming","ext.uls.interface","ext.cx.eventlogging.campaigns","ext.cx.uls.quick.actions","wikibase.client.vector-2022","ext.checkUser.clientHints","ext.growthExperiments.SuggestedEditSession","wikibase.sidebar.tracking"];</script>
+<script>(RLQ=window.RLQ||[]).push(function(){mw.loader.impl(function(){return["user.options@12s5i",function($,jQuery,require,module){mw.user.tokens.set({"patrolToken":"+\\","watchToken":"+\\","csrfToken":"+\\"});
+}];});});</script>
+<link rel="stylesheet" href="/w/load.php?lang=en&amp;modules=ext.cite.styles%7Cext.tmh.player.styles%7Cext.uls.interlanguage%7Cext.visualEditor.desktopArticleTarget.noscript%7Cext.wikimediaBadges%7Cext.wikimediamessages.styles%7Cjquery.makeCollapsible.styles%7Cmediawiki.page.gallery.styles%7Cskins.vector.icons%2Cstyles%7Cskins.vector.search.codex.styles%7Cwikibase.client.init&amp;only=styles&amp;skin=vector-2022">
+<script async="" src="/w/load.php?lang=en&amp;modules=startup&amp;only=scripts&amp;raw=1&amp;skin=vector-2022"></script>
+<style>
+.mw-editfont-monospace{font-family:monospace,monospace}.mw-editfont-sans-serif{font-family:sans-serif}.mw-editfont-serif{font-family:serif} .mw-editfont-monospace,.mw-editfont-sans-serif,.mw-editfont-serif{  font-size:13px; -moz-tab-size:4;tab-size:4; }.mw-editfont-monospace.oo-ui-textInputWidget,.mw-editfont-sans-serif.oo-ui-textInputWidget,.mw-editfont-serif.oo-ui-textInputWidget{font-size:inherit}.mw-editfont-monospace.oo-ui-textInputWidget > .oo-ui-inputWidget-input,.mw-editfont-sans-serif.oo-ui-textInputWidget > .oo-ui-inputWidget-input,.mw-editfont-serif.oo-ui-textInputWidget > .oo-ui-inputWidget-input{  font-size:13px}.mw-editfont-monospace.oo-ui-textInputWidget > input.oo-ui-inputWidget-input,.mw-editfont-sans-serif.oo-ui-textInputWidget > input.oo-ui-inputWidget-input,.mw-editfont-serif.oo-ui-textInputWidget > input.oo-ui-inputWidget-input{min-height:32px}
+.oo-ui-icon-add,.mw-ui-icon-add:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E add %3C/title%3E%3Cpath d=%22M11 9V4H9v5H4v2h5v5h2v-5h5V9z%22/%3E%3C/svg%3E")}.oo-ui-image-invert.oo-ui-icon-add,.mw-ui-icon-add-invert:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E add %3C/title%3E%3Cg fill=%22%23fff%22%3E%3Cpath d=%22M11 9V4H9v5H4v2h5v5h2v-5h5V9z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-progressive.oo-ui-icon-add,.mw-ui-icon-add-progressive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E add %3C/title%3E%3Cg fill=%22%2336c%22%3E%3Cpath d=%22M11 9V4H9v5H4v2h5v5h2v-5h5V9z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-icon-browser,.mw-ui-icon-browser:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E browser %3C/title%3E%3Cpath d=%22M2 2a2 2 0 0 0-2 2v12a2 2 0 0 0 2 2h16a2 2 0 0 0 2-2V4a2 2 0 0 0-2-2zm2 1.5A1.5 1.5 0 1 1 2.5 5 1.5 1.5 0 0 1 4 3.5M18 16H2V8h16z%22/%3E%3C/svg%3E")}.oo-ui-image-invert.oo-ui-icon-browser,.mw-ui-icon-browser-invert:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E browser %3C/title%3E%3Cg fill=%22%23fff%22%3E%3Cpath d=%22M2 2a2 2 0 0 0-2 2v12a2 2 0 0 0 2 2h16a2 2 0 0 0 2-2V4a2 2 0 0 0-2-2zm2 1.5A1.5 1.5 0 1 1 2.5 5 1.5 1.5 0 0 1 4 3.5M18 16H2V8h16z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-progressive.oo-ui-icon-browser,.mw-ui-icon-browser-progressive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E browser %3C/title%3E%3Cg fill=%22%2336c%22%3E%3Cpath d=%22M2 2a2 2 0 0 0-2 2v12a2 2 0 0 0 2 2h16a2 2 0 0 0 2-2V4a2 2 0 0 0-2-2zm2 1.5A1.5 1.5 0 1 1 2.5 5 1.5 1.5 0 0 1 4 3.5M18 16H2V8h16z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-icon-cancel,.mw-ui-icon-cancel:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E cancel %3C/title%3E%3Cpath d=%22M10 0a10 10 0 1 0 10 10A10 10 0 0 0 10 0M2 10a8 8 0 0 1 1.69-4.9L14.9 16.31A8 8 0 0 1 2 10m14.31 4.9L5.1 3.69A8 8 0 0 1 16.31 14.9%22/%3E%3C/svg%3E")}.oo-ui-image-invert.oo-ui-icon-cancel,.mw-ui-icon-cancel-invert:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E cancel %3C/title%3E%3Cg fill=%22%23fff%22%3E%3Cpath d=%22M10 0a10 10 0 1 0 10 10A10 10 0 0 0 10 0M2 10a8 8 0 0 1 1.69-4.9L14.9 16.31A8 8 0 0 1 2 10m14.31 4.9L5.1 3.69A8 8 0 0 1 16.31 14.9%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-progressive.oo-ui-icon-cancel,.mw-ui-icon-cancel-progressive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E cancel %3C/title%3E%3Cg fill=%22%2336c%22%3E%3Cpath d=%22M10 0a10 10 0 1 0 10 10A10 10 0 0 0 10 0M2 10a8 8 0 0 1 1.69-4.9L14.9 16.31A8 8 0 0 1 2 10m14.31 4.9L5.1 3.69A8 8 0 0 1 16.31 14.9%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-destructive.oo-ui-icon-cancel,.mw-ui-icon-cancel-destructive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E cancel %3C/title%3E%3Cg fill=%22%23d73333%22%3E%3Cpath d=%22M10 0a10 10 0 1 0 10 10A10 10 0 0 0 10 0M2 10a8 8 0 0 1 1.69-4.9L14.9 16.31A8 8 0 0 1 2 10m14.31 4.9L5.1 3.69A8 8 0 0 1 16.31 14.9%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-icon-check,.mw-ui-icon-check:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E check %3C/title%3E%3Cpath d=%22M7 14.2 2.8 10l-1.4 1.4L7 17 19 5l-1.4-1.4z%22/%3E%3C/svg%3E")}.oo-ui-image-invert.oo-ui-icon-check,.mw-ui-icon-check-invert:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E check %3C/title%3E%3Cg fill=%22%23fff%22%3E%3Cpath d=%22M7 14.2 2.8 10l-1.4 1.4L7 17 19 5l-1.4-1.4z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-progressive.oo-ui-icon-check,.mw-ui-icon-check-progressive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E check %3C/title%3E%3Cg fill=%22%2336c%22%3E%3Cpath d=%22M7 14.2 2.8 10l-1.4 1.4L7 17 19 5l-1.4-1.4z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-destructive.oo-ui-icon-check,.mw-ui-icon-check-destructive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E check %3C/title%3E%3Cg fill=%22%23d73333%22%3E%3Cpath d=%22M7 14.2 2.8 10l-1.4 1.4L7 17 19 5l-1.4-1.4z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-success.oo-ui-icon-check,.mw-ui-icon-check-success:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E check %3C/title%3E%3Cg fill=%22%2314866d%22%3E%3Cpath d=%22M7 14.2 2.8 10l-1.4 1.4L7 17 19 5l-1.4-1.4z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-icon-checkAll,.mw-ui-icon-checkAll:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E check all %3C/title%3E%3Cpath d=%22m.29 12.71 1.42-1.42 2.22 2.22 8.3-10.14 1.54 1.26-9.7 11.86zM12 10h5v2h-5zm-3 4h5v2H9zm6-8h5v2h-5z%22/%3E%3C/svg%3E")}.oo-ui-image-invert.oo-ui-icon-checkAll,.mw-ui-icon-checkAll-invert:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E check all %3C/title%3E%3Cg fill=%22%23fff%22%3E%3Cpath d=%22m.29 12.71 1.42-1.42 2.22 2.22 8.3-10.14 1.54 1.26-9.7 11.86zM12 10h5v2h-5zm-3 4h5v2H9zm6-8h5v2h-5z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-progressive.oo-ui-icon-checkAll,.mw-ui-icon-checkAll-progressive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E check all %3C/title%3E%3Cg fill=%22%2336c%22%3E%3Cpath d=%22m.29 12.71 1.42-1.42 2.22 2.22 8.3-10.14 1.54 1.26-9.7 11.86zM12 10h5v2h-5zm-3 4h5v2H9zm6-8h5v2h-5z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-icon-clear,.mw-ui-icon-clear:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E clear %3C/title%3E%3Cpath d=%22M10 0a10 10 0 1 0 10 10A10 10 0 0 0 10 0m5.66 14.24-1.41 1.41L10 11.41l-4.24 4.25-1.42-1.42L8.59 10 4.34 5.76l1.42-1.42L10 8.59l4.24-4.24 1.41 1.41L11.41 10z%22/%3E%3C/svg%3E")}.oo-ui-image-invert.oo-ui-icon-clear,.mw-ui-icon-clear-invert:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E clear %3C/title%3E%3Cg fill=%22%23fff%22%3E%3Cpath d=%22M10 0a10 10 0 1 0 10 10A10 10 0 0 0 10 0m5.66 14.24-1.41 1.41L10 11.41l-4.24 4.25-1.42-1.42L8.59 10 4.34 5.76l1.42-1.42L10 8.59l4.24-4.24 1.41 1.41L11.41 10z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-progressive.oo-ui-icon-clear,.mw-ui-icon-clear-progressive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E clear %3C/title%3E%3Cg fill=%22%2336c%22%3E%3Cpath d=%22M10 0a10 10 0 1 0 10 10A10 10 0 0 0 10 0m5.66 14.24-1.41 1.41L10 11.41l-4.24 4.25-1.42-1.42L8.59 10 4.34 5.76l1.42-1.42L10 8.59l4.24-4.24 1.41 1.41L11.41 10z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-icon-clock,.mw-ui-icon-clock:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E clock %3C/title%3E%3Cpath d=%22M10 0a10 10 0 1 0 10 10A10 10 0 0 0 10 0m2.5 14.5L9 11V4h2v6l3 3z%22/%3E%3C/svg%3E")}.oo-ui-image-invert.oo-ui-icon-clock,.mw-ui-icon-clock-invert:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E clock %3C/title%3E%3Cg fill=%22%23fff%22%3E%3Cpath d=%22M10 0a10 10 0 1 0 10 10A10 10 0 0 0 10 0m2.5 14.5L9 11V4h2v6l3 3z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-progressive.oo-ui-icon-clock,.mw-ui-icon-clock-progressive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E clock %3C/title%3E%3Cg fill=%22%2336c%22%3E%3Cpath d=%22M10 0a10 10 0 1 0 10 10A10 10 0 0 0 10 0m2.5 14.5L9 11V4h2v6l3 3z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-icon-close,.mw-ui-icon-close:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E close %3C/title%3E%3Cpath d=%22m4.3 2.9 12.8 12.8-1.4 1.4L2.9 4.3z%22/%3E%3Cpath d=%22M17.1 4.3 4.3 17.1l-1.4-1.4L15.7 2.9z%22/%3E%3C/svg%3E")}.oo-ui-image-invert.oo-ui-icon-close,.mw-ui-icon-close-invert:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E close %3C/title%3E%3Cg fill=%22%23fff%22%3E%3Cpath d=%22m4.3 2.9 12.8 12.8-1.4 1.4L2.9 4.3z%22/%3E%3Cpath d=%22M17.1 4.3 4.3 17.1l-1.4-1.4L15.7 2.9z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-progressive.oo-ui-icon-close,.mw-ui-icon-close-progressive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E close %3C/title%3E%3Cg fill=%22%2336c%22%3E%3Cpath d=%22m4.3 2.9 12.8 12.8-1.4 1.4L2.9 4.3z%22/%3E%3Cpath d=%22M17.1 4.3 4.3 17.1l-1.4-1.4L15.7 2.9z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-icon-ellipsis,.mw-ui-icon-ellipsis:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E ellipsis %3C/title%3E%3Ccircle cx=%2210%22 cy=%2210%22 r=%222%22/%3E%3Ccircle cx=%223%22 cy=%2210%22 r=%222%22/%3E%3Ccircle cx=%2217%22 cy=%2210%22 r=%222%22/%3E%3C/svg%3E")}.oo-ui-image-invert.oo-ui-icon-ellipsis,.mw-ui-icon-ellipsis-invert:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E ellipsis %3C/title%3E%3Cg fill=%22%23fff%22%3E%3Ccircle cx=%2210%22 cy=%2210%22 r=%222%22/%3E%3Ccircle cx=%223%22 cy=%2210%22 r=%222%22/%3E%3Ccircle cx=%2217%22 cy=%2210%22 r=%222%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-progressive.oo-ui-icon-ellipsis,.mw-ui-icon-ellipsis-progressive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E ellipsis %3C/title%3E%3Cg fill=%22%2336c%22%3E%3Ccircle cx=%2210%22 cy=%2210%22 r=%222%22/%3E%3Ccircle cx=%223%22 cy=%2210%22 r=%222%22/%3E%3Ccircle cx=%2217%22 cy=%2210%22 r=%222%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-icon-verticalEllipsis,.mw-ui-icon-verticalEllipsis:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E vertical ellipsis %3C/title%3E%3Ccircle cx=%2210%22 cy=%2210%22 r=%222%22/%3E%3Ccircle cx=%2210%22 cy=%223%22 r=%222%22/%3E%3Ccircle cx=%2210%22 cy=%2217%22 r=%222%22/%3E%3C/svg%3E")}.oo-ui-image-invert.oo-ui-icon-verticalEllipsis,.mw-ui-icon-verticalEllipsis-invert:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E vertical ellipsis %3C/title%3E%3Cg fill=%22%23fff%22%3E%3Ccircle cx=%2210%22 cy=%2210%22 r=%222%22/%3E%3Ccircle cx=%2210%22 cy=%223%22 r=%222%22/%3E%3Ccircle cx=%2210%22 cy=%2217%22 r=%222%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-progressive.oo-ui-icon-verticalEllipsis,.mw-ui-icon-verticalEllipsis-progressive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E vertical ellipsis %3C/title%3E%3Cg fill=%22%2336c%22%3E%3Ccircle cx=%2210%22 cy=%2210%22 r=%222%22/%3E%3Ccircle cx=%2210%22 cy=%223%22 r=%222%22/%3E%3Ccircle cx=%2210%22 cy=%2217%22 r=%222%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-icon-feedback,.mw-ui-icon-feedback:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E feedback %3C/title%3E%3Cpath d=%22M19 16 2 12a3.83 3.83 0 0 1-1-2.5A3.83 3.83 0 0 1 2 7l17-4z%22/%3E%3Crect width=%224%22 height=%228%22 x=%224%22 y=%229%22 rx=%222%22/%3E%3C/svg%3E")}.oo-ui-image-invert.oo-ui-icon-feedback,.mw-ui-icon-feedback-invert:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E feedback %3C/title%3E%3Cg fill=%22%23fff%22%3E%3Cpath d=%22M19 16 2 12a3.83 3.83 0 0 1-1-2.5A3.83 3.83 0 0 1 2 7l17-4z%22/%3E%3Crect width=%224%22 height=%228%22 x=%224%22 y=%229%22 rx=%222%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-progressive.oo-ui-icon-feedback,.mw-ui-icon-feedback-progressive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E feedback %3C/title%3E%3Cg fill=%22%2336c%22%3E%3Cpath d=%22M19 16 2 12a3.83 3.83 0 0 1-1-2.5A3.83 3.83 0 0 1 2 7l17-4z%22/%3E%3Crect width=%224%22 height=%228%22 x=%224%22 y=%229%22 rx=%222%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-icon-funnel,.mw-ui-icon-funnel:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E funnel %3C/title%3E%3Cpath d=%22M10 13 1 1h18z%22/%3E%3Cpath d=%22M8 9v8l4 2V9z%22/%3E%3C/svg%3E")}.oo-ui-image-invert.oo-ui-icon-funnel,.mw-ui-icon-funnel-invert:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E funnel %3C/title%3E%3Cg fill=%22%23fff%22%3E%3Cpath d=%22M10 13 1 1h18z%22/%3E%3Cpath d=%22M8 9v8l4 2V9z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-progressive.oo-ui-icon-funnel,.mw-ui-icon-funnel-progressive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E funnel %3C/title%3E%3Cg fill=%22%2336c%22%3E%3Cpath d=%22M10 13 1 1h18z%22/%3E%3Cpath d=%22M8 9v8l4 2V9z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-destructive.oo-ui-icon-funnel,.mw-ui-icon-funnel-destructive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E funnel %3C/title%3E%3Cg fill=%22%23d73333%22%3E%3Cpath d=%22M10 13 1 1h18z%22/%3E%3Cpath d=%22M8 9v8l4 2V9z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-icon-hand,.mw-ui-icon-hand:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E hand %3C/title%3E%3Cpath d=%22M18 4.6V17c0 1.9-.5 3-2.4 3H9.5c-.9 0-1.8-.4-2.4-1l-4.6-5-.5-1c0-1 .5-1 .5-1 .3 0 .6 0 1 .2L7 14V3.3C7 2.6 7.3 2 8 2c.6 0 1 .7 1 1.4V9h1V1.2c0-.6.3-1.2 1-1.2s1 .6 1 1.3V9h1V2c0-.7.3-1.3 1-1.3s1 .6 1 1.3v7h1V4.6c0-.7.3-1.3 1-1.3s1 .6 1 1.3%22/%3E%3C/svg%3E")}.oo-ui-image-invert.oo-ui-icon-hand,.mw-ui-icon-hand-invert:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E hand %3C/title%3E%3Cg fill=%22%23fff%22%3E%3Cpath d=%22M18 4.6V17c0 1.9-.5 3-2.4 3H9.5c-.9 0-1.8-.4-2.4-1l-4.6-5-.5-1c0-1 .5-1 .5-1 .3 0 .6 0 1 .2L7 14V3.3C7 2.6 7.3 2 8 2c.6 0 1 .7 1 1.4V9h1V1.2c0-.6.3-1.2 1-1.2s1 .6 1 1.3V9h1V2c0-.7.3-1.3 1-1.3s1 .6 1 1.3v7h1V4.6c0-.7.3-1.3 1-1.3s1 .6 1 1.3%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-progressive.oo-ui-icon-hand,.mw-ui-icon-hand-progressive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E hand %3C/title%3E%3Cg fill=%22%2336c%22%3E%3Cpath d=%22M18 4.6V17c0 1.9-.5 3-2.4 3H9.5c-.9 0-1.8-.4-2.4-1l-4.6-5-.5-1c0-1 .5-1 .5-1 .3 0 .6 0 1 .2L7 14V3.3C7 2.6 7.3 2 8 2c.6 0 1 .7 1 1.4V9h1V1.2c0-.6.3-1.2 1-1.2s1 .6 1 1.3V9h1V2c0-.7.3-1.3 1-1.3s1 .6 1 1.3v7h1V4.6c0-.7.3-1.3 1-1.3s1 .6 1 1.3%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-destructive.oo-ui-icon-hand,.mw-ui-icon-hand-destructive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E hand %3C/title%3E%3Cg fill=%22%23d73333%22%3E%3Cpath d=%22M18 4.6V17c0 1.9-.5 3-2.4 3H9.5c-.9 0-1.8-.4-2.4-1l-4.6-5-.5-1c0-1 .5-1 .5-1 .3 0 .6 0 1 .2L7 14V3.3C7 2.6 7.3 2 8 2c.6 0 1 .7 1 1.4V9h1V1.2c0-.6.3-1.2 1-1.2s1 .6 1 1.3V9h1V2c0-.7.3-1.3 1-1.3s1 .6 1 1.3v7h1V4.6c0-.7.3-1.3 1-1.3s1 .6 1 1.3%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-icon-heart,.mw-ui-icon-heart:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E heart %3C/title%3E%3Cpath d=%22M14.75 1A5.24 5.24 0 0 0 10 4 5.24 5.24 0 0 0 0 6.25C0 11.75 10 19 10 19s10-7.25 10-12.75A5.25 5.25 0 0 0 14.75 1%22/%3E%3C/svg%3E")}.oo-ui-image-invert.oo-ui-icon-heart,.mw-ui-icon-heart-invert:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E heart %3C/title%3E%3Cg fill=%22%23fff%22%3E%3Cpath d=%22M14.75 1A5.24 5.24 0 0 0 10 4 5.24 5.24 0 0 0 0 6.25C0 11.75 10 19 10 19s10-7.25 10-12.75A5.25 5.25 0 0 0 14.75 1%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-progressive.oo-ui-icon-heart,.mw-ui-icon-heart-progressive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E heart %3C/title%3E%3Cg fill=%22%2336c%22%3E%3Cpath d=%22M14.75 1A5.24 5.24 0 0 0 10 4 5.24 5.24 0 0 0 0 6.25C0 11.75 10 19 10 19s10-7.25 10-12.75A5.25 5.25 0 0 0 14.75 1%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-icon-help,.mw-ui-icon-help:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E help %3C/title%3E%3Cpath d=%22M10.06 1C13 1 15 2.89 15 5.53a4.59 4.59 0 0 1-2.29 4.08c-1.42.92-1.82 1.53-1.82 2.71V13H8.38v-.81a3.84 3.84 0 0 1 2-3.84c1.34-.9 1.79-1.53 1.79-2.71a2.1 2.1 0 0 0-2.08-2.14h-.17a2.3 2.3 0 0 0-2.38 2.22v.17H5A4.71 4.71 0 0 1 9.51 1a5 5 0 0 1 .55 0%22/%3E%3Ccircle cx=%2210%22 cy=%2217%22 r=%222%22/%3E%3C/svg%3E")}.oo-ui-image-invert.oo-ui-icon-help,.mw-ui-icon-help-invert:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E help %3C/title%3E%3Cg fill=%22%23fff%22%3E%3Cpath d=%22M10.06 1C13 1 15 2.89 15 5.53a4.59 4.59 0 0 1-2.29 4.08c-1.42.92-1.82 1.53-1.82 2.71V13H8.38v-.81a3.84 3.84 0 0 1 2-3.84c1.34-.9 1.79-1.53 1.79-2.71a2.1 2.1 0 0 0-2.08-2.14h-.17a2.3 2.3 0 0 0-2.38 2.22v.17H5A4.71 4.71 0 0 1 9.51 1a5 5 0 0 1 .55 0%22/%3E%3Ccircle cx=%2210%22 cy=%2217%22 r=%222%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-progressive.oo-ui-icon-help,.mw-ui-icon-help-progressive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E help %3C/title%3E%3Cg fill=%22%2336c%22%3E%3Cpath d=%22M10.06 1C13 1 15 2.89 15 5.53a4.59 4.59 0 0 1-2.29 4.08c-1.42.92-1.82 1.53-1.82 2.71V13H8.38v-.81a3.84 3.84 0 0 1 2-3.84c1.34-.9 1.79-1.53 1.79-2.71a2.1 2.1 0 0 0-2.08-2.14h-.17a2.3 2.3 0 0 0-2.38 2.22v.17H5A4.71 4.71 0 0 1 9.51 1a5 5 0 0 1 .55 0%22/%3E%3Ccircle cx=%2210%22 cy=%2217%22 r=%222%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-icon-helpNotice,.mw-ui-icon-helpNotice:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E help %3C/title%3E%3Cpath d=%22M10 0a10 10 0 1 0 10 10A10 10 0 0 0 10 0m1 16H9v-2h2zm2.71-7.6a2.6 2.6 0 0 1-.33.74 3.2 3.2 0 0 1-.48.55l-.54.48c-.21.18-.41.35-.58.52a2.5 2.5 0 0 0-.47.56A2.3 2.3 0 0 0 11 12a3.8 3.8 0 0 0-.11 1H9.08a9 9 0 0 1 .07-1.25 3.3 3.3 0 0 1 .25-.9 2.8 2.8 0 0 1 .41-.67 4 4 0 0 1 .58-.58c.17-.16.34-.3.51-.44a3 3 0 0 0 .43-.44 1.8 1.8 0 0 0 .3-.55 2 2 0 0 0 .11-.72 2.1 2.1 0 0 0-.17-.86 1.7 1.7 0 0 0-1-.9 1.7 1.7 0 0 0-.5-.1 1.77 1.77 0 0 0-1.53.68 3 3 0 0 0-.5 1.82H6.16a4.7 4.7 0 0 1 .28-1.68 3.6 3.6 0 0 1 .8-1.29 3.9 3.9 0 0 1 1.28-.83A4.6 4.6 0 0 1 10.18 4a4.4 4.4 0 0 1 1.44.23 3.5 3.5 0 0 1 1.15.65 3.1 3.1 0 0 1 .78 1.06 3.5 3.5 0 0 1 .29 1.45 3.4 3.4 0 0 1-.13 1.01%22/%3E%3C/svg%3E")}.oo-ui-image-invert.oo-ui-icon-helpNotice,.mw-ui-icon-helpNotice-invert:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E help %3C/title%3E%3Cg fill=%22%23fff%22%3E%3Cpath d=%22M10 0a10 10 0 1 0 10 10A10 10 0 0 0 10 0m1 16H9v-2h2zm2.71-7.6a2.6 2.6 0 0 1-.33.74 3.2 3.2 0 0 1-.48.55l-.54.48c-.21.18-.41.35-.58.52a2.5 2.5 0 0 0-.47.56A2.3 2.3 0 0 0 11 12a3.8 3.8 0 0 0-.11 1H9.08a9 9 0 0 1 .07-1.25 3.3 3.3 0 0 1 .25-.9 2.8 2.8 0 0 1 .41-.67 4 4 0 0 1 .58-.58c.17-.16.34-.3.51-.44a3 3 0 0 0 .43-.44 1.8 1.8 0 0 0 .3-.55 2 2 0 0 0 .11-.72 2.1 2.1 0 0 0-.17-.86 1.7 1.7 0 0 0-1-.9 1.7 1.7 0 0 0-.5-.1 1.77 1.77 0 0 0-1.53.68 3 3 0 0 0-.5 1.82H6.16a4.7 4.7 0 0 1 .28-1.68 3.6 3.6 0 0 1 .8-1.29 3.9 3.9 0 0 1 1.28-.83A4.6 4.6 0 0 1 10.18 4a4.4 4.4 0 0 1 1.44.23 3.5 3.5 0 0 1 1.15.65 3.1 3.1 0 0 1 .78 1.06 3.5 3.5 0 0 1 .29 1.45 3.4 3.4 0 0 1-.13 1.01%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-progressive.oo-ui-icon-helpNotice,.mw-ui-icon-helpNotice-progressive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E help %3C/title%3E%3Cg fill=%22%2336c%22%3E%3Cpath d=%22M10 0a10 10 0 1 0 10 10A10 10 0 0 0 10 0m1 16H9v-2h2zm2.71-7.6a2.6 2.6 0 0 1-.33.74 3.2 3.2 0 0 1-.48.55l-.54.48c-.21.18-.41.35-.58.52a2.5 2.5 0 0 0-.47.56A2.3 2.3 0 0 0 11 12a3.8 3.8 0 0 0-.11 1H9.08a9 9 0 0 1 .07-1.25 3.3 3.3 0 0 1 .25-.9 2.8 2.8 0 0 1 .41-.67 4 4 0 0 1 .58-.58c.17-.16.34-.3.51-.44a3 3 0 0 0 .43-.44 1.8 1.8 0 0 0 .3-.55 2 2 0 0 0 .11-.72 2.1 2.1 0 0 0-.17-.86 1.7 1.7 0 0 0-1-.9 1.7 1.7 0 0 0-.5-.1 1.77 1.77 0 0 0-1.53.68 3 3 0 0 0-.5 1.82H6.16a4.7 4.7 0 0 1 .28-1.68 3.6 3.6 0 0 1 .8-1.29 3.9 3.9 0 0 1 1.28-.83A4.6 4.6 0 0 1 10.18 4a4.4 4.4 0 0 1 1.44.23 3.5 3.5 0 0 1 1.15.65 3.1 3.1 0 0 1 .78 1.06 3.5 3.5 0 0 1 .29 1.45 3.4 3.4 0 0 1-.13 1.01%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-icon-home,.mw-ui-icon-home:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E home %3C/title%3E%3Cpath d=%22M10 1 0 10h3v9h4v-4.6c0-1.47 1.31-2.66 3-2.66s3 1.19 3 2.66V19h4v-9h3z%22/%3E%3C/svg%3E")}.oo-ui-image-invert.oo-ui-icon-home,.mw-ui-icon-home-invert:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E home %3C/title%3E%3Cg fill=%22%23fff%22%3E%3Cpath d=%22M10 1 0 10h3v9h4v-4.6c0-1.47 1.31-2.66 3-2.66s3 1.19 3 2.66V19h4v-9h3z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-progressive.oo-ui-icon-home,.mw-ui-icon-home-progressive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E home %3C/title%3E%3Cg fill=%22%2336c%22%3E%3Cpath d=%22M10 1 0 10h3v9h4v-4.6c0-1.47 1.31-2.66 3-2.66s3 1.19 3 2.66V19h4v-9h3z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-icon-key,.mw-ui-icon-key:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E key %3C/title%3E%3Cpath d=%22M15 6a1.54 1.54 0 0 1-1.5-1.5 1.5 1.5 0 0 1 3 0A1.54 1.54 0 0 1 15 6m-1.5-5A5.55 5.55 0 0 0 8 6.5a6.8 6.8 0 0 0 .7 2.8L1 17v2h4v-2h2v-2h2l3.2-3.2a6 6 0 0 0 1.3.2A5.55 5.55 0 0 0 19 6.5 5.55 5.55 0 0 0 13.5 1%22/%3E%3C/svg%3E")}.oo-ui-image-invert.oo-ui-icon-key,.mw-ui-icon-key-invert:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E key %3C/title%3E%3Cg fill=%22%23fff%22%3E%3Cpath d=%22M15 6a1.54 1.54 0 0 1-1.5-1.5 1.5 1.5 0 0 1 3 0A1.54 1.54 0 0 1 15 6m-1.5-5A5.55 5.55 0 0 0 8 6.5a6.8 6.8 0 0 0 .7 2.8L1 17v2h4v-2h2v-2h2l3.2-3.2a6 6 0 0 0 1.3.2A5.55 5.55 0 0 0 19 6.5 5.55 5.55 0 0 0 13.5 1%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-progressive.oo-ui-icon-key,.mw-ui-icon-key-progressive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E key %3C/title%3E%3Cg fill=%22%2336c%22%3E%3Cpath d=%22M15 6a1.54 1.54 0 0 1-1.5-1.5 1.5 1.5 0 0 1 3 0A1.54 1.54 0 0 1 15 6m-1.5-5A5.55 5.55 0 0 0 8 6.5a6.8 6.8 0 0 0 .7 2.8L1 17v2h4v-2h2v-2h2l3.2-3.2a6 6 0 0 0 1.3.2A5.55 5.55 0 0 0 19 6.5 5.55 5.55 0 0 0 13.5 1%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-icon-keyboard,.mw-ui-icon-keyboard:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E keyboard %3C/title%3E%3Cpath d=%22M0 15a2 2 0 0 0 2 2h16a2 2 0 0 0 2-2V5a2 2 0 0 0-2-2H2a2 2 0 0 0-2 2zm9-9h2v2H9zm0 3h2v2H9zM6 6h2v2H6zm0 3h2v2H6zm-1 5H3v-2h2zm0-3H3V9h2zm0-3H3V6h2zm9 6H6v-2h8zm0-3h-2V9h2zm0-3h-2V6h2zm3 6h-2v-2h2zm0-3h-2V9h2zm0-3h-2V6h2z%22/%3E%3C/svg%3E")}.oo-ui-image-invert.oo-ui-icon-keyboard,.mw-ui-icon-keyboard-invert:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E keyboard %3C/title%3E%3Cg fill=%22%23fff%22%3E%3Cpath d=%22M0 15a2 2 0 0 0 2 2h16a2 2 0 0 0 2-2V5a2 2 0 0 0-2-2H2a2 2 0 0 0-2 2zm9-9h2v2H9zm0 3h2v2H9zM6 6h2v2H6zm0 3h2v2H6zm-1 5H3v-2h2zm0-3H3V9h2zm0-3H3V6h2zm9 6H6v-2h8zm0-3h-2V9h2zm0-3h-2V6h2zm3 6h-2v-2h2zm0-3h-2V9h2zm0-3h-2V6h2z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-progressive.oo-ui-icon-keyboard,.mw-ui-icon-keyboard-progressive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E keyboard %3C/title%3E%3Cg fill=%22%2336c%22%3E%3Cpath d=%22M0 15a2 2 0 0 0 2 2h16a2 2 0 0 0 2-2V5a2 2 0 0 0-2-2H2a2 2 0 0 0-2 2zm9-9h2v2H9zm0 3h2v2H9zM6 6h2v2H6zm0 3h2v2H6zm-1 5H3v-2h2zm0-3H3V9h2zm0-3H3V6h2zm9 6H6v-2h8zm0-3h-2V9h2zm0-3h-2V6h2zm3 6h-2v-2h2zm0-3h-2V9h2zm0-3h-2V6h2z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-icon-lightbulb,.mw-ui-icon-lightbulb:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E lightbulb %3C/title%3E%3Cpath d=%22M8 19a1 1 0 0 0 1 1h2a1 1 0 0 0 1-1v-1H8zm9-12a7 7 0 1 0-12 4.9S7 14 7 15v1a1 1 0 0 0 1 1h4a1 1 0 0 0 1-1v-1c0-1 2-3.1 2-3.1A7 7 0 0 0 17 7%22/%3E%3C/svg%3E")}.oo-ui-image-invert.oo-ui-icon-lightbulb,.mw-ui-icon-lightbulb-invert:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E lightbulb %3C/title%3E%3Cg fill=%22%23fff%22%3E%3Cpath d=%22M8 19a1 1 0 0 0 1 1h2a1 1 0 0 0 1-1v-1H8zm9-12a7 7 0 1 0-12 4.9S7 14 7 15v1a1 1 0 0 0 1 1h4a1 1 0 0 0 1-1v-1c0-1 2-3.1 2-3.1A7 7 0 0 0 17 7%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-progressive.oo-ui-icon-lightbulb,.mw-ui-icon-lightbulb-progressive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E lightbulb %3C/title%3E%3Cg fill=%22%2336c%22%3E%3Cpath d=%22M8 19a1 1 0 0 0 1 1h2a1 1 0 0 0 1-1v-1H8zm9-12a7 7 0 1 0-12 4.9S7 14 7 15v1a1 1 0 0 0 1 1h4a1 1 0 0 0 1-1v-1c0-1 2-3.1 2-3.1A7 7 0 0 0 17 7%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-icon-logIn,.mw-ui-icon-logIn:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E log in %3C/title%3E%3Cpath d=%22M1 11v6c0 1.1.9 2 2 2h14c1.1 0 2-.9 2-2V3c0-1.1-.9-2-2-2H3c-1.1 0-2 .9-2 2v6h8V5l4.75 5L9 15v-4z%22/%3E%3C/svg%3E")}.oo-ui-image-invert.oo-ui-icon-logIn,.mw-ui-icon-logIn-invert:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E log in %3C/title%3E%3Cg fill=%22%23fff%22%3E%3Cpath d=%22M1 11v6c0 1.1.9 2 2 2h14c1.1 0 2-.9 2-2V3c0-1.1-.9-2-2-2H3c-1.1 0-2 .9-2 2v6h8V5l4.75 5L9 15v-4z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-progressive.oo-ui-icon-logIn,.mw-ui-icon-logIn-progressive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E log in %3C/title%3E%3Cg fill=%22%2336c%22%3E%3Cpath d=%22M1 11v6c0 1.1.9 2 2 2h14c1.1 0 2-.9 2-2V3c0-1.1-.9-2-2-2H3c-1.1 0-2 .9-2 2v6h8V5l4.75 5L9 15v-4z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-icon-logOut,.mw-ui-icon-logOut:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E log out %3C/title%3E%3Cpath d=%22M3 3h8V1H3a2 2 0 0 0-2 2v14a2 2 0 0 0 2 2h8v-2H3z%22/%3E%3Cpath d=%22M13 5v4H5v2h8v4l6-5z%22/%3E%3C/svg%3E")}.oo-ui-image-invert.oo-ui-icon-logOut,.mw-ui-icon-logOut-invert:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E log out %3C/title%3E%3Cg fill=%22%23fff%22%3E%3Cpath d=%22M3 3h8V1H3a2 2 0 0 0-2 2v14a2 2 0 0 0 2 2h8v-2H3z%22/%3E%3Cpath d=%22M13 5v4H5v2h8v4l6-5z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-progressive.oo-ui-icon-logOut,.mw-ui-icon-logOut-progressive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E log out %3C/title%3E%3Cg fill=%22%2336c%22%3E%3Cpath d=%22M3 3h8V1H3a2 2 0 0 0-2 2v14a2 2 0 0 0 2 2h8v-2H3z%22/%3E%3Cpath d=%22M13 5v4H5v2h8v4l6-5z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-icon-network,.mw-ui-icon-network:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E network %3C/title%3E%3Ccircle cx=%2210%22 cy=%2215%22 r=%222%22/%3E%3Cpath d=%22M1 7.4a12 13 0 0 1 18 0l-1.5 1.4a10 11.1 0 0 0-15 0zm3.7 3.2a7 7.3 0 0 1 10.7 0L14 12a5 5.3 0 0 0-7.8 0z%22/%3E%3C/svg%3E")}.oo-ui-image-invert.oo-ui-icon-network,.mw-ui-icon-network-invert:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E network %3C/title%3E%3Cg fill=%22%23fff%22%3E%3Ccircle cx=%2210%22 cy=%2215%22 r=%222%22/%3E%3Cpath d=%22M1 7.4a12 13 0 0 1 18 0l-1.5 1.4a10 11.1 0 0 0-15 0zm3.7 3.2a7 7.3 0 0 1 10.7 0L14 12a5 5.3 0 0 0-7.8 0z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-progressive.oo-ui-icon-network,.mw-ui-icon-network-progressive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E network %3C/title%3E%3Cg fill=%22%2336c%22%3E%3Ccircle cx=%2210%22 cy=%2215%22 r=%222%22/%3E%3Cpath d=%22M1 7.4a12 13 0 0 1 18 0l-1.5 1.4a10 11.1 0 0 0-15 0zm3.7 3.2a7 7.3 0 0 1 10.7 0L14 12a5 5.3 0 0 0-7.8 0z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-icon-networkOff,.mw-ui-icon-networkOff:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E network off %3C/title%3E%3Ccircle cx=%2210%22 cy=%2216%22 r=%222%22/%3E%3Cpath d=%22M16.4 11.6A7.1 7.1 0 0 0 12 9.1l3.4 3.4zM19 8.4A12.2 14 0 0 0 8.2 4.2L10 6a9.9 9.9 0 0 1 7.4 3.7zM3.5 2 2 3.4l2.2 2.2A13.1 13.1 0 0 0 1 8.4l1.5 1.3a10.7 10.7 0 0 1 3.2-2.6L8 9.3a7.3 7.3 0 0 0-3.3 2.3L6.1 13a5.2 5.2 0 0 1 3.6-2l6.8 7 1.5-1.5z%22/%3E%3C/svg%3E")}.oo-ui-image-invert.oo-ui-icon-networkOff,.mw-ui-icon-networkOff-invert:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E network off %3C/title%3E%3Cg fill=%22%23fff%22%3E%3Ccircle cx=%2210%22 cy=%2216%22 r=%222%22/%3E%3Cpath d=%22M16.4 11.6A7.1 7.1 0 0 0 12 9.1l3.4 3.4zM19 8.4A12.2 14 0 0 0 8.2 4.2L10 6a9.9 9.9 0 0 1 7.4 3.7zM3.5 2 2 3.4l2.2 2.2A13.1 13.1 0 0 0 1 8.4l1.5 1.3a10.7 10.7 0 0 1 3.2-2.6L8 9.3a7.3 7.3 0 0 0-3.3 2.3L6.1 13a5.2 5.2 0 0 1 3.6-2l6.8 7 1.5-1.5z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-progressive.oo-ui-icon-networkOff,.mw-ui-icon-networkOff-progressive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E network off %3C/title%3E%3Cg fill=%22%2336c%22%3E%3Ccircle cx=%2210%22 cy=%2216%22 r=%222%22/%3E%3Cpath d=%22M16.4 11.6A7.1 7.1 0 0 0 12 9.1l3.4 3.4zM19 8.4A12.2 14 0 0 0 8.2 4.2L10 6a9.9 9.9 0 0 1 7.4 3.7zM3.5 2 2 3.4l2.2 2.2A13.1 13.1 0 0 0 1 8.4l1.5 1.3a10.7 10.7 0 0 1 3.2-2.6L8 9.3a7.3 7.3 0 0 0-3.3 2.3L6.1 13a5.2 5.2 0 0 1 3.6-2l6.8 7 1.5-1.5z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-icon-newWindow,.mw-ui-icon-newWindow:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E new window %3C/title%3E%3Cpath d=%22M17 17H3V3h5V1H3a2 2 0 0 0-2 2v14a2 2 0 0 0 2 2h14a2 2 0 0 0 2-2v-5h-2z%22/%3E%3Cpath d=%22m11 1 3.3 3.3L8.6 10l1.4 1.4 5.7-5.7L19 9V1z%22/%3E%3C/svg%3E")}.oo-ui-image-invert.oo-ui-icon-newWindow,.mw-ui-icon-newWindow-invert:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E new window %3C/title%3E%3Cg fill=%22%23fff%22%3E%3Cpath d=%22M17 17H3V3h5V1H3a2 2 0 0 0-2 2v14a2 2 0 0 0 2 2h14a2 2 0 0 0 2-2v-5h-2z%22/%3E%3Cpath d=%22m11 1 3.3 3.3L8.6 10l1.4 1.4 5.7-5.7L19 9V1z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-progressive.oo-ui-icon-newWindow,.mw-ui-icon-newWindow-progressive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E new window %3C/title%3E%3Cg fill=%22%2336c%22%3E%3Cpath d=%22M17 17H3V3h5V1H3a2 2 0 0 0-2 2v14a2 2 0 0 0 2 2h14a2 2 0 0 0 2-2v-5h-2z%22/%3E%3Cpath d=%22m11 1 3.3 3.3L8.6 10l1.4 1.4 5.7-5.7L19 9V1z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-icon-pageSettings,.mw-ui-icon-pageSettings:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E page settings %3C/title%3E%3Ccircle cx=%2210%22 cy=%2210%22 r=%221.75%22/%3E%3Cpath d=%22M15 1H5a2 2 0 0 0-2 2v14a2 2 0 0 0 2 2h10a2 2 0 0 0 2-2V3a2 2 0 0 0-2-2m0 9.75-1.37.25a3.7 3.7 0 0 1-.38.93l.82 1.07L13 14.07l-1.12-.82a3.7 3.7 0 0 1-.93.38l-.2 1.37h-1.5L9 13.63a3.7 3.7 0 0 1-.93-.38L7 14.07 5.93 13l.82-1.12a3.7 3.7 0 0 1-.38-.88L5 10.75v-1.5L6.37 9a3.7 3.7 0 0 1 .38-.93L5.93 7 7 5.93l1.12.82A3.7 3.7 0 0 1 9 6.37L9.25 5h1.5L11 6.37a3.7 3.7 0 0 1 .93.38L13 5.93 14.07 7l-.82 1.12a3.7 3.7 0 0 1 .38.93l1.37.2z%22/%3E%3C/svg%3E")}.oo-ui-image-invert.oo-ui-icon-pageSettings,.mw-ui-icon-pageSettings-invert:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E page settings %3C/title%3E%3Cg fill=%22%23fff%22%3E%3Ccircle cx=%2210%22 cy=%2210%22 r=%221.75%22/%3E%3Cpath d=%22M15 1H5a2 2 0 0 0-2 2v14a2 2 0 0 0 2 2h10a2 2 0 0 0 2-2V3a2 2 0 0 0-2-2m0 9.75-1.37.25a3.7 3.7 0 0 1-.38.93l.82 1.07L13 14.07l-1.12-.82a3.7 3.7 0 0 1-.93.38l-.2 1.37h-1.5L9 13.63a3.7 3.7 0 0 1-.93-.38L7 14.07 5.93 13l.82-1.12a3.7 3.7 0 0 1-.38-.88L5 10.75v-1.5L6.37 9a3.7 3.7 0 0 1 .38-.93L5.93 7 7 5.93l1.12.82A3.7 3.7 0 0 1 9 6.37L9.25 5h1.5L11 6.37a3.7 3.7 0 0 1 .93.38L13 5.93 14.07 7l-.82 1.12a3.7 3.7 0 0 1 .38.93l1.37.2z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-progressive.oo-ui-icon-pageSettings,.mw-ui-icon-pageSettings-progressive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E page settings %3C/title%3E%3Cg fill=%22%2336c%22%3E%3Ccircle cx=%2210%22 cy=%2210%22 r=%221.75%22/%3E%3Cpath d=%22M15 1H5a2 2 0 0 0-2 2v14a2 2 0 0 0 2 2h10a2 2 0 0 0 2-2V3a2 2 0 0 0-2-2m0 9.75-1.37.25a3.7 3.7 0 0 1-.38.93l.82 1.07L13 14.07l-1.12-.82a3.7 3.7 0 0 1-.93.38l-.2 1.37h-1.5L9 13.63a3.7 3.7 0 0 1-.93-.38L7 14.07 5.93 13l.82-1.12a3.7 3.7 0 0 1-.38-.88L5 10.75v-1.5L6.37 9a3.7 3.7 0 0 1 .38-.93L5.93 7 7 5.93l1.12.82A3.7 3.7 0 0 1 9 6.37L9.25 5h1.5L11 6.37a3.7 3.7 0 0 1 .93.38L13 5.93 14.07 7l-.82 1.12a3.7 3.7 0 0 1 .38.93l1.37.2z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-icon-printer,.mw-ui-icon-printer:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E printer %3C/title%3E%3Cpath d=%22M5 1h10v4H5zM3 6a2 2 0 0 0-2 2v7h4v4h10v-4h4V8a2 2 0 0 0-2-2zm11 12H6v-6h8zm2-8a1 1 0 1 1 1-1 1 1 0 0 1-1 1%22/%3E%3C/svg%3E")}.oo-ui-image-invert.oo-ui-icon-printer,.mw-ui-icon-printer-invert:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E printer %3C/title%3E%3Cg fill=%22%23fff%22%3E%3Cpath d=%22M5 1h10v4H5zM3 6a2 2 0 0 0-2 2v7h4v4h10v-4h4V8a2 2 0 0 0-2-2zm11 12H6v-6h8zm2-8a1 1 0 1 1 1-1 1 1 0 0 1-1 1%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-progressive.oo-ui-icon-printer,.mw-ui-icon-printer-progressive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E printer %3C/title%3E%3Cg fill=%22%2336c%22%3E%3Cpath d=%22M5 1h10v4H5zM3 6a2 2 0 0 0-2 2v7h4v4h10v-4h4V8a2 2 0 0 0-2-2zm11 12H6v-6h8zm2-8a1 1 0 1 1 1-1 1 1 0 0 1-1 1%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-icon-reload,.mw-ui-icon-reload:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E reload %3C/title%3E%3Cpath d=%22M15.65 4.35A8 8 0 1 0 17.4 13h-2.22a6 6 0 1 1-1-7.22L11 9h7V2z%22/%3E%3C/svg%3E")}.oo-ui-image-invert.oo-ui-icon-reload,.mw-ui-icon-reload-invert:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E reload %3C/title%3E%3Cg fill=%22%23fff%22%3E%3Cpath d=%22M15.65 4.35A8 8 0 1 0 17.4 13h-2.22a6 6 0 1 1-1-7.22L11 9h7V2z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-progressive.oo-ui-icon-reload,.mw-ui-icon-reload-progressive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E reload %3C/title%3E%3Cg fill=%22%2336c%22%3E%3Cpath d=%22M15.65 4.35A8 8 0 1 0 17.4 13h-2.22a6 6 0 1 1-1-7.22L11 9h7V2z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-icon-search,.mw-ui-icon-search:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E search %3C/title%3E%3Cpath d=%22M12.2 13.6a7 7 0 1 1 1.4-1.4l5.4 5.4-1.4 1.4zM3 8a5 5 0 1 0 10 0A5 5 0 0 0 3 8%22/%3E%3C/svg%3E")}.oo-ui-image-invert.oo-ui-icon-search,.mw-ui-icon-search-invert:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E search %3C/title%3E%3Cg fill=%22%23fff%22%3E%3Cpath d=%22M12.2 13.6a7 7 0 1 1 1.4-1.4l5.4 5.4-1.4 1.4zM3 8a5 5 0 1 0 10 0A5 5 0 0 0 3 8%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-progressive.oo-ui-icon-search,.mw-ui-icon-search-progressive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E search %3C/title%3E%3Cg fill=%22%2336c%22%3E%3Cpath d=%22M12.2 13.6a7 7 0 1 1 1.4-1.4l5.4 5.4-1.4 1.4zM3 8a5 5 0 1 0 10 0A5 5 0 0 0 3 8%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-icon-settings,.mw-ui-icon-settings:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 xmlns:xlink=%22http://www.w3.org/1999/xlink%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E settings %3C/title%3E%3Cg transform=%22translate%2810 10%29%22%3E%3Cpath id=%22a%22 d=%22M1.5-10h-3l-1 6.5h5m0 7h-5l1 6.5h3%22/%3E%3Cuse xlink:href=%22%23a%22 transform=%22rotate%2845%29%22/%3E%3Cuse xlink:href=%22%23a%22 transform=%22rotate%2890%29%22/%3E%3Cuse xlink:href=%22%23a%22 transform=%22rotate%28135%29%22/%3E%3C/g%3E%3Cpath d=%22M10 2.5a7.5 7.5 0 0 0 0 15 7.5 7.5 0 0 0 0-15v4a3.5 3.5 0 0 1 0 7 3.5 3.5 0 0 1 0-7%22/%3E%3C/svg%3E")}.oo-ui-image-invert.oo-ui-icon-settings,.mw-ui-icon-settings-invert:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 xmlns:xlink=%22http://www.w3.org/1999/xlink%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E settings %3C/title%3E%3Cg fill=%22%23fff%22%3E%3Cg xmlns:xlink=%22http://www.w3.org/1999/xlink%22 transform=%22translate%2810 10%29%22%3E%3Cpath id=%22a%22 d=%22M1.5-10h-3l-1 6.5h5m0 7h-5l1 6.5h3%22/%3E%3Cuse xlink:href=%22%23a%22 transform=%22rotate%2845%29%22/%3E%3Cuse xlink:href=%22%23a%22 transform=%22rotate%2890%29%22/%3E%3Cuse xlink:href=%22%23a%22 transform=%22rotate%28135%29%22/%3E%3C/g%3E%3Cpath d=%22M10 2.5a7.5 7.5 0 0 0 0 15 7.5 7.5 0 0 0 0-15v4a3.5 3.5 0 0 1 0 7 3.5 3.5 0 0 1 0-7%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-progressive.oo-ui-icon-settings,.mw-ui-icon-settings-progressive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 xmlns:xlink=%22http://www.w3.org/1999/xlink%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E settings %3C/title%3E%3Cg fill=%22%2336c%22%3E%3Cg xmlns:xlink=%22http://www.w3.org/1999/xlink%22 transform=%22translate%2810 10%29%22%3E%3Cpath id=%22a%22 d=%22M1.5-10h-3l-1 6.5h5m0 7h-5l1 6.5h3%22/%3E%3Cuse xlink:href=%22%23a%22 transform=%22rotate%2845%29%22/%3E%3Cuse xlink:href=%22%23a%22 transform=%22rotate%2890%29%22/%3E%3Cuse xlink:href=%22%23a%22 transform=%22rotate%28135%29%22/%3E%3C/g%3E%3Cpath d=%22M10 2.5a7.5 7.5 0 0 0 0 15 7.5 7.5 0 0 0 0-15v4a3.5 3.5 0 0 1 0 7 3.5 3.5 0 0 1 0-7%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-icon-subtract,.mw-ui-icon-subtract:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E subtract %3C/title%3E%3Cpath d=%22M4 9h12v2H4z%22/%3E%3C/svg%3E")}.oo-ui-image-invert.oo-ui-icon-subtract,.mw-ui-icon-subtract-invert:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E subtract %3C/title%3E%3Cg fill=%22%23fff%22%3E%3Cpath d=%22M4 9h12v2H4z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-progressive.oo-ui-icon-subtract,.mw-ui-icon-subtract-progressive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E subtract %3C/title%3E%3Cg fill=%22%2336c%22%3E%3Cpath d=%22M4 9h12v2H4z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-destructive.oo-ui-icon-subtract,.mw-ui-icon-subtract-destructive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E subtract %3C/title%3E%3Cg fill=%22%23d73333%22%3E%3Cpath d=%22M4 9h12v2H4z%22/%3E%3C/g%3E%3C/svg%3E")}
+.vector-icon.mw-ui-icon-wikimedia-appearance{-webkit-mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=appearance&format=original&lang=en&skin=vector-2022&version=ar2nc);mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=appearance&format=original&lang=en&skin=vector-2022&version=ar2nc)}.vector-icon.mw-ui-icon-wikimedia-appearance-invert{-webkit-mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=appearance&variant=invert&format=original&lang=en&skin=vector-2022&version=ar2nc);mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=appearance&variant=invert&format=original&lang=en&skin=vector-2022&version=ar2nc)}.vector-icon.mw-ui-icon-wikimedia-appearance-progressive{-webkit-mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=appearance&variant=progressive&format=original&lang=en&skin=vector-2022&version=ar2nc);mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=appearance&variant=progressive&format=original&lang=en&skin=vector-2022&version=ar2nc)}.vector-icon.mw-ui-icon-wikimedia-speechBubbleAdd{-webkit-mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=speechBubbleAdd&format=original&lang=en&skin=vector-2022&version=ar2nc);mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=speechBubbleAdd&format=original&lang=en&skin=vector-2022&version=ar2nc)}.vector-icon.mw-ui-icon-wikimedia-speechBubbleAdd-invert{-webkit-mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=speechBubbleAdd&variant=invert&format=original&lang=en&skin=vector-2022&version=ar2nc);mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=speechBubbleAdd&variant=invert&format=original&lang=en&skin=vector-2022&version=ar2nc)}.vector-icon.mw-ui-icon-wikimedia-speechBubbleAdd-progressive{-webkit-mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=speechBubbleAdd&variant=progressive&format=original&lang=en&skin=vector-2022&version=ar2nc);mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=speechBubbleAdd&variant=progressive&format=original&lang=en&skin=vector-2022&version=ar2nc)}.vector-icon.mw-ui-icon-wikimedia-speechBubbles{-webkit-mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=speechBubbles&format=original&lang=en&skin=vector-2022&version=ar2nc);mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=speechBubbles&format=original&lang=en&skin=vector-2022&version=ar2nc)}.vector-icon.mw-ui-icon-wikimedia-speechBubbles-invert{-webkit-mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=speechBubbles&variant=invert&format=original&lang=en&skin=vector-2022&version=ar2nc);mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=speechBubbles&variant=invert&format=original&lang=en&skin=vector-2022&version=ar2nc)}.vector-icon.mw-ui-icon-wikimedia-speechBubbles-progressive{-webkit-mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=speechBubbles&variant=progressive&format=original&lang=en&skin=vector-2022&version=ar2nc);mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=speechBubbles&variant=progressive&format=original&lang=en&skin=vector-2022&version=ar2nc)}.vector-icon.mw-ui-icon-wikimedia-article{-webkit-mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=article&format=original&lang=en&skin=vector-2022&version=ar2nc);mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=article&format=original&lang=en&skin=vector-2022&version=ar2nc)}.vector-icon.mw-ui-icon-wikimedia-article-invert{-webkit-mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=article&variant=invert&format=original&lang=en&skin=vector-2022&version=ar2nc);mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=article&variant=invert&format=original&lang=en&skin=vector-2022&version=ar2nc)}.vector-icon.mw-ui-icon-wikimedia-article-progressive{-webkit-mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=article&variant=progressive&format=original&lang=en&skin=vector-2022&version=ar2nc);mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=article&variant=progressive&format=original&lang=en&skin=vector-2022&version=ar2nc)}.vector-icon.mw-ui-icon-wikimedia-history{-webkit-mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=history&format=original&lang=en&skin=vector-2022&version=ar2nc);mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=history&format=original&lang=en&skin=vector-2022&version=ar2nc)}.vector-icon.mw-ui-icon-wikimedia-history-invert{-webkit-mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=history&variant=invert&format=original&lang=en&skin=vector-2022&version=ar2nc);mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=history&variant=invert&format=original&lang=en&skin=vector-2022&version=ar2nc)}.vector-icon.mw-ui-icon-wikimedia-history-progressive{-webkit-mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=history&variant=progressive&format=original&lang=en&skin=vector-2022&version=ar2nc);mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=history&variant=progressive&format=original&lang=en&skin=vector-2022&version=ar2nc)}.vector-icon.mw-ui-icon-wikimedia-wikiText{-webkit-mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=wikiText&format=original&lang=en&skin=vector-2022&version=ar2nc);mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=wikiText&format=original&lang=en&skin=vector-2022&version=ar2nc)}.vector-icon.mw-ui-icon-wikimedia-wikiText-invert{-webkit-mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=wikiText&variant=invert&format=original&lang=en&skin=vector-2022&version=ar2nc);mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=wikiText&variant=invert&format=original&lang=en&skin=vector-2022&version=ar2nc)}.vector-icon.mw-ui-icon-wikimedia-wikiText-progressive{-webkit-mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=wikiText&variant=progressive&format=original&lang=en&skin=vector-2022&version=ar2nc);mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=wikiText&variant=progressive&format=original&lang=en&skin=vector-2022&version=ar2nc)}.vector-icon.mw-ui-icon-wikimedia-edit{-webkit-mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=edit&format=original&lang=en&skin=vector-2022&version=ar2nc);mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=edit&format=original&lang=en&skin=vector-2022&version=ar2nc)}.vector-icon.mw-ui-icon-wikimedia-edit-invert{-webkit-mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=edit&variant=invert&format=original&lang=en&skin=vector-2022&version=ar2nc);mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=edit&variant=invert&format=original&lang=en&skin=vector-2022&version=ar2nc)}.vector-icon.mw-ui-icon-wikimedia-edit-progressive{-webkit-mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=edit&variant=progressive&format=original&lang=en&skin=vector-2022&version=ar2nc);mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=edit&variant=progressive&format=original&lang=en&skin=vector-2022&version=ar2nc)}.vector-icon.mw-ui-icon-wikimedia-editLock{-webkit-mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=editLock&format=original&lang=en&skin=vector-2022&version=ar2nc);mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=editLock&format=original&lang=en&skin=vector-2022&version=ar2nc)}.vector-icon.mw-ui-icon-wikimedia-editLock-invert{-webkit-mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=editLock&variant=invert&format=original&lang=en&skin=vector-2022&version=ar2nc);mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=editLock&variant=invert&format=original&lang=en&skin=vector-2022&version=ar2nc)}.vector-icon.mw-ui-icon-wikimedia-editLock-progressive{-webkit-mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=editLock&variant=progressive&format=original&lang=en&skin=vector-2022&version=ar2nc);mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=editLock&variant=progressive&format=original&lang=en&skin=vector-2022&version=ar2nc)}.vector-icon.mw-ui-icon-wikimedia-exitFullscreen{-webkit-mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=exitFullscreen&format=original&lang=en&skin=vector-2022&version=ar2nc);mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=exitFullscreen&format=original&lang=en&skin=vector-2022&version=ar2nc)}.vector-icon.mw-ui-icon-wikimedia-exitFullscreen-invert{-webkit-mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=exitFullscreen&variant=invert&format=original&lang=en&skin=vector-2022&version=ar2nc);mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=exitFullscreen&variant=invert&format=original&lang=en&skin=vector-2022&version=ar2nc)}.vector-icon.mw-ui-icon-wikimedia-exitFullscreen-progressive{-webkit-mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=exitFullscreen&variant=progressive&format=original&lang=en&skin=vector-2022&version=ar2nc);mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=exitFullscreen&variant=progressive&format=original&lang=en&skin=vector-2022&version=ar2nc)}.vector-icon.mw-ui-icon-wikimedia-fullScreen{-webkit-mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=fullScreen&format=original&lang=en&skin=vector-2022&version=ar2nc);mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=fullScreen&format=original&lang=en&skin=vector-2022&version=ar2nc)}.vector-icon.mw-ui-icon-wikimedia-fullScreen-invert{-webkit-mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=fullScreen&variant=invert&format=original&lang=en&skin=vector-2022&version=ar2nc);mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=fullScreen&variant=invert&format=original&lang=en&skin=vector-2022&version=ar2nc)}.vector-icon.mw-ui-icon-wikimedia-fullScreen-progressive{-webkit-mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=fullScreen&variant=progressive&format=original&lang=en&skin=vector-2022&version=ar2nc);mask-image:url(https://en.wikipedia.org/w/load.php?modules=skins.vector.icons.js&image=fullScreen&variant=progressive&format=original&lang=en&skin=vector-2022&version=ar2nc)}
+.cite-accessibility-label{ top:-99999px;clip:rect(1px,1px,1px,1px); position:absolute !important;padding:0 !important;border:0 !important;height:1px !important;width:1px !important; overflow:hidden}:target .mw-cite-targeted-backlink{font-weight:bold}.mw-cite-up-arrow-backlink{display:none}:target .mw-cite-up-arrow-backlink{display:inline}:target .mw-cite-up-arrow{display:none}
+.ext-urlshortener-result-dialog{font-size:0.90909em}.ext-urlshortener-result-dialog a{word-wrap:break-word}
+.cdx-button{display:inline-flex;align-items:center;justify-content:center;gap:4px;box-sizing:border-box;min-height:32px;max-width:28rem;margin:0;border-width:1px;border-style:solid;border-radius:2px;padding-right:11px;padding-left:11px;font-family:inherit;font-size:inherit;font-weight:700;overflow:hidden;text-overflow:ellipsis;white-space:nowrap;text-transform:none;transition-property:background-color,color,border-color,box-shadow;transition-duration:.1s}.cdx-button--size-large{min-height:44px;padding-right:15px;padding-left:15px}.cdx-button--icon-only{min-width:32px;padding-right:5px;padding-left:5px}.cdx-button--icon-only.cdx-button--size-large{min-width:44px;padding-right:11px;padding-left:11px}.cdx-button::-moz-focus-inner{border:0;padding:0}.cdx-button .cdx-button__icon,.cdx-button .cdx-icon{vertical-align:middle}.cdx-button .cdx-icon{color:inherit}.cdx-button--fake-button,.cdx-button--fake-button:hover,.cdx-button--fake-button:focus{text-decoration:none}.cdx-button:enabled,.cdx-button.cdx-button--fake-button--enabled{background-color:var(--background-color-interactive-subtle,#f8f9fa);color:var(--color-base,#202122);border-color:var(--border-color-base,#a2a9b1)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:enabled .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled .cdx-button__icon{background-color:var(--color-base,#202122)}}.cdx-button:enabled:hover,.cdx-button.cdx-button--fake-button--enabled:hover{background-color:var(--background-color-base,#fff);color:var(--color-base--hover,#404244);cursor:pointer}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:enabled:hover .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled:hover .cdx-button__icon{background-color:var(--color-base--hover,#404244)}}.cdx-button:enabled:active,.cdx-button.cdx-button--fake-button--enabled:active,.cdx-button:enabled.cdx-button--is-active,.cdx-button.cdx-button--fake-button--enabled.cdx-button--is-active{background-color:var(--background-color-interactive,#eaecf0);color:var(--color-emphasized,#101418);border-color:var(--border-color-interactive,#72777d)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:enabled:active .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled:active .cdx-button__icon,.cdx-button:enabled.cdx-button--is-active .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--is-active .cdx-button__icon{background-color:var(--color-emphasized,#101418)}}.cdx-button:enabled:focus,.cdx-button.cdx-button--fake-button--enabled:focus{outline:1px solid transparent}.cdx-button:enabled:focus:not(:active):not(.cdx-button--is-active),.cdx-button.cdx-button--fake-button--enabled:focus:not(:active):not(.cdx-button--is-active){border-color:var(--border-color-progressive--focus,#36c);box-shadow:inset 0 0 0 1px var(--box-shadow-color-progressive--focus,#36c)}.cdx-button:enabled.cdx-button--action-progressive,.cdx-button.cdx-button--fake-button--enabled.cdx-button--action-progressive{color:var(--color-progressive,#36c)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:enabled.cdx-button--action-progressive .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--action-progressive .cdx-button__icon{background-color:var(--color-progressive,#36c)}}.cdx-button:enabled.cdx-button--action-progressive:hover,.cdx-button.cdx-button--fake-button--enabled.cdx-button--action-progressive:hover{color:var(--color-progressive--hover,#4b77d6);border-color:var(--border-color-progressive--hover,#4b77d6)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:enabled.cdx-button--action-progressive:hover .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--action-progressive:hover .cdx-button__icon{background-color:var(--color-progressive--hover,#4b77d6)}}.cdx-button:enabled.cdx-button--action-progressive:active,.cdx-button.cdx-button--fake-button--enabled.cdx-button--action-progressive:active,.cdx-button:enabled.cdx-button--action-progressive.cdx-button--is-active,.cdx-button.cdx-button--fake-button--enabled.cdx-button--action-progressive.cdx-button--is-active{background-color:var(--background-color-progressive-subtle,#f1f4fd);color:var(--color-progressive--active,#233566);border-color:var(--border-color-progressive--active,#233566)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:enabled.cdx-button--action-progressive:active .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--action-progressive:active .cdx-button__icon,.cdx-button:enabled.cdx-button--action-progressive.cdx-button--is-active .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--action-progressive.cdx-button--is-active .cdx-button__icon{background-color:var(--color-progressive--active,#233566)}}.cdx-button:enabled.cdx-button--action-destructive,.cdx-button.cdx-button--fake-button--enabled.cdx-button--action-destructive{color:var(--color-destructive,#bf3c2c)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:enabled.cdx-button--action-destructive .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--action-destructive .cdx-button__icon{background-color:var(--color-destructive,#bf3c2c)}}.cdx-button:enabled.cdx-button--action-destructive:hover,.cdx-button.cdx-button--fake-button--enabled.cdx-button--action-destructive:hover{color:var(--color-destructive--hover,#f54739);border-color:var(--border-color-destructive--hover,#f54739)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:enabled.cdx-button--action-destructive:hover .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--action-destructive:hover .cdx-button__icon{background-color:var(--color-destructive--hover,#f54739)}}.cdx-button:enabled.cdx-button--action-destructive:active,.cdx-button.cdx-button--fake-button--enabled.cdx-button--action-destructive:active,.cdx-button:enabled.cdx-button--action-destructive.cdx-button--is-active,.cdx-button.cdx-button--fake-button--enabled.cdx-button--action-destructive.cdx-button--is-active{background-color:var(--background-color-destructive-subtle,#ffe9e5);color:var(--color-destructive--active,#9f3526);border-color:var(--border-color-destructive--active,#9f3526)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:enabled.cdx-button--action-destructive:active .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--action-destructive:active .cdx-button__icon,.cdx-button:enabled.cdx-button--action-destructive.cdx-button--is-active .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--action-destructive.cdx-button--is-active .cdx-button__icon{background-color:var(--color-destructive--active,#9f3526)}}.cdx-button:enabled.cdx-button--action-destructive:focus:not(:active):not(.cdx-button--is-active),.cdx-button.cdx-button--fake-button--enabled.cdx-button--action-destructive:focus:not(:active):not(.cdx-button--is-active){border-color:var(--border-color-destructive--focus,#36c);box-shadow:inset 0 0 0 1px var(--box-shadow-color-destructive--focus,#36c)}.cdx-button:enabled.cdx-button--weight-primary.cdx-button--action-progressive,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-primary.cdx-button--action-progressive{background-color:var(--background-color-progressive,#36c);color:var(--color-inverted-fixed,#fff);border-color:var(--border-color-progressive,#36c)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:enabled.cdx-button--weight-primary.cdx-button--action-progressive .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-primary.cdx-button--action-progressive .cdx-button__icon{background-color:var(--color-inverted-fixed,#fff)}}.cdx-button:enabled.cdx-button--weight-primary.cdx-button--action-progressive:hover,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-primary.cdx-button--action-progressive:hover{background-color:var(--background-color-progressive--hover,#4b77d6);border-color:var(--border-color-progressive--hover,#4b77d6)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:enabled.cdx-button--weight-primary.cdx-button--action-progressive:hover .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-primary.cdx-button--action-progressive:hover .cdx-button__icon{background-color:var(--color-inverted-fixed,#fff)}}.cdx-button:enabled.cdx-button--weight-primary.cdx-button--action-progressive:active,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-primary.cdx-button--action-progressive:active,.cdx-button:enabled.cdx-button--weight-primary.cdx-button--action-progressive.cdx-button--is-active,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-primary.cdx-button--action-progressive.cdx-button--is-active{background-color:var(--background-color-progressive--active,#233566);border-color:var(--border-color-progressive--active,#233566)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:enabled.cdx-button--weight-primary.cdx-button--action-progressive:active .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-primary.cdx-button--action-progressive:active .cdx-button__icon,.cdx-button:enabled.cdx-button--weight-primary.cdx-button--action-progressive.cdx-button--is-active .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-primary.cdx-button--action-progressive.cdx-button--is-active .cdx-button__icon{background-color:var(--color-inverted-fixed,#fff)}}.cdx-button:enabled.cdx-button--weight-primary.cdx-button--action-progressive:focus:not(:active):not(.cdx-button--is-active),.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-primary.cdx-button--action-progressive:focus:not(:active):not(.cdx-button--is-active){border-color:var(--border-color-progressive--focus,#36c);box-shadow:inset 0 0 0 1px var(--box-shadow-color-progressive--focus,#36c),inset 0 0 0 2px var(--box-shadow-color-inverted,#fff)}.cdx-button:enabled.cdx-button--weight-primary.cdx-button--action-destructive,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-primary.cdx-button--action-destructive{background-color:var(--background-color-destructive,#bf3c2c);color:var(--color-inverted-fixed,#fff);border-color:var(--border-color-destructive,#bf3c2c)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:enabled.cdx-button--weight-primary.cdx-button--action-destructive .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-primary.cdx-button--action-destructive .cdx-button__icon{background-color:var(--color-inverted-fixed,#fff)}}.cdx-button:enabled.cdx-button--weight-primary.cdx-button--action-destructive:hover,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-primary.cdx-button--action-destructive:hover{background-color:var(--background-color-destructive--hover,#f54739);border-color:var(--border-color-destructive--hover,#f54739)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:enabled.cdx-button--weight-primary.cdx-button--action-destructive:hover .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-primary.cdx-button--action-destructive:hover .cdx-button__icon{background-color:var(--color-inverted-fixed,#fff)}}.cdx-button:enabled.cdx-button--weight-primary.cdx-button--action-destructive:active,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-primary.cdx-button--action-destructive:active,.cdx-button:enabled.cdx-button--weight-primary.cdx-button--action-destructive.cdx-button--is-active,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-primary.cdx-button--action-destructive.cdx-button--is-active{background-color:var(--background-color-destructive--active,#9f3526);border-color:var(--border-color-destructive--active,#9f3526)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:enabled.cdx-button--weight-primary.cdx-button--action-destructive:active .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-primary.cdx-button--action-destructive:active .cdx-button__icon,.cdx-button:enabled.cdx-button--weight-primary.cdx-button--action-destructive.cdx-button--is-active .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-primary.cdx-button--action-destructive.cdx-button--is-active .cdx-button__icon{background-color:var(--color-inverted-fixed,#fff)}}.cdx-button:enabled.cdx-button--weight-primary.cdx-button--action-destructive:focus:not(:active):not(.cdx-button--is-active),.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-primary.cdx-button--action-destructive:focus:not(:active):not(.cdx-button--is-active){border-color:var(--border-color-destructive--focus,#36c);box-shadow:inset 0 0 0 1px var(--box-shadow-color-destructive--focus,#36c),inset 0 0 0 2px var(--box-shadow-color-inverted,#fff)}.cdx-button:enabled.cdx-button--weight-quiet,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet{background-color:var(--background-color-transparent,transparent);border-color:var(--border-color-transparent,transparent)}.cdx-button:enabled.cdx-button--weight-quiet:hover,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet:hover{background-color:var(--background-color-button-quiet--hover,rgba(0,24,73,.027))}.cdx-button:enabled.cdx-button--weight-quiet:active,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet:active,.cdx-button:enabled.cdx-button--weight-quiet.cdx-button--is-active,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet.cdx-button--is-active{background-color:var(--background-color-button-quiet--active,rgba(0,24,73,.082));color:var(--color-emphasized,#101418);border-color:var(--border-color-interactive,#72777d)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:enabled.cdx-button--weight-quiet:active .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet:active .cdx-button__icon,.cdx-button:enabled.cdx-button--weight-quiet.cdx-button--is-active .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet.cdx-button--is-active .cdx-button__icon{background-color:var(--color-emphasized,#101418)}}.cdx-button:enabled.cdx-button--weight-quiet.cdx-button--action-progressive,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet.cdx-button--action-progressive{color:var(--color-progressive,#36c)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:enabled.cdx-button--weight-quiet.cdx-button--action-progressive .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet.cdx-button--action-progressive .cdx-button__icon{background-color:var(--color-progressive,#36c)}}.cdx-button:enabled.cdx-button--weight-quiet.cdx-button--action-progressive:hover,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet.cdx-button--action-progressive:hover{background-color:var(--background-color-progressive-subtle,#f1f4fd);color:var(--color-progressive--hover,#4b77d6)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:enabled.cdx-button--weight-quiet.cdx-button--action-progressive:hover .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet.cdx-button--action-progressive:hover .cdx-button__icon{background-color:var(--color-progressive--hover,#4b77d6)}}.cdx-button:enabled.cdx-button--weight-quiet.cdx-button--action-progressive:active,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet.cdx-button--action-progressive:active,.cdx-button:enabled.cdx-button--weight-quiet.cdx-button--action-progressive.cdx-button--is-active,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet.cdx-button--action-progressive.cdx-button--is-active{background-color:var(--background-color-progressive--active,#233566);color:var(--color-inverted-fixed,#fff);border-color:var(--border-color-progressive--active,#233566)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:enabled.cdx-button--weight-quiet.cdx-button--action-progressive:active .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet.cdx-button--action-progressive:active .cdx-button__icon,.cdx-button:enabled.cdx-button--weight-quiet.cdx-button--action-progressive.cdx-button--is-active .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet.cdx-button--action-progressive.cdx-button--is-active .cdx-button__icon{background-color:var(--color-inverted,#fff)}}.cdx-button:enabled.cdx-button--weight-quiet.cdx-button--action-destructive,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet.cdx-button--action-destructive{color:var(--color-destructive,#bf3c2c)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:enabled.cdx-button--weight-quiet.cdx-button--action-destructive .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet.cdx-button--action-destructive .cdx-button__icon{background-color:var(--color-destructive,#bf3c2c)}}.cdx-button:enabled.cdx-button--weight-quiet.cdx-button--action-destructive:hover,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet.cdx-button--action-destructive:hover{background-color:var(--background-color-destructive-subtle,#ffe9e5);color:var(--color-destructive--hover,#f54739)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:enabled.cdx-button--weight-quiet.cdx-button--action-destructive:hover .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet.cdx-button--action-destructive:hover .cdx-button__icon{background-color:var(--color-destructive--hover,#f54739)}}.cdx-button:enabled.cdx-button--weight-quiet.cdx-button--action-destructive:active,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet.cdx-button--action-destructive:active,.cdx-button:enabled.cdx-button--weight-quiet.cdx-button--action-destructive.cdx-button--is-active,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet.cdx-button--action-destructive.cdx-button--is-active{background-color:var(--background-color-destructive--active,#9f3526);color:var(--color-inverted-fixed,#fff);border-color:var(--border-color-destructive--active,#9f3526)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:enabled.cdx-button--weight-quiet.cdx-button--action-destructive:active .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet.cdx-button--action-destructive:active .cdx-button__icon,.cdx-button:enabled.cdx-button--weight-quiet.cdx-button--action-destructive.cdx-button--is-active .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet.cdx-button--action-destructive.cdx-button--is-active .cdx-button__icon{background-color:var(--color-inverted,#fff)}}.cdx-button:enabled.cdx-button--weight-quiet.cdx-button--action-destructive:focus:not(:active):not(.cdx-button--is-active),.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet.cdx-button--action-destructive:focus:not(:active):not(.cdx-button--is-active){border-color:var(--border-color-destructive--focus,#36c);box-shadow:inset 0 0 0 1px var(--box-shadow-color-destructive--focus,#36c)}.cdx-button:disabled,.cdx-button.cdx-button--fake-button--disabled{background-color:var(--background-color-disabled,#dadde3);color:var(--color-disabled-emphasized,#a2a9b1);border-color:var(--border-color-transparent,transparent)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:disabled .cdx-button__icon,.cdx-button.cdx-button--fake-button--disabled .cdx-button__icon{background-color:var(--color-inverted,#fff)}}.cdx-button:disabled.cdx-button--weight-quiet,.cdx-button.cdx-button--fake-button--disabled.cdx-button--weight-quiet{background-color:var(--background-color-transparent,transparent);color:var(--color-disabled,#a2a9b1)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:disabled.cdx-button--weight-quiet .cdx-button__icon,.cdx-button.cdx-button--fake-button--disabled.cdx-button--weight-quiet .cdx-button__icon{background-color:var(--color-disabled,#a2a9b1)}}.cdx-icon{color:var(--color-base,#202122);display:inline-flex;align-items:center;justify-content:center;vertical-align:text-bottom}.cdx-icon svg{fill:currentcolor;width:100%;height:100%}.cdx-icon--x-small{min-width:12px;min-height:12px;width:.75rem;height:.75rem}.cdx-icon--small{min-width:16px;min-height:16px;width:1rem;height:1rem}.cdx-icon--medium{min-width:20px;min-height:20px;width:1.25rem;height:1.25rem}.cdx-icon--flipped svg{transform:scaleX(-1)}.cdx-dialog-backdrop{background-color:var(--background-color-backdrop-light,rgba(255,255,255,.65));display:flex;align-items:center;justify-content:center;position:fixed;top:0;left:0;z-index:400;min-height:100%;width:100vw;height:100vh;height:-webkit-fill-available}.cdx-dialog{background-color:var(--background-color-base,#fff);display:flex;flex-direction:column;box-sizing:border-box;width:calc(100% - 2rem);max-width:32rem;max-height:calc(100vh - 2.5rem);border:1px solid var(--border-color-base,#a2a9b1);border-radius:2px;box-shadow:0 2px 2px rgba(0,0,0,.2)}.cdx-dialog__header{padding:16px 24px}.cdx-dialog__header--default{display:flex;align-items:baseline;justify-content:flex-end;box-sizing:border-box;width:100%}.cdx-dialog__header__title-group{display:flex;flex-grow:1;flex-direction:column;gap:6px}.cdx-dialog__header .cdx-dialog__header__title{margin:0;border:0;padding:0;font-family:inherit;font-size:1.125rem;font-weight:700;line-height:1.25}.cdx-dialog__header .cdx-dialog__header__subtitle{color:var(--color-subtle,#54595d);margin:0;padding:0;font-size:1rem;line-height:1.375}.cdx-dialog__header__close-button.cdx-button{margin-right:-8px}.cdx-dialog--dividers .cdx-dialog__header{border-bottom:1px solid var(--border-color-subtle,#c8ccd1)}.cdx-dialog__body{flex-grow:1;padding:16px 24px;overflow-y:auto}.cdx-dialog__body--no-header{padding-top:24px}.cdx-dialog__body--no-footer{padding-bottom:24px}.cdx-dialog__body>*:first-child{margin-top:0;padding-top:0}.cdx-dialog__body>*:last-child{margin-bottom:0;padding-bottom:0}.cdx-dialog__footer{padding:16px 24px 24px}.cdx-dialog__footer--default{display:flex;align-items:baseline;flex-wrap:wrap;justify-content:space-between;gap:12px}.cdx-dialog__footer .cdx-dialog__footer__text{color:var(--color-subtle,#54595d);flex:1 0 auto;width:100%;margin:0;font-size:.875rem;line-height:1.5714285}.cdx-dialog__footer__actions{display:flex;flex-grow:1;gap:12px}.cdx-dialog--dividers .cdx-dialog__footer{border-top:1px solid var(--border-color-subtle,#c8ccd1)}.cdx-dialog--horizontal-actions .cdx-dialog__footer__actions{flex-direction:row-reverse}.cdx-dialog--vertical-actions .cdx-dialog__footer__actions{flex-direction:column;width:100%}.cdx-dialog--vertical-actions .cdx-dialog__footer .cdx-dialog__footer__primary-action.cdx-button,.cdx-dialog--vertical-actions .cdx-dialog__footer .cdx-dialog__footer__default-action.cdx-button{max-width:none}.cdx-dialog-focus-trap{position:absolute}.cdx-dialog-focus-trap:focus{outline:0}.cdx-dialog-fade-enter-active,.cdx-dialog-fade-leave-active{transition-property:opacity;transition-duration:.25s;transition-timing-function:ease}.cdx-dialog-fade-enter-from,.cdx-dialog-fade-leave-to{opacity:0}body.cdx-dialog-open{overflow:hidden}.cdx-progress-bar{box-sizing:border-box;overflow-x:hidden}.cdx-progress-bar__bar{width:33.33%;height:100%}.cdx-progress-bar:not(.cdx-progress-bar--inline){position:relative;z-index:1;height:1rem;max-width:none;border:1px solid var(--border-color-base,#a2a9b1);border-radius:9999px;box-shadow:0 2px 2px rgba(0,0,0,.2)}.cdx-progress-bar--inline{width:100%;height:.25rem}.cdx-progress-bar:not(.cdx-progress-bar--disabled) .cdx-progress-bar__bar{background-color:var(--background-color-progressive,#36c);animation-name:cdx-animation-progress-bar__bar;animation-duration:1.6s;animation-timing-function:linear;animation-iteration-count:infinite}.cdx-progress-bar:not(.cdx-progress-bar--disabled).cdx-progress-bar--block{background-color:var(--background-color-base,#fff)}.cdx-progress-bar--disabled .cdx-progress-bar__bar{background-color:var(--background-color-disabled,#dadde3)}.cdx-progress-bar--disabled:not(.cdx-progress-bar--inline){background-color:var(--background-color-disabled-subtle,#eaecf0)}@keyframes cdx-animation-progress-bar__bar{0%{transform:translate(-100%)}to{transform:translate(300%)}}.cdx-thumbnail{display:inline-flex}.cdx-thumbnail__placeholder,.cdx-thumbnail__image{background-position:center;background-repeat:no-repeat;background-size:cover;flex-shrink:0;box-sizing:border-box;min-width:40px;min-height:40px;width:2.5rem;height:2.5rem;border:1px solid var(--border-color-subtle,#c8ccd1);border-radius:2px}.cdx-thumbnail__image{background-color:var(--background-color-base-fixed,#fff);display:inline-block}.cdx-thumbnail__image-enter-active{transition-property:opacity;transition-duration:.1s}.cdx-thumbnail__image-enter-from{opacity:0}.cdx-thumbnail__placeholder{background-color:var(--background-color-interactive-subtle,#f8f9fa);display:inline-flex;align-items:center;justify-content:center}.cdx-thumbnail__placeholder__icon{min-width:20px;min-height:20px;width:1.25rem;height:1.25rem;display:inline-block;vertical-align:text-bottom}@supports not (((-webkit-mask-image:none) or (mask-image:none))){.cdx-thumbnail__placeholder__icon{background-position:center;background-repeat:no-repeat;background-size:max(1.25rem,20px)}}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-thumbnail__placeholder__icon{-webkit-mask-size:max(1.25rem,20px);mask-size:max(1.25rem,20px);-webkit-mask-repeat:no-repeat;mask-repeat:no-repeat;-webkit-mask-position:center;mask-position:center}}@supports not (((-webkit-mask-image:none) or (mask-image:none))){.cdx-thumbnail__placeholder__icon{background-image:url('data:image/svg+xml;utf8,<svg xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" width="20" height="20" viewBox="0 0 20 20" fill="%23000000"><path d="M19 3H1v14h18zM3 14l3.5-4.5 2.5 3L12.5 8l4.5 6z"/><path d="M19 5H1V3h18zm0 12H1v-2h18z"/></svg>');filter:invert(var(--filter-invert-icon,0));opacity:var(--opacity-icon-base,.87)}.cdx-button:not(.cdx-button--weight-quiet):disabled .cdx-thumbnail__placeholder__icon,.cdx-button--weight-primary.cdx-button--action-progressive .cdx-thumbnail__placeholder__icon,.cdx-button--weight-primary.cdx-button--action-destructive .cdx-thumbnail__placeholder__icon{filter:invert(var(--filter-invert-primary-button-icon,1))}}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-thumbnail__placeholder__icon{-webkit-mask-image:url('data:image/svg+xml;utf8,<svg xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" width="20" height="20" viewBox="0 0 20 20" fill="%23000000"><path d="M19 3H1v14h18zM3 14l3.5-4.5 2.5 3L12.5 8l4.5 6z"/><path d="M19 5H1V3h18zm0 12H1v-2h18z"/></svg>');mask-image:url('data:image/svg+xml;utf8,<svg xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" width="20" height="20" viewBox="0 0 20 20" fill="%23000000"><path d="M19 3H1v14h18zM3 14l3.5-4.5 2.5 3L12.5 8l4.5 6z"/><path d="M19 5H1V3h18zm0 12H1v-2h18z"/></svg>');background-color:var(--color-placeholder,#72777d)}}.cdx-thumbnail__placeholder__icon--vue.cdx-icon{color:var(--color-placeholder,#72777d)}.cdx-search-result-title{display:inline-block;max-width:100%;font-weight:700}.cdx-search-result-title__match{font-weight:400}.cdx-menu-item{list-style:none;position:relative;padding:8px 12px;line-height:1.6;transition-property:background-color,color,border-color,box-shadow;transition-duration:.1s}.cdx-menu-item__content{display:flex;align-items:center;line-height:1.4285714;word-wrap:break-word;-webkit-hyphens:auto;-ms-hyphens:auto;hyphens:auto}.cdx-menu-item__content,.cdx-menu-item__content:hover{text-decoration:none}.cdx-menu-item--has-description .cdx-menu-item__content{align-items:flex-start}.cdx-menu-item__text{max-width:100%}.cdx-menu-item__text__description{display:block}.cdx-menu-item__thumbnail.cdx-thumbnail,.cdx-menu-item__icon{margin-right:8px}.cdx-menu-item__selected-icon{height:1.4285714em;margin-left:auto}.cdx-menu-item__icon.cdx-icon,.cdx-menu-item__selected-icon.cdx-icon{color:inherit}.cdx-menu-item--bold-label .cdx-menu-item__text__label{font-weight:700}.cdx-menu-item--hide-description-overflow .cdx-menu-item__text{overflow:hidden}.cdx-menu-item--hide-description-overflow .cdx-menu-item__text__description{overflow:hidden;text-overflow:ellipsis;white-space:nowrap}.cdx-menu-item--enabled,.cdx-menu-item--enabled .cdx-menu-item__content{color:var(--color-base,#202122)}.cdx-menu-item--enabled .cdx-menu-item__text__supporting-text,.cdx-menu-item--enabled .cdx-menu-item__text__description{color:var(--color-subtle,#54595d)}.cdx-menu-item--enabled.cdx-menu-item--highlighted{background-color:var(--background-color-interactive-subtle,#f8f9fa);color:var(--color-base--hover,#404244);cursor:pointer}.cdx-menu-item--enabled.cdx-menu-item--highlighted .cdx-menu-item__content,.cdx-menu-item--enabled.cdx-menu-item--highlighted .cdx-menu-item__text__description{color:var(--color-base--hover,#404244)}.cdx-menu-item--enabled.cdx-menu-item--active{background-color:var(--background-color-interactive,#eaecf0);color:var(--color-emphasized,#101418)}.cdx-menu-item--enabled.cdx-menu-item--active .cdx-menu-item__content,.cdx-menu-item--enabled.cdx-menu-item--active .cdx-menu-item__text__description{color:var(--color-emphasized,#101418)}.cdx-menu-item--enabled.cdx-menu-item--selected{background-color:var(--background-color-progressive-subtle,#f1f4fd)}.cdx-menu-item--enabled.cdx-menu-item--selected .cdx-menu-item__content{color:var(--color-progressive,#36c)}.cdx-menu-item--enabled.cdx-menu-item--selected.cdx-menu-item--highlighted .cdx-menu-item__content{color:var(--color-progressive--hover,#4b77d6)}.cdx-menu-item--enabled.cdx-menu-item--selected.cdx-menu-item--highlighted .cdx-menu-item__text__description{color:var(--color-subtle,#54595d)}.cdx-menu-item--enabled.cdx-menu-item--selected.cdx-menu-item--active .cdx-menu-item__content{color:var(--color-progressive--active,#233566)}.cdx-menu-item--enabled.cdx-menu-item--selected.cdx-menu-item--active .cdx-menu-item__text__description{color:var(--color-subtle,#54595d)}.cdx-menu-item--disabled{color:var(--color-disabled,#a2a9b1);cursor:default}.cdx-menu-item--disabled .cdx-menu-item__text__description{color:var(--color-disabled,#a2a9b1)}.cdx-menu-item--destructive .cdx-menu-item__content{color:var(--color-destructive,#bf3c2c)}.cdx-menu-item--destructive.cdx-menu-item--highlighted .cdx-menu-item__content{color:var(--color-destructive--hover,#f54739)}.cdx-menu-item--destructive.cdx-menu-item--active .cdx-menu-item__content{color:var(--color-destructive--active,#9f3526)}.cdx-menu-item--destructive.cdx-menu-item--selected.cdx-menu-item--highlighted .cdx-menu-item__content,.cdx-menu-item--destructive.cdx-menu-item--selected.cdx-menu-item--highlighted .cdx-menu-item__text__description{color:var(--color-destructive--hover,#f54739)}.cdx-menu{background-color:var(--background-color-base,#fff);display:flex;flex-direction:column;position:absolute;left:0;z-index:50;box-sizing:border-box;width:100%;border:1px solid var(--border-color-base,#a2a9b1);border-radius:2px;box-shadow:0 2px 2px rgba(0,0,0,.2)}.cdx-menu__progress-bar.cdx-progress-bar{position:absolute;top:0}.cdx-menu__listbox,.cdx-menu__group{margin:0;padding:0}.cdx-menu__listbox{overflow-y:auto}.cdx-menu__group{display:flex;flex-direction:column}.cdx-menu__group__meta{display:flex;gap:8px;padding:8px 12px 6px}.cdx-menu__group__meta__text{display:flex;flex-direction:column;line-height:1.6}.cdx-menu__group__icon{height:1.6em}.cdx-menu__group__label{font-weight:700}.cdx-menu__group__description{color:var(--color-subtle,#54595d);font-size:.875rem}.cdx-menu__group-wrapper--hide-label .cdx-menu__group__meta{display:block;clip:rect(1px,1px,1px,1px);position:absolute!important;width:1px;height:1px;margin:-1px;border:0;padding:0;overflow:hidden}.cdx-menu__group-wrapper+.cdx-menu-item,.cdx-menu-item+.cdx-menu__group-wrapper,.cdx-menu__group-wrapper--hide-label,.cdx-menu__group-wrapper--hide-label+.cdx-menu__group-wrapper{border-top:1px solid var(--border-color-muted,#dadde3)}.cdx-menu--has-footer .cdx-menu__listbox>.cdx-menu-item:last-of-type{position:absolute;bottom:0;box-sizing:border-box;width:100%}.cdx-menu--has-footer .cdx-menu__listbox>.cdx-menu-item:last-of-type:not(:first-of-type){border-top:1px solid var(--border-color-subtle,#c8ccd1)}.cdx-select{box-sizing:border-box;min-width:256px;min-height:32px;border-width:1px;border-style:solid;border-radius:2px;padding-top:4px;padding-bottom:4px;padding-left:12px;padding-right:calc(16px + 1.25rem);font-size:inherit;line-height:1.375;-webkit-appearance:none;appearance:none;background-position:center right 12px;background-repeat:no-repeat;background-size:max(.75rem,12px)}.cdx-select:disabled{background-color:var(--background-color-disabled-subtle,#eaecf0);color:var(--color-disabled,#a2a9b1);border-color:var(--border-color-disabled,#c8ccd1);background-image:url('data:image/svg+xml;utf8,<svg xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" width="20" height="20" viewBox="0 0 20 20" fill="%2372777d"><path d="m17.5 4.75-7.5 7.5-7.5-7.5L1 6.25l9 9 9-9z"/></svg>');opacity:1}.cdx-select:enabled{background-color:var(--background-color-interactive-subtle,#f8f9fa);color:var(--color-base,#202122);border-color:var(--border-color-base,#a2a9b1);transition-property:background-color,color,border-color,box-shadow;transition-duration:.1s;background-image:url('data:image/svg+xml;utf8,<svg xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" width="20" height="20" viewBox="0 0 20 20" fill="%23202122"><path d="m17.5 4.75-7.5 7.5-7.5-7.5L1 6.25l9 9 9-9z"/></svg>')}.cdx-select:enabled:hover{background-color:var(--background-color-base,#fff);color:var(--color-base--hover,#404244);border-color:var(--border-color-base,#a2a9b1);cursor:pointer}.cdx-select:enabled:focus{border-color:var(--border-color-progressive--focus,#36c);box-shadow:inset 0 0 0 1px var(--box-shadow-color-progressive--focus,#36c);outline:1px solid transparent}.cdx-select:enabled:active{color:var(--color-emphasized,#101418);border-color:var(--border-color-interactive,#72777d)}.cdx-select-vue{display:inline-block;position:relative}.cdx-select-vue__handle{box-sizing:border-box;min-width:256px;min-height:32px;border-width:1px;border-style:solid;border-radius:2px;padding-top:4px;padding-bottom:4px;padding-left:12px;padding-right:calc(16px + 1.25rem);font-size:inherit;line-height:1.375;position:relative;width:100%}.cdx-select-vue--has-start-icon .cdx-select-vue__handle{padding-left:calc(20px + 1.25rem)}.cdx-select-vue__start-icon.cdx-icon{position:absolute;top:50%;min-width:20px;min-height:20px;width:1.25rem;height:1.25rem;transition-property:color;transition-duration:.1s;left:12px;transform:translateY(-50%)}.cdx-select-vue__indicator.cdx-icon{color:var(--color-base,#202122);position:absolute;top:50%;min-width:12px;min-height:12px;width:.75rem;height:.75rem;transition-property:color;transition-duration:.1s;right:12px;transform:translateY(-50%)}.cdx-select-vue--enabled .cdx-select-vue__handle{background-color:var(--background-color-interactive-subtle,#f8f9fa);color:var(--color-base,#202122);border-color:var(--border-color-base,#a2a9b1);transition-property:background-color,color,border-color,box-shadow;transition-duration:.1s}.cdx-select-vue--enabled .cdx-select-vue__handle:hover{background-color:var(--background-color-base,#fff);color:var(--color-base--hover,#404244);border-color:var(--border-color-base,#a2a9b1);cursor:pointer}.cdx-select-vue--enabled .cdx-select-vue__handle:focus{border-color:var(--border-color-progressive--focus,#36c);box-shadow:inset 0 0 0 1px var(--box-shadow-color-progressive--focus,#36c);outline:1px solid transparent}.cdx-select-vue--enabled .cdx-select-vue__handle:active{color:var(--color-emphasized,#101418);border-color:var(--border-color-interactive,#72777d)}.cdx-select-vue--enabled .cdx-select-vue__handle:hover .cdx-select-vue__indicator{color:var(--color-base--hover,#404244)}.cdx-select-vue--enabled.cdx-select-vue--expanded .cdx-select-vue__handle{background-color:var(--background-color-base,#fff)}.cdx-select-vue--enabled.cdx-select-vue--expanded .cdx-select-vue__handle .cdx-select-vue__indicator{color:var(--color-base,#202122)}.cdx-select-vue--disabled .cdx-select-vue__handle{background-color:var(--background-color-disabled-subtle,#eaecf0);color:var(--color-disabled,#a2a9b1);border-color:var(--border-color-disabled,#c8ccd1);cursor:default}.cdx-select-vue--disabled .cdx-select-vue__indicator,.cdx-select-vue--disabled .cdx-select-vue__start-icon{color:var(--color-disabled,#a2a9b1)}.cdx-select-vue--status-error.cdx-select-vue--enabled .cdx-select-vue__handle{border-color:var(--border-color-error,#f54739)}.cdx-select-vue--status-error.cdx-select-vue--enabled .cdx-select-vue__handle:hover{border-color:var(--border-color-error--hover,#d74032)}.cdx-select-vue--status-error.cdx-select-vue--enabled .cdx-select-vue__handle:focus{border-color:var(--border-color-progressive--focus,#36c)}.cdx-dialog .cdx-select-vue{position:static}.cdx-tab[aria-hidden=true]{display:none}.cdx-tab:focus{outline:1px solid transparent}.cdx-tabs__header{display:flex;align-items:flex-end;position:relative}.cdx-tabs__prev-scroller,.cdx-tabs__next-scroller{background-color:inherit;position:absolute;top:0;bottom:0}.cdx-tabs__prev-scroller{left:0}.cdx-tabs__next-scroller{right:0}.cdx-tabs__prev-scroller:after,.cdx-tabs__next-scroller:before{content:"";position:absolute;top:0;z-index:1;width:1.5rem;height:100%;pointer-events:none}.cdx-tabs__prev-scroller:after{left:100%}.cdx-tabs__next-scroller:before{right:100%}.cdx-tabs__scroll-button.cdx-button{height:100%}.cdx-tabs__list{display:flex;overflow-x:auto;scrollbar-width:none;-webkit-overflow-scrolling:touch}.cdx-tabs__list::-webkit-scrollbar{-webkit-appearance:none;display:none}.cdx-tabs__list__item{background-color:var(--background-color-transparent,transparent);display:block;flex:0 0 auto;max-width:16rem;border-width:0;border-top-left-radius:2px;border-top-right-radius:2px;padding:4px 12px;font-size:1rem;font-weight:700;line-height:1.4285714;text-decoration:none;overflow:hidden;text-overflow:ellipsis;white-space:nowrap;transition-property:background-color,color,border-color,box-shadow;transition-duration:.1s}.cdx-tabs__list__item:hover{cursor:pointer}.cdx-tabs__list__item[aria-selected=true]{cursor:default}.cdx-tabs>.cdx-tabs__header .cdx-tabs__list__item+.cdx-tabs__list__item{margin-left:0}.cdx-tabs--framed>.cdx-tabs__header{background-color:var(--background-color-interactive,#eaecf0)}.cdx-tabs--framed>.cdx-tabs__header .cdx-tabs__prev-scroller:after{background-image:linear-gradient(to right,var(--background-color-interactive,#eaecf0) 0,var(--background-color-transparent,transparent) 100%)}.cdx-tabs--framed>.cdx-tabs__header .cdx-tabs__next-scroller:before{background-image:linear-gradient(to left,var(--background-color-interactive,#eaecf0) 0,var(--background-color-transparent,transparent) 100%)}.cdx-tabs--framed>.cdx-tabs__header .cdx-tabs__list__item{color:var(--color-base,#202122);margin:8px 4px 0 8px}.cdx-tabs--framed>.cdx-tabs__header .cdx-tabs__list__item:enabled{overflow:hidden}.cdx-tabs--framed>.cdx-tabs__header .cdx-tabs__list__item:enabled:hover{background-color:var(--background-color-tab-list-item-framed--hover,rgba(255,255,255,.3));color:var(--color-base,#202122)}.cdx-tabs--framed>.cdx-tabs__header .cdx-tabs__list__item:enabled:active{background-color:var(--background-color-tab-list-item-framed--active,rgba(255,255,255,.65));color:var(--color-base,#202122)}.cdx-tabs--framed>.cdx-tabs__header .cdx-tabs__list__item[aria-selected=true],.cdx-tabs--framed>.cdx-tabs__header .cdx-tabs__list__item[aria-selected=true]:hover{background-color:var(--background-color-base,#fff);color:var(--color-base,#202122)}.cdx-tabs--framed>.cdx-tabs__header .cdx-tabs__list__item:disabled{background-color:var(--background-color-interactive,#eaecf0);color:var(--color-disabled,#a2a9b1);cursor:default}.cdx-tabs--framed>.cdx-tabs__header .cdx-tabs__list__item:last-child{margin-right:8px}.cdx-tabs:not(.cdx-tabs--framed)>.cdx-tabs__header{background-color:var(--background-color-base,#fff);margin:0 4px;border-bottom:1px solid var(--border-color-base,#a2a9b1)}.cdx-tabs:not(.cdx-tabs--framed)>.cdx-tabs__header .cdx-tabs__prev-scroller:after{background-image:linear-gradient(to right,var(--background-color-base,#fff) 0,var(--background-color-transparent,transparent) 100%)}.cdx-tabs:not(.cdx-tabs--framed)>.cdx-tabs__header .cdx-tabs__next-scroller:before{background-image:linear-gradient(to left,var(--background-color-base,#fff) 0,var(--background-color-transparent,transparent) 100%)}.cdx-tabs:not(.cdx-tabs--framed)>.cdx-tabs__header .cdx-tabs__list__item{margin:0 2px}.cdx-tabs:not(.cdx-tabs--framed)>.cdx-tabs__header .cdx-tabs__list__item:enabled{color:var(--color-base,#202122)}.cdx-tabs:not(.cdx-tabs--framed)>.cdx-tabs__header .cdx-tabs__list__item:enabled:hover:not([aria-selected="true"]){color:var(--color-progressive--hover,#4b77d6);box-shadow:inset 0 -2px 0 0 var(--box-shadow-color-progressive-selected--hover,#4b77d6)}.cdx-tabs:not(.cdx-tabs--framed)>.cdx-tabs__header .cdx-tabs__list__item:enabled:active:not([aria-selected="true"]){color:var(--color-progressive--active,#233566);box-shadow:inset 0 -2px 0 0 var(--box-shadow-color-progressive-selected--active,#233566)}.cdx-tabs:not(.cdx-tabs--framed)>.cdx-tabs__header .cdx-tabs__list__item[aria-selected=true]{color:var(--color-progressive,#36c);box-shadow:inset 0 -2px 0 0 var(--box-shadow-color-progressive-selected,#36c)}.cdx-tabs:not(.cdx-tabs--framed)>.cdx-tabs__header .cdx-tabs__list__item[aria-selected=true]:hover{color:var(--color-progressive,#36c)}.cdx-tabs:not(.cdx-tabs--framed)>.cdx-tabs__header .cdx-tabs__list__item:disabled{color:var(--color-disabled,#a2a9b1);cursor:default}.cdx-tabs:not(.cdx-tabs--framed)>.cdx-tabs__header .cdx-tabs__list__item:first-child{margin-left:0}.cdx-tabs:not(.cdx-tabs--framed)>.cdx-tabs__header .cdx-tabs__list__item:last-child{margin-right:0}.cdx-tabs--framed>.cdx-tabs__header .cdx-tabs__list__item:focus-visible,.cdx-tabs:not(.cdx-tabs--framed)>.cdx-tabs__header .cdx-tabs__list__item:focus-visible{box-shadow:inset 0 0 0 2px var(--border-color-progressive,#36c);outline:1px solid transparent;overflow:hidden}.cdx-text-input{position:relative;box-sizing:border-box;min-width:256px;border-radius:2px;overflow:hidden}.cdx-text-input .cdx-text-input__start-icon{position:absolute;top:50%;min-width:20px;min-height:20px;width:1.25rem;height:1.25rem;transition-property:color;transition-duration:.1s;left:9px;transform:translateY(-50%)}.cdx-text-input__icon.cdx-text-input__end-icon{min-width:16px;min-height:16px;width:1rem;height:1rem}@supports not (((-webkit-mask-image:none) or (mask-image:none))){.cdx-text-input__icon.cdx-text-input__end-icon{background-position:center;background-repeat:no-repeat;background-size:max(1rem,16px)}}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-text-input__icon.cdx-text-input__end-icon{-webkit-mask-size:max(1rem,16px);mask-size:max(1rem,16px);-webkit-mask-repeat:no-repeat;mask-repeat:no-repeat;-webkit-mask-position:center;mask-position:center}}.cdx-text-input__clear-icon.cdx-icon,.cdx-text-input .cdx-text-input__end-icon{position:absolute;top:50%;min-width:16px;min-height:16px;width:1rem;height:1rem;transition-property:color;transition-duration:.1s;right:9px;transform:translateY(-50%)}.cdx-text-input__clear-icon.cdx-icon:hover{cursor:pointer}.cdx-text-input__end-icon.cdx-icon+.cdx-text-input__clear-icon.cdx-icon{right:calc(17px + 1rem)}.cdx-text-input__input{display:block;box-sizing:border-box;min-height:32px;width:100%;margin:0;border-width:1px;border-style:solid;border-radius:0;padding:4px 8px;font-family:inherit;font-size:inherit;line-height:1.375}.cdx-text-input__input:enabled{background-color:var(--background-color-base,#fff);color:var(--color-base,#202122);border-color:var(--border-color-base,#a2a9b1);box-shadow:inset 0 0 0 1px var(--box-shadow-color-transparent,transparent);transition-property:background-color,color,border-color,box-shadow;transition-duration:.25s}.cdx-text-input__input:enabled~.cdx-text-input__icon-vue{color:var(--color-placeholder,#72777d)}.cdx-text-input__input:enabled~.cdx-text-input__icon{opacity:var(--opacity-icon-placeholder,.51)}.cdx-text-input__input:enabled:hover{border-color:var(--border-color-interactive,#72777d)}.cdx-text-input__input:enabled:focus~.cdx-text-input__icon-vue,.cdx-text-input__input:enabled.cdx-text-input__input--has-value~.cdx-text-input__icon-vue{color:var(--color-base,#202122)}.cdx-text-input__input:enabled:focus~.cdx-text-input__icon,.cdx-text-input__input:enabled.cdx-text-input__input--has-value~.cdx-text-input__icon{opacity:1}.cdx-text-input__input:enabled:focus{border-color:var(--border-color-progressive--focus,#36c);box-shadow:inset 0 0 0 1px var(--box-shadow-color-progressive--focus,#36c);outline:1px solid transparent}.cdx-text-input__input:enabled:read-only{background-color:var(--background-color-interactive-subtle,#f8f9fa)}.cdx-text-input__input:disabled{background-color:var(--background-color-disabled-subtle,#eaecf0);color:var(--color-disabled,#a2a9b1);-webkit-text-fill-color:var(--color-disabled,#a2a9b1);border-color:var(--border-color-disabled,#c8ccd1)}.cdx-text-input__input:disabled~.cdx-text-input__icon-vue{color:var(--color-disabled,#a2a9b1);pointer-events:none}.cdx-text-input__input:disabled~.cdx-text-input__icon{opacity:var(--opacity-icon-base--disabled,.51)}.cdx-text-input__input::placeholder{color:var(--color-placeholder,#72777d);opacity:1}.cdx-text-input__input::-ms-clear{display:none}.cdx-text-input__input[type=search]{-webkit-appearance:none;-moz-appearance:textfield}.cdx-text-input__input[type=search]::-webkit-search-decoration,.cdx-text-input__input[type=search]::-webkit-search-cancel-button{display:none}.cdx-text-input--has-start-icon .cdx-text-input__input{padding-left:calc(16px + 1.25rem)}.cdx-text-input--has-end-icon .cdx-text-input__input,.cdx-text-input--clearable .cdx-text-input__input{padding-right:calc(16px + 1rem)}.cdx-text-input--has-end-icon.cdx-text-input--clearable .cdx-text-input__input{padding-right:calc(24px + 2rem)}.cdx-text-input--status-error .cdx-text-input__input:enabled{border-color:var(--border-color-error,#f54739)}.cdx-text-input--status-error .cdx-text-input__input:enabled:hover{border-color:var(--border-color-error--hover,#d74032)}.cdx-text-input--status-error .cdx-text-input__input:enabled:focus{border-color:var(--border-color-progressive--focus,#36c)}
+.ve-init-mw-progressBarWidget{height:1em;overflow:hidden;margin:0 25%}.ve-init-mw-progressBarWidget-bar{height:1em;width:0} .ve-init-mw-progressBarWidget{background-color:#fff;box-sizing:border-box;height:0.875em;border:1px solid #36c;border-radius:0.875em;box-shadow:0 1px 1px rgba(0,0,0,0.15)}.ve-init-mw-progressBarWidget-bar{background-color:#36c;height:0.875em}
+.rt-overlay{position:absolute;width:100%;font-size:calc(var(--font-size-medium,1rem) * (13 / 14));line-height:1.5em; z-index:800; top:0} .skin-vector-legacy .rt-overlay{font-size:13px}.skin-monobook .rt-overlay{font-size:12.7px}.rt-tooltip{position:absolute;max-width:27em;background:var(--background-color-base,#fff);color:var(--color-base,#202122);border:1px solid var(--border-color-subtle,#c8ccd1);border-radius:2px;box-shadow:0 20px 48px 0 rgba(0,0,0,0.2)}html.skin-theme-clientpref-night .rt-tooltip{box-shadow:0 20px 48px 0 rgba(0,0,0,1)} .rt-tooltip-above .rt-hoverArea{margin-bottom:-0.6em;padding-bottom:0.6em}.rt-tooltip-below .rt-hoverArea{margin-top:-0.7em;padding-top:0.7em}.rt-scroll{overflow-x:auto}.rt-content{padding:0.7em 0.9em;overflow-wrap:break-word}.rt-tail{ background:linear-gradient(to top right,var(--border-color-subtle,#c8ccd1) 48%,rgba(0,0,0,0) 48%);--tail-left:19px;--tail-side-width:13px}.rt-tail,.rt-tail:after{position:absolute; z-index:-1;width:var(--tail-side-width);height:var(--tail-side-width)}.rt-tail:after{content:'';background:var(--background-color-base,#fff);bottom:1px;left:1px}.rt-tooltip-above .rt-tail{transform:rotate(-45deg);transform-origin:100% 100%;bottom:0;left:var(--tail-left)}.rt-tooltip-below .rt-tail{transform:rotate(135deg);transform-origin:0 0;top:0;left:calc(var(--tail-left) + var(--tail-side-width))}.rt-settingsLink{background-image:url(data:image/svg+xml,%3Csvg%20xmlns%3D%22http%3A%2F%2Fwww.w3.org%2F2000%2Fsvg%22%20viewBox%3D%220%200%2024%2024%22%3E%0D%0A%20%20%20%20%3Cpath%20fill%3D%22%2354595d%22%20d%3D%22M20%2014.5v-2.9l-1.8-.3c-.1-.4-.3-.8-.6-1.4l1.1-1.5-2.1-2.1-1.5%201.1c-.5-.3-1-.5-1.4-.6L13.5%205h-2.9l-.3%201.8c-.5.1-.9.3-1.4.6L7.4%206.3%205.3%208.4l1%201.5c-.3.5-.4.9-.6%201.4l-1.7.2v2.9l1.8.3c.1.5.3.9.6%201.4l-1%201.5%202.1%202.1%201.5-1c.4.2.9.4%201.4.6l.3%201.8h3l.3-1.8c.5-.1.9-.3%201.4-.6l1.5%201.1%202.1-2.1-1.1-1.5c.3-.5.5-1%20.6-1.4l1.5-.3zM12%2016c-1.7%200-3-1.3-3-3s1.3-3%203-3%203%201.3%203%203-1.3%203-3%203z%22%2F%3E%0D%0A%3C%2Fsvg%3E);float:right;margin:-0.5em -0.5em 0 0.5em;box-sizing:border-box;height:32px;width:32px;border:1px solid transparent;border-radius:2px;background-position:center center;background-repeat:no-repeat;background-size:24px 24px}html.skin-theme-clientpref-night .rt-settingsLink{background-image:url(data:image/svg+xml,%3Csvg%20xmlns%3D%22http%3A%2F%2Fwww.w3.org%2F2000%2Fsvg%22%20viewBox%3D%220%200%2024%2024%22%3E%0D%0A%20%20%20%20%3Cpath%20fill%3D%22%23c8ccd1%22%20d%3D%22M20%2014.5v-2.9l-1.8-.3c-.1-.4-.3-.8-.6-1.4l1.1-1.5-2.1-2.1-1.5%201.1c-.5-.3-1-.5-1.4-.6L13.5%205h-2.9l-.3%201.8c-.5.1-.9.3-1.4.6L7.4%206.3%205.3%208.4l1%201.5c-.3.5-.4.9-.6%201.4l-1.7.2v2.9l1.8.3c.1.5.3.9.6%201.4l-1%201.5%202.1%202.1%201.5-1c.4.2.9.4%201.4.6l.3%201.8h3l.3-1.8c.5-.1.9-.3%201.4-.6l1.5%201.1%202.1-2.1-1.1-1.5c.3-.5.5-1%20.6-1.4l1.5-.3zM12%2016c-1.7%200-3-1.3-3-3s1.3-3%203-3%203%201.3%203%203-1.3%203-3%203z%22%2F%3E%0D%0A%3C%2Fsvg%3E)}.rt-settingsLink:hover,.rt-settingsLink:active{background-color:var(--background-color-interactive,#eaecf0)}.rt-settingsLink:active{border-color:var(--border-color-interactive,#72777d)}.rt-settingsLink:focus{outline:1px solid transparent}.rt-settingsLink:focus:not(:active){border-color:var(--border-color-progressive--focus,#36c);box-shadow:inset 0 0 0 1px var(--box-shadow-color-progressive--focus,#36c)}.rt-target{background-color:var(--background-color-progressive-subtle,#eaf3ff)}.rt-enableField{font-weight:bold;margin-bottom:1.25em}.rt-numberInput.rt-numberInput{width:10em}.rt-tooltipsForCommentsField.rt-tooltipsForCommentsField.rt-tooltipsForCommentsField{margin-top:1.25em}.rt-disabledHelp{border-collapse:collapse}.rt-disabledHelp td{padding:0}.rt-disabledNote.rt-disabledNote{vertical-align:bottom;padding-left:0.36em;font-weight:bold}@keyframes rt-fade-in-up{0%{opacity:0;transform:translate(0,20px)}100%{opacity:1;transform:translate(0,0)}}@keyframes rt-fade-in-down{0%{opacity:0;transform:translate(0,-20px)}100%{opacity:1;transform:translate(0,0)}}@keyframes rt-fade-out-down{0%{opacity:1;transform:translate(0,0)}100%{opacity:0;transform:translate(0,20px)}}@keyframes rt-fade-out-up{0%{opacity:1;transform:translate(0,0)}100%{opacity:0;transform:translate(0,-20px)}}.rt-fade-in-up{animation:rt-fade-in-up 0.2s ease forwards}.rt-fade-in-down{animation:rt-fade-in-down 0.2s ease forwards}.rt-fade-out-down{animation:rt-fade-out-down 0.2s ease forwards}.rt-fade-out-up{animation:rt-fade-out-up 0.2s ease forwards}
+.mw-collapsible-toggle{float:right;-webkit-user-select:none;-moz-user-select:none;user-select:none}.mw-collapsible-toggle-default{-webkit-appearance:none;-moz-appearance:none;appearance:none;background:none;margin:0;padding:0;border:0;font:inherit}.mw-collapsible-toggle-default .mw-collapsible-text{color:var(--color-progressive,#36c);border-radius:2px;text-decoration:none}.mw-collapsible-toggle-default .mw-collapsible-text:visited{color:var(--color-visited,#6a60b0)}.mw-collapsible-toggle-default .mw-collapsible-text:visited:hover{color:var(--color-visited,#6a60b0)}.mw-collapsible-toggle-default .mw-collapsible-text:hover{color:var(--color-progressive--hover,#4b77d6);text-decoration:underline}.mw-collapsible-toggle-default .mw-collapsible-text:active{color:var(--color-progressive--active,#233566);text-decoration:underline}.mw-collapsible-toggle-default .mw-collapsible-text:focus-visible{outline:solid 2px var(--outline-color-progressive--focus,#36c)}@supports not selector(:focus-visible){.mw-collapsible-toggle-default .mw-collapsible-text:focus{outline:solid 2px var(--outline-color-progressive--focus,#36c)}}.mw-collapsible-toggle-default .mw-collapsible-text .cdx-icon:not(.cdx-thumbnail__placeholder__icon--vue):last-child{min-width:12px;min-height:12px;width:1rem;height:1rem;padding-left:4px;vertical-align:middle}.mw-underline-always .mw-collapsible-toggle-default .mw-collapsible-text{text-decoration:underline}.mw-underline-never .mw-collapsible-toggle-default .mw-collapsible-text{text-decoration:none}.mw-collapsible-toggle-default::before{content:'['}.mw-collapsible-toggle-default::after{content:']'}.mw-customtoggle,.mw-collapsible-toggle{cursor:pointer} caption .mw-collapsible-toggle,.mw-content-ltr caption .mw-collapsible-toggle,.mw-content-rtl caption .mw-collapsible-toggle,.mw-content-rtl .mw-content-ltr caption .mw-collapsible-toggle,.mw-content-ltr .mw-content-rtl caption .mw-collapsible-toggle{float:none}
+@media screen {
+	.toctoggle{-webkit-user-select:none;-moz-user-select:none;user-select:none;font-size:94%}}
+@keyframes centralAuthPPersonalAnimation{0%{opacity:0;transform:translateY(-20px)}100%{opacity:1;transform:translateY(0)}}.centralAuthPPersonalAnimation{animation-duration:1s;animation-fill-mode:both;animation-name:centralAuthPPersonalAnimation}
+#mw-teleport-target{position:absolute;z-index:450}   #mw-teleport-target{font-size:0.875rem}
+#vector-appearance form{font-size:0.875rem;padding:6px 0}#vector-appearance a.skin-theme-beta-notice-success{color:var(--color-success,#177860);pointer-events:none}#vector-appearance .vector-icon.vector-icon--heart{ min-width:16px;min-height:16px;width:1rem;height:1rem;display:inline-block;vertical-align:text-bottom}@supports not ((-webkit-mask-image:none) or (mask-image:none)){#vector-appearance .vector-icon.vector-icon--heart{background-position:center;background-repeat:no-repeat;background-size:calc(max(1rem,16px))}}@supports (-webkit-mask-image:none) or (mask-image:none){#vector-appearance .vector-icon.vector-icon--heart{ -webkit-mask-size:calc(max(1rem,16px));mask-size:calc(max(1rem,16px));-webkit-mask-repeat:no-repeat;mask-repeat:no-repeat;-webkit-mask-position:center;mask-position:center; }}@supports not ((-webkit-mask-image:none) or (mask-image:none)){#vector-appearance .vector-icon.vector-icon--heart{background-image:url("data:image/svg+xml;utf8,<svg xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\" width=\"20\" height=\"20\" viewBox=\"0 0 20 20\" fill=\"%23000000\"><path d=\"M14.75 1A5.24 5.24 0 0010 4 5.24 5.24 0 000 6.25C0 11.75 10 19 10 19s10-7.25 10-12.75A5.25 5.25 0 0014.75 1\"/></svg>");filter:invert(var(--filter-invert-icon,0));opacity:var(--opacity-icon-base,0.87)}.cdx-button:not(.cdx-button--weight-quiet):disabled #vector-appearance .vector-icon.vector-icon--heart,.cdx-button--weight-primary.cdx-button--action-progressive #vector-appearance .vector-icon.vector-icon--heart,.cdx-button--weight-primary.cdx-button--action-destructive #vector-appearance .vector-icon.vector-icon--heart{filter:invert(var(--filter-invert-primary-button-icon,1))}}@supports (-webkit-mask-image:none) or (mask-image:none){#vector-appearance .vector-icon.vector-icon--heart{ -webkit-mask-image:url("data:image/svg+xml;utf8,<svg xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\" width=\"20\" height=\"20\" viewBox=\"0 0 20 20\" fill=\"%23000000\"><path d=\"M14.75 1A5.24 5.24 0 0010 4 5.24 5.24 0 000 6.25C0 11.75 10 19 10 19s10-7.25 10-12.75A5.25 5.25 0 0014.75 1\"/></svg>"); mask-image:url("data:image/svg+xml;utf8,<svg xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\" width=\"20\" height=\"20\" viewBox=\"0 0 20 20\" fill=\"%23000000\"><path d=\"M14.75 1A5.24 5.24 0 0010 4 5.24 5.24 0 000 6.25C0 11.75 10 19 10 19s10-7.25 10-12.75A5.25 5.25 0 0014.75 1\"/></svg>");background-color:var(--color-success,#177860)}}#skin-theme-beta-notice{display:none}@media screen and (prefers-color-scheme:dark){html.skin-theme-clientpref-os #skin-theme-beta-notice{display:block}}html.skin-theme-clientpref-night #skin-theme-beta-notice{display:block}
+.uls-menu{border-radius:2px; font-size:medium}.uls-search,.uls-language-settings-close-block{border-top-right-radius:2px;border-top-left-radius:2px}.uls-language-list{border-bottom-right-radius:2px;border-bottom-left-radius:2px}.uls-menu.callout::before,.uls-menu.callout::after{border-top:10px solid transparent;border-bottom:10px solid transparent;display:inline-block; top:17px;position:absolute;content:''}.uls-menu.callout.selector-right::before{ border-left:10px solid #c8ccd1; right:-11px}.uls-menu.callout.selector-right::after{ border-left:10px solid #fff; right:-10px}.uls-menu.callout.selector-left::before{ border-right:10px solid #c8ccd1; left:-11px}.uls-menu.callout.selector-left::after{ border-right:10px solid #fff; left:-10px}.uls-ui-languages button{margin:5px 15px 5px 0;white-space:nowrap;overflow:hidden}.uls-search-wrapper-wrapper{position:relative;padding-left:40px;margin-top:5px;margin-bottom:5px}.uls-icon-back{background:transparent url(/w/extensions/UniversalLanguageSelector/resources/images/back-grey-ltr.svg?c9c25) no-repeat scroll center center;background-size:28px;height:32px;width:40px;display:block;position:absolute;left:0;border-right:1px solid #c8ccd1;opacity:0.87}.uls-icon-back:hover{opacity:1;cursor:pointer}.uls-menu .uls-no-results-view .uls-no-found-more{background-color:#fff}.uls-menu .uls-no-results-view h3{padding:0 28px;margin:0;color:#54595d;font-size:1em;font-weight:normal}   .skin-vector .uls-menu{border-color:#c8ccd1;box-shadow:0 2px 2px 0 rgba(0,0,0,0.2);font-size:0.875em;z-index:50}.skin-vector .uls-search{border-bottom-color:#c8ccd1}.skin-vector .uls-search-label{opacity:0.51;transition:opacity 250ms}.skin-vector .uls-search-wrapper:hover .uls-search-label{opacity:0.87}.skin-vector .uls-languagefilter,.skin-vector .uls-lcd-region-title{color:#54595d}.skin-vector .uls-filtersuggestion{color:#72777d}
+@media print{#centralNotice{display:none}}.cn-closeButton{display:inline-block;background:url(data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAABQAAAAUBAMAAAB/pwA+AAAAElBMVEUAAAAQEBDPz88AAABAQEDv7+9oe1vvAAAABnRSTlMA3rLe3rJS22KzAAAARElEQVQI12PAAUIUQCSTK5BwFgIxFU1AhKECUFAYKAAioXwwBeZChMGCEGGQIFQYJohgIhQgtCEMQ7ECYTHCOciOxA4AADgJTXIb9s8AAAAASUVORK5CYII=) no-repeat;width:20px;height:20px;text-indent:20px;white-space:nowrap;overflow:hidden}
+#uls-settings-block{background-color:#fcfcfc}#uls-settings-block.uls-settings-block--vector-2022{display:flex;justify-content:space-between;padding:8px 12px}#uls-settings-block.uls-settings-block--vector-2022.row::before,#uls-settings-block.uls-settings-block--vector-2022.row::after{content:none}#uls-settings-block.uls-settings-block--vector-2022.uls-settings-block--with-add-languages{background-color:#f8f9fa;border-top:1px solid #c8ccd1}#uls-settings-block.uls-settings-block--vector-2022 > button.uls-add-languages-button{background:transparent url(/w/extensions/UniversalLanguageSelector/resources/images/add.svg?3165e) no-repeat left center;margin-right:32px;padding-left:32px}#uls-settings-block.uls-settings-block--vector-2022 > button.uls-language-settings-button{background:transparent url(/w/extensions/UniversalLanguageSelector/resources/images/cog.svg?ce0b4) no-repeat center;margin-left:auto;border:0;min-height:20px;min-width:20px}#uls-settings-block:not(.uls-settings-block--vector-2022){background-color:#f8f9fa;border-top:1px solid #c8ccd1;padding-left:10px;line-height:1.2em;border-radius:0 0 2px 2px}#uls-settings-block:not(.uls-settings-block--vector-2022) > button{background:left top transparent no-repeat;background-size:20px auto;color:#54595d;display:inline-block;margin:8px 15px;border:0;padding:0 0 0 26px;font-size:medium;cursor:pointer}#uls-settings-block:not(.uls-settings-block--vector-2022) > button:hover{color:#202122}#uls-settings-block:not(.uls-settings-block--vector-2022) > button.display-settings-block{background-image:url(/w/extensions/UniversalLanguageSelector/resources/images/display.svg?9fd85)}#uls-settings-block:not(.uls-settings-block--vector-2022) > button.input-settings-block{background-image:url(/w/extensions/UniversalLanguageSelector/resources/images/input.svg?60384)}.uls-tipsy.uls-tipsy{z-index:1000}.uls-empty-state{padding:28px}.uls-empty-state .uls-empty-state__header,.uls-empty-state .uls-empty-state__desc{color:#54595d}.uls-empty-state .uls-language-action-items{list-style:none;margin:1em 0}.empty-language-selector__language-settings-button{margin:12px}.uls-menu.uls-language-actions-dialog{min-width:248px}.uls-menu.uls-language-actions-dialog .uls-language-actions-title{border-bottom:1px solid #c8ccd1;display:flex;align-items:center;height:32px;padding:5px 0}.uls-menu.uls-language-actions-dialog .uls-language-actions-title .uls-language-actions-close{min-width:unset;width:44px;background:transparent url(/w/extensions/UniversalLanguageSelector/resources/images/arrow-previous-ltr.svg?279af) no-repeat center}.uls-menu.uls-language-actions-dialog .uls-language-action-items .uls-language-action.oo-ui-widget{margin:0;padding:12px 8px;display:block}.uls-menu.uls-language-actions-dialog .uls-language-action-items .uls-language-action.oo-ui-widget .oo-ui-buttonElement-button{padding-left:36px}.mw-interlanguage-selector-disabled #p-lang-btn-sticky-header{display:none}</style><style>
+.firstHeading::before{content:url(/static/images/mobile/copyright/wikipedia-wordmark-en.svg);display:block;height:18px;left:-9999px;line-height:0;margin-bottom:20px;position:absolute;width:120px}
+.mw-wiki-logo{background-image:url(/static/images/project-logos/enwiki.png)}
+@media print{ .firstHeading::before{left:auto;position:relative}}
+@media (-webkit-min-device-pixel-ratio:1.5),(min-resolution:1.5dppx),(min-resolution:144dpi){.mw-wiki-logo{background-image:url(/static/images/project-logos/enwiki-1.5x.png);background-size:135px auto}}
+@media (-webkit-min-device-pixel-ratio:2),(min-resolution:2dppx),(min-resolution:192dpi){.mw-wiki-logo{background-image:url(/static/images/project-logos/enwiki-2x.png);background-size:135px auto}}
+.mw-ui-icon-wikimedia-expand{ min-width:20px;min-height:20px;width:1.25rem;height:1.25rem;min-width:12px;min-height:12px;width:0.75rem;height:0.75rem;display:inline-block;vertical-align:text-bottom}@supports not ((-webkit-mask-image:none) or (mask-image:none)){.mw-ui-icon-wikimedia-expand{background-position:center;background-repeat:no-repeat;background-size:calc(max(1.25rem,20px))}}@supports (-webkit-mask-image:none) or (mask-image:none){.mw-ui-icon-wikimedia-expand{ -webkit-mask-size:calc(max(1.25rem,20px));mask-size:calc(max(1.25rem,20px));-webkit-mask-repeat:no-repeat;mask-repeat:no-repeat;-webkit-mask-position:center;mask-position:center; }}@supports not ((-webkit-mask-image:none) or (mask-image:none)){.mw-ui-icon-wikimedia-expand{background-image:url("data:image/svg+xml;utf8,<svg xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\" width=\"20\" height=\"20\" viewBox=\"0 0 20 20\" fill=\"%23000000\"><path d=\"m17.5 4.75-7.5 7.5-7.5-7.5L1 6.25l9 9 9-9z\"/></svg>");filter:invert(var(--filter-invert-icon,0));opacity:var(--opacity-icon-base,0.87)}.cdx-button:not(.cdx-button--weight-quiet):disabled .mw-ui-icon-wikimedia-expand,.cdx-button--weight-primary.cdx-button--action-progressive .mw-ui-icon-wikimedia-expand,.cdx-button--weight-primary.cdx-button--action-destructive .mw-ui-icon-wikimedia-expand{filter:invert(var(--filter-invert-primary-button-icon,1))}}@supports (-webkit-mask-image:none) or (mask-image:none){.mw-ui-icon-wikimedia-expand{ -webkit-mask-image:url("data:image/svg+xml;utf8,<svg xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\" width=\"20\" height=\"20\" viewBox=\"0 0 20 20\" fill=\"%23000000\"><path d=\"m17.5 4.75-7.5 7.5-7.5-7.5L1 6.25l9 9 9-9z\"/></svg>"); mask-image:url("data:image/svg+xml;utf8,<svg xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\" width=\"20\" height=\"20\" viewBox=\"0 0 20 20\" fill=\"%23000000\"><path d=\"m17.5 4.75-7.5 7.5-7.5-7.5L1 6.25l9 9 9-9z\"/></svg>");background-color:var(--color-base,#202122)}}@supports not ((-webkit-mask-image:none) or (mask-image:none)){.mw-ui-icon-wikimedia-expand{background-position:center;background-repeat:no-repeat;background-size:calc(max(0.75rem,12px))}}@supports (-webkit-mask-image:none) or (mask-image:none){.mw-ui-icon-wikimedia-expand{ -webkit-mask-size:calc(max(0.75rem,12px));mask-size:calc(max(0.75rem,12px));-webkit-mask-repeat:no-repeat;mask-repeat:no-repeat;-webkit-mask-position:center;mask-position:center; }}.vector-popup-notification{font-size:0.875rem}.vector-popup-notification p{margin:0}.vector-popup-notification p:last-child{padding-bottom:0} .vector-sticky-header-container{position:fixed;top:0;left:0;right:0;z-index:3;transition:transform 250ms linear;display:none;transform:translateY(-100%);opacity:0}.vector-sticky-header{display:flex;align-items:center;justify-content:space-between;border-bottom:1px solid var(--background-color-interactive,#eaecf0)}.vector-sticky-header-start,.vector-sticky-header-end,.vector-sticky-header-icons,.vector-sticky-header-buttons,.vector-sticky-header-context-bar{display:flex;align-items:center}.vector-sticky-header-start{flex-grow:1;min-width:0}.vector-sticky-header-context-bar-primary,.vector-sticky-header-end{white-space:nowrap}.vector-sticky-header-context-bar{border-left:1px solid #c8c8c8;padding-left:30px;min-width:0;margin-left:30px}.vector-sticky-header-context-bar-primary{overflow:hidden;font-family:'Linux Libertine','Georgia','Times','Source Serif Pro',serif;font-size:1.5em;text-overflow:ellipsis}.vector-sticky-header-context-bar-primary wbr{display:none}.vector-sticky-header-buttons{font-size:0.875em}.vector-sticky-header-icons,.vector-sticky-header-buttons{column-gap:8px}.vector-sticky-header .vector-search-box{display:none}.vector-sticky-header.vector-header-search-toggled .vector-sticky-header-search-toggle,.vector-sticky-header.vector-header-search-toggled .vector-sticky-header-context-bar{display:none}.vector-sticky-header.vector-header-search-toggled .vector-search-box{display:block;margin-left:4px}.vector-sticky-header.vector-header-search-toggled .vector-search-box-show-thumbnail{margin-left:-9px}.vector-sticky-header.vector-header-search-toggled .vector-search-box-show-thumbnail .cdx-text-input__start-icon{color:var(--color-base,#202122)}@media (min-width:1120px){.client-js.vector-sticky-header-enabled{scroll-padding-top:calc(3.125rem + 75px)}.client-js.vector-sticky-header-enabled .vector-sticky-header-container{display:flex}.client-js.vector-sticky-header-enabled .vector-sticky-header-visible .vector-sticky-header-container{opacity:1;transform:translateY(0)}.client-js.vector-sticky-header-enabled .vector-sticky-pinned-container{top:calc(3.125rem + 24px);max-height:calc(100vh - 3.125rem - (24px * 2))}.client-js.vector-sticky-header-enabled .mw-sticky-header-element,.client-js.vector-sticky-header-enabled .charts-stickyhead th{ top:3.125rem !important}}.client-js .vector-settings{display:block;position:fixed;bottom:8px;right:8px;z-index:1}.client-js .vector-settings ul{padding:0;list-style:none;display:flex;flex-direction:column-reverse;align-items:center;gap:8px 8px}
+.mw-mmv-overlay{position:fixed;top:0;left:0;right:0;bottom:0;z-index:1000;background-color:#000;display:flex;justify-items:center;align-items:center;align-content:center;justify-content:center}.mw-mmv-overlay .cdx-progress-bar{max-width:80vw;min-width:20vw;width:20rem}body.mw-mmv-lightbox-open{overflow-y:auto;background-color:#000}body.mw-mmv-lightbox-open > *:not(.mw-notification-area-overlay){display:none}body.mw-mmv-lightbox-open > .mw-mmv-overlay{display:flex}body.mw-mmv-lightbox-open > .mw-mmv-wrapper{display:block}.mw-mmv-view-expanded .cdx-button__icon{ min-width:16px;min-height:16px;width:1rem;height:1rem;display:inline-block;vertical-align:text-bottom}@supports not ((-webkit-mask-image:none) or (mask-image:none)){.mw-mmv-view-expanded .cdx-button__icon{background-position:center;background-repeat:no-repeat;background-size:calc(max(1rem,16px))}}@supports (-webkit-mask-image:none) or (mask-image:none){.mw-mmv-view-expanded .cdx-button__icon{ -webkit-mask-size:calc(max(1rem,16px));mask-size:calc(max(1rem,16px));-webkit-mask-repeat:no-repeat;mask-repeat:no-repeat;-webkit-mask-position:center;mask-position:center; }}@supports not ((-webkit-mask-image:none) or (mask-image:none)){.mw-mmv-view-expanded .cdx-button__icon{background-image:url("data:image/svg+xml;utf8,<svg xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\" width=\"20\" height=\"20\" viewBox=\"0 0 20 20\" fill=\"%23000000\"><path d=\"M3 5a2 2 0 00-2 2v10a2 2 0 002 2h14a2 2 0 002-2V7a2 2 0 00-2-2zm0 11 3.5-4.5 2.5 3 3.5-4.5 4.5 6zM16 2a2 2 0 012 2H2a2 2 0 012-2z\"/></svg>");filter:invert(var(--filter-invert-icon,0));opacity:var(--opacity-icon-base,0.87)}.cdx-button:not(.cdx-button--weight-quiet):disabled .mw-mmv-view-expanded .cdx-button__icon,.cdx-button--weight-primary.cdx-button--action-progressive .mw-mmv-view-expanded .cdx-button__icon,.cdx-button--weight-primary.cdx-button--action-destructive .mw-mmv-view-expanded .cdx-button__icon{filter:invert(var(--filter-invert-primary-button-icon,1))}}@supports (-webkit-mask-image:none) or (mask-image:none){.mw-mmv-view-expanded .cdx-button__icon{ -webkit-mask-image:url("data:image/svg+xml;utf8,<svg xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\" width=\"20\" height=\"20\" viewBox=\"0 0 20 20\" fill=\"%23000000\"><path d=\"M3 5a2 2 0 00-2 2v10a2 2 0 002 2h14a2 2 0 002-2V7a2 2 0 00-2-2zm0 11 3.5-4.5 2.5 3 3.5-4.5 4.5 6zM16 2a2 2 0 012 2H2a2 2 0 012-2z\"/></svg>"); mask-image:url("data:image/svg+xml;utf8,<svg xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\" width=\"20\" height=\"20\" viewBox=\"0 0 20 20\" fill=\"%23000000\"><path d=\"M3 5a2 2 0 00-2 2v10a2 2 0 002 2h14a2 2 0 002-2V7a2 2 0 00-2-2zm0 11 3.5-4.5 2.5 3 3.5-4.5 4.5 6zM16 2a2 2 0 012 2H2a2 2 0 012-2z\"/></svg>");transition-property:background-color;transition-duration:100ms}}
+.ve-init-mw-tempWikitextEditorWidget{border:0;padding:0;color:inherit;line-height:1.5em;width:100%;-moz-tab-size:4;tab-size:4;  }.ve-init-mw-tempWikitextEditorWidget:focus{outline:0;padding:0}.ve-init-mw-tempWikitextEditorWidget::selection{background:rgba(109,169,247,0.5); }
+.oo-ui-icon-edit,.mw-ui-icon-edit:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E edit %3C/title%3E%3Cpath d=%22m16.77 8 1.94-2a1 1 0 0 0 0-1.41l-3.34-3.3a1 1 0 0 0-1.41 0L12 3.23zM1 14.25V19h4.75l9.96-9.96-4.75-4.75z%22/%3E%3C/svg%3E")}.oo-ui-image-invert.oo-ui-icon-edit,.mw-ui-icon-edit-invert:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E edit %3C/title%3E%3Cg fill=%22%23fff%22%3E%3Cpath d=%22m16.77 8 1.94-2a1 1 0 0 0 0-1.41l-3.34-3.3a1 1 0 0 0-1.41 0L12 3.23zM1 14.25V19h4.75l9.96-9.96-4.75-4.75z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-progressive.oo-ui-icon-edit,.mw-ui-icon-edit-progressive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E edit %3C/title%3E%3Cg fill=%22%2336c%22%3E%3Cpath d=%22m16.77 8 1.94-2a1 1 0 0 0 0-1.41l-3.34-3.3a1 1 0 0 0-1.41 0L12 3.23zM1 14.25V19h4.75l9.96-9.96-4.75-4.75z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-icon-editLock,.mw-ui-icon-editLock:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E edit lock %3C/title%3E%3Cpath d=%22M12 12a2 2 0 0 1-2-2V5.25l-9 9V19h4.75l7-7zm7-8h-.5V2.5a2.5 2.5 0 0 0-5 0V4H13a1 1 0 0 0-1 1v4a1 1 0 0 0 1 1h6a1 1 0 0 0 1-1V5a1 1 0 0 0-1-1m-3 4a1 1 0 1 1 1-1 1 1 0 0 1-1 1m1.5-4h-3V2.75C14.5 2 14.5 1 16 1s1.5 1 1.5 1.75z%22/%3E%3C/svg%3E")}.oo-ui-image-invert.oo-ui-icon-editLock,.mw-ui-icon-editLock-invert:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E edit lock %3C/title%3E%3Cg fill=%22%23fff%22%3E%3Cpath d=%22M12 12a2 2 0 0 1-2-2V5.25l-9 9V19h4.75l7-7zm7-8h-.5V2.5a2.5 2.5 0 0 0-5 0V4H13a1 1 0 0 0-1 1v4a1 1 0 0 0 1 1h6a1 1 0 0 0 1-1V5a1 1 0 0 0-1-1m-3 4a1 1 0 1 1 1-1 1 1 0 0 1-1 1m1.5-4h-3V2.75C14.5 2 14.5 1 16 1s1.5 1 1.5 1.75z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-progressive.oo-ui-icon-editLock,.mw-ui-icon-editLock-progressive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E edit lock %3C/title%3E%3Cg fill=%22%2336c%22%3E%3Cpath d=%22M12 12a2 2 0 0 1-2-2V5.25l-9 9V19h4.75l7-7zm7-8h-.5V2.5a2.5 2.5 0 0 0-5 0V4H13a1 1 0 0 0-1 1v4a1 1 0 0 0 1 1h6a1 1 0 0 0 1-1V5a1 1 0 0 0-1-1m-3 4a1 1 0 1 1 1-1 1 1 0 0 1-1 1m1.5-4h-3V2.75C14.5 2 14.5 1 16 1s1.5 1 1.5 1.75z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-icon-editUndo,.mw-ui-icon-editUndo:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E undo edit %3C/title%3E%3Cpath d=%22M1 14.25V19h4.75l8.33-8.33-5.27-4.23zM13 2.86V0L8 4l5 4V5h.86c2.29 0 4 1.43 4 4.29H20a6.51 6.51 0 0 0-6.14-6.43z%22/%3E%3C/svg%3E")}.oo-ui-image-invert.oo-ui-icon-editUndo,.mw-ui-icon-editUndo-invert:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E undo edit %3C/title%3E%3Cg fill=%22%23fff%22%3E%3Cpath d=%22M1 14.25V19h4.75l8.33-8.33-5.27-4.23zM13 2.86V0L8 4l5 4V5h.86c2.29 0 4 1.43 4 4.29H20a6.51 6.51 0 0 0-6.14-6.43z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-progressive.oo-ui-icon-editUndo,.mw-ui-icon-editUndo-progressive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E undo edit %3C/title%3E%3Cg fill=%22%2336c%22%3E%3Cpath d=%22M1 14.25V19h4.75l8.33-8.33-5.27-4.23zM13 2.86V0L8 4l5 4V5h.86c2.29 0 4 1.43 4 4.29H20a6.51 6.51 0 0 0-6.14-6.43z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-icon-link,.mw-ui-icon-link:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E link %3C/title%3E%3Cpath d=%22M4.83 15h2.91a4.9 4.9 0 0 1-1.55-2H5a3 3 0 1 1 0-6h3a3 3 0 0 1 2.82 4h2.1a5 5 0 0 0 .08-.83v-.34A4.83 4.83 0 0 0 8.17 5H4.83A4.83 4.83 0 0 0 0 9.83v.34A4.83 4.83 0 0 0 4.83 15%22/%3E%3Cpath d=%22M15.17 5h-2.91a4.9 4.9 0 0 1 1.55 2H15a3 3 0 1 1 0 6h-3a3 3 0 0 1-2.82-4h-2.1a5 5 0 0 0-.08.83v.34A4.83 4.83 0 0 0 11.83 15h3.34A4.83 4.83 0 0 0 20 10.17v-.34A4.83 4.83 0 0 0 15.17 5%22/%3E%3C/svg%3E")}.oo-ui-image-invert.oo-ui-icon-link,.mw-ui-icon-link-invert:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E link %3C/title%3E%3Cg fill=%22%23fff%22%3E%3Cpath d=%22M4.83 15h2.91a4.9 4.9 0 0 1-1.55-2H5a3 3 0 1 1 0-6h3a3 3 0 0 1 2.82 4h2.1a5 5 0 0 0 .08-.83v-.34A4.83 4.83 0 0 0 8.17 5H4.83A4.83 4.83 0 0 0 0 9.83v.34A4.83 4.83 0 0 0 4.83 15%22/%3E%3Cpath d=%22M15.17 5h-2.91a4.9 4.9 0 0 1 1.55 2H15a3 3 0 1 1 0 6h-3a3 3 0 0 1-2.82-4h-2.1a5 5 0 0 0-.08.83v.34A4.83 4.83 0 0 0 11.83 15h3.34A4.83 4.83 0 0 0 20 10.17v-.34A4.83 4.83 0 0 0 15.17 5%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-progressive.oo-ui-icon-link,.mw-ui-icon-link-progressive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E link %3C/title%3E%3Cg fill=%22%2336c%22%3E%3Cpath d=%22M4.83 15h2.91a4.9 4.9 0 0 1-1.55-2H5a3 3 0 1 1 0-6h3a3 3 0 0 1 2.82 4h2.1a5 5 0 0 0 .08-.83v-.34A4.83 4.83 0 0 0 8.17 5H4.83A4.83 4.83 0 0 0 0 9.83v.34A4.83 4.83 0 0 0 4.83 15%22/%3E%3Cpath d=%22M15.17 5h-2.91a4.9 4.9 0 0 1 1.55 2H15a3 3 0 1 1 0 6h-3a3 3 0 0 1-2.82-4h-2.1a5 5 0 0 0-.08.83v.34A4.83 4.83 0 0 0 11.83 15h3.34A4.83 4.83 0 0 0 20 10.17v-.34A4.83 4.83 0 0 0 15.17 5%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-icon-unLink,.mw-ui-icon-unLink:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E unlink %3C/title%3E%3Cpath d=%22M4.83 5A4.83 4.83 0 0 0 0 9.83v.34A4.83 4.83 0 0 0 4.83 15h2.91a4.9 4.9 0 0 1-1.55-2H5c-4 0-4-6 0-6h3q.113.002.225.012L6.215 5zm7.43 0a4.9 4.9 0 0 1 1.55 2H15c3.179.003 4.17 4.3 1.314 5.695l1.508 1.508A4.83 4.83 0 0 0 20 10.17v-.34A4.83 4.83 0 0 0 15.17 5zm-3.612.03 4.329 4.327A4.83 4.83 0 0 0 8.648 5.03M7.227 8.411C7.17 8.595 7.08 9 7.08 9c-.045.273-.08.584-.08.83v.34A4.83 4.83 0 0 0 11.83 15h3.34q.475 0 .941-.094L14.205 13H12c-2.067-.006-3.51-2.051-2.82-4zm3.755 1.36A3 3 0 0 1 10.82 11h1.389z%22/%3E%3Cpath d=%22M1.22 0 0 1.22 18.8 20l1.2-1.22z%22/%3E%3C/svg%3E")}.oo-ui-image-invert.oo-ui-icon-unLink,.mw-ui-icon-unLink-invert:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E unlink %3C/title%3E%3Cg fill=%22%23fff%22%3E%3Cpath d=%22M4.83 5A4.83 4.83 0 0 0 0 9.83v.34A4.83 4.83 0 0 0 4.83 15h2.91a4.9 4.9 0 0 1-1.55-2H5c-4 0-4-6 0-6h3q.113.002.225.012L6.215 5zm7.43 0a4.9 4.9 0 0 1 1.55 2H15c3.179.003 4.17 4.3 1.314 5.695l1.508 1.508A4.83 4.83 0 0 0 20 10.17v-.34A4.83 4.83 0 0 0 15.17 5zm-3.612.03 4.329 4.327A4.83 4.83 0 0 0 8.648 5.03M7.227 8.411C7.17 8.595 7.08 9 7.08 9c-.045.273-.08.584-.08.83v.34A4.83 4.83 0 0 0 11.83 15h3.34q.475 0 .941-.094L14.205 13H12c-2.067-.006-3.51-2.051-2.82-4zm3.755 1.36A3 3 0 0 1 10.82 11h1.389z%22/%3E%3Cpath d=%22M1.22 0 0 1.22 18.8 20l1.2-1.22z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-progressive.oo-ui-icon-unLink,.mw-ui-icon-unLink-progressive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E unlink %3C/title%3E%3Cg fill=%22%2336c%22%3E%3Cpath d=%22M4.83 5A4.83 4.83 0 0 0 0 9.83v.34A4.83 4.83 0 0 0 4.83 15h2.91a4.9 4.9 0 0 1-1.55-2H5c-4 0-4-6 0-6h3q.113.002.225.012L6.215 5zm7.43 0a4.9 4.9 0 0 1 1.55 2H15c3.179.003 4.17 4.3 1.314 5.695l1.508 1.508A4.83 4.83 0 0 0 20 10.17v-.34A4.83 4.83 0 0 0 15.17 5zm-3.612.03 4.329 4.327A4.83 4.83 0 0 0 8.648 5.03M7.227 8.411C7.17 8.595 7.08 9 7.08 9c-.045.273-.08.584-.08.83v.34A4.83 4.83 0 0 0 11.83 15h3.34q.475 0 .941-.094L14.205 13H12c-2.067-.006-3.51-2.051-2.82-4zm3.755 1.36A3 3 0 0 1 10.82 11h1.389z%22/%3E%3Cpath d=%22M1.22 0 0 1.22 18.8 20l1.2-1.22z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-destructive.oo-ui-icon-unLink,.mw-ui-icon-unLink-destructive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E unlink %3C/title%3E%3Cg fill=%22%23d73333%22%3E%3Cpath d=%22M4.83 5A4.83 4.83 0 0 0 0 9.83v.34A4.83 4.83 0 0 0 4.83 15h2.91a4.9 4.9 0 0 1-1.55-2H5c-4 0-4-6 0-6h3q.113.002.225.012L6.215 5zm7.43 0a4.9 4.9 0 0 1 1.55 2H15c3.179.003 4.17 4.3 1.314 5.695l1.508 1.508A4.83 4.83 0 0 0 20 10.17v-.34A4.83 4.83 0 0 0 15.17 5zm-3.612.03 4.329 4.327A4.83 4.83 0 0 0 8.648 5.03M7.227 8.411C7.17 8.595 7.08 9 7.08 9c-.045.273-.08.584-.08.83v.34A4.83 4.83 0 0 0 11.83 15h3.34q.475 0 .941-.094L14.205 13H12c-2.067-.006-3.51-2.051-2.82-4zm3.755 1.36A3 3 0 0 1 10.82 11h1.389z%22/%3E%3Cpath d=%22M1.22 0 0 1.22 18.8 20l1.2-1.22z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-icon-linkExternal,.mw-ui-icon-linkExternal:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E external link %3C/title%3E%3Cpath d=%22M17 17H3V3h5V1H3a2 2 0 0 0-2 2v14a2 2 0 0 0 2 2h14a2 2 0 0 0 2-2v-5h-2z%22/%3E%3Cpath d=%22m11 1 3.29 3.29-5.73 5.73 1.42 1.42 5.73-5.73L19 9V1z%22/%3E%3C/svg%3E")}.oo-ui-image-invert.oo-ui-icon-linkExternal,.mw-ui-icon-linkExternal-invert:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E external link %3C/title%3E%3Cg fill=%22%23fff%22%3E%3Cpath d=%22M17 17H3V3h5V1H3a2 2 0 0 0-2 2v14a2 2 0 0 0 2 2h14a2 2 0 0 0 2-2v-5h-2z%22/%3E%3Cpath d=%22m11 1 3.29 3.29-5.73 5.73 1.42 1.42 5.73-5.73L19 9V1z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-progressive.oo-ui-icon-linkExternal,.mw-ui-icon-linkExternal-progressive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E external link %3C/title%3E%3Cg fill=%22%2336c%22%3E%3Cpath d=%22M17 17H3V3h5V1H3a2 2 0 0 0-2 2v14a2 2 0 0 0 2 2h14a2 2 0 0 0 2-2v-5h-2z%22/%3E%3Cpath d=%22m11 1 3.29 3.29-5.73 5.73 1.42 1.42 5.73-5.73L19 9V1z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-icon-linkSecure,.mw-ui-icon-linkSecure:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E secure link %3C/title%3E%3Cpath d=%22M16.07 8H15V5s0-5-5-5-5 5-5 5v3H3.93A1.93 1.93 0 0 0 2 9.93v8.15A1.93 1.93 0 0 0 3.93 20h12.14A1.93 1.93 0 0 0 18 18.07V9.93A1.93 1.93 0 0 0 16.07 8M7 5.5C7 4 7 2 10 2s3 2 3 3.5V8H7zM10 16a2 2 0 1 1 2-2 2 2 0 0 1-2 2%22/%3E%3C/svg%3E")}.oo-ui-image-invert.oo-ui-icon-linkSecure,.mw-ui-icon-linkSecure-invert:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E secure link %3C/title%3E%3Cg fill=%22%23fff%22%3E%3Cpath d=%22M16.07 8H15V5s0-5-5-5-5 5-5 5v3H3.93A1.93 1.93 0 0 0 2 9.93v8.15A1.93 1.93 0 0 0 3.93 20h12.14A1.93 1.93 0 0 0 18 18.07V9.93A1.93 1.93 0 0 0 16.07 8M7 5.5C7 4 7 2 10 2s3 2 3 3.5V8H7zM10 16a2 2 0 1 1 2-2 2 2 0 0 1-2 2%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-progressive.oo-ui-icon-linkSecure,.mw-ui-icon-linkSecure-progressive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E secure link %3C/title%3E%3Cg fill=%22%2336c%22%3E%3Cpath d=%22M16.07 8H15V5s0-5-5-5-5 5-5 5v3H3.93A1.93 1.93 0 0 0 2 9.93v8.15A1.93 1.93 0 0 0 3.93 20h12.14A1.93 1.93 0 0 0 18 18.07V9.93A1.93 1.93 0 0 0 16.07 8M7 5.5C7 4 7 2 10 2s3 2 3 3.5V8H7zM10 16a2 2 0 1 1 2-2 2 2 0 0 1-2 2%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-icon-redo,.mw-ui-icon-redo:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E redo %3C/title%3E%3Cpath d=%22M19 8.5 12 3v11zM12 7v3h-1c-4 0-7 2-7 6v1H1v-1c0-6 5-9 10-9z%22/%3E%3C/svg%3E")}.oo-ui-image-invert.oo-ui-icon-redo,.mw-ui-icon-redo-invert:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E redo %3C/title%3E%3Cg fill=%22%23fff%22%3E%3Cpath d=%22M19 8.5 12 3v11zM12 7v3h-1c-4 0-7 2-7 6v1H1v-1c0-6 5-9 10-9z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-progressive.oo-ui-icon-redo,.mw-ui-icon-redo-progressive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E redo %3C/title%3E%3Cg fill=%22%2336c%22%3E%3Cpath d=%22M19 8.5 12 3v11zM12 7v3h-1c-4 0-7 2-7 6v1H1v-1c0-6 5-9 10-9z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-icon-undo,.mw-ui-icon-undo:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E undo %3C/title%3E%3Cpath d=%22M1 8.5 8 14v-4h1c4 0 7 2 7 6v1h3v-1c0-6-5-9-10-9H8V3z%22/%3E%3C/svg%3E")}.oo-ui-image-invert.oo-ui-icon-undo,.mw-ui-icon-undo-invert:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E undo %3C/title%3E%3Cg fill=%22%23fff%22%3E%3Cpath d=%22M1 8.5 8 14v-4h1c4 0 7 2 7 6v1h3v-1c0-6-5-9-10-9H8V3z%22/%3E%3C/g%3E%3C/svg%3E")}.oo-ui-image-progressive.oo-ui-icon-undo,.mw-ui-icon-undo-progressive:before{background-image:url("data:image/svg+xml,%3Csvg xmlns=%22http://www.w3.org/2000/svg%22 width=%2220%22 height=%2220%22 viewBox=%220 0 20 20%22%3E%3Ctitle%3E undo %3C/title%3E%3Cg fill=%22%2336c%22%3E%3Cpath d=%22M1 8.5 8 14v-4h1c4 0 7 2 7 6v1h3v-1c0-6-5-9-10-9H8V3z%22/%3E%3C/g%3E%3C/svg%3E")}
+@keyframes mwe-popups-fade-in-up{0%{opacity:0;transform:translate(0,20px)}100%{opacity:1;transform:translate(0,0)}}@keyframes mwe-popups-fade-in-down{0%{opacity:0;transform:translate(0,-20px)}100%{opacity:1;transform:translate(0,0)}}@keyframes mwe-popups-fade-out-down{0%{opacity:1;transform:translate(0,0)}100%{opacity:0;transform:translate(0,20px)}}@keyframes mwe-popups-fade-out-up{0%{opacity:1;transform:translate(0,0)}100%{opacity:0;transform:translate(0,-20px)}}.mwe-popups-fade-in-up{animation:mwe-popups-fade-in-up 0.2s ease forwards}.mwe-popups-fade-in-down{animation:mwe-popups-fade-in-down 0.2s ease forwards}.mwe-popups-fade-out-down{animation:mwe-popups-fade-out-down 0.2s ease forwards}.mwe-popups-fade-out-up{animation:mwe-popups-fade-out-up 0.2s ease forwards}.popups-icon--settings{ min-width:20px;min-height:20px;width:1.25rem;height:1.25rem;display:inline-block;vertical-align:text-bottom}@supports not ((-webkit-mask-image:none) or (mask-image:none)){.popups-icon--settings{background-position:center;background-repeat:no-repeat;background-size:calc(max(1.25rem,20px))}}@supports (-webkit-mask-image:none) or (mask-image:none){.popups-icon--settings{ -webkit-mask-size:calc(max(1.25rem,20px));mask-size:calc(max(1.25rem,20px));-webkit-mask-repeat:no-repeat;mask-repeat:no-repeat;-webkit-mask-position:center;mask-position:center; }}@supports not ((-webkit-mask-image:none) or (mask-image:none)){.popups-icon--settings{background-image:url("data:image/svg+xml;utf8,<svg xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\" width=\"20\" height=\"20\" viewBox=\"0 0 20 20\" fill=\"%23000000\"><g transform=\"translate(10 10)\"><path id=\"cdx-icon-settings-a\" d=\"M1.5-10h-3l-1 6.5h5m0 7h-5l1 6.5h3\"/><use xlink:href=\"%23cdx-icon-settings-a\" transform=\"rotate(45)\"/><use xlink:href=\"%23cdx-icon-settings-a\" transform=\"rotate(90)\"/><use xlink:href=\"%23cdx-icon-settings-a\" transform=\"rotate(135)\"/></g><path d=\"M10 2.5a7.5 7.5 0 000 15 7.5 7.5 0 000-15v4a3.5 3.5 0 010 7 3.5 3.5 0 010-7\"/></svg>");filter:invert(var(--filter-invert-icon,0));opacity:var(--opacity-icon-base,0.87)}.cdx-button:not(.cdx-button--weight-quiet):disabled .popups-icon--settings,.cdx-button--weight-primary.cdx-button--action-progressive .popups-icon--settings,.cdx-button--weight-primary.cdx-button--action-destructive .popups-icon--settings{filter:invert(var(--filter-invert-primary-button-icon,1))}}@supports (-webkit-mask-image:none) or (mask-image:none){.popups-icon--settings{ -webkit-mask-image:url("data:image/svg+xml;utf8,<svg xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\" width=\"20\" height=\"20\" viewBox=\"0 0 20 20\" fill=\"%23000000\"><g transform=\"translate(10 10)\"><path id=\"cdx-icon-settings-a\" d=\"M1.5-10h-3l-1 6.5h5m0 7h-5l1 6.5h3\"/><use xlink:href=\"%23cdx-icon-settings-a\" transform=\"rotate(45)\"/><use xlink:href=\"%23cdx-icon-settings-a\" transform=\"rotate(90)\"/><use xlink:href=\"%23cdx-icon-settings-a\" transform=\"rotate(135)\"/></g><path d=\"M10 2.5a7.5 7.5 0 000 15 7.5 7.5 0 000-15v4a3.5 3.5 0 010 7 3.5 3.5 0 010-7\"/></svg>"); mask-image:url("data:image/svg+xml;utf8,<svg xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\" width=\"20\" height=\"20\" viewBox=\"0 0 20 20\" fill=\"%23000000\"><g transform=\"translate(10 10)\"><path id=\"cdx-icon-settings-a\" d=\"M1.5-10h-3l-1 6.5h5m0 7h-5l1 6.5h3\"/><use xlink:href=\"%23cdx-icon-settings-a\" transform=\"rotate(45)\"/><use xlink:href=\"%23cdx-icon-settings-a\" transform=\"rotate(90)\"/><use xlink:href=\"%23cdx-icon-settings-a\" transform=\"rotate(135)\"/></g><path d=\"M10 2.5a7.5 7.5 0 000 15 7.5 7.5 0 000-15v4a3.5 3.5 0 010 7 3.5 3.5 0 010-7\"/></svg>");background-color:var(--color-base,#202122)}}.popups-icon--infoFilled{ min-width:20px;min-height:20px;width:1.25rem;height:1.25rem;display:inline-block;vertical-align:text-bottom}@supports not ((-webkit-mask-image:none) or (mask-image:none)){.popups-icon--infoFilled{background-position:center;background-repeat:no-repeat;background-size:calc(max(1.25rem,20px))}}@supports (-webkit-mask-image:none) or (mask-image:none){.popups-icon--infoFilled{ -webkit-mask-size:calc(max(1.25rem,20px));mask-size:calc(max(1.25rem,20px));-webkit-mask-repeat:no-repeat;mask-repeat:no-repeat;-webkit-mask-position:center;mask-position:center; }}@supports not ((-webkit-mask-image:none) or (mask-image:none)){.popups-icon--infoFilled{background-image:url("data:image/svg+xml;utf8,<svg xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\" width=\"20\" height=\"20\" viewBox=\"0 0 20 20\" fill=\"%23000000\"><path d=\"M10 0C4.477 0 0 4.477 0 10s4.477 10 10 10 10-4.477 10-10S15.523 0 10 0M9 5h2v2H9zm0 4h2v6H9z\"/></svg>");filter:invert(var(--filter-invert-icon,0));opacity:var(--opacity-icon-base,0.87)}.cdx-button:not(.cdx-button--weight-quiet):disabled .popups-icon--infoFilled,.cdx-button--weight-primary.cdx-button--action-progressive .popups-icon--infoFilled,.cdx-button--weight-primary.cdx-button--action-destructive .popups-icon--infoFilled{filter:invert(var(--filter-invert-primary-button-icon,1))}}@supports (-webkit-mask-image:none) or (mask-image:none){.popups-icon--infoFilled{ -webkit-mask-image:url("data:image/svg+xml;utf8,<svg xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\" width=\"20\" height=\"20\" viewBox=\"0 0 20 20\" fill=\"%23000000\"><path d=\"M10 0C4.477 0 0 4.477 0 10s4.477 10 10 10 10-4.477 10-10S15.523 0 10 0M9 5h2v2H9zm0 4h2v6H9z\"/></svg>"); mask-image:url("data:image/svg+xml;utf8,<svg xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\" width=\"20\" height=\"20\" viewBox=\"0 0 20 20\" fill=\"%23000000\"><path d=\"M10 0C4.477 0 0 4.477 0 10s4.477 10 10 10 10-4.477 10-10S15.523 0 10 0M9 5h2v2H9zm0 4h2v6H9z\"/></svg>");background-color:var(--color-base,#202122)}}@supports not ((-webkit-mask-image:none) or (mask-image:none)){.popups-icon--infoFilled:lang(ar){background-image:url("data:image/svg+xml;utf8,<svg xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\" width=\"20\" height=\"20\" viewBox=\"0 0 20 20\" fill=\"%23000000\"><path d=\"M8 19a1 1 0 001 1h2a1 1 0 001-1v-1H8zm9-12a7 7 0 10-12 4.9S7 14 7 15v1a1 1 0 001 1h4a1 1 0 001-1v-1c0-1 2-3.1 2-3.1A7 7 0 0017 7\"/></svg>");filter:invert(var(--filter-invert-icon,0));opacity:var(--opacity-icon-base,0.87)}.cdx-button:not(.cdx-button--weight-quiet):disabled .popups-icon--infoFilled:lang(ar),.cdx-button--weight-primary.cdx-button--action-progressive .popups-icon--infoFilled:lang(ar),.cdx-button--weight-primary.cdx-button--action-destructive .popups-icon--infoFilled:lang(ar){filter:invert(var(--filter-invert-primary-button-icon,1))}}@supports (-webkit-mask-image:none) or (mask-image:none){.popups-icon--infoFilled:lang(ar){ -webkit-mask-image:url("data:image/svg+xml;utf8,<svg xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\" width=\"20\" height=\"20\" viewBox=\"0 0 20 20\" fill=\"%23000000\"><path d=\"M8 19a1 1 0 001 1h2a1 1 0 001-1v-1H8zm9-12a7 7 0 10-12 4.9S7 14 7 15v1a1 1 0 001 1h4a1 1 0 001-1v-1c0-1 2-3.1 2-3.1A7 7 0 0017 7\"/></svg>"); mask-image:url("data:image/svg+xml;utf8,<svg xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\" width=\"20\" height=\"20\" viewBox=\"0 0 20 20\" fill=\"%23000000\"><path d=\"M8 19a1 1 0 001 1h2a1 1 0 001-1v-1H8zm9-12a7 7 0 10-12 4.9S7 14 7 15v1a1 1 0 001 1h4a1 1 0 001-1v-1c0-1 2-3.1 2-3.1A7 7 0 0017 7\"/></svg>");background-color:var(--color-base,#202122)}}.popups-icon--close{ min-width:20px;min-height:20px;width:1.25rem;height:1.25rem;display:inline-block;vertical-align:text-bottom}@supports not ((-webkit-mask-image:none) or (mask-image:none)){.popups-icon--close{background-position:center;background-repeat:no-repeat;background-size:calc(max(1.25rem,20px))}}@supports (-webkit-mask-image:none) or (mask-image:none){.popups-icon--close{ -webkit-mask-size:calc(max(1.25rem,20px));mask-size:calc(max(1.25rem,20px));-webkit-mask-repeat:no-repeat;mask-repeat:no-repeat;-webkit-mask-position:center;mask-position:center; }}@supports not ((-webkit-mask-image:none) or (mask-image:none)){.popups-icon--close{background-image:url("data:image/svg+xml;utf8,<svg xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\" width=\"20\" height=\"20\" viewBox=\"0 0 20 20\" fill=\"%23000000\"><path d=\"m4.34 2.93 12.73 12.73-1.41 1.41L2.93 4.35z\"/><path d=\"M17.07 4.34 4.34 17.07l-1.41-1.41L15.66 2.93z\"/></svg>");filter:invert(var(--filter-invert-icon,0));opacity:var(--opacity-icon-base,0.87)}.cdx-button:not(.cdx-button--weight-quiet):disabled .popups-icon--close,.cdx-button--weight-primary.cdx-button--action-progressive .popups-icon--close,.cdx-button--weight-primary.cdx-button--action-destructive .popups-icon--close{filter:invert(var(--filter-invert-primary-button-icon,1))}}@supports (-webkit-mask-image:none) or (mask-image:none){.popups-icon--close{ -webkit-mask-image:url("data:image/svg+xml;utf8,<svg xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\" width=\"20\" height=\"20\" viewBox=\"0 0 20 20\" fill=\"%23000000\"><path d=\"m4.34 2.93 12.73 12.73-1.41 1.41L2.93 4.35z\"/><path d=\"M17.07 4.34 4.34 17.07l-1.41-1.41L15.66 2.93z\"/></svg>"); mask-image:url("data:image/svg+xml;utf8,<svg xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\" width=\"20\" height=\"20\" viewBox=\"0 0 20 20\" fill=\"%23000000\"><path d=\"m4.34 2.93 12.73 12.73-1.41 1.41L2.93 4.35z\"/><path d=\"M17.07 4.34 4.34 17.07l-1.41-1.41L15.66 2.93z\"/></svg>");background-color:var(--color-base,#202122)}}.popups-icon--footer{background-image:url(/w/extensions/Popups/src/ui/icons/footer-ltr.svg?9d590)}.popups-icon--preview-generic{mask-image:url(/w/extensions/Popups/src/ui/icons/sad-face-ltr.svg?d9aab);background-color:var(--color-base,#202122)}#mwe-popups-settings{z-index:1000;background-color:var(--background-color-base,#fff);width:420px;border:1px solid var(--border-color-base,#a2a9b1);box-shadow:0 2px 2px 0 rgba(0,0,0,0.2);border-radius:2px;font-size:14px}#mwe-popups-settings header{box-sizing:border-box;border-bottom:1px solid var(--border-color-subtle,#c8ccd1);position:relative;display:table;width:100%;padding:5px 7px}#mwe-popups-settings header > div{display:table-cell;width:3.25rem;vertical-align:middle;cursor:pointer}#mwe-popups-settings header h1{margin-bottom:0.6em;padding-top:0.5em;border:0;width:100%;font-family:sans-serif;font-size:18px;font-weight:bold;text-align:center}#mwe-popups-settings main#mwe-popups-settings-form{display:block;width:350px;padding:32px 0 24px;margin:0 auto}#mwe-popups-settings main#mwe-popups-settings-form p{color:var(--color-subtle,#54595d);font-size:14px;margin:16px 0 0}#mwe-popups-settings main#mwe-popups-settings-form p:first-child{margin-top:0}#mwe-popups-settings main#mwe-popups-settings-form form img{margin-right:60px}#mwe-popups-settings main#mwe-popups-settings-form form label{font-size:13px;line-height:16px;width:300px;margin-left:10px;flex-direction:column}#mwe-popups-settings main#mwe-popups-settings-form form label > span{color:var(--color-emphasized,#101418);font-size:14px;font-weight:bold;display:block;margin-bottom:5px}#mwe-popups-settings main#mwe-popups-settings-form form label::before{top:0.78125em !important}.mwe-popups-settings-help{font-size:13px;font-weight:800;margin:40px;position:relative}.mwe-popups-settings-help .popups-icon{background-size:contain;width:180px;max-width:none;height:140px;margin:0;padding:0}.mwe-popups-settings-help p{left:180px;bottom:20px;position:absolute}.mwe-popups{background:var(--background-color-base,#fff);position:absolute;z-index:110;box-shadow:0 30px 90px -20px rgba(0,0,0,0.3),0 0 0 1px var(--background-color-neutral,#eaecf0);padding:0;display:none;font-size:14px;line-height:20px;min-width:300px;border-radius:2px; }.mwe-popups .mwe-popups-container{color:var(--color-base,#202122);text-decoration:none}.mwe-popups .mwe-popups-container footer{padding:0 16px 16px;margin:0;position:absolute;bottom:0;pointer-events:none}.mwe-popups .mwe-popups-container footer a{pointer-events:auto}.mwe-popups .mwe-popups-settings-button{float:right;pointer-events:auto;min-width:32px !important; min-height:32px !important; }.mwe-popups .mwe-popups-extract{margin:16px;display:block;color:var(--color-base,#202122);text-decoration:none;position:relative;padding-bottom:4px}.mwe-popups .mwe-popups-extract:hover{text-decoration:none}.mwe-popups .mwe-popups-extract::after{content:' ';position:absolute;bottom:0;width:25%;height:20px;background-color:transparent;pointer-events:none}.mwe-popups .mwe-popups-extract[dir='ltr']::after{ right:0; background-image:linear-gradient(to right,rgba(255,255,255,0),#ffffff 50%)}.mwe-popups .mwe-popups-extract[dir='rtl']::after{ left:0; background-image:linear-gradient(to left,rgba(255,255,255,0),#ffffff 50%)}.mwe-popups .mwe-popups-extract p{margin:0}.mwe-popups .mwe-popups-extract ul,.mwe-popups .mwe-popups-extract ol,.mwe-popups .mwe-popups-extract li,.mwe-popups .mwe-popups-extract dl,.mwe-popups .mwe-popups-extract dd,.mwe-popups .mwe-popups-extract dt{margin-top:0;margin-bottom:0}.mwe-popups .mwe-popups-extract blockquote{margin:0;padding:0 20px}.mwe-popups svg{overflow:hidden}.mwe-popups.mwe-popups-is-tall{width:450px}.mwe-popups.mwe-popups-is-tall > div > a > svg{vertical-align:middle}.mwe-popups.mwe-popups-is-tall .mwe-popups-extract{width:215px;height:176px;overflow:hidden;float:left}.mwe-popups.mwe-popups-is-tall footer{left:0;right:203px}.mwe-popups.mwe-popups-is-not-tall{width:320px}.mwe-popups.mwe-popups-is-not-tall .mwe-popups-extract{min-height:50px;max-height:136px;overflow:hidden;margin-bottom:50px}.mwe-popups.mwe-popups-is-not-tall footer{left:0;right:0}.mwe-popups.mwe-popups-no-image-pointer::before{content:'';position:absolute;border:8px solid var(--border-color-transparent,transparent);border-top:0;border-bottom:8px solid rgba(0,0,0,0.07000000000000001);top:-8px;left:10px}.mwe-popups.mwe-popups-no-image-pointer::after{content:'';position:absolute;border:11px solid var(--border-color-transparent,transparent);border-top:0;border-bottom:11px solid var(--background-color-base,#fff);top:-7px;left:7px}.mwe-popups.flipped-x.mwe-popups-no-image-pointer::before{left:auto;right:10px}.mwe-popups.flipped-x.mwe-popups-no-image-pointer::after{left:auto;right:7px}.mwe-popups.mwe-popups-image-pointer::before{content:'';position:absolute;border:9px solid var(--border-color-transparent,transparent);border-top:0;border-bottom:9px solid var(--border-color-base,#a2a9b1);top:-9px;left:9px;z-index:111}.mwe-popups.mwe-popups-image-pointer::after{content:'';position:absolute;border:12px solid var(--border-color-transparent,transparent);border-top:0;border-bottom:12px solid var(--background-color-base,#fff);top:-8px;left:6px;z-index:112}.mwe-popups.mwe-popups-image-pointer.flipped-x::before{content:'';position:absolute;border:9px solid var(--border-color-transparent,transparent);border-top:0;border-bottom:9px solid var(--border-color-base,#a2a9b1);top:-9px;left:293px}.mwe-popups.mwe-popups-image-pointer.flipped-x::after{content:'';position:absolute;border:12px solid var(--border-color-transparent,transparent);border-top:0;border-bottom:12px solid var(--background-color-base,#fff);top:-8px;left:290px}.mwe-popups.mwe-popups-image-pointer > div > a > svg{margin-top:-8px;position:absolute;z-index:113;left:0}.mwe-popups.flipped-x.mwe-popups-is-tall{min-height:242px}.mwe-popups.flipped-x.mwe-popups-is-tall::before{content:'';position:absolute;border:9px solid var(--border-color-transparent,transparent);border-top:0;border-bottom:9px solid var(--border-color-base,#a2a9b1);top:-9px;left:420px;z-index:111}.mwe-popups.flipped-x.mwe-popups-is-tall > div > a > svg{margin:0;margin-top:-8px;margin-bottom:-7px;position:absolute;z-index:113;right:0}.mwe-popups.flipped-x-y::before{content:'';position:absolute;border:9px solid var(--border-color-transparent,transparent);border-bottom:0;border-top:9px solid var(--border-color-base,#a2a9b1);bottom:-9px;left:293px;z-index:111}.mwe-popups.flipped-x-y::after{content:'';position:absolute;border:12px solid var(--border-color-transparent,transparent);border-bottom:0;border-top:12px solid var(--background-color-base,#fff);bottom:-8px;left:290px;z-index:112}.mwe-popups.flipped-x-y.mwe-popups-is-tall{min-height:242px}.mwe-popups.flipped-x-y.mwe-popups-is-tall::before{content:'';position:absolute;border:9px solid var(--border-color-transparent,transparent);border-bottom:0;border-top:9px solid var(--border-color-base,#a2a9b1);bottom:-9px;left:420px}.mwe-popups.flipped-x-y.mwe-popups-is-tall::after{content:'';position:absolute;border:12px solid var(--border-color-transparent,transparent);border-bottom:0;border-top:12px solid var(--background-color-base,#fff);bottom:-8px;left:417px}.mwe-popups.flipped-x-y.mwe-popups-is-tall > div > a > svg{margin:0;margin-bottom:-9px;position:absolute;z-index:113;right:0}.mwe-popups.flipped-y::before{content:'';position:absolute;border:8px solid var(--border-color-transparent,transparent);border-bottom:0;border-top:8px solid var(--border-color-base,#a2a9b1);bottom:-8px;left:10px}.mwe-popups.flipped-y::after{content:'';position:absolute;border:11px solid var(--border-color-transparent,transparent);border-bottom:0;border-top:11px solid var(--background-color-base,#fff);bottom:-7px;left:7px}.mwe-popups-is-tall polyline{transform:translate(0,0)}.mwe-popups-is-tall.flipped-x-y polyline{transform:translate(0,-8px)}.mwe-popups-is-tall.flipped-x polyline{transform:translate(0,8px)}.rtl .mwe-popups-is-tall polyline{transform:translate(-100%,0)}.rtl .mwe-popups-is-tall.flipped-x-y polyline{transform:translate(-100%,-8px)}.rtl .mwe-popups-is-tall.flipped-x polyline{transform:translate(-100%,8px)}@supports (clip-path:polygon(1px 1px)){.mwe-popups .mwe-popups-thumbnail{display:block;object-fit:cover;outline:1px solid rgba(0,0,0,0.1)}.mwe-popups.flipped-y .mwe-popups-container,.mwe-popups.flipped-x-y .mwe-popups-container{--y1:100%;--y2:calc(100% - var(--pointer-height));--y3:calc(100% - var(--pointer-height) - var(--pseudo-radius));--y4:var(--pseudo-radius);--y5:0;margin-bottom:calc(var(--pointer-height) * -1);padding-bottom:var(--pointer-height)}.mwe-popups:not(.flipped-y):not(.flipped-x-y) .mwe-popups-container{margin-top:calc(var(--pointer-height) * -1);padding-top:var(--pointer-height)}.mwe-popups .mwe-popups-discreet{margin-top:calc(var(--pointer-height) * -1)}.mwe-popups.mwe-popups-is-tall.flipped-y .mwe-popups-discreet,.mwe-popups.mwe-popups-is-tall.flipped-x-y .mwe-popups-discreet{margin-top:0;margin-bottom:calc(var(--pointer-height) * -1)}.mwe-popups .mwe-popups-container{--x1:0;--x2:var(--pseudo-radius);--x3:calc(var(--pointer-offset) - (var(--pointer-width) / 2));--x4:var(--pointer-offset);--x5:calc(var(--pointer-offset) + (var(--pointer-width) / 2));--x6:calc(100% - var(--pseudo-radius));--x7:100%;--y1:0;--y2:var(--pointer-height);--y3:calc(var(--pointer-height) + var(--pseudo-radius));--y4:calc(100% - var(--pseudo-radius));--y5:100%;padding-top:0;display:flex;background:var(--background-color-base,#fff);--pseudo-radius:2px;--pointer-height:8px;--pointer-width:16px;--pointer-offset:26px;clip-path:polygon(var(--x2) var(--y2),var(--x3) var(--y2),var(--x4) var(--y1),var(--x5) var(--y2),var(--x6) var(--y2),var(--x7) var(--y3),var(--x7) var(--y4),var(--x6) var(--y5),var(--x2) var(--y5),var(--x1) var(--y4),var(--x1) var(--y3))}.mwe-popups.mwe-popups-is-tall{flex-direction:row}.mwe-popups.mwe-popups-is-tall .mwe-popups-discreet{order:1}.mwe-popups.mwe-popups-is-tall .mwe-popups-discreet .mwe-popups-thumbnail{width:203px;box-sizing:border-box;height:250px}.mwe-popups.mwe-popups-is-not-tall .mwe-popups-thumbnail{width:320px;height:192px}.mwe-popups.mwe-popups-is-not-tall .mwe-popups-container{flex-direction:column}.mwe-popups::before{display:none}.mwe-popups::after{display:none}body.ltr .mwe-popups.flipped-x .mwe-popups-container,body.ltr .mwe-popups.flipped-x-y .mwe-popups-container,body.rtl .mwe-popups:not(.flipped-x):not(.flipped-x-y) .mwe-popups-container{--x3:calc(100% - var(--pointer-offset) - (var(--pointer-width) / 2));--x4:calc(100% - var(--pointer-offset));--x5:calc(100% - var(--pointer-offset) + (var(--pointer-width) / 2))}}@media screen{html.skin-theme-clientpref-night .mwe-popups.mwe-popups-no-image-pointer::before{content:'';position:absolute;border:8px solid var(--border-color-transparent,transparent);border-top:0;border-bottom:8px solid rgba(255,255,255,0.07000000000000001);top:-8px;left:10px}html.skin-theme-clientpref-night .mwe-popups-extract[dir='ltr']::after{ background-image:linear-gradient(to right,transparent,var(--background-color-base,#fff) 50%)}html.skin-theme-clientpref-night .mwe-popups-extract[dir='rtl']::after{ background-image:linear-gradient(to left,transparent,var(--background-color-base,#fff) 50%)}@supports (clip-path:polygon(1px 1px)){html.skin-theme-clientpref-night .mwe-popups .mwe-popups-thumbnail{background-color:#c8ccd1}}}@media screen and (prefers-color-scheme:dark){html.skin-theme-clientpref-os .mwe-popups.mwe-popups-no-image-pointer::before{content:'';position:absolute;border:8px solid var(--border-color-transparent,transparent);border-top:0;border-bottom:8px solid rgba(255,255,255,0.07000000000000001);top:-8px;left:10px}html.skin-theme-clientpref-os .mwe-popups-extract[dir='ltr']::after{ background-image:linear-gradient(to right,transparent,var(--background-color-base,#fff) 50%)}html.skin-theme-clientpref-os .mwe-popups-extract[dir='rtl']::after{ background-image:linear-gradient(to left,transparent,var(--background-color-base,#fff) 50%)}@supports (clip-path:polygon(1px 1px)){html.skin-theme-clientpref-os .mwe-popups .mwe-popups-thumbnail{background-color:#c8ccd1}}}.mwe-popups .mwe-popups-title{display:block;margin-bottom:12px}.mwe-popups-type-generic.mwe-popups .mwe-popups-title{font-weight:normal;margin:0}.mwe-popups .mwe-popups-title .popups-icon,.mwe-popups .mw-parser-output .popups-icon{margin:0 8px 0 0}.mwe-popups.mwe-popups-type-generic .mwe-popups-extract,.mwe-popups.mwe-popups-type-disambiguation .mwe-popups-extract{min-height:auto}.mwe-popups.mwe-popups-type-generic .mwe-popups-read-link,.mwe-popups.mwe-popups-type-disambiguation .mwe-popups-read-link{font-weight:bold;font-size:12px;text-decoration:none}.mwe-popups.mwe-popups-type-generic .mwe-popups-extract:hover + footer .mwe-popups-read-link,.mwe-popups.mwe-popups-type-disambiguation .mwe-popups-extract:hover + footer .mwe-popups-read-link,.mwe-popups.mwe-popups-type-generic .mwe-popups-read-link:hover,.mwe-popups.mwe-popups-type-disambiguation .mwe-popups-read-link:hover{text-decoration:underline}.mwe-popups-overlay{background-color:rgba(255,255,255,0.9);z-index:999;position:fixed;height:100%;width:100%;top:0;bottom:0;left:0;right:0;display:flex;justify-content:center;align-items:center}#mwe-popups-svg{position:absolute;top:-1000px}.popups-icon{min-width:20px;min-height:20px;width:1.25rem;height:1.25rem;display:inline-block;vertical-align:text-bottom}@supports not ((-webkit-mask-image:none) or (mask-image:none)){.popups-icon{background-position:center;background-repeat:no-repeat;background-size:calc(max(1.25rem,20px))}}@supports (-webkit-mask-image:none) or (mask-image:none){.popups-icon{ -webkit-mask-size:calc(max(1.25rem,20px));mask-size:calc(max(1.25rem,20px));-webkit-mask-repeat:no-repeat;mask-repeat:no-repeat;-webkit-mask-position:center;mask-position:center; }}.popups-icon--size-small{min-width:16px;min-height:16px;width:1rem;height:1rem}@supports not ((-webkit-mask-image:none) or (mask-image:none)){.popups-icon--size-small{background-position:center;background-repeat:no-repeat;background-size:calc(max(1rem,16px))}}@supports (-webkit-mask-image:none) or (mask-image:none){.popups-icon--size-small{ -webkit-mask-size:calc(max(1rem,16px));mask-size:calc(max(1rem,16px));-webkit-mask-repeat:no-repeat;mask-repeat:no-repeat;-webkit-mask-position:center;mask-position:center; }}.mwe-popups-overlay .cdx-button.cdx-button--icon-only span + span,.mwe-popups .cdx-button.cdx-button--icon-only span + span{display:block;position:absolute !important; clip:rect(1px,1px,1px,1px);width:1px;height:1px;margin:-1px;border:0;padding:0;overflow:hidden}.cdx-button{display:inline-flex;align-items:center;justify-content:center;gap:4px;box-sizing:border-box;min-height:32px;max-width:28rem;margin:0;border-width:1px;border-style:solid;border-radius:2px;padding-right:11px;padding-left:11px;font-family:inherit;font-size:inherit;font-weight:700;overflow:hidden;text-overflow:ellipsis;white-space:nowrap;text-transform:none;transition-property:background-color,color,border-color,box-shadow;transition-duration:.1s}.cdx-button--size-large{min-height:44px;padding-right:15px;padding-left:15px}.cdx-button--icon-only{min-width:32px;padding-right:5px;padding-left:5px}.cdx-button--icon-only.cdx-button--size-large{min-width:44px;padding-right:11px;padding-left:11px}.cdx-button::-moz-focus-inner{border:0;padding:0}.cdx-button .cdx-button__icon,.cdx-button .cdx-icon{vertical-align:middle}.cdx-button .cdx-icon{color:inherit}.cdx-button--fake-button,.cdx-button--fake-button:hover,.cdx-button--fake-button:focus{text-decoration:none}.cdx-button:enabled,.cdx-button.cdx-button--fake-button--enabled{background-color:var(--background-color-interactive-subtle,#f8f9fa);color:var(--color-base,#202122);border-color:var(--border-color-base,#a2a9b1)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:enabled .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled .cdx-button__icon{background-color:var(--color-base,#202122)}}.cdx-button:enabled:hover,.cdx-button.cdx-button--fake-button--enabled:hover{background-color:var(--background-color-base,#fff);color:var(--color-base--hover,#404244);cursor:pointer}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:enabled:hover .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled:hover .cdx-button__icon{background-color:var(--color-base--hover,#404244)}}.cdx-button:enabled:active,.cdx-button.cdx-button--fake-button--enabled:active,.cdx-button:enabled.cdx-button--is-active,.cdx-button.cdx-button--fake-button--enabled.cdx-button--is-active{background-color:var(--background-color-interactive,#eaecf0);color:var(--color-emphasized,#101418);border-color:var(--border-color-interactive,#72777d)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:enabled:active .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled:active .cdx-button__icon,.cdx-button:enabled.cdx-button--is-active .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--is-active .cdx-button__icon{background-color:var(--color-emphasized,#101418)}}.cdx-button:enabled:focus,.cdx-button.cdx-button--fake-button--enabled:focus{outline:1px solid transparent}.cdx-button:enabled:focus:not(:active):not(.cdx-button--is-active),.cdx-button.cdx-button--fake-button--enabled:focus:not(:active):not(.cdx-button--is-active){border-color:var(--border-color-progressive--focus,#36c);box-shadow:inset 0 0 0 1px var(--box-shadow-color-progressive--focus,#36c)}.cdx-button:enabled.cdx-button--action-progressive,.cdx-button.cdx-button--fake-button--enabled.cdx-button--action-progressive{color:var(--color-progressive,#36c)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:enabled.cdx-button--action-progressive .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--action-progressive .cdx-button__icon{background-color:var(--color-progressive,#36c)}}.cdx-button:enabled.cdx-button--action-progressive:hover,.cdx-button.cdx-button--fake-button--enabled.cdx-button--action-progressive:hover{color:var(--color-progressive--hover,#4b77d6);border-color:var(--border-color-progressive--hover,#4b77d6)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:enabled.cdx-button--action-progressive:hover .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--action-progressive:hover .cdx-button__icon{background-color:var(--color-progressive--hover,#4b77d6)}}.cdx-button:enabled.cdx-button--action-progressive:active,.cdx-button.cdx-button--fake-button--enabled.cdx-button--action-progressive:active,.cdx-button:enabled.cdx-button--action-progressive.cdx-button--is-active,.cdx-button.cdx-button--fake-button--enabled.cdx-button--action-progressive.cdx-button--is-active{background-color:var(--background-color-progressive-subtle,#f1f4fd);color:var(--color-progressive--active,#233566);border-color:var(--border-color-progressive--active,#233566)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:enabled.cdx-button--action-progressive:active .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--action-progressive:active .cdx-button__icon,.cdx-button:enabled.cdx-button--action-progressive.cdx-button--is-active .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--action-progressive.cdx-button--is-active .cdx-button__icon{background-color:var(--color-progressive--active,#233566)}}.cdx-button:enabled.cdx-button--action-destructive,.cdx-button.cdx-button--fake-button--enabled.cdx-button--action-destructive{color:var(--color-destructive,#bf3c2c)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:enabled.cdx-button--action-destructive .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--action-destructive .cdx-button__icon{background-color:var(--color-destructive,#bf3c2c)}}.cdx-button:enabled.cdx-button--action-destructive:hover,.cdx-button.cdx-button--fake-button--enabled.cdx-button--action-destructive:hover{color:var(--color-destructive--hover,#f54739);border-color:var(--border-color-destructive--hover,#f54739)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:enabled.cdx-button--action-destructive:hover .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--action-destructive:hover .cdx-button__icon{background-color:var(--color-destructive--hover,#f54739)}}.cdx-button:enabled.cdx-button--action-destructive:active,.cdx-button.cdx-button--fake-button--enabled.cdx-button--action-destructive:active,.cdx-button:enabled.cdx-button--action-destructive.cdx-button--is-active,.cdx-button.cdx-button--fake-button--enabled.cdx-button--action-destructive.cdx-button--is-active{background-color:var(--background-color-destructive-subtle,#ffe9e5);color:var(--color-destructive--active,#9f3526);border-color:var(--border-color-destructive--active,#9f3526)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:enabled.cdx-button--action-destructive:active .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--action-destructive:active .cdx-button__icon,.cdx-button:enabled.cdx-button--action-destructive.cdx-button--is-active .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--action-destructive.cdx-button--is-active .cdx-button__icon{background-color:var(--color-destructive--active,#9f3526)}}.cdx-button:enabled.cdx-button--action-destructive:focus:not(:active):not(.cdx-button--is-active),.cdx-button.cdx-button--fake-button--enabled.cdx-button--action-destructive:focus:not(:active):not(.cdx-button--is-active){border-color:var(--border-color-destructive--focus,#36c);box-shadow:inset 0 0 0 1px var(--box-shadow-color-destructive--focus,#36c)}.cdx-button:enabled.cdx-button--weight-primary.cdx-button--action-progressive,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-primary.cdx-button--action-progressive{background-color:var(--background-color-progressive,#36c);color:var(--color-inverted-fixed,#fff);border-color:var(--border-color-progressive,#36c)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:enabled.cdx-button--weight-primary.cdx-button--action-progressive .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-primary.cdx-button--action-progressive .cdx-button__icon{background-color:var(--color-inverted-fixed,#fff)}}.cdx-button:enabled.cdx-button--weight-primary.cdx-button--action-progressive:hover,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-primary.cdx-button--action-progressive:hover{background-color:var(--background-color-progressive--hover,#4b77d6);border-color:var(--border-color-progressive--hover,#4b77d6)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:enabled.cdx-button--weight-primary.cdx-button--action-progressive:hover .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-primary.cdx-button--action-progressive:hover .cdx-button__icon{background-color:var(--color-inverted-fixed,#fff)}}.cdx-button:enabled.cdx-button--weight-primary.cdx-button--action-progressive:active,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-primary.cdx-button--action-progressive:active,.cdx-button:enabled.cdx-button--weight-primary.cdx-button--action-progressive.cdx-button--is-active,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-primary.cdx-button--action-progressive.cdx-button--is-active{background-color:var(--background-color-progressive--active,#233566);border-color:var(--border-color-progressive--active,#233566)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:enabled.cdx-button--weight-primary.cdx-button--action-progressive:active .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-primary.cdx-button--action-progressive:active .cdx-button__icon,.cdx-button:enabled.cdx-button--weight-primary.cdx-button--action-progressive.cdx-button--is-active .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-primary.cdx-button--action-progressive.cdx-button--is-active .cdx-button__icon{background-color:var(--color-inverted-fixed,#fff)}}.cdx-button:enabled.cdx-button--weight-primary.cdx-button--action-progressive:focus:not(:active):not(.cdx-button--is-active),.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-primary.cdx-button--action-progressive:focus:not(:active):not(.cdx-button--is-active){border-color:var(--border-color-progressive--focus,#36c);box-shadow:inset 0 0 0 1px var(--box-shadow-color-progressive--focus,#36c),inset 0 0 0 2px var(--box-shadow-color-inverted,#fff)}.cdx-button:enabled.cdx-button--weight-primary.cdx-button--action-destructive,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-primary.cdx-button--action-destructive{background-color:var(--background-color-destructive,#bf3c2c);color:var(--color-inverted-fixed,#fff);border-color:var(--border-color-destructive,#bf3c2c)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:enabled.cdx-button--weight-primary.cdx-button--action-destructive .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-primary.cdx-button--action-destructive .cdx-button__icon{background-color:var(--color-inverted-fixed,#fff)}}.cdx-button:enabled.cdx-button--weight-primary.cdx-button--action-destructive:hover,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-primary.cdx-button--action-destructive:hover{background-color:var(--background-color-destructive--hover,#f54739);border-color:var(--border-color-destructive--hover,#f54739)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:enabled.cdx-button--weight-primary.cdx-button--action-destructive:hover .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-primary.cdx-button--action-destructive:hover .cdx-button__icon{background-color:var(--color-inverted-fixed,#fff)}}.cdx-button:enabled.cdx-button--weight-primary.cdx-button--action-destructive:active,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-primary.cdx-button--action-destructive:active,.cdx-button:enabled.cdx-button--weight-primary.cdx-button--action-destructive.cdx-button--is-active,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-primary.cdx-button--action-destructive.cdx-button--is-active{background-color:var(--background-color-destructive--active,#9f3526);border-color:var(--border-color-destructive--active,#9f3526)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:enabled.cdx-button--weight-primary.cdx-button--action-destructive:active .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-primary.cdx-button--action-destructive:active .cdx-button__icon,.cdx-button:enabled.cdx-button--weight-primary.cdx-button--action-destructive.cdx-button--is-active .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-primary.cdx-button--action-destructive.cdx-button--is-active .cdx-button__icon{background-color:var(--color-inverted-fixed,#fff)}}.cdx-button:enabled.cdx-button--weight-primary.cdx-button--action-destructive:focus:not(:active):not(.cdx-button--is-active),.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-primary.cdx-button--action-destructive:focus:not(:active):not(.cdx-button--is-active){border-color:var(--border-color-destructive--focus,#36c);box-shadow:inset 0 0 0 1px var(--box-shadow-color-destructive--focus,#36c),inset 0 0 0 2px var(--box-shadow-color-inverted,#fff)}.cdx-button:enabled.cdx-button--weight-quiet,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet{background-color:var(--background-color-transparent,transparent);border-color:var(--border-color-transparent,transparent)}.cdx-button:enabled.cdx-button--weight-quiet:hover,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet:hover{background-color:var(--background-color-button-quiet--hover,rgba(0,24,73,.027))}.cdx-button:enabled.cdx-button--weight-quiet:active,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet:active,.cdx-button:enabled.cdx-button--weight-quiet.cdx-button--is-active,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet.cdx-button--is-active{background-color:var(--background-color-button-quiet--active,rgba(0,24,73,.082));color:var(--color-emphasized,#101418);border-color:var(--border-color-interactive,#72777d)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:enabled.cdx-button--weight-quiet:active .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet:active .cdx-button__icon,.cdx-button:enabled.cdx-button--weight-quiet.cdx-button--is-active .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet.cdx-button--is-active .cdx-button__icon{background-color:var(--color-emphasized,#101418)}}.cdx-button:enabled.cdx-button--weight-quiet.cdx-button--action-progressive,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet.cdx-button--action-progressive{color:var(--color-progressive,#36c)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:enabled.cdx-button--weight-quiet.cdx-button--action-progressive .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet.cdx-button--action-progressive .cdx-button__icon{background-color:var(--color-progressive,#36c)}}.cdx-button:enabled.cdx-button--weight-quiet.cdx-button--action-progressive:hover,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet.cdx-button--action-progressive:hover{background-color:var(--background-color-progressive-subtle,#f1f4fd);color:var(--color-progressive--hover,#4b77d6)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:enabled.cdx-button--weight-quiet.cdx-button--action-progressive:hover .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet.cdx-button--action-progressive:hover .cdx-button__icon{background-color:var(--color-progressive--hover,#4b77d6)}}.cdx-button:enabled.cdx-button--weight-quiet.cdx-button--action-progressive:active,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet.cdx-button--action-progressive:active,.cdx-button:enabled.cdx-button--weight-quiet.cdx-button--action-progressive.cdx-button--is-active,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet.cdx-button--action-progressive.cdx-button--is-active{background-color:var(--background-color-progressive--active,#233566);color:var(--color-inverted-fixed,#fff);border-color:var(--border-color-progressive--active,#233566)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:enabled.cdx-button--weight-quiet.cdx-button--action-progressive:active .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet.cdx-button--action-progressive:active .cdx-button__icon,.cdx-button:enabled.cdx-button--weight-quiet.cdx-button--action-progressive.cdx-button--is-active .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet.cdx-button--action-progressive.cdx-button--is-active .cdx-button__icon{background-color:var(--color-inverted,#fff)}}.cdx-button:enabled.cdx-button--weight-quiet.cdx-button--action-destructive,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet.cdx-button--action-destructive{color:var(--color-destructive,#bf3c2c)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:enabled.cdx-button--weight-quiet.cdx-button--action-destructive .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet.cdx-button--action-destructive .cdx-button__icon{background-color:var(--color-destructive,#bf3c2c)}}.cdx-button:enabled.cdx-button--weight-quiet.cdx-button--action-destructive:hover,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet.cdx-button--action-destructive:hover{background-color:var(--background-color-destructive-subtle,#ffe9e5);color:var(--color-destructive--hover,#f54739)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:enabled.cdx-button--weight-quiet.cdx-button--action-destructive:hover .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet.cdx-button--action-destructive:hover .cdx-button__icon{background-color:var(--color-destructive--hover,#f54739)}}.cdx-button:enabled.cdx-button--weight-quiet.cdx-button--action-destructive:active,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet.cdx-button--action-destructive:active,.cdx-button:enabled.cdx-button--weight-quiet.cdx-button--action-destructive.cdx-button--is-active,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet.cdx-button--action-destructive.cdx-button--is-active{background-color:var(--background-color-destructive--active,#9f3526);color:var(--color-inverted-fixed,#fff);border-color:var(--border-color-destructive--active,#9f3526)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:enabled.cdx-button--weight-quiet.cdx-button--action-destructive:active .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet.cdx-button--action-destructive:active .cdx-button__icon,.cdx-button:enabled.cdx-button--weight-quiet.cdx-button--action-destructive.cdx-button--is-active .cdx-button__icon,.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet.cdx-button--action-destructive.cdx-button--is-active .cdx-button__icon{background-color:var(--color-inverted,#fff)}}.cdx-button:enabled.cdx-button--weight-quiet.cdx-button--action-destructive:focus:not(:active):not(.cdx-button--is-active),.cdx-button.cdx-button--fake-button--enabled.cdx-button--weight-quiet.cdx-button--action-destructive:focus:not(:active):not(.cdx-button--is-active){border-color:var(--border-color-destructive--focus,#36c);box-shadow:inset 0 0 0 1px var(--box-shadow-color-destructive--focus,#36c)}.cdx-button:disabled,.cdx-button.cdx-button--fake-button--disabled{background-color:var(--background-color-disabled,#dadde3);color:var(--color-disabled-emphasized,#a2a9b1);border-color:var(--border-color-transparent,transparent)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:disabled .cdx-button__icon,.cdx-button.cdx-button--fake-button--disabled .cdx-button__icon{background-color:var(--color-inverted,#fff)}}.cdx-button:disabled.cdx-button--weight-quiet,.cdx-button.cdx-button--fake-button--disabled.cdx-button--weight-quiet{background-color:var(--background-color-transparent,transparent);color:var(--color-disabled,#a2a9b1)}@supports ((-webkit-mask-image:none) or (mask-image:none)){.cdx-button:disabled.cdx-button--weight-quiet .cdx-button__icon,.cdx-button.cdx-button--fake-button--disabled.cdx-button--weight-quiet .cdx-button__icon{background-color:var(--color-disabled,#a2a9b1)}}.cdx-icon{color:var(--color-base,#202122);display:inline-flex;align-items:center;justify-content:center;vertical-align:text-bottom}.cdx-icon svg{fill:currentcolor;width:100%;height:100%}.cdx-icon--x-small{min-width:12px;min-height:12px;width:.75rem;height:.75rem}.cdx-icon--small{min-width:16px;min-height:16px;width:1rem;height:1rem}.cdx-icon--medium{min-width:20px;min-height:20px;width:1.25rem;height:1.25rem}.cdx-icon--flipped svg{transform:scaleX(-1)}.cdx-label{display:flex;flex-direction:column;line-height:1.375}.cdx-label__label__icon.cdx-icon{margin-right:4px}.cdx-label__label__text{font-weight:700}legend.cdx-label{padding:0}fieldset label.cdx-label__label .cdx-label__label__text{font-weight:400}.cdx-label:not(.cdx-label--disabled) .cdx-label__label__optional-flag,.cdx-label:not(.cdx-label--disabled) .cdx-label__description{color:var(--color-subtle,#54595d)}.cdx-label--disabled,.cdx-label--disabled .cdx-label__label__icon{color:var(--color-disabled,#a2a9b1)}.cdx-label--visually-hidden{display:block;clip:rect(1px,1px,1px,1px);position:absolute!important;width:1px;height:1px;margin:-1px;border:0;padding:0;overflow:hidden}.cdx-label:not(.cdx-label--visually-hidden){padding-bottom:8px}@media screen and (min-width:640px){.cdx-label:not(.cdx-label--visually-hidden){padding-bottom:4px}}.cdx-checkbox{position:relative;min-width:20px;min-height:20px}.cdx-checkbox__wrapper{display:flex}.cdx-checkbox:not(.cdx-checkbox--inline){display:flex;flex-direction:column;margin-bottom:12px}.cdx-checkbox:not(.cdx-checkbox--inline):last-child{margin-bottom:0}.cdx-checkbox--inline{display:inline-flex;margin-right:16px;white-space:nowrap}.cdx-checkbox--inline:last-child{margin-right:0}.cdx-checkbox__label,.cdx-checkbox__label.cdx-label{display:inline-flex;position:relative;z-index:0;padding-left:calc(1.25rem + 8px);line-height:1.4285714}.cdx-checkbox__label.cdx-label{padding-bottom:0}.cdx-checkbox__label.cdx-label .cdx-label__label__text{font-weight:400}.cdx-checkbox--inline .cdx-checkbox__label{display:inline}.cdx-checkbox__icon{background-color:var(--background-color-base-fixed,#fff);position:absolute;left:0;box-sizing:border-box;min-width:20px;min-height:20px;width:1.25rem;height:1.25rem;border-width:1px;border-style:solid;transition-property:background-color,color,border-color,box-shadow;transition-duration:.1s}.cdx-checkbox__input{opacity:0;position:absolute;left:0;z-index:1;min-width:20px;min-height:20px;width:1.25rem;height:1.25rem;margin:0;font-size:inherit;cursor:inherit}.cdx-checkbox:hover>.cdx-checkbox__input:enabled,.cdx-checkbox:hover>.cdx-checkbox__input:enabled~.cdx-label .cdx-label__label,.cdx-checkbox:hover>.cdx-checkbox__input:enabled~.cdx-checkbox__label:not(.cdx-label){cursor:pointer}.cdx-checkbox__custom-input:not(.cdx-checkbox__custom-input--inline){padding-top:6px;padding-left:calc(1.25rem + 8px)}.cdx-checkbox__icon{background-size:0 0;border-radius:2px}.cdx-checkbox__input:indeterminate+.cdx-checkbox__icon:before{content:" ";background-color:var(--background-color-base-fixed,#fff);position:absolute;top:calc(50% - .5px);right:3px;left:3px;height:2px}.cdx-checkbox__input:checked:not(:indeterminate)+.cdx-checkbox__icon:before{content:" ";background-image:url('data:image/svg+xml;utf8,<svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 20 20"><path fill="%23fff" d="M7 14.17L2.83 10l-1.41 1.41L7 17 19 5l-1.41-1.42z"/></svg>');background-position:center;background-repeat:no-repeat;background-size:1rem 1rem;position:absolute;width:100%;height:100%}.cdx-checkbox__input:enabled+.cdx-checkbox__icon{border-color:var(--border-color-interactive,#72777d)}.cdx-checkbox__input:enabled:hover+.cdx-checkbox__icon{border-color:var(--border-color-progressive--hover,#4b77d6)}.cdx-checkbox__input:enabled:active+.cdx-checkbox__icon{background-color:var(--background-color-progressive--active,#233566);border-color:var(--border-color-progressive--active,#233566)}.cdx-checkbox__input:enabled:focus:not(:active)+.cdx-checkbox__icon{border-color:var(--border-color-progressive--focus,#36c);box-shadow:inset 0 0 0 1px var(--box-shadow-color-progressive--focus,#36c);outline:1px solid transparent}.cdx-checkbox__input:enabled:checked+.cdx-checkbox__icon,.cdx-checkbox__input:enabled:indeterminate+.cdx-checkbox__icon{background-color:var(--background-color-input-binary--checked,#36c);border-color:var(--border-color-progressive,#36c)}.cdx-checkbox__input:enabled:checked:hover+.cdx-checkbox__icon,.cdx-checkbox__input:enabled:indeterminate:hover+.cdx-checkbox__icon{background-color:var(--background-color-progressive--hover,#4b77d6);border-color:var(--border-color-progressive--hover,#4b77d6)}.cdx-checkbox__input:enabled:checked:active+.cdx-checkbox__icon,.cdx-checkbox__input:enabled:indeterminate:active+.cdx-checkbox__icon{background-color:var(--background-color-progressive--active,#233566);border-color:var(--border-color-progressive--active,#233566)}.cdx-checkbox__input:enabled:checked:focus:not(:active):not(:hover)+.cdx-checkbox__icon,.cdx-checkbox__input:enabled:indeterminate:focus:not(:active):not(:hover)+.cdx-checkbox__icon{background-color:var(--background-color-input-binary--checked,#36c);border-color:var(--border-color-progressive,#36c)}.cdx-checkbox__input:enabled:checked:focus:not(:active)+.cdx-checkbox__icon,.cdx-checkbox__input:enabled:indeterminate:focus:not(:active)+.cdx-checkbox__icon{box-shadow:inset 0 0 0 1px var(--box-shadow-color-progressive--focus,#36c),inset 0 0 0 2px var(--box-shadow-color-inverted,#fff)}.cdx-checkbox--status-error .cdx-checkbox__input:enabled+.cdx-checkbox__icon{border-color:var(--border-color-error,#f54739)}.cdx-checkbox--status-error .cdx-checkbox__input:enabled:hover+.cdx-checkbox__icon{border-color:var(--border-color-error--hover,#d74032)}.cdx-checkbox--status-error .cdx-checkbox__input:enabled:active+.cdx-checkbox__icon{background-color:var(--background-color-error--active,#bf3c2c);border-color:var(--border-color-transparent,transparent)}.cdx-checkbox--status-error .cdx-checkbox__input:enabled:focus+.cdx-checkbox__icon{border-color:var(--border-color-progressive--focus,#36c)}.cdx-checkbox--status-error .cdx-checkbox__input:enabled:checked+.cdx-checkbox__icon,.cdx-checkbox--status-error .cdx-checkbox__input:enabled:indeterminate+.cdx-checkbox__icon{background-color:var(--background-color-error,#f54739);border-color:var(--border-color-transparent,transparent)}.cdx-checkbox--status-error .cdx-checkbox__input:enabled:checked:hover+.cdx-checkbox__icon,.cdx-checkbox--status-error .cdx-checkbox__input:enabled:indeterminate:hover+.cdx-checkbox__icon{background-color:var(--background-color-error--hover,#d74032);border-color:var(--border-color-error--hover,#d74032)}.cdx-checkbox--status-error .cdx-checkbox__input:enabled:checked:active+.cdx-checkbox__icon,.cdx-checkbox--status-error .cdx-checkbox__input:enabled:indeterminate:active+.cdx-checkbox__icon{background-color:var(--background-color-error--active,#bf3c2c);border-color:var(--border-color-transparent,transparent)}.cdx-checkbox--status-error .cdx-checkbox__input:enabled:checked:focus:not(:active)+.cdx-checkbox__icon,.cdx-checkbox--status-error .cdx-checkbox__input:enabled:indeterminate:focus:not(:active)+.cdx-checkbox__icon{background-color:var(--background-color-error,#f54739);border-color:var(--border-color-progressive--focus,#36c)}.cdx-checkbox__input:disabled+.cdx-checkbox__icon{background-color:var(--background-color-disabled-subtle,#eaecf0);border-color:var(--border-color-disabled,#c8ccd1)}.cdx-checkbox__input:disabled:checked+.cdx-checkbox__icon,.cdx-checkbox__input:disabled:indeterminate+.cdx-checkbox__icon{background-color:var(--background-color-disabled,#dadde3);border-color:var(--border-color-transparent,transparent)}.cdx-checkbox__input:disabled:indeterminate+.cdx-checkbox__icon:before{background-color:var(--color-disabled-emphasized,#a2a9b1)}.cdx-checkbox__input:disabled~.cdx-checkbox__label,.cdx-checkbox__input:disabled~.cdx-checkbox__label.cdx-label{color:var(--color-disabled,#a2a9b1)}</style><style>
+.ve-active .ve-init-mw-desktopArticleTarget-targetContainer #siteNotice,.ve-active .mw-indicators,.ve-active #t-print,.ve-active #t-permalink,.ve-active #p-coll-print_export,.ve-active #t-cite,.ve-active .ve-init-mw-desktopArticleTarget-editableContent,.ve-active .ve-init-mw-tempWikitextEditorWidget{display:none}.ve-deactivating .ve-ui-surface{display:none}.ve-activating{ }.ve-activating .ve-ui-surface{height:0;padding:0 !important; overflow:hidden} .ve-loading .ve-init-mw-desktopArticleTarget-targetContainer > :not(.ve-init-mw-desktopArticleTarget-toolbarPlaceholder):not(.ve-init-mw-desktopArticleTarget),.ve-loading .ve-init-mw-desktopArticleTarget-originalContent,.ve-activated:not(.ve-loading) .ve-init-mw-desktopArticleTarget-uneditableContent{pointer-events:none;-webkit-user-select:none;-moz-user-select:none;-ms-user-select:none;user-select:none;opacity:0.5}.ve-activated .ve-init-mw-desktopArticleTarget-targetContainer #firstHeading{ -webkit-user-select:text;-moz-user-select:text;-ms-user-select:text;user-select:text;pointer-events:auto;cursor:text}.ve-activated .ve-init-mw-desktopArticleTarget-targetContainer #firstHeading a{ pointer-events:none}.ve-activated .ve-init-mw-desktopArticleTarget-originalContent #catlinks{cursor:pointer}.ve-activated .ve-init-mw-desktopArticleTarget-originalContent #catlinks:hover{ background:#e9f2fd}.ve-activated .ve-init-mw-desktopArticleTarget-originalContent #catlinks a{opacity:1} .ve-init-mw-desktopArticleTarget-loading-overlay{z-index:2;position:absolute;width:100%;top:1em}.ve-init-mw-desktopArticleTarget-toolbarPlaceholder{overflow:hidden;transition:height 250ms ease;height:0;padding-bottom:2px; }.ve-init-mw-desktopArticleTarget-toolbarPlaceholder-bar{transform:translateY(-100%);transition:transform 250ms ease}.ve-init-mw-desktopArticleTarget-toolbarPlaceholder-open .ve-init-mw-desktopArticleTarget-toolbarPlaceholder-bar{transform:translateY(0)}.ve-init-mw-desktopArticleTarget-toolbarPlaceholder-floating{transition:none}.ve-init-mw-desktopArticleTarget-toolbarPlaceholder-floating .ve-init-mw-desktopArticleTarget-toolbarPlaceholder-bar{position:fixed;top:0;z-index:1;background:var(--background-color-base,#fff)} .oo-ui-element-hidden{display:none !important; } .mw-editsection::before{content:'\200B'}.mw-editsection a{white-space:nowrap} .ve-init-mw-desktopArticleTarget-toolbarPlaceholder-bar{height:42px;border-bottom:1px solid #c8ccd1;box-shadow:0 1px 1px 0 rgba(0,0,0,0.1)}.ve-init-mw-desktopArticleTarget-toolbarPlaceholder-floating,.ve-init-mw-desktopArticleTarget-toolbarPlaceholder-open{height:42px} .ve-init-mw-desktopArticleTarget-toolbar,.ve-init-mw-desktopArticleTarget-toolbarPlaceholder,.ve-ui-overlay-local,.ve-ui-overlay-global{font-size:0.875rem}.ve-init-mw-desktopArticleTarget-toolbarPlaceholder-bar,.ve-init-mw-desktopArticleTarget-toolbar.ve-ui-toolbar > .oo-ui-toolbar-bar{box-shadow:0 2px 1px -1px rgba(0,0,0,0.1)}.ve-ui-mwSaveDialog-preview .mw-body{ }.ve-ui-mwSaveDialog-preview .mw-body .firstHeading{grid-area:titlebar}.ve-ui-mwSaveDialog-preview .mw-body .mw-body-content{grid-area:content}.ve-ui-mwSaveDialog-preview .mw-content-container{max-width:960px;margin:0 auto}.ve-init-mw-desktopArticleTarget .ve-init-mw-target-surface > .ve-ce-surface .ve-ce-attachedRootNode{min-height:15em}.ve-init-mw-desktopArticleTarget-toolbar .ve-ui-toolbarDialog-position-above.ve-ui-toolbarDialog-padded .oo-ui-window-body,.ve-init-mw-desktopArticleTarget-toolbar .ve-ui-toolbarDialog-position-below.ve-ui-toolbarDialog-padded .oo-ui-window-body{padding-left:0;padding-right:0}.ve-init-mw-desktopArticleTarget-toolbar .ve-ui-toolbarDialog-position-side.ve-ui-toolbarDialog-padded .oo-ui-window-body{padding-right:0}
+.popups-icon--reference-generic{ min-width:20px;min-height:20px;width:1.25rem;height:1.25rem;display:inline-block;vertical-align:text-bottom}@supports not ((-webkit-mask-image:none) or (mask-image:none)){.popups-icon--reference-generic{background-position:center;background-repeat:no-repeat;background-size:calc(max(1.25rem,20px))}}@supports (-webkit-mask-image:none) or (mask-image:none){.popups-icon--reference-generic{ -webkit-mask-size:calc(max(1.25rem,20px));mask-size:calc(max(1.25rem,20px));-webkit-mask-repeat:no-repeat;mask-repeat:no-repeat;-webkit-mask-position:center;mask-position:center; }}@supports not ((-webkit-mask-image:none) or (mask-image:none)){.popups-icon--reference-generic{background-image:url("data:image/svg+xml;utf8,<svg xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\" width=\"20\" height=\"20\" viewBox=\"0 0 20 20\" fill=\"%23000000\"><path d=\"m15 10-2.78-2.78L9.44 10V1H5a2 2 0 00-2 2v14a2 2 0 002 2h10a2 2 0 002-2V3a2 2 0 00-2-2z\"/></svg>");filter:invert(var(--filter-invert-icon,0));opacity:var(--opacity-icon-base,0.87)}.cdx-button:not(.cdx-button--weight-quiet):disabled .popups-icon--reference-generic,.cdx-button--weight-primary.cdx-button--action-progressive .popups-icon--reference-generic,.cdx-button--weight-primary.cdx-button--action-destructive .popups-icon--reference-generic{filter:invert(var(--filter-invert-primary-button-icon,1))}}@supports (-webkit-mask-image:none) or (mask-image:none){.popups-icon--reference-generic{ -webkit-mask-image:url("data:image/svg+xml;utf8,<svg xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\" width=\"20\" height=\"20\" viewBox=\"0 0 20 20\" fill=\"%23000000\"><path d=\"m15 10-2.78-2.78L9.44 10V1H5a2 2 0 00-2 2v14a2 2 0 002 2h10a2 2 0 002-2V3a2 2 0 00-2-2z\"/></svg>"); mask-image:url("data:image/svg+xml;utf8,<svg xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\" width=\"20\" height=\"20\" viewBox=\"0 0 20 20\" fill=\"%23000000\"><path d=\"m15 10-2.78-2.78L9.44 10V1H5a2 2 0 00-2 2v14a2 2 0 002 2h10a2 2 0 002-2V3a2 2 0 00-2-2z\"/></svg>");background-color:var(--color-base,#202122)}}.popups-icon--reference-book{ min-width:20px;min-height:20px;width:1.25rem;height:1.25rem;display:inline-block;vertical-align:text-bottom}@supports not ((-webkit-mask-image:none) or (mask-image:none)){.popups-icon--reference-book{background-position:center;background-repeat:no-repeat;background-size:calc(max(1.25rem,20px))}}@supports (-webkit-mask-image:none) or (mask-image:none){.popups-icon--reference-book{ -webkit-mask-size:calc(max(1.25rem,20px));mask-size:calc(max(1.25rem,20px));-webkit-mask-repeat:no-repeat;mask-repeat:no-repeat;-webkit-mask-position:center;mask-position:center; }}@supports not ((-webkit-mask-image:none) or (mask-image:none)){.popups-icon--reference-book{background-image:url("data:image/svg+xml;utf8,<svg xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\" width=\"20\" height=\"20\" viewBox=\"0 0 20 20\" fill=\"%23000000\"><path d=\"M15 2a7.65 7.65 0 00-5 2 7.65 7.65 0 00-5-2H1v15h4a7.65 7.65 0 015 2 7.65 7.65 0 015-2h4V2zm2.5 13.5H14a4.38 4.38 0 00-3 1V5s1-1.5 4-1.5h2.5z\"/><path d=\"M9 3.5h2v1H9z\"/></svg>");filter:invert(var(--filter-invert-icon,0));opacity:var(--opacity-icon-base,0.87)}.cdx-button:not(.cdx-button--weight-quiet):disabled .popups-icon--reference-book,.cdx-button--weight-primary.cdx-button--action-progressive .popups-icon--reference-book,.cdx-button--weight-primary.cdx-button--action-destructive .popups-icon--reference-book{filter:invert(var(--filter-invert-primary-button-icon,1))}}@supports (-webkit-mask-image:none) or (mask-image:none){.popups-icon--reference-book{ -webkit-mask-image:url("data:image/svg+xml;utf8,<svg xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\" width=\"20\" height=\"20\" viewBox=\"0 0 20 20\" fill=\"%23000000\"><path d=\"M15 2a7.65 7.65 0 00-5 2 7.65 7.65 0 00-5-2H1v15h4a7.65 7.65 0 015 2 7.65 7.65 0 015-2h4V2zm2.5 13.5H14a4.38 4.38 0 00-3 1V5s1-1.5 4-1.5h2.5z\"/><path d=\"M9 3.5h2v1H9z\"/></svg>"); mask-image:url("data:image/svg+xml;utf8,<svg xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\" width=\"20\" height=\"20\" viewBox=\"0 0 20 20\" fill=\"%23000000\"><path d=\"M15 2a7.65 7.65 0 00-5 2 7.65 7.65 0 00-5-2H1v15h4a7.65 7.65 0 015 2 7.65 7.65 0 015-2h4V2zm2.5 13.5H14a4.38 4.38 0 00-3 1V5s1-1.5 4-1.5h2.5z\"/><path d=\"M9 3.5h2v1H9z\"/></svg>");background-color:var(--color-base,#202122)}}.popups-icon--reference-book[dir='rtl'],html[dir='rtl'] .popups-icon--reference-book:not([dir='ltr']){transform:scaleX(-1)}.popups-icon--reference-journal{ min-width:20px;min-height:20px;width:1.25rem;height:1.25rem;display:inline-block;vertical-align:text-bottom}@supports not ((-webkit-mask-image:none) or (mask-image:none)){.popups-icon--reference-journal{background-position:center;background-repeat:no-repeat;background-size:calc(max(1.25rem,20px))}}@supports (-webkit-mask-image:none) or (mask-image:none){.popups-icon--reference-journal{ -webkit-mask-size:calc(max(1.25rem,20px));mask-size:calc(max(1.25rem,20px));-webkit-mask-repeat:no-repeat;mask-repeat:no-repeat;-webkit-mask-position:center;mask-position:center; }}@supports not ((-webkit-mask-image:none) or (mask-image:none)){.popups-icon--reference-journal{background-image:url("data:image/svg+xml;utf8,<svg xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\" width=\"20\" height=\"20\" viewBox=\"0 0 20 20\" fill=\"%23000000\"><path d=\"M2 18.5A1.5 1.5 0 003.5 20H5V0H3.5A1.5 1.5 0 002 1.5zM6 0v20h10a2 2 0 002-2V2a2 2 0 00-2-2zm7 8H8V7h5zm3-2H8V5h8z\"/></svg>");filter:invert(var(--filter-invert-icon,0));opacity:var(--opacity-icon-base,0.87)}.cdx-button:not(.cdx-button--weight-quiet):disabled .popups-icon--reference-journal,.cdx-button--weight-primary.cdx-button--action-progressive .popups-icon--reference-journal,.cdx-button--weight-primary.cdx-button--action-destructive .popups-icon--reference-journal{filter:invert(var(--filter-invert-primary-button-icon,1))}}@supports (-webkit-mask-image:none) or (mask-image:none){.popups-icon--reference-journal{ -webkit-mask-image:url("data:image/svg+xml;utf8,<svg xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\" width=\"20\" height=\"20\" viewBox=\"0 0 20 20\" fill=\"%23000000\"><path d=\"M2 18.5A1.5 1.5 0 003.5 20H5V0H3.5A1.5 1.5 0 002 1.5zM6 0v20h10a2 2 0 002-2V2a2 2 0 00-2-2zm7 8H8V7h5zm3-2H8V5h8z\"/></svg>"); mask-image:url("data:image/svg+xml;utf8,<svg xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\" width=\"20\" height=\"20\" viewBox=\"0 0 20 20\" fill=\"%23000000\"><path d=\"M2 18.5A1.5 1.5 0 003.5 20H5V0H3.5A1.5 1.5 0 002 1.5zM6 0v20h10a2 2 0 002-2V2a2 2 0 00-2-2zm7 8H8V7h5zm3-2H8V5h8z\"/></svg>");background-color:var(--color-base,#202122)}}.popups-icon--reference-journal[dir='rtl'],html[dir='rtl'] .popups-icon--reference-journal:not([dir='ltr']){transform:scaleX(-1)}.popups-icon--reference-news{ min-width:20px;min-height:20px;width:1.25rem;height:1.25rem;display:inline-block;vertical-align:text-bottom}@supports not ((-webkit-mask-image:none) or (mask-image:none)){.popups-icon--reference-news{background-position:center;background-repeat:no-repeat;background-size:calc(max(1.25rem,20px))}}@supports (-webkit-mask-image:none) or (mask-image:none){.popups-icon--reference-news{ -webkit-mask-size:calc(max(1.25rem,20px));mask-size:calc(max(1.25rem,20px));-webkit-mask-repeat:no-repeat;mask-repeat:no-repeat;-webkit-mask-position:center;mask-position:center; }}@supports not ((-webkit-mask-image:none) or (mask-image:none)){.popups-icon--reference-news{background-image:url("data:image/svg+xml;utf8,<svg xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\" width=\"20\" height=\"20\" viewBox=\"0 0 20 20\" fill=\"%23000000\"><path d=\"M5 2a2 2 0 00-2 2v12a1 1 0 01-1-1V5h-.5A1.5 1.5 0 000 6.5v10A1.5 1.5 0 001.5 18H18a2 2 0 002-2V4a2 2 0 00-2-2zm1 2h11v4H6zm0 6h6v1H6zm0 2h6v1H6zm0 2h6v1H6zm7-4h4v5h-4z\"/></svg>");filter:invert(var(--filter-invert-icon,0));opacity:var(--opacity-icon-base,0.87)}.cdx-button:not(.cdx-button--weight-quiet):disabled .popups-icon--reference-news,.cdx-button--weight-primary.cdx-button--action-progressive .popups-icon--reference-news,.cdx-button--weight-primary.cdx-button--action-destructive .popups-icon--reference-news{filter:invert(var(--filter-invert-primary-button-icon,1))}}@supports (-webkit-mask-image:none) or (mask-image:none){.popups-icon--reference-news{ -webkit-mask-image:url("data:image/svg+xml;utf8,<svg xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\" width=\"20\" height=\"20\" viewBox=\"0 0 20 20\" fill=\"%23000000\"><path d=\"M5 2a2 2 0 00-2 2v12a1 1 0 01-1-1V5h-.5A1.5 1.5 0 000 6.5v10A1.5 1.5 0 001.5 18H18a2 2 0 002-2V4a2 2 0 00-2-2zm1 2h11v4H6zm0 6h6v1H6zm0 2h6v1H6zm0 2h6v1H6zm7-4h4v5h-4z\"/></svg>"); mask-image:url("data:image/svg+xml;utf8,<svg xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\" width=\"20\" height=\"20\" viewBox=\"0 0 20 20\" fill=\"%23000000\"><path d=\"M5 2a2 2 0 00-2 2v12a1 1 0 01-1-1V5h-.5A1.5 1.5 0 000 6.5v10A1.5 1.5 0 001.5 18H18a2 2 0 002-2V4a2 2 0 00-2-2zm1 2h11v4H6zm0 6h6v1H6zm0 2h6v1H6zm0 2h6v1H6zm7-4h4v5h-4z\"/></svg>");background-color:var(--color-base,#202122)}}.popups-icon--reference-news[dir='rtl'],html[dir='rtl'] .popups-icon--reference-news:not([dir='ltr']){transform:scaleX(-1)}.popups-icon--reference-web{ min-width:20px;min-height:20px;width:1.25rem;height:1.25rem;display:inline-block;vertical-align:text-bottom}@supports not ((-webkit-mask-image:none) or (mask-image:none)){.popups-icon--reference-web{background-position:center;background-repeat:no-repeat;background-size:calc(max(1.25rem,20px))}}@supports (-webkit-mask-image:none) or (mask-image:none){.popups-icon--reference-web{ -webkit-mask-size:calc(max(1.25rem,20px));mask-size:calc(max(1.25rem,20px));-webkit-mask-repeat:no-repeat;mask-repeat:no-repeat;-webkit-mask-position:center;mask-position:center; }}@supports not ((-webkit-mask-image:none) or (mask-image:none)){.popups-icon--reference-web{background-image:url("data:image/svg+xml;utf8,<svg xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\" width=\"20\" height=\"20\" viewBox=\"0 0 20 20\" fill=\"%23000000\"><path d=\"M2 2a2 2 0 00-2 2v12a2 2 0 002 2h16a2 2 0 002-2V4a2 2 0 00-2-2zm2 1.5A1.5 1.5 0 112.5 5 1.5 1.5 0 014 3.5M18 16H2V8h16z\"/></svg>");filter:invert(var(--filter-invert-icon,0));opacity:var(--opacity-icon-base,0.87)}.cdx-button:not(.cdx-button--weight-quiet):disabled .popups-icon--reference-web,.cdx-button--weight-primary.cdx-button--action-progressive .popups-icon--reference-web,.cdx-button--weight-primary.cdx-button--action-destructive .popups-icon--reference-web{filter:invert(var(--filter-invert-primary-button-icon,1))}}@supports (-webkit-mask-image:none) or (mask-image:none){.popups-icon--reference-web{ -webkit-mask-image:url("data:image/svg+xml;utf8,<svg xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\" width=\"20\" height=\"20\" viewBox=\"0 0 20 20\" fill=\"%23000000\"><path d=\"M2 2a2 2 0 00-2 2v12a2 2 0 002 2h16a2 2 0 002-2V4a2 2 0 00-2-2zm2 1.5A1.5 1.5 0 112.5 5 1.5 1.5 0 014 3.5M18 16H2V8h16z\"/></svg>"); mask-image:url("data:image/svg+xml;utf8,<svg xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\" width=\"20\" height=\"20\" viewBox=\"0 0 20 20\" fill=\"%23000000\"><path d=\"M2 2a2 2 0 00-2 2v12a2 2 0 002 2h16a2 2 0 002-2V4a2 2 0 00-2-2zm2 1.5A1.5 1.5 0 112.5 5 1.5 1.5 0 014 3.5M18 16H2V8h16z\"/></svg>");background-color:var(--color-base,#202122)}}.popups-icon--reference-web[dir='rtl'],html[dir='rtl'] .popups-icon--reference-web:not([dir='ltr']){transform:scaleX(-1)}.popups-icon--preview-disambiguation{ min-width:20px;min-height:20px;width:1.25rem;height:1.25rem;display:inline-block;vertical-align:text-bottom}@supports not ((-webkit-mask-image:none) or (mask-image:none)){.popups-icon--preview-disambiguation{background-position:center;background-repeat:no-repeat;background-size:calc(max(1.25rem,20px))}}@supports (-webkit-mask-image:none) or (mask-image:none){.popups-icon--preview-disambiguation{ -webkit-mask-size:calc(max(1.25rem,20px));mask-size:calc(max(1.25rem,20px));-webkit-mask-repeat:no-repeat;mask-repeat:no-repeat;-webkit-mask-position:center;mask-position:center; }}@supports not ((-webkit-mask-image:none) or (mask-image:none)){.popups-icon--preview-disambiguation{background-image:url("data:image/svg+xml;utf8,<svg xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\" width=\"20\" height=\"20\" viewBox=\"0 0 20 20\" fill=\"%23000000\"><path d=\"M7 0a2 2 0 00-2 2h9a2 2 0 012 2v12a2 2 0 002-2V2a2 2 0 00-2-2z\"/><path d=\"M13 20a2 2 0 002-2V5a2 2 0 00-2-2H4a2 2 0 00-2 2v13a2 2 0 002 2zM9 5h4v5H9zM4 5h4v1H4zm0 2h4v1H4zm0 2h4v1H4zm0 2h9v1H4zm0 2h9v1H4zm0 2h9v1H4z\"/></svg>");filter:invert(var(--filter-invert-icon,0));opacity:var(--opacity-icon-base,0.87)}.cdx-button:not(.cdx-button--weight-quiet):disabled .popups-icon--preview-disambiguation,.cdx-button--weight-primary.cdx-button--action-progressive .popups-icon--preview-disambiguation,.cdx-button--weight-primary.cdx-button--action-destructive .popups-icon--preview-disambiguation{filter:invert(var(--filter-invert-primary-button-icon,1))}}@supports (-webkit-mask-image:none) or (mask-image:none){.popups-icon--preview-disambiguation{ -webkit-mask-image:url("data:image/svg+xml;utf8,<svg xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\" width=\"20\" height=\"20\" viewBox=\"0 0 20 20\" fill=\"%23000000\"><path d=\"M7 0a2 2 0 00-2 2h9a2 2 0 012 2v12a2 2 0 002-2V2a2 2 0 00-2-2z\"/><path d=\"M13 20a2 2 0 002-2V5a2 2 0 00-2-2H4a2 2 0 00-2 2v13a2 2 0 002 2zM9 5h4v5H9zM4 5h4v1H4zm0 2h4v1H4zm0 2h4v1H4zm0 2h9v1H4zm0 2h9v1H4zm0 2h9v1H4z\"/></svg>"); mask-image:url("data:image/svg+xml;utf8,<svg xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\" width=\"20\" height=\"20\" viewBox=\"0 0 20 20\" fill=\"%23000000\"><path d=\"M7 0a2 2 0 00-2 2h9a2 2 0 012 2v12a2 2 0 002-2V2a2 2 0 00-2-2z\"/><path d=\"M13 20a2 2 0 002-2V5a2 2 0 00-2-2H4a2 2 0 00-2 2v13a2 2 0 002 2zM9 5h4v5H9zM4 5h4v1H4zm0 2h4v1H4zm0 2h4v1H4zm0 2h9v1H4zm0 2h9v1H4zm0 2h9v1H4z\"/></svg>");background-color:var(--color-base,#202122)}}.popups-icon--preview-disambiguation[dir='rtl'],html[dir='rtl'] .popups-icon--preview-disambiguation:not([dir='ltr']){transform:scaleX(-1)} #mw-content-text .reference a[href*='#'] *{pointer-events:none}.mwe-popups.mwe-popups-type-reference .mwe-popups-container .mwe-popups-title .popups-icon--reference-note{display:none}.mwe-popups.mwe-popups-type-reference .mwe-popups-container .mwe-popups-extract{margin-right:0;max-height:inherit}.mwe-popups.mwe-popups-type-reference .mwe-popups-container .mwe-popups-extract .mwe-popups-scroll{max-height:343px;overflow:auto;padding-right:16px}.mwe-popups.mwe-popups-type-reference .mwe-popups-container .mwe-popups-extract .mw-parser-output{overflow-wrap:break-word}.mwe-popups.mwe-popups-type-reference .mwe-popups-container .mwe-popups-extract::after{display:none}.mwe-popups.mwe-popups-type-reference .mwe-popups-container .mwe-popups-extract .mwe-popups-fade{position:absolute;width:100%;height:20px;background-color:transparent;background-image:linear-gradient(rgba(255,255,255,0),#ffffff);opacity:0;pointer-events:none;transition:opacity 250ms ease}.mwe-popups.mwe-popups-type-reference .mwe-popups-container .mwe-popups-extract.mwe-popups-fade-out .mwe-popups-fade{opacity:1}.mwe-popups.mwe-popups-type-reference .mwe-popups-container .mwe-collapsible-placeholder{font-weight:bold;margin:1em 0;position:relative}.mwe-popups.mwe-popups-type-reference .mwe-popups-container .mw-reference-previews-parent{margin-bottom:1em}</style><meta name="ResourceLoaderDynamicStyles" content="">
+<link rel="stylesheet" href="/w/load.php?lang=en&amp;modules=site.styles&amp;only=styles&amp;skin=vector-2022">
+<meta name="generator" content="MediaWiki 1.44.0-wmf.2">
+<meta name="referrer" content="origin">
+<meta name="referrer" content="origin-when-cross-origin">
+<meta name="robots" content="max-image-preview:standard">
+<meta name="format-detection" content="telephone=no">
+<meta property="og:image" content="https://upload.wikimedia.org/wikipedia/commons/thumb/a/a6/Pink_lady_and_cross_section.jpg/1200px-Pink_lady_and_cross_section.jpg">
+<meta property="og:image:width" content="1200">
+<meta property="og:image:height" content="407">
+<meta property="og:image" content="https://upload.wikimedia.org/wikipedia/commons/thumb/a/a6/Pink_lady_and_cross_section.jpg/800px-Pink_lady_and_cross_section.jpg">
+<meta property="og:image:width" content="800">
+<meta property="og:image:height" content="271">
+<meta property="og:image" content="https://upload.wikimedia.org/wikipedia/commons/thumb/a/a6/Pink_lady_and_cross_section.jpg/640px-Pink_lady_and_cross_section.jpg">
+<meta property="og:image:width" content="640">
+<meta property="og:image:height" content="217">
+<meta name="viewport" content="width=1120">
+<meta property="og:title" content="Apple - Wikipedia">
+<meta property="og:type" content="website">
+<link rel="preconnect" href="//upload.wikimedia.org">
+<link rel="alternate" media="only screen and (max-width: 640px)" href="//en.m.wikipedia.org/wiki/Apple">
+<link rel="apple-touch-icon" href="/static/apple-touch/wikipedia.png">
+<link rel="icon" href="/static/favicon/wikipedia.ico">
+<link rel="search" type="application/opensearchdescription+xml" href="/w/rest.php/v1/search" title="Wikipedia (en)">
+<link rel="EditURI" type="application/rsd+xml" href="//en.wikipedia.org/w/api.php?action=rsd">
+<link rel="canonical" href="https://en.wikipedia.org/wiki/Apple">
+<link rel="license" href="https://creativecommons.org/licenses/by-sa/4.0/deed.en">
+<link rel="alternate" type="application/atom+xml" title="Wikipedia Atom feed" href="/w/index.php?title=Special:RecentChanges&amp;feed=atom">
+<link rel="dns-prefetch" href="//meta.wikimedia.org">
+<link rel="dns-prefetch" href="//login.wikimedia.org">
+</head>
+<body class="skin--responsive skin-vector skin-vector-search-vue mediawiki ltr sitedir-ltr mw-hide-empty-elt ns-0 ns-subject page-Apple rootpage-Apple skin-vector-2022 action-view uls-dialog-sticky-hide vector-below-page-title"><a class="mw-jump-link" href="#bodyContent">Jump to content</a>
+<div class="vector-header-container">
+	<header class="vector-header mw-header">
+		<div class="vector-header-start">
+			<nav class="vector-main-menu-landmark" aria-label="Site">
+				
+<div id="vector-main-menu-dropdown" class="vector-dropdown vector-main-menu-dropdown vector-button-flush-left vector-button-flush-right">
+	<input type="checkbox" id="vector-main-menu-dropdown-checkbox" role="button" aria-haspopup="true" data-event-name="ui.dropdown-vector-main-menu-dropdown" class="vector-dropdown-checkbox " aria-label="Main menu">
+	<label id="vector-main-menu-dropdown-label" for="vector-main-menu-dropdown-checkbox" class="vector-dropdown-label cdx-button cdx-button--fake-button cdx-button--fake-button--enabled cdx-button--weight-quiet cdx-button--icon-only " aria-hidden="true"><span class="vector-icon mw-ui-icon-menu mw-ui-icon-wikimedia-menu"></span>
+
+<span class="vector-dropdown-label-text">Main menu</span>
+	</label>
+	<div class="vector-dropdown-content">
+
+
+				<div id="vector-main-menu-unpinned-container" class="vector-unpinned-container">
+		
+<div id="vector-main-menu" class="vector-main-menu vector-pinnable-element">
+	<div class="vector-pinnable-header vector-main-menu-pinnable-header vector-pinnable-header-unpinned" data-feature-name="main-menu-pinned" data-pinnable-element-id="vector-main-menu" data-pinned-container-id="vector-main-menu-pinned-container" data-unpinned-container-id="vector-main-menu-unpinned-container" data-saved-pinned-state="false">
+	<div class="vector-pinnable-header-label">Main menu</div>
+	<button class="vector-pinnable-header-toggle-button vector-pinnable-header-pin-button" data-event-name="pinnable-header.vector-main-menu.pin">move to sidebar</button>
+	<button class="vector-pinnable-header-toggle-button vector-pinnable-header-unpin-button" data-event-name="pinnable-header.vector-main-menu.unpin">hide</button>
+</div>
+
+	
+<div id="p-navigation" class="vector-menu mw-portlet mw-portlet-navigation">
+	<div class="vector-menu-heading">
+		Navigation
+	</div>
+	<div class="vector-menu-content">
+		
+		<ul class="vector-menu-content-list">
+			
+			<li id="n-mainpage-description" class="mw-list-item"><a href="/wiki/Main_Page" title="Visit the main page [ctrl-option-z]" accesskey="z"><span>Main page</span></a></li><li id="n-contents" class="mw-list-item"><a href="/wiki/Wikipedia:Contents" title="Guides to browsing Wikipedia"><span>Contents</span></a></li><li id="n-currentevents" class="mw-list-item"><a href="/wiki/Portal:Current_events" title="Articles related to current events"><span>Current events</span></a></li><li id="n-randompage" class="mw-list-item"><a href="/wiki/Special:Random" title="Visit a randomly selected article [ctrl-option-x]" accesskey="x"><span>Random article</span></a></li><li id="n-aboutsite" class="mw-list-item"><a href="/wiki/Wikipedia:About" title="Learn about Wikipedia and how it works"><span>About Wikipedia</span></a></li><li id="n-contactpage" class="mw-list-item"><a href="//en.wikipedia.org/wiki/Wikipedia:Contact_us" title="How to contact Wikipedia"><span>Contact us</span></a></li>
+		</ul>
+		
+	</div>
+</div>
+
+	
+	
+<div id="p-interaction" class="vector-menu mw-portlet mw-portlet-interaction">
+	<div class="vector-menu-heading">
+		Contribute
+	</div>
+	<div class="vector-menu-content">
+		
+		<ul class="vector-menu-content-list">
+			
+			<li id="n-help" class="mw-list-item"><a href="/wiki/Help:Contents" title="Guidance on how to use and edit Wikipedia"><span>Help</span></a></li><li id="n-introduction" class="mw-list-item"><a href="/wiki/Help:Introduction" title="Learn how to edit Wikipedia"><span>Learn to edit</span></a></li><li id="n-portal" class="mw-list-item"><a href="/wiki/Wikipedia:Community_portal" title="The hub for editors"><span>Community portal</span></a></li><li id="n-recentchanges" class="mw-list-item"><a href="/wiki/Special:RecentChanges" title="A list of recent changes to Wikipedia [ctrl-option-r]" accesskey="r"><span>Recent changes</span></a></li><li id="n-upload" class="mw-list-item"><a href="/wiki/Wikipedia:File_upload_wizard" title="Add images or other media for use on Wikipedia"><span>Upload file</span></a></li>
+		</ul>
+		
+	</div>
+</div>
+
+</div>
+
+				</div>
+
+	</div>
+</div>
+
+		</nav>
+			
+<a href="/wiki/Main_Page" class="mw-logo">
+	<img class="mw-logo-icon" src="/static/images/icons/wikipedia.png" alt="" aria-hidden="true" height="50" width="50">
+	<span class="mw-logo-container skin-invert">
+		<img class="mw-logo-wordmark" alt="Wikipedia" src="/static/images/mobile/copyright/wikipedia-wordmark-en.svg" style="width: 7.5em; height: 1.125em;" width="300" height="45">
+		<img class="mw-logo-tagline" alt="The Free Encyclopedia" src="/static/images/mobile/copyright/wikipedia-tagline-en.svg" width="300" height="33" style="width: 7.3125em; height: 0.8125em;">
+	</span>
+</a>
+
+		</div>
+		<div class="vector-header-end">
+			
+<div id="p-search" role="search" class="vector-search-box-vue  vector-search-box-collapses vector-search-box-show-thumbnail vector-search-box-auto-expand-width vector-search-box">
+	<a href="/wiki/Special:Search" class="cdx-button cdx-button--fake-button cdx-button--fake-button--enabled cdx-button--weight-quiet cdx-button--icon-only search-toggle" title="Search Wikipedia [ctrl-option-f]" accesskey="f"><span class="vector-icon mw-ui-icon-search mw-ui-icon-wikimedia-search"></span>
+
+<span>Search</span>
+	</a>
+	<div class="vector-typeahead-search-container">
+		<div class="cdx-typeahead-search cdx-typeahead-search--show-thumbnail cdx-typeahead-search--auto-expand-width">
+			<form action="/w/index.php" id="searchform" class="cdx-search-input cdx-search-input--has-end-button">
+				<div id="simpleSearch" class="cdx-search-input__input-wrapper" data-search-loc="header-moved">
+					<div class="cdx-text-input cdx-text-input--has-start-icon">
+						<input class="cdx-text-input__input" type="search" name="search" placeholder="Search Wikipedia" aria-label="Search Wikipedia" autocapitalize="sentences" title="Search Wikipedia [ctrl-option-f]" accesskey="f" id="searchInput" autocomplete="off">
+						<span class="cdx-text-input__icon cdx-text-input__start-icon"></span>
+					</div>
+					<input type="hidden" name="title" value="Special:Search">
+				</div>
+				<button class="cdx-button cdx-search-input__end-button">Search</button>
+			</form>
+		</div>
+	</div>
+</div>
+
+			<nav class="vector-user-links vector-user-links-wide" aria-label="Personal tools">
+	<div class="vector-user-links-main">
+	
+<div id="p-vector-user-menu-preferences" class="vector-menu mw-portlet emptyPortlet">
+	<div class="vector-menu-content">
+		
+		<ul class="vector-menu-content-list">
+			
+			
+		</ul>
+		
+	</div>
+</div>
+
+	
+<div id="p-vector-user-menu-userpage" class="vector-menu mw-portlet emptyPortlet">
+	<div class="vector-menu-content">
+		
+		<ul class="vector-menu-content-list">
+			
+			
+		</ul>
+		
+	</div>
+</div>
+
+	<nav class="vector-appearance-landmark" aria-label="Appearance">
+		
+<div id="vector-appearance-dropdown" class="vector-dropdown " title="Change the appearance of the page's font size, width, and color">
+	<input type="checkbox" id="vector-appearance-dropdown-checkbox" role="button" aria-haspopup="true" data-event-name="ui.dropdown-vector-appearance-dropdown" class="vector-dropdown-checkbox " aria-label="Appearance">
+	<label id="vector-appearance-dropdown-label" for="vector-appearance-dropdown-checkbox" class="vector-dropdown-label cdx-button cdx-button--fake-button cdx-button--fake-button--enabled cdx-button--weight-quiet cdx-button--icon-only " aria-hidden="true"><span class="vector-icon mw-ui-icon-appearance mw-ui-icon-wikimedia-appearance"></span>
+
+<span class="vector-dropdown-label-text">Appearance</span>
+	</label>
+	<div class="vector-dropdown-content">
+
+
+			<div id="vector-appearance-unpinned-container" class="vector-unpinned-container">
+				
+			</div>
+		
+	</div>
+</div>
+
+	</nav>
+	
+<div id="p-vector-user-menu-notifications" class="vector-menu mw-portlet emptyPortlet">
+	<div class="vector-menu-content">
+		
+		<ul class="vector-menu-content-list">
+			
+			
+		</ul>
+		
+	</div>
+</div>
+
+	
+<div id="p-vector-user-menu-overflow" class="vector-menu mw-portlet">
+	<div class="vector-menu-content">
+		
+		<ul class="vector-menu-content-list">
+			<li id="pt-sitesupport-2" class="user-links-collapsible-item mw-list-item user-links-collapsible-item"><a data-mw="interface" href="https://donate.wikimedia.org/wiki/Special:FundraiserRedirector?utm_source=donate&amp;utm_medium=sidebar&amp;utm_campaign=C13_en.wikipedia.org&amp;uselang=en" class=""><span>Donate</span></a>
+</li>
+<li id="pt-createaccount-2" class="user-links-collapsible-item mw-list-item user-links-collapsible-item"><a data-mw="interface" href="/w/index.php?title=Special:CreateAccount&amp;returnto=Apple" title="You are encouraged to create an account and log in; however, it is not mandatory" class=""><span>Create account</span></a>
+</li>
+<li id="pt-login-2" class="user-links-collapsible-item mw-list-item user-links-collapsible-item"><a data-mw="interface" href="/w/index.php?title=Special:UserLogin&amp;returnto=Apple" title="You're encouraged to log in; however, it's not mandatory. [ctrl-option-o]" accesskey="o" class=""><span>Log in</span></a>
+</li>
+
+			
+		</ul>
+		
+	</div>
+</div>
+
+	</div>
+	
+<div id="vector-user-links-dropdown" class="vector-dropdown vector-user-menu vector-button-flush-right vector-user-menu-logged-out" title="Log in and more options">
+	<input type="checkbox" id="vector-user-links-dropdown-checkbox" role="button" aria-haspopup="true" data-event-name="ui.dropdown-vector-user-links-dropdown" class="vector-dropdown-checkbox " aria-label="Personal tools">
+	<label id="vector-user-links-dropdown-label" for="vector-user-links-dropdown-checkbox" class="vector-dropdown-label cdx-button cdx-button--fake-button cdx-button--fake-button--enabled cdx-button--weight-quiet cdx-button--icon-only " aria-hidden="true"><span class="vector-icon mw-ui-icon-ellipsis mw-ui-icon-wikimedia-ellipsis"></span>
+
+<span class="vector-dropdown-label-text">Personal tools</span>
+	</label>
+	<div class="vector-dropdown-content">
+
+
+		
+<div id="p-personal" class="vector-menu mw-portlet mw-portlet-personal user-links-collapsible-item" title="User menu">
+	<div class="vector-menu-content">
+		
+		<ul class="vector-menu-content-list">
+			
+			<li id="pt-sitesupport" class="user-links-collapsible-item mw-list-item"><a href="https://donate.wikimedia.org/wiki/Special:FundraiserRedirector?utm_source=donate&amp;utm_medium=sidebar&amp;utm_campaign=C13_en.wikipedia.org&amp;uselang=en"><span>Donate</span></a></li><li id="pt-createaccount" class="user-links-collapsible-item mw-list-item"><a href="/w/index.php?title=Special:CreateAccount&amp;returnto=Apple" title="You are encouraged to create an account and log in; however, it is not mandatory"><span class="vector-icon mw-ui-icon-userAdd mw-ui-icon-wikimedia-userAdd"></span> <span>Create account</span></a></li><li id="pt-login" class="user-links-collapsible-item mw-list-item"><a href="/w/index.php?title=Special:UserLogin&amp;returnto=Apple" title="You're encouraged to log in; however, it's not mandatory. [ctrl-option-o]" accesskey="o"><span class="vector-icon mw-ui-icon-logIn mw-ui-icon-wikimedia-logIn"></span> <span>Log in</span></a></li>
+		</ul>
+		
+	</div>
+</div>
+
+<div id="p-user-menu-anon-editor" class="vector-menu mw-portlet mw-portlet-user-menu-anon-editor">
+	<div class="vector-menu-heading">
+		Pages for logged out editors <a href="/wiki/Help:Introduction" aria-label="Learn more about editing"><span>learn more</span></a>
+	</div>
+	<div class="vector-menu-content">
+		
+		<ul class="vector-menu-content-list">
+			
+			<li id="pt-anoncontribs" class="mw-list-item"><a href="/wiki/Special:MyContributions" title="A list of edits made from this IP address [ctrl-option-y]" accesskey="y"><span>Contributions</span></a></li><li id="pt-anontalk" class="mw-list-item"><a href="/wiki/Special:MyTalk" title="Discussion about edits from this IP address [ctrl-option-n]" accesskey="n"><span>Talk</span></a></li>
+		</ul>
+		
+	</div>
+</div>
+
+	
+	</div>
+</div>
+
+</nav>
+
+		</div>
+	</header>
+</div>
+<div class="mw-page-container">
+	<div class="mw-page-container-inner">
+		<div class="vector-sitenotice-container">
+			<div id="siteNotice"><div id="centralNotice"></div><!-- CentralNotice --></div>
+		</div>
+		<div class="vector-column-start">
+			<div class="vector-main-menu-container">
+		<div id="mw-navigation">
+			<nav id="mw-panel" class="vector-main-menu-landmark" aria-label="Site">
+				<div id="vector-main-menu-pinned-container" class="vector-pinned-container">
+				
+				</div>
+		</nav>
+		</div>
+	</div>
+	<div class="vector-sticky-pinned-container">
+				<nav id="mw-panel-toc" aria-label="Contents" data-event-name="ui.sidebar-toc" class="mw-table-of-contents-container vector-toc-landmark">
+					<div id="vector-toc-pinned-container" class="vector-pinned-container">
+					<div id="vector-toc" class="vector-toc vector-pinnable-element">
+	<div class="vector-pinnable-header vector-toc-pinnable-header vector-pinnable-header-pinned" data-feature-name="toc-pinned" data-pinnable-element-id="vector-toc">
+	<h2 class="vector-pinnable-header-label">Contents</h2>
+	<button class="vector-pinnable-header-toggle-button vector-pinnable-header-pin-button" data-event-name="pinnable-header.vector-toc.pin">move to sidebar</button>
+	<button class="vector-pinnable-header-toggle-button vector-pinnable-header-unpin-button" data-event-name="pinnable-header.vector-toc.unpin">hide</button>
+</div>
+
+
+	<ul class="vector-toc-contents" id="mw-panel-toc-list">
+		<li id="toc-mw-content-text" class="vector-toc-list-item vector-toc-level-1 vector-toc-level-1-active vector-toc-list-item-active">
+			<a href="#" class="vector-toc-link">
+				<div class="vector-toc-text">(Top)</div>
+			</a>
+		</li>
+		<li id="toc-Etymology" class="vector-toc-list-item vector-toc-level-1">
+		<a class="vector-toc-link" href="#Etymology">
+			<div class="vector-toc-text">
+				<span class="vector-toc-numb">1</span>
+				<span>Etymology</span>
+			</div>
+		</a>
+		
+		<ul id="toc-Etymology-sublist" class="vector-toc-list">
+		</ul>
+	</li>
+	<li id="toc-Description" class="vector-toc-list-item vector-toc-level-1">
+		<a class="vector-toc-link" href="#Description">
+			<div class="vector-toc-text">
+				<span class="vector-toc-numb">2</span>
+				<span>Description</span>
+			</div>
+		</a>
+		
+			<button aria-controls="toc-Description-sublist" class="cdx-button cdx-button--weight-quiet cdx-button--icon-only vector-toc-toggle" aria-expanded="false">
+				<span class="vector-icon mw-ui-icon-wikimedia-expand"></span>
+				<span>Toggle Description subsection</span>
+			</button>
+		
+		<ul id="toc-Description-sublist" class="vector-toc-list">
+			<li id="toc-Fruit" class="vector-toc-list-item vector-toc-level-2">
+			<a class="vector-toc-link" href="#Fruit">
+				<div class="vector-toc-text">
+					<span class="vector-toc-numb">2.1</span>
+					<span>Fruit</span>
+				</div>
+			</a>
+			
+			<ul id="toc-Fruit-sublist" class="vector-toc-list">
+			</ul>
+		</li>
+		<li id="toc-Chemistry" class="vector-toc-list-item vector-toc-level-2">
+			<a class="vector-toc-link" href="#Chemistry">
+				<div class="vector-toc-text">
+					<span class="vector-toc-numb">2.2</span>
+					<span>Chemistry</span>
+				</div>
+			</a>
+			
+			<ul id="toc-Chemistry-sublist" class="vector-toc-list">
+			</ul>
+		</li>
+	</ul>
+	</li>
+	<li id="toc-Taxonomy" class="vector-toc-list-item vector-toc-level-1">
+		<a class="vector-toc-link" href="#Taxonomy">
+			<div class="vector-toc-text">
+				<span class="vector-toc-numb">3</span>
+				<span>Taxonomy</span>
+			</div>
+		</a>
+		
+			<button aria-controls="toc-Taxonomy-sublist" class="cdx-button cdx-button--weight-quiet cdx-button--icon-only vector-toc-toggle" aria-expanded="false">
+				<span class="vector-icon mw-ui-icon-wikimedia-expand"></span>
+				<span>Toggle Taxonomy subsection</span>
+			</button>
+		
+		<ul id="toc-Taxonomy-sublist" class="vector-toc-list">
+			<li id="toc-Genome" class="vector-toc-list-item vector-toc-level-2">
+			<a class="vector-toc-link" href="#Genome">
+				<div class="vector-toc-text">
+					<span class="vector-toc-numb">3.1</span>
+					<span>Genome</span>
+				</div>
+			</a>
+			
+			<ul id="toc-Genome-sublist" class="vector-toc-list">
+			</ul>
+		</li>
+	</ul>
+	</li>
+	<li id="toc-Cultivation" class="vector-toc-list-item vector-toc-level-1">
+		<a class="vector-toc-link" href="#Cultivation">
+			<div class="vector-toc-text">
+				<span class="vector-toc-numb">4</span>
+				<span>Cultivation</span>
+			</div>
+		</a>
+		
+			<button aria-controls="toc-Cultivation-sublist" class="cdx-button cdx-button--weight-quiet cdx-button--icon-only vector-toc-toggle" aria-expanded="false">
+				<span class="vector-icon mw-ui-icon-wikimedia-expand"></span>
+				<span>Toggle Cultivation subsection</span>
+			</button>
+		
+		<ul id="toc-Cultivation-sublist" class="vector-toc-list">
+			<li id="toc-History" class="vector-toc-list-item vector-toc-level-2">
+			<a class="vector-toc-link" href="#History">
+				<div class="vector-toc-text">
+					<span class="vector-toc-numb">4.1</span>
+					<span>History</span>
+				</div>
+			</a>
+			
+			<ul id="toc-History-sublist" class="vector-toc-list">
+			</ul>
+		</li>
+		<li id="toc-Breeding" class="vector-toc-list-item vector-toc-level-2">
+			<a class="vector-toc-link" href="#Breeding">
+				<div class="vector-toc-text">
+					<span class="vector-toc-numb">4.2</span>
+					<span>Breeding</span>
+				</div>
+			</a>
+			
+			<ul id="toc-Breeding-sublist" class="vector-toc-list">
+			</ul>
+		</li>
+		<li id="toc-Pollination" class="vector-toc-list-item vector-toc-level-2">
+			<a class="vector-toc-link" href="#Pollination">
+				<div class="vector-toc-text">
+					<span class="vector-toc-numb">4.3</span>
+					<span>Pollination</span>
+				</div>
+			</a>
+			
+			<ul id="toc-Pollination-sublist" class="vector-toc-list">
+			</ul>
+		</li>
+		<li id="toc-Maturation_and_harvest" class="vector-toc-list-item vector-toc-level-2">
+			<a class="vector-toc-link" href="#Maturation_and_harvest">
+				<div class="vector-toc-text">
+					<span class="vector-toc-numb">4.4</span>
+					<span>Maturation and harvest</span>
+				</div>
+			</a>
+			
+			<ul id="toc-Maturation_and_harvest-sublist" class="vector-toc-list">
+			</ul>
+		</li>
+		<li id="toc-Storage" class="vector-toc-list-item vector-toc-level-2">
+			<a class="vector-toc-link" href="#Storage">
+				<div class="vector-toc-text">
+					<span class="vector-toc-numb">4.5</span>
+					<span>Storage</span>
+				</div>
+			</a>
+			
+			<ul id="toc-Storage-sublist" class="vector-toc-list">
+			</ul>
+		</li>
+		<li id="toc-Pests_and_diseases" class="vector-toc-list-item vector-toc-level-2">
+			<a class="vector-toc-link" href="#Pests_and_diseases">
+				<div class="vector-toc-text">
+					<span class="vector-toc-numb">4.6</span>
+					<span>Pests and diseases</span>
+				</div>
+			</a>
+			
+			<ul id="toc-Pests_and_diseases-sublist" class="vector-toc-list">
+			</ul>
+		</li>
+		<li id="toc-Cultivars" class="vector-toc-list-item vector-toc-level-2">
+			<a class="vector-toc-link" href="#Cultivars">
+				<div class="vector-toc-text">
+					<span class="vector-toc-numb">4.7</span>
+					<span>Cultivars</span>
+				</div>
+			</a>
+			
+			<ul id="toc-Cultivars-sublist" class="vector-toc-list">
+			</ul>
+		</li>
+		<li id="toc-Production" class="vector-toc-list-item vector-toc-level-2">
+			<a class="vector-toc-link" href="#Production">
+				<div class="vector-toc-text">
+					<span class="vector-toc-numb">4.8</span>
+					<span>Production</span>
+				</div>
+			</a>
+			
+			<ul id="toc-Production-sublist" class="vector-toc-list">
+			</ul>
+		</li>
+	</ul>
+	</li>
+	<li id="toc-Toxicity" class="vector-toc-list-item vector-toc-level-1">
+		<a class="vector-toc-link" href="#Toxicity">
+			<div class="vector-toc-text">
+				<span class="vector-toc-numb">5</span>
+				<span>Toxicity</span>
+			</div>
+		</a>
+		
+			<button aria-controls="toc-Toxicity-sublist" class="cdx-button cdx-button--weight-quiet cdx-button--icon-only vector-toc-toggle" aria-expanded="false">
+				<span class="vector-icon mw-ui-icon-wikimedia-expand"></span>
+				<span>Toggle Toxicity subsection</span>
+			</button>
+		
+		<ul id="toc-Toxicity-sublist" class="vector-toc-list">
+			<li id="toc-Amygdalin" class="vector-toc-list-item vector-toc-level-2">
+			<a class="vector-toc-link" href="#Amygdalin">
+				<div class="vector-toc-text">
+					<span class="vector-toc-numb">5.1</span>
+					<span>Amygdalin</span>
+				</div>
+			</a>
+			
+			<ul id="toc-Amygdalin-sublist" class="vector-toc-list">
+			</ul>
+		</li>
+		<li id="toc-Allergy" class="vector-toc-list-item vector-toc-level-2">
+			<a class="vector-toc-link" href="#Allergy">
+				<div class="vector-toc-text">
+					<span class="vector-toc-numb">5.2</span>
+					<span>Allergy</span>
+				</div>
+			</a>
+			
+			<ul id="toc-Allergy-sublist" class="vector-toc-list">
+			</ul>
+		</li>
+	</ul>
+	</li>
+	<li id="toc-Uses" class="vector-toc-list-item vector-toc-level-1">
+		<a class="vector-toc-link" href="#Uses">
+			<div class="vector-toc-text">
+				<span class="vector-toc-numb">6</span>
+				<span>Uses</span>
+			</div>
+		</a>
+		
+			<button aria-controls="toc-Uses-sublist" class="cdx-button cdx-button--weight-quiet cdx-button--icon-only vector-toc-toggle" aria-expanded="false">
+				<span class="vector-icon mw-ui-icon-wikimedia-expand"></span>
+				<span>Toggle Uses subsection</span>
+			</button>
+		
+		<ul id="toc-Uses-sublist" class="vector-toc-list">
+			<li id="toc-Nutrition" class="vector-toc-list-item vector-toc-level-2">
+			<a class="vector-toc-link" href="#Nutrition">
+				<div class="vector-toc-text">
+					<span class="vector-toc-numb">6.1</span>
+					<span>Nutrition</span>
+				</div>
+			</a>
+			
+			<ul id="toc-Nutrition-sublist" class="vector-toc-list">
+			</ul>
+		</li>
+		<li id="toc-Culinary" class="vector-toc-list-item vector-toc-level-2">
+			<a class="vector-toc-link" href="#Culinary">
+				<div class="vector-toc-text">
+					<span class="vector-toc-numb">6.2</span>
+					<span>Culinary</span>
+				</div>
+			</a>
+			
+			<ul id="toc-Culinary-sublist" class="vector-toc-list">
+			</ul>
+		</li>
+		<li id="toc-Organic_production" class="vector-toc-list-item vector-toc-level-2">
+			<a class="vector-toc-link" href="#Organic_production">
+				<div class="vector-toc-text">
+					<span class="vector-toc-numb">6.3</span>
+					<span>Organic production</span>
+				</div>
+			</a>
+			
+			<ul id="toc-Organic_production-sublist" class="vector-toc-list">
+			</ul>
+		</li>
+		<li id="toc-Non-browning_apples" class="vector-toc-list-item vector-toc-level-2">
+			<a class="vector-toc-link" href="#Non-browning_apples">
+				<div class="vector-toc-text">
+					<span class="vector-toc-numb">6.4</span>
+					<span>Non-browning apples</span>
+				</div>
+			</a>
+			
+			<ul id="toc-Non-browning_apples-sublist" class="vector-toc-list">
+			</ul>
+		</li>
+		<li id="toc-Other_products" class="vector-toc-list-item vector-toc-level-2">
+			<a class="vector-toc-link" href="#Other_products">
+				<div class="vector-toc-text">
+					<span class="vector-toc-numb">6.5</span>
+					<span>Other products</span>
+				</div>
+			</a>
+			
+			<ul id="toc-Other_products-sublist" class="vector-toc-list">
+			</ul>
+		</li>
+	</ul>
+	</li>
+	<li id="toc-In_culture" class="vector-toc-list-item vector-toc-level-1">
+		<a class="vector-toc-link" href="#In_culture">
+			<div class="vector-toc-text">
+				<span class="vector-toc-numb">7</span>
+				<span>In culture</span>
+			</div>
+		</a>
+		
+			<button aria-controls="toc-In_culture-sublist" class="cdx-button cdx-button--weight-quiet cdx-button--icon-only vector-toc-toggle" aria-expanded="false">
+				<span class="vector-icon mw-ui-icon-wikimedia-expand"></span>
+				<span>Toggle In culture subsection</span>
+			</button>
+		
+		<ul id="toc-In_culture-sublist" class="vector-toc-list">
+			<li id="toc-Germanic_paganism" class="vector-toc-list-item vector-toc-level-2">
+			<a class="vector-toc-link" href="#Germanic_paganism">
+				<div class="vector-toc-text">
+					<span class="vector-toc-numb">7.1</span>
+					<span>Germanic paganism</span>
+				</div>
+			</a>
+			
+			<ul id="toc-Germanic_paganism-sublist" class="vector-toc-list">
+			</ul>
+		</li>
+		<li id="toc-Greek_mythology" class="vector-toc-list-item vector-toc-level-2">
+			<a class="vector-toc-link" href="#Greek_mythology">
+				<div class="vector-toc-text">
+					<span class="vector-toc-numb">7.2</span>
+					<span>Greek mythology</span>
+				</div>
+			</a>
+			
+			<ul id="toc-Greek_mythology-sublist" class="vector-toc-list">
+			</ul>
+		</li>
+		<li id="toc-Celtic_mythology" class="vector-toc-list-item vector-toc-level-2">
+			<a class="vector-toc-link" href="#Celtic_mythology">
+				<div class="vector-toc-text">
+					<span class="vector-toc-numb">7.3</span>
+					<span>Celtic mythology</span>
+				</div>
+			</a>
+			
+			<ul id="toc-Celtic_mythology-sublist" class="vector-toc-list">
+			</ul>
+		</li>
+		<li id="toc-China" class="vector-toc-list-item vector-toc-level-2">
+			<a class="vector-toc-link" href="#China">
+				<div class="vector-toc-text">
+					<span class="vector-toc-numb">7.4</span>
+					<span>China</span>
+				</div>
+			</a>
+			
+			<ul id="toc-China-sublist" class="vector-toc-list">
+			</ul>
+		</li>
+		<li id="toc-Christian_art" class="vector-toc-list-item vector-toc-level-2">
+			<a class="vector-toc-link" href="#Christian_art">
+				<div class="vector-toc-text">
+					<span class="vector-toc-numb">7.5</span>
+					<span>Christian art</span>
+				</div>
+			</a>
+			
+			<ul id="toc-Christian_art-sublist" class="vector-toc-list">
+			</ul>
+		</li>
+		<li id="toc-Proverb" class="vector-toc-list-item vector-toc-level-2">
+			<a class="vector-toc-link" href="#Proverb">
+				<div class="vector-toc-text">
+					<span class="vector-toc-numb">7.6</span>
+					<span>Proverb</span>
+				</div>
+			</a>
+			
+			<ul id="toc-Proverb-sublist" class="vector-toc-list">
+			</ul>
+		</li>
+	</ul>
+	</li>
+	<li id="toc-See_also" class="vector-toc-list-item vector-toc-level-1">
+		<a class="vector-toc-link" href="#See_also">
+			<div class="vector-toc-text">
+				<span class="vector-toc-numb">8</span>
+				<span>See also</span>
+			</div>
+		</a>
+		
+		<ul id="toc-See_also-sublist" class="vector-toc-list">
+		</ul>
+	</li>
+	<li id="toc-References" class="vector-toc-list-item vector-toc-level-1">
+		<a class="vector-toc-link" href="#References">
+			<div class="vector-toc-text">
+				<span class="vector-toc-numb">9</span>
+				<span>References</span>
+			</div>
+		</a>
+		
+		<ul id="toc-References-sublist" class="vector-toc-list">
+		</ul>
+	</li>
+	<li id="toc-Further_reading" class="vector-toc-list-item vector-toc-level-1">
+		<a class="vector-toc-link" href="#Further_reading">
+			<div class="vector-toc-text">
+				<span class="vector-toc-numb">10</span>
+				<span>Further reading</span>
+			</div>
+		</a>
+		
+		<ul id="toc-Further_reading-sublist" class="vector-toc-list">
+		</ul>
+	</li>
+	<li id="toc-External_links" class="vector-toc-list-item vector-toc-level-1">
+		<a class="vector-toc-link" href="#External_links">
+			<div class="vector-toc-text">
+				<span class="vector-toc-numb">11</span>
+				<span>External links</span>
+			</div>
+		</a>
+		
+		<ul id="toc-External_links-sublist" class="vector-toc-list">
+		</ul>
+	</li>
+</ul>
+</div>
+
+					</div>
+		</nav>
+			</div>
+		</div>
+		<div class="mw-content-container">
+			<main id="content" class="mw-body">
+				<header class="mw-body-header vector-page-titlebar">
+					<nav aria-label="Contents" class="vector-toc-landmark">
+						
+<div id="vector-page-titlebar-toc" class="vector-dropdown vector-page-titlebar-toc vector-button-flush-left">
+	<input type="checkbox" id="vector-page-titlebar-toc-checkbox" role="button" aria-haspopup="true" data-event-name="ui.dropdown-vector-page-titlebar-toc" class="vector-dropdown-checkbox " aria-label="Toggle the table of contents">
+	<label id="vector-page-titlebar-toc-label" for="vector-page-titlebar-toc-checkbox" class="vector-dropdown-label cdx-button cdx-button--fake-button cdx-button--fake-button--enabled cdx-button--icon-only" aria-hidden="true"><span class="vector-icon mw-ui-icon-listBullet mw-ui-icon-wikimedia-listBullet"></span>
+
+<span class="vector-dropdown-label-text">Toggle the table of contents</span>
+	</label>
+	<div class="vector-dropdown-content">
+
+
+							<div id="vector-page-titlebar-toc-unpinned-container" class="vector-unpinned-container">
+			</div>
+		
+	</div>
+</div>
+
+					</nav>
+					<h1 id="firstHeading" class="firstHeading mw-first-heading"><span class="mw-page-title-main">Apple</span></h1>
+							
+<div id="p-lang-btn" class="vector-dropdown mw-portlet mw-portlet-lang">
+	<input type="checkbox" id="p-lang-btn-checkbox" role="button" aria-haspopup="true" data-event-name="ui.dropdown-p-lang-btn" class="vector-dropdown-checkbox mw-interlanguage-selector" aria-label="Go to an article in another language. Available in 191 languages">
+	<label id="p-lang-btn-label" for="p-lang-btn-checkbox" class="vector-dropdown-label cdx-button cdx-button--fake-button cdx-button--fake-button--enabled cdx-button--weight-quiet cdx-button--action-progressive mw-portlet-lang-heading-191" aria-hidden="true"><span class="vector-icon mw-ui-icon-language-progressive mw-ui-icon-wikimedia-language-progressive"></span>
+
+<span class="vector-dropdown-label-text">191 languages</span>
+	</label>
+	<div class="vector-dropdown-content">
+
+		<div class="vector-menu-content">
+			
+			<ul class="vector-menu-content-list">
+				
+				<li class="interlanguage-link interwiki-af mw-list-item"><a href="https://af.wikipedia.org/wiki/Appel" title="Appel – Afrikaans" lang="af" hreflang="af" data-title="Appel" data-language-autonym="Afrikaans" data-language-local-name="Afrikaans" class="interlanguage-link-target"><span>Afrikaans</span></a></li><li class="interlanguage-link interwiki-als mw-list-item"><a href="https://als.wikipedia.org/wiki/Apfel" title="Apfel – Alemannic" lang="gsw" hreflang="gsw" data-title="Apfel" data-language-autonym="Alemannisch" data-language-local-name="Alemannic" class="interlanguage-link-target"><span>Alemannisch</span></a></li><li class="interlanguage-link interwiki-am mw-list-item"><a href="https://am.wikipedia.org/wiki/%E1%8D%96%E1%88%9D" title="ፖም – Amharic" lang="am" hreflang="am" data-title="ፖም" data-language-autonym="አማርኛ" data-language-local-name="Amharic" class="interlanguage-link-target"><span>አማርኛ</span></a></li><li class="interlanguage-link interwiki-ang mw-list-item"><a href="https://ang.wikipedia.org/wiki/%C3%86ppel" title="Æppel – Old English" lang="ang" hreflang="ang" data-title="Æppel" data-language-autonym="Ænglisc" data-language-local-name="Old English" class="interlanguage-link-target"><span>Ænglisc</span></a></li><li class="interlanguage-link interwiki-ar mw-list-item"><a href="https://ar.wikipedia.org/wiki/%D8%AA%D9%81%D8%A7%D8%AD" title="تفاح – Arabic" lang="ar" hreflang="ar" data-title="تفاح" data-language-autonym="العربية" data-language-local-name="Arabic" class="interlanguage-link-target"><span>العربية</span></a></li><li class="interlanguage-link interwiki-an mw-list-item"><a href="https://an.wikipedia.org/wiki/Manzana" title="Manzana – Aragonese" lang="an" hreflang="an" data-title="Manzana" data-language-autonym="Aragonés" data-language-local-name="Aragonese" class="interlanguage-link-target"><span>Aragonés</span></a></li><li class="interlanguage-link interwiki-arc mw-list-item"><a href="https://arc.wikipedia.org/wiki/%DC%9A%DC%99%DC%98%DC%AA%DC%90" title="ܚܙܘܪܐ – Aramaic" lang="arc" hreflang="arc" data-title="ܚܙܘܪܐ" data-language-autonym="ܐܪܡܝܐ" data-language-local-name="Aramaic" class="interlanguage-link-target"><span>ܐܪܡܝܐ</span></a></li><li class="interlanguage-link interwiki-hyw mw-list-item"><a href="https://hyw.wikipedia.org/wiki/%D4%BD%D5%B6%D5%B1%D5%B8%D6%80" title="Խնձոր – Western Armenian" lang="hyw" hreflang="hyw" data-title="Խնձոր" data-language-autonym="Արեւմտահայերէն" data-language-local-name="Western Armenian" class="interlanguage-link-target"><span>Արեւմտահայերէն</span></a></li><li class="interlanguage-link interwiki-roa-rup mw-list-item"><a href="https://roa-rup.wikipedia.org/wiki/Muz%C3%A2" title="Muzâ – Aromanian" lang="rup" hreflang="rup" data-title="Muzâ" data-language-autonym="Armãneashti" data-language-local-name="Aromanian" class="interlanguage-link-target"><span>Armãneashti</span></a></li><li class="interlanguage-link interwiki-as mw-list-item"><a href="https://as.wikipedia.org/wiki/%E0%A6%86%E0%A6%AA%E0%A7%87%E0%A6%B2" title="আপেল – Assamese" lang="as" hreflang="as" data-title="আপেল" data-language-autonym="অসমীয়া" data-language-local-name="Assamese" class="interlanguage-link-target"><span>অসমীয়া</span></a></li><li class="interlanguage-link interwiki-ast mw-list-item"><a href="https://ast.wikipedia.org/wiki/Mazana" title="Mazana – Asturian" lang="ast" hreflang="ast" data-title="Mazana" data-language-autonym="Asturianu" data-language-local-name="Asturian" class="interlanguage-link-target"><span>Asturianu</span></a></li><li class="interlanguage-link interwiki-atj mw-list-item"><a href="https://atj.wikipedia.org/wiki/Wamin" title="Wamin – Atikamekw" lang="atj" hreflang="atj" data-title="Wamin" data-language-autonym="Atikamekw" data-language-local-name="Atikamekw" class="interlanguage-link-target"><span>Atikamekw</span></a></li><li class="interlanguage-link interwiki-awa mw-list-item"><a href="https://awa.wikipedia.org/wiki/%E0%A4%B8%E0%A5%87%E0%A4%B5" title="सेव – Awadhi" lang="awa" hreflang="awa" data-title="सेव" data-language-autonym="अवधी" data-language-local-name="Awadhi" class="interlanguage-link-target"><span>अवधी</span></a></li><li class="interlanguage-link interwiki-gn mw-list-item"><a href="https://gn.wikipedia.org/wiki/Guavirana%27a" title="Guavirana'a – Guarani" lang="gn" hreflang="gn" data-title="Guavirana'a" data-language-autonym="Avañe'ẽ" data-language-local-name="Guarani" class="interlanguage-link-target"><span>Avañe'ẽ</span></a></li><li class="interlanguage-link interwiki-az mw-list-item"><a href="https://az.wikipedia.org/wiki/Alma" title="Alma – Azerbaijani" lang="az" hreflang="az" data-title="Alma" data-language-autonym="Azərbaycanca" data-language-local-name="Azerbaijani" class="interlanguage-link-target"><span>Azərbaycanca</span></a></li><li class="interlanguage-link interwiki-azb mw-list-item"><a href="https://azb.wikipedia.org/wiki/%D8%A2%D9%84%D9%85%D8%A7" title="آلما – South Azerbaijani" lang="azb" hreflang="azb" data-title="آلما" data-language-autonym="تۆرکجه" data-language-local-name="South Azerbaijani" class="interlanguage-link-target"><span>تۆرکجه</span></a></li><li class="interlanguage-link interwiki-ban mw-list-item"><a href="https://ban.wikipedia.org/wiki/Apel" title="Apel – Balinese" lang="ban" hreflang="ban" data-title="Apel" data-language-autonym="Basa Bali" data-language-local-name="Balinese" class="interlanguage-link-target"><span>Basa Bali</span></a></li><li class="interlanguage-link interwiki-bn mw-list-item"><a href="https://bn.wikipedia.org/wiki/%E0%A6%86%E0%A6%AA%E0%A7%87%E0%A6%B2" title="আপেল – Bangla" lang="bn" hreflang="bn" data-title="আপেল" data-language-autonym="বাংলা" data-language-local-name="Bangla" class="interlanguage-link-target"><span>বাংলা</span></a></li><li class="interlanguage-link interwiki-zh-min-nan mw-list-item"><a href="https://zh-min-nan.wikipedia.org/wiki/Ph%C5%8Dng-k%C3%B3" title="Phōng-kó – Minnan" lang="nan" hreflang="nan" data-title="Phōng-kó" data-language-autonym="閩南語 / Bân-lâm-gú" data-language-local-name="Minnan" class="interlanguage-link-target"><span>閩南語 / Bân-lâm-gú</span></a></li><li class="interlanguage-link interwiki-map-bms mw-list-item"><a href="https://map-bms.wikipedia.org/wiki/Apel" title="Apel – Banyumasan" lang="jv-x-bms" hreflang="jv-x-bms" data-title="Apel" data-language-autonym="Basa Banyumasan" data-language-local-name="Banyumasan" class="interlanguage-link-target"><span>Basa Banyumasan</span></a></li><li class="interlanguage-link interwiki-ba mw-list-item"><a href="https://ba.wikipedia.org/wiki/%D0%90%D0%BB%D0%BC%D0%B0" title="Алма – Bashkir" lang="ba" hreflang="ba" data-title="Алма" data-language-autonym="Башҡортса" data-language-local-name="Bashkir" class="interlanguage-link-target"><span>Башҡортса</span></a></li><li class="interlanguage-link interwiki-be mw-list-item"><a href="https://be.wikipedia.org/wiki/%D0%AF%D0%B1%D0%BB%D1%8B%D0%BA" title="Яблык – Belarusian" lang="be" hreflang="be" data-title="Яблык" data-language-autonym="Беларуская" data-language-local-name="Belarusian" class="interlanguage-link-target"><span>Беларуская</span></a></li><li class="interlanguage-link interwiki-be-x-old mw-list-item"><a href="https://be-tarask.wikipedia.org/wiki/%D0%AF%D0%B1%D0%BB%D1%8B%D0%BA" title="Яблык – Belarusian (Taraškievica orthography)" lang="be-tarask" hreflang="be-tarask" data-title="Яблык" data-language-autonym="Беларуская (тарашкевіца)" data-language-local-name="Belarusian (Taraškievica orthography)" class="interlanguage-link-target"><span>Беларуская (тарашкевіца)</span></a></li><li class="interlanguage-link interwiki-bh mw-list-item"><a href="https://bh.wikipedia.org/wiki/%E0%A4%B8%E0%A5%87%E0%A4%B5" title="सेव – Bhojpuri" lang="bh" hreflang="bh" data-title="सेव" data-language-autonym="भोजपुरी" data-language-local-name="Bhojpuri" class="interlanguage-link-target"><span>भोजपुरी</span></a></li><li class="interlanguage-link interwiki-bcl mw-list-item"><a href="https://bcl.wikipedia.org/wiki/Mansanas" title="Mansanas – Central Bikol" lang="bcl" hreflang="bcl" data-title="Mansanas" data-language-autonym="Bikol Central" data-language-local-name="Central Bikol" class="interlanguage-link-target"><span>Bikol Central</span></a></li><li class="interlanguage-link interwiki-bi mw-list-item"><a href="https://bi.wikipedia.org/wiki/Apol" title="Apol – Bislama" lang="bi" hreflang="bi" data-title="Apol" data-language-autonym="Bislama" data-language-local-name="Bislama" class="interlanguage-link-target"><span>Bislama</span></a></li><li class="interlanguage-link interwiki-bg mw-list-item"><a href="https://bg.wikipedia.org/wiki/%D0%AF%D0%B1%D1%8A%D0%BB%D0%BA%D0%B0" title="Ябълка – Bulgarian" lang="bg" hreflang="bg" data-title="Ябълка" data-language-autonym="Български" data-language-local-name="Bulgarian" class="interlanguage-link-target"><span>Български</span></a></li><li class="interlanguage-link interwiki-bar mw-list-item"><a href="https://bar.wikipedia.org/wiki/Epfe" title="Epfe – Bavarian" lang="bar" hreflang="bar" data-title="Epfe" data-language-autonym="Boarisch" data-language-local-name="Bavarian" class="interlanguage-link-target"><span>Boarisch</span></a></li><li class="interlanguage-link interwiki-bo mw-list-item"><a href="https://bo.wikipedia.org/wiki/%E0%BD%80%E0%BD%B4%E0%BC%8B%E0%BD%A4%E0%BD%B4%E0%BC%8D" title="ཀུ་ཤུ། – Tibetan" lang="bo" hreflang="bo" data-title="ཀུ་ཤུ།" data-language-autonym="བོད་ཡིག" data-language-local-name="Tibetan" class="interlanguage-link-target"><span>བོད་ཡིག</span></a></li><li class="interlanguage-link interwiki-bs mw-list-item"><a href="https://bs.wikipedia.org/wiki/Jabuka" title="Jabuka – Bosnian" lang="bs" hreflang="bs" data-title="Jabuka" data-language-autonym="Bosanski" data-language-local-name="Bosnian" class="interlanguage-link-target"><span>Bosanski</span></a></li><li class="interlanguage-link interwiki-br mw-list-item"><a href="https://br.wikipedia.org/wiki/Aval" title="Aval – Breton" lang="br" hreflang="br" data-title="Aval" data-language-autonym="Brezhoneg" data-language-local-name="Breton" class="interlanguage-link-target"><span>Brezhoneg</span></a></li><li class="interlanguage-link interwiki-ca mw-list-item"><a href="https://ca.wikipedia.org/wiki/Poma" title="Poma – Catalan" lang="ca" hreflang="ca" data-title="Poma" data-language-autonym="Català" data-language-local-name="Catalan" class="interlanguage-link-target"><span>Català</span></a></li><li class="interlanguage-link interwiki-cv mw-list-item"><a href="https://cv.wikipedia.org/wiki/%D0%9F%D0%B0%D0%BD%D1%83%D0%BB%D0%BC%D0%B8" title="Панулми – Chuvash" lang="cv" hreflang="cv" data-title="Панулми" data-language-autonym="Чӑвашла" data-language-local-name="Chuvash" class="interlanguage-link-target"><span>Чӑвашла</span></a></li><li class="interlanguage-link interwiki-cs mw-list-item"><a href="https://cs.wikipedia.org/wiki/Jablko" title="Jablko – Czech" lang="cs" hreflang="cs" data-title="Jablko" data-language-autonym="Čeština" data-language-local-name="Czech" class="interlanguage-link-target"><span>Čeština</span></a></li><li class="interlanguage-link interwiki-cy mw-list-item"><a href="https://cy.wikipedia.org/wiki/Afal" title="Afal – Welsh" lang="cy" hreflang="cy" data-title="Afal" data-language-autonym="Cymraeg" data-language-local-name="Welsh" class="interlanguage-link-target"><span>Cymraeg</span></a></li><li class="interlanguage-link interwiki-da mw-list-item"><a href="https://da.wikipedia.org/wiki/%C3%86ble" title="Æble – Danish" lang="da" hreflang="da" data-title="Æble" data-language-autonym="Dansk" data-language-local-name="Danish" class="interlanguage-link-target"><span>Dansk</span></a></li><li class="interlanguage-link interwiki-ary mw-list-item"><a href="https://ary.wikipedia.org/wiki/%D8%AA%D9%81%D8%A7%D8%AD" title="تفاح – Moroccan Arabic" lang="ary" hreflang="ary" data-title="تفاح" data-language-autonym="الدارجة" data-language-local-name="Moroccan Arabic" class="interlanguage-link-target"><span>الدارجة</span></a></li><li class="interlanguage-link interwiki-de badge-Q70894304 mw-list-item" title=""><a href="https://de.wikipedia.org/wiki/Tafelapfel" title="Tafelapfel – German" lang="de" hreflang="de" data-title="Tafelapfel" data-language-autonym="Deutsch" data-language-local-name="German" class="interlanguage-link-target"><span>Deutsch</span></a></li><li class="interlanguage-link interwiki-dv mw-list-item"><a href="https://dv.wikipedia.org/wiki/%DE%87%DE%A7%DE%8A%DE%A6%DE%8D%DE%B0" title="އާފަލް – Divehi" lang="dv" hreflang="dv" data-title="އާފަލް" data-language-autonym="ދިވެހިބަސް" data-language-local-name="Divehi" class="interlanguage-link-target"><span>ދިވެހިބަސް</span></a></li><li class="interlanguage-link interwiki-nv mw-list-item"><a href="https://nv.wikipedia.org/wiki/Bilas%C3%A1ana" title="Bilasáana – Navajo" lang="nv" hreflang="nv" data-title="Bilasáana" data-language-autonym="Diné bizaad" data-language-local-name="Navajo" class="interlanguage-link-target"><span>Diné bizaad</span></a></li><li class="interlanguage-link interwiki-dsb mw-list-item"><a href="https://dsb.wikipedia.org/wiki/Jab%C5%82uko" title="Jabłuko – Lower Sorbian" lang="dsb" hreflang="dsb" data-title="Jabłuko" data-language-autonym="Dolnoserbski" data-language-local-name="Lower Sorbian" class="interlanguage-link-target"><span>Dolnoserbski</span></a></li><li class="interlanguage-link interwiki-et mw-list-item"><a href="https://et.wikipedia.org/wiki/%C3%95un" title="Õun – Estonian" lang="et" hreflang="et" data-title="Õun" data-language-autonym="Eesti" data-language-local-name="Estonian" class="interlanguage-link-target"><span>Eesti</span></a></li><li class="interlanguage-link interwiki-el mw-list-item"><a href="https://el.wikipedia.org/wiki/%CE%9C%CE%AE%CE%BB%CE%BF" title="Μήλο – Greek" lang="el" hreflang="el" data-title="Μήλο" data-language-autonym="Ελληνικά" data-language-local-name="Greek" class="interlanguage-link-target"><span>Ελληνικά</span></a></li><li class="interlanguage-link interwiki-eml mw-list-item"><a href="https://eml.wikipedia.org/wiki/P%C3%A0m" title="Pàm – Emiliano-Romagnolo" lang="egl" hreflang="egl" data-title="Pàm" data-language-autonym="Emiliàn e rumagnòl" data-language-local-name="Emiliano-Romagnolo" class="interlanguage-link-target"><span>Emiliàn e rumagnòl</span></a></li><li class="interlanguage-link interwiki-es mw-list-item"><a href="https://es.wikipedia.org/wiki/Manzana" title="Manzana – Spanish" lang="es" hreflang="es" data-title="Manzana" data-language-autonym="Español" data-language-local-name="Spanish" class="interlanguage-link-target"><span>Español</span></a></li><li class="interlanguage-link interwiki-eo badge-Q17437798 badge-goodarticle mw-list-item" title="good article badge"><a href="https://eo.wikipedia.org/wiki/Pomo" title="Pomo – Esperanto" lang="eo" hreflang="eo" data-title="Pomo" data-language-autonym="Esperanto" data-language-local-name="Esperanto" class="interlanguage-link-target"><span>Esperanto</span></a></li><li class="interlanguage-link interwiki-eu mw-list-item"><a href="https://eu.wikipedia.org/wiki/Sagar" title="Sagar – Basque" lang="eu" hreflang="eu" data-title="Sagar" data-language-autonym="Euskara" data-language-local-name="Basque" class="interlanguage-link-target"><span>Euskara</span></a></li><li class="interlanguage-link interwiki-fa badge-Q17437798 badge-goodarticle mw-list-item" title="good article badge"><a href="https://fa.wikipedia.org/wiki/%D8%B3%DB%8C%D8%A8" title="سیب – Persian" lang="fa" hreflang="fa" data-title="سیب" data-language-autonym="فارسی" data-language-local-name="Persian" class="interlanguage-link-target"><span>فارسی</span></a></li><li class="interlanguage-link interwiki-hif mw-list-item"><a href="https://hif.wikipedia.org/wiki/Aapul" title="Aapul – Fiji Hindi" lang="hif" hreflang="hif" data-title="Aapul" data-language-autonym="Fiji Hindi" data-language-local-name="Fiji Hindi" class="interlanguage-link-target"><span>Fiji Hindi</span></a></li><li class="interlanguage-link interwiki-fr mw-list-item"><a href="https://fr.wikipedia.org/wiki/Pomme" title="Pomme – French" lang="fr" hreflang="fr" data-title="Pomme" data-language-autonym="Français" data-language-local-name="French" class="interlanguage-link-target"><span>Français</span></a></li><li class="interlanguage-link interwiki-fy mw-list-item"><a href="https://fy.wikipedia.org/wiki/Apel" title="Apel – Western Frisian" lang="fy" hreflang="fy" data-title="Apel" data-language-autonym="Frysk" data-language-local-name="Western Frisian" class="interlanguage-link-target"><span>Frysk</span></a></li><li class="interlanguage-link interwiki-fur mw-list-item"><a href="https://fur.wikipedia.org/wiki/Milu%C3%A7%C3%A2r" title="Miluçâr – Friulian" lang="fur" hreflang="fur" data-title="Miluçâr" data-language-autonym="Furlan" data-language-local-name="Friulian" class="interlanguage-link-target"><span>Furlan</span></a></li><li class="interlanguage-link interwiki-ga mw-list-item"><a href="https://ga.wikipedia.org/wiki/%C3%9All" title="Úll – Irish" lang="ga" hreflang="ga" data-title="Úll" data-language-autonym="Gaeilge" data-language-local-name="Irish" class="interlanguage-link-target"><span>Gaeilge</span></a></li><li class="interlanguage-link interwiki-gd mw-list-item"><a href="https://gd.wikipedia.org/wiki/Ubhal" title="Ubhal – Scottish Gaelic" lang="gd" hreflang="gd" data-title="Ubhal" data-language-autonym="Gàidhlig" data-language-local-name="Scottish Gaelic" class="interlanguage-link-target"><span>Gàidhlig</span></a></li><li class="interlanguage-link interwiki-gl mw-list-item"><a href="https://gl.wikipedia.org/wiki/Maz%C3%A1" title="Mazá – Galician" lang="gl" hreflang="gl" data-title="Mazá" data-language-autonym="Galego" data-language-local-name="Galician" class="interlanguage-link-target"><span>Galego</span></a></li><li class="interlanguage-link interwiki-gan mw-list-item"><a href="https://gan.wikipedia.org/wiki/%E8%98%8B%E6%9E%9C" title="蘋果 – Gan" lang="gan" hreflang="gan" data-title="蘋果" data-language-autonym="贛語" data-language-local-name="Gan" class="interlanguage-link-target"><span>贛語</span></a></li><li class="interlanguage-link interwiki-gu mw-list-item"><a href="https://gu.wikipedia.org/wiki/%E0%AA%B8%E0%AA%AB%E0%AA%B0%E0%AA%9C%E0%AA%A8" title="સફરજન – Gujarati" lang="gu" hreflang="gu" data-title="સફરજન" data-language-autonym="ગુજરાતી" data-language-local-name="Gujarati" class="interlanguage-link-target"><span>ગુજરાતી</span></a></li><li class="interlanguage-link interwiki-hak mw-list-item"><a href="https://hak.wikipedia.org/wiki/Ph%C3%ACn-k%C3%B3" title="Phìn-kó – Hakka Chinese" lang="hak" hreflang="hak" data-title="Phìn-kó" data-language-autonym="客家語 / Hak-kâ-ngî" data-language-local-name="Hakka Chinese" class="interlanguage-link-target"><span>客家語 / Hak-kâ-ngî</span></a></li><li class="interlanguage-link interwiki-xal mw-list-item"><a href="https://xal.wikipedia.org/wiki/%D0%90%D0%BB%D1%8C%D0%BC%D0%B0%D0%BD" title="Альман – Kalmyk" lang="xal" hreflang="xal" data-title="Альман" data-language-autonym="Хальмг" data-language-local-name="Kalmyk" class="interlanguage-link-target"><span>Хальмг</span></a></li><li class="interlanguage-link interwiki-ko mw-list-item"><a href="https://ko.wikipedia.org/wiki/%EC%82%AC%EA%B3%BC" title="사과 – Korean" lang="ko" hreflang="ko" data-title="사과" data-language-autonym="한국어" data-language-local-name="Korean" class="interlanguage-link-target"><span>한국어</span></a></li><li class="interlanguage-link interwiki-ha mw-list-item"><a href="https://ha.wikipedia.org/wiki/Tuffa" title="Tuffa – Hausa" lang="ha" hreflang="ha" data-title="Tuffa" data-language-autonym="Hausa" data-language-local-name="Hausa" class="interlanguage-link-target"><span>Hausa</span></a></li><li class="interlanguage-link interwiki-hy mw-list-item"><a href="https://hy.wikipedia.org/wiki/%D4%BD%D5%B6%D5%B1%D5%B8%D6%80" title="Խնձոր – Armenian" lang="hy" hreflang="hy" data-title="Խնձոր" data-language-autonym="Հայերեն" data-language-local-name="Armenian" class="interlanguage-link-target"><span>Հայերեն</span></a></li><li class="interlanguage-link interwiki-hi mw-list-item"><a href="https://hi.wikipedia.org/wiki/%E0%A4%B8%E0%A5%87%E0%A4%AC" title="सेब – Hindi" lang="hi" hreflang="hi" data-title="सेब" data-language-autonym="हिन्दी" data-language-local-name="Hindi" class="interlanguage-link-target"><span>हिन्दी</span></a></li><li class="interlanguage-link interwiki-hsb mw-list-item"><a href="https://hsb.wikipedia.org/wiki/Jab%C5%82uko" title="Jabłuko – Upper Sorbian" lang="hsb" hreflang="hsb" data-title="Jabłuko" data-language-autonym="Hornjoserbsce" data-language-local-name="Upper Sorbian" class="interlanguage-link-target"><span>Hornjoserbsce</span></a></li><li class="interlanguage-link interwiki-hr mw-list-item"><a href="https://hr.wikipedia.org/wiki/Pitoma_jabuka" title="Pitoma jabuka – Croatian" lang="hr" hreflang="hr" data-title="Pitoma jabuka" data-language-autonym="Hrvatski" data-language-local-name="Croatian" class="interlanguage-link-target"><span>Hrvatski</span></a></li><li class="interlanguage-link interwiki-io mw-list-item"><a href="https://io.wikipedia.org/wiki/Pomo" title="Pomo – Ido" lang="io" hreflang="io" data-title="Pomo" data-language-autonym="Ido" data-language-local-name="Ido" class="interlanguage-link-target"><span>Ido</span></a></li><li class="interlanguage-link interwiki-ig mw-list-item"><a href="https://ig.wikipedia.org/wiki/Apple" title="Apple – Igbo" lang="ig" hreflang="ig" data-title="Apple" data-language-autonym="Igbo" data-language-local-name="Igbo" class="interlanguage-link-target"><span>Igbo</span></a></li><li class="interlanguage-link interwiki-ilo mw-list-item"><a href="https://ilo.wikipedia.org/wiki/Mansanas" title="Mansanas – Iloko" lang="ilo" hreflang="ilo" data-title="Mansanas" data-language-autonym="Ilokano" data-language-local-name="Iloko" class="interlanguage-link-target"><span>Ilokano</span></a></li><li class="interlanguage-link interwiki-id badge-Q17437798 badge-goodarticle mw-list-item" title="good article badge"><a href="https://id.wikipedia.org/wiki/Apel" title="Apel – Indonesian" lang="id" hreflang="id" data-title="Apel" data-language-autonym="Bahasa Indonesia" data-language-local-name="Indonesian" class="interlanguage-link-target"><span>Bahasa Indonesia</span></a></li><li class="interlanguage-link interwiki-ia mw-list-item"><a href="https://ia.wikipedia.org/wiki/Pomo" title="Pomo – Interlingua" lang="ia" hreflang="ia" data-title="Pomo" data-language-autonym="Interlingua" data-language-local-name="Interlingua" class="interlanguage-link-target"><span>Interlingua</span></a></li><li class="interlanguage-link interwiki-iu mw-list-item"><a href="https://iu.wikipedia.org/wiki/%E1%91%AD%E1%92%BB%E1%92%A5%E1%93%87%E1%90%85%E1%94%AD%E1%96%85" title="ᑭᒻᒥᓇᐅᔭᖅ – Inuktitut" lang="iu" hreflang="iu" data-title="ᑭᒻᒥᓇᐅᔭᖅ" data-language-autonym="ᐃᓄᒃᑎᑐᑦ / inuktitut" data-language-local-name="Inuktitut" class="interlanguage-link-target"><span>ᐃᓄᒃᑎᑐᑦ / inuktitut</span></a></li><li class="interlanguage-link interwiki-ik mw-list-item"><a href="https://ik.wikipedia.org/wiki/Aapuq" title="Aapuq – Inupiaq" lang="ik" hreflang="ik" data-title="Aapuq" data-language-autonym="Iñupiatun" data-language-local-name="Inupiaq" class="interlanguage-link-target"><span>Iñupiatun</span></a></li><li class="interlanguage-link interwiki-os mw-list-item"><a href="https://os.wikipedia.org/wiki/%D0%A4%C3%A6%D1%82%D0%BA%D1%8A%D1%83%D1%8B" title="Фæткъуы – Ossetic" lang="os" hreflang="os" data-title="Фæткъуы" data-language-autonym="Ирон" data-language-local-name="Ossetic" class="interlanguage-link-target"><span>Ирон</span></a></li><li class="interlanguage-link interwiki-zu mw-list-item"><a href="https://zu.wikipedia.org/wiki/IPhumezi" title="IPhumezi – Zulu" lang="zu" hreflang="zu" data-title="IPhumezi" data-language-autonym="IsiZulu" data-language-local-name="Zulu" class="interlanguage-link-target"><span>IsiZulu</span></a></li><li class="interlanguage-link interwiki-is mw-list-item"><a href="https://is.wikipedia.org/wiki/Epli" title="Epli – Icelandic" lang="is" hreflang="is" data-title="Epli" data-language-autonym="Íslenska" data-language-local-name="Icelandic" class="interlanguage-link-target"><span>Íslenska</span></a></li><li class="interlanguage-link interwiki-it mw-list-item"><a href="https://it.wikipedia.org/wiki/Mela" title="Mela – Italian" lang="it" hreflang="it" data-title="Mela" data-language-autonym="Italiano" data-language-local-name="Italian" class="interlanguage-link-target"><span>Italiano</span></a></li><li class="interlanguage-link interwiki-he mw-list-item"><a href="https://he.wikipedia.org/wiki/%D7%AA%D7%A4%D7%95%D7%97" title="תפוח – Hebrew" lang="he" hreflang="he" data-title="תפוח" data-language-autonym="עברית" data-language-local-name="Hebrew" class="interlanguage-link-target"><span>עברית</span></a></li><li class="interlanguage-link interwiki-jv mw-list-item"><a href="https://jv.wikipedia.org/wiki/Apel" title="Apel – Javanese" lang="jv" hreflang="jv" data-title="Apel" data-language-autonym="Jawa" data-language-local-name="Javanese" class="interlanguage-link-target"><span>Jawa</span></a></li><li class="interlanguage-link interwiki-kn mw-list-item"><a href="https://kn.wikipedia.org/wiki/%E0%B2%B8%E0%B3%87%E0%B2%AC%E0%B3%81" title="ಸೇಬು – Kannada" lang="kn" hreflang="kn" data-title="ಸೇಬು" data-language-autonym="ಕನ್ನಡ" data-language-local-name="Kannada" class="interlanguage-link-target"><span>ಕನ್ನಡ</span></a></li><li class="interlanguage-link interwiki-krc mw-list-item"><a href="https://krc.wikipedia.org/wiki/%D0%90%D0%BB%D0%BC%D0%B0" title="Алма – Karachay-Balkar" lang="krc" hreflang="krc" data-title="Алма" data-language-autonym="Къарачай-малкъар" data-language-local-name="Karachay-Balkar" class="interlanguage-link-target"><span>Къарачай-малкъар</span></a></li><li class="interlanguage-link interwiki-ks mw-list-item"><a href="https://ks.wikipedia.org/wiki/%DA%98%D9%88%D9%97%D9%86%D9%9B%D9%B9%DA%BE" title="ژوٗنٛٹھ – Kashmiri" lang="ks" hreflang="ks" data-title="ژوٗنٛٹھ" data-language-autonym="कॉशुर / کٲشُر" data-language-local-name="Kashmiri" class="interlanguage-link-target"><span>कॉशुर / کٲشُر</span></a></li><li class="interlanguage-link interwiki-kk mw-list-item"><a href="https://kk.wikipedia.org/wiki/%D0%90%D0%BB%D0%BC%D0%B0" title="Алма – Kazakh" lang="kk" hreflang="kk" data-title="Алма" data-language-autonym="Қазақша" data-language-local-name="Kazakh" class="interlanguage-link-target"><span>Қазақша</span></a></li><li class="interlanguage-link interwiki-rw mw-list-item"><a href="https://rw.wikipedia.org/wiki/Pome" title="Pome – Kinyarwanda" lang="rw" hreflang="rw" data-title="Pome" data-language-autonym="Ikinyarwanda" data-language-local-name="Kinyarwanda" class="interlanguage-link-target"><span>Ikinyarwanda</span></a></li><li class="interlanguage-link interwiki-sw mw-list-item"><a href="https://sw.wikipedia.org/wiki/Tofaa" title="Tofaa – Swahili" lang="sw" hreflang="sw" data-title="Tofaa" data-language-autonym="Kiswahili" data-language-local-name="Swahili" class="interlanguage-link-target"><span>Kiswahili</span></a></li><li class="interlanguage-link interwiki-ht mw-list-item"><a href="https://ht.wikipedia.org/wiki/P%C3%B2m" title="Pòm – Haitian Creole" lang="ht" hreflang="ht" data-title="Pòm" data-language-autonym="Kreyòl ayisyen" data-language-local-name="Haitian Creole" class="interlanguage-link-target"><span>Kreyòl ayisyen</span></a></li><li class="interlanguage-link interwiki-ku mw-list-item"><a href="https://ku.wikipedia.org/wiki/S%C3%AAv" title="Sêv – Kurdish" lang="ku" hreflang="ku" data-title="Sêv" data-language-autonym="Kurdî" data-language-local-name="Kurdish" class="interlanguage-link-target"><span>Kurdî</span></a></li><li class="interlanguage-link interwiki-ky mw-list-item"><a href="https://ky.wikipedia.org/wiki/%D0%90%D0%BB%D0%BC%D0%B0" title="Алма – Kyrgyz" lang="ky" hreflang="ky" data-title="Алма" data-language-autonym="Кыргызча" data-language-local-name="Kyrgyz" class="interlanguage-link-target"><span>Кыргызча</span></a></li><li class="interlanguage-link interwiki-lad mw-list-item"><a href="https://lad.wikipedia.org/wiki/Mansana" title="Mansana – Ladino" lang="lad" hreflang="lad" data-title="Mansana" data-language-autonym="Ladino" data-language-local-name="Ladino" class="interlanguage-link-target"><span>Ladino</span></a></li><li class="interlanguage-link interwiki-lo mw-list-item"><a href="https://lo.wikipedia.org/wiki/%E0%BB%9D%E0%BA%B2%E0%BA%81%E0%BA%9B%E0%BA%BB%E0%BB%88%E0%BA%A1" title="ໝາກປົ່ມ – Lao" lang="lo" hreflang="lo" data-title="ໝາກປົ່ມ" data-language-autonym="ລາວ" data-language-local-name="Lao" class="interlanguage-link-target"><span>ລາວ</span></a></li><li class="interlanguage-link interwiki-la mw-list-item"><a href="https://la.wikipedia.org/wiki/Malum" title="Malum – Latin" lang="la" hreflang="la" data-title="Malum" data-language-autonym="Latina" data-language-local-name="Latin" class="interlanguage-link-target"><span>Latina</span></a></li><li class="interlanguage-link interwiki-lv mw-list-item"><a href="https://lv.wikipedia.org/wiki/%C4%80bols" title="Ābols – Latvian" lang="lv" hreflang="lv" data-title="Ābols" data-language-autonym="Latviešu" data-language-local-name="Latvian" class="interlanguage-link-target"><span>Latviešu</span></a></li><li class="interlanguage-link interwiki-lb mw-list-item"><a href="https://lb.wikipedia.org/wiki/Apel" title="Apel – Luxembourgish" lang="lb" hreflang="lb" data-title="Apel" data-language-autonym="Lëtzebuergesch" data-language-local-name="Luxembourgish" class="interlanguage-link-target"><span>Lëtzebuergesch</span></a></li><li class="interlanguage-link interwiki-lt mw-list-item"><a href="https://lt.wikipedia.org/wiki/Obuolys" title="Obuolys – Lithuanian" lang="lt" hreflang="lt" data-title="Obuolys" data-language-autonym="Lietuvių" data-language-local-name="Lithuanian" class="interlanguage-link-target"><span>Lietuvių</span></a></li><li class="interlanguage-link interwiki-lij mw-list-item"><a href="https://lij.wikipedia.org/wiki/Mei" title="Mei – Ligurian" lang="lij" hreflang="lij" data-title="Mei" data-language-autonym="Ligure" data-language-local-name="Ligurian" class="interlanguage-link-target"><span>Ligure</span></a></li><li class="interlanguage-link interwiki-li mw-list-item"><a href="https://li.wikipedia.org/wiki/Appel" title="Appel – Limburgish" lang="li" hreflang="li" data-title="Appel" data-language-autonym="Limburgs" data-language-local-name="Limburgish" class="interlanguage-link-target"><span>Limburgs</span></a></li><li class="interlanguage-link interwiki-olo mw-list-item"><a href="https://olo.wikipedia.org/wiki/Juablokku" title="Juablokku – Livvi-Karelian" lang="olo" hreflang="olo" data-title="Juablokku" data-language-autonym="Livvinkarjala" data-language-local-name="Livvi-Karelian" class="interlanguage-link-target"><span>Livvinkarjala</span></a></li><li class="interlanguage-link interwiki-jbo mw-list-item"><a href="https://jbo.wikipedia.org/wiki/plise" title="plise – Lojban" lang="jbo" hreflang="jbo" data-title="plise" data-language-autonym="La .lojban." data-language-local-name="Lojban" class="interlanguage-link-target"><span>La .lojban.</span></a></li><li class="interlanguage-link interwiki-mk mw-list-item"><a href="https://mk.wikipedia.org/wiki/%D0%88%D0%B0%D0%B1%D0%BE%D0%BB%D0%BA%D0%BE" title="Јаболко – Macedonian" lang="mk" hreflang="mk" data-title="Јаболко" data-language-autonym="Македонски" data-language-local-name="Macedonian" class="interlanguage-link-target"><span>Македонски</span></a></li><li class="interlanguage-link interwiki-mg mw-list-item"><a href="https://mg.wikipedia.org/wiki/Paoma" title="Paoma – Malagasy" lang="mg" hreflang="mg" data-title="Paoma" data-language-autonym="Malagasy" data-language-local-name="Malagasy" class="interlanguage-link-target"><span>Malagasy</span></a></li><li class="interlanguage-link interwiki-ml mw-list-item"><a href="https://ml.wikipedia.org/wiki/%E0%B4%86%E0%B4%AA%E0%B5%8D%E0%B4%AA%E0%B4%BF%E0%B5%BE" title="ആപ്പിൾ – Malayalam" lang="ml" hreflang="ml" data-title="ആപ്പിൾ" data-language-autonym="മലയാളം" data-language-local-name="Malayalam" class="interlanguage-link-target"><span>മലയാളം</span></a></li><li class="interlanguage-link interwiki-mi mw-list-item"><a href="https://mi.wikipedia.org/wiki/%C4%80poro" title="Āporo – Māori" lang="mi" hreflang="mi" data-title="Āporo" data-language-autonym="Māori" data-language-local-name="Māori" class="interlanguage-link-target"><span>Māori</span></a></li><li class="interlanguage-link interwiki-mr mw-list-item"><a href="https://mr.wikipedia.org/wiki/%E0%A4%B8%E0%A4%AB%E0%A4%B0%E0%A4%9A%E0%A4%82%E0%A4%A6" title="सफरचंद – Marathi" lang="mr" hreflang="mr" data-title="सफरचंद" data-language-autonym="मराठी" data-language-local-name="Marathi" class="interlanguage-link-target"><span>मराठी</span></a></li><li class="interlanguage-link interwiki-arz mw-list-item"><a href="https://arz.wikipedia.org/wiki/%D8%AA%D9%81%D8%A7%D8%AD" title="تفاح – Egyptian Arabic" lang="arz" hreflang="arz" data-title="تفاح" data-language-autonym="مصرى" data-language-local-name="Egyptian Arabic" class="interlanguage-link-target"><span>مصرى</span></a></li><li class="interlanguage-link interwiki-ms mw-list-item"><a href="https://ms.wikipedia.org/wiki/Epal" title="Epal – Malay" lang="ms" hreflang="ms" data-title="Epal" data-language-autonym="Bahasa Melayu" data-language-local-name="Malay" class="interlanguage-link-target"><span>Bahasa Melayu</span></a></li><li class="interlanguage-link interwiki-mni mw-list-item"><a href="https://mni.wikipedia.org/wiki/%EA%AF%81%EA%AF%A6%EA%AF%9D_(%EA%AF%8D%EA%AF%A9)" title="ꯁꯦꯝ (ꯍꯩ) – Manipuri" lang="mni" hreflang="mni" data-title="ꯁꯦꯝ (ꯍꯩ)" data-language-autonym="ꯃꯤꯇꯩ ꯂꯣꯟ" data-language-local-name="Manipuri" class="interlanguage-link-target"><span>ꯃꯤꯇꯩ ꯂꯣꯟ</span></a></li><li class="interlanguage-link interwiki-cdo mw-list-item"><a href="https://cdo.wikipedia.org/wiki/B%C3%ACng-gu%C5%8D" title="Bìng-guō – Mindong" lang="cdo" hreflang="cdo" data-title="Bìng-guō" data-language-autonym="閩東語 / Mìng-dĕ̤ng-ngṳ̄" data-language-local-name="Mindong" class="interlanguage-link-target"><span>閩東語 / Mìng-dĕ̤ng-ngṳ̄</span></a></li><li class="interlanguage-link interwiki-mwl mw-list-item"><a href="https://mwl.wikipedia.org/wiki/Ma%C3%A7ana" title="Maçana – Mirandese" lang="mwl" hreflang="mwl" data-title="Maçana" data-language-autonym="Mirandés" data-language-local-name="Mirandese" class="interlanguage-link-target"><span>Mirandés</span></a></li><li class="interlanguage-link interwiki-mdf mw-list-item"><a href="https://mdf.wikipedia.org/wiki/%D0%9C%D0%B0%D1%80%D1%8C%D1%81%D1%8C" title="Марьсь – Moksha" lang="mdf" hreflang="mdf" data-title="Марьсь" data-language-autonym="Мокшень" data-language-local-name="Moksha" class="interlanguage-link-target"><span>Мокшень</span></a></li><li class="interlanguage-link interwiki-my mw-list-item"><a href="https://my.wikipedia.org/wiki/%E1%80%95%E1%80%94%E1%80%BA%E1%80%B8%E1%80%9E%E1%80%AE%E1%80%B8" title="ပန်းသီး – Burmese" lang="my" hreflang="my" data-title="ပန်းသီး" data-language-autonym="မြန်မာဘာသာ" data-language-local-name="Burmese" class="interlanguage-link-target"><span>မြန်မာဘာသာ</span></a></li><li class="interlanguage-link interwiki-fj mw-list-item"><a href="https://fj.wikipedia.org/wiki/Yapolo" title="Yapolo – Fijian" lang="fj" hreflang="fj" data-title="Yapolo" data-language-autonym="Na Vosa Vakaviti" data-language-local-name="Fijian" class="interlanguage-link-target"><span>Na Vosa Vakaviti</span></a></li><li class="interlanguage-link interwiki-nl mw-list-item"><a href="https://nl.wikipedia.org/wiki/Appel_(vrucht)" title="Appel (vrucht) – Dutch" lang="nl" hreflang="nl" data-title="Appel (vrucht)" data-language-autonym="Nederlands" data-language-local-name="Dutch" class="interlanguage-link-target"><span>Nederlands</span></a></li><li class="interlanguage-link interwiki-ne mw-list-item"><a href="https://ne.wikipedia.org/wiki/%E0%A4%B8%E0%A5%8D%E0%A4%AF%E0%A4%BE%E0%A4%89" title="स्याउ – Nepali" lang="ne" hreflang="ne" data-title="स्याउ" data-language-autonym="नेपाली" data-language-local-name="Nepali" class="interlanguage-link-target"><span>नेपाली</span></a></li><li class="interlanguage-link interwiki-new mw-list-item"><a href="https://new.wikipedia.org/wiki/%E0%A4%B8%E0%A5%8D%E0%A4%AF%E0%A4%BE%E0%A4%89" title="स्याउ – Newari" lang="new" hreflang="new" data-title="स्याउ" data-language-autonym="नेपाल भाषा" data-language-local-name="Newari" class="interlanguage-link-target"><span>नेपाल भाषा</span></a></li><li class="interlanguage-link interwiki-ja mw-list-item"><a href="https://ja.wikipedia.org/wiki/%E3%83%AA%E3%83%B3%E3%82%B4" title="リンゴ – Japanese" lang="ja" hreflang="ja" data-title="リンゴ" data-language-autonym="日本語" data-language-local-name="Japanese" class="interlanguage-link-target"><span>日本語</span></a></li><li class="interlanguage-link interwiki-nap mw-list-item"><a href="https://nap.wikipedia.org/wiki/Milo" title="Milo – Neapolitan" lang="nap" hreflang="nap" data-title="Milo" data-language-autonym="Napulitano" data-language-local-name="Neapolitan" class="interlanguage-link-target"><span>Napulitano</span></a></li><li class="interlanguage-link interwiki-ce mw-list-item"><a href="https://ce.wikipedia.org/wiki/%D3%80%D0%B0%D0%B6" title="Ӏаж – Chechen" lang="ce" hreflang="ce" data-title="Ӏаж" data-language-autonym="Нохчийн" data-language-local-name="Chechen" class="interlanguage-link-target"><span>Нохчийн</span></a></li><li class="interlanguage-link interwiki-no mw-list-item"><a href="https://no.wikipedia.org/wiki/Eple" title="Eple – Norwegian Bokmål" lang="nb" hreflang="nb" data-title="Eple" data-language-autonym="Norsk bokmål" data-language-local-name="Norwegian Bokmål" class="interlanguage-link-target"><span>Norsk bokmål</span></a></li><li class="interlanguage-link interwiki-nn mw-list-item"><a href="https://nn.wikipedia.org/wiki/Eple" title="Eple – Norwegian Nynorsk" lang="nn" hreflang="nn" data-title="Eple" data-language-autonym="Norsk nynorsk" data-language-local-name="Norwegian Nynorsk" class="interlanguage-link-target"><span>Norsk nynorsk</span></a></li><li class="interlanguage-link interwiki-nrm mw-list-item"><a href="https://nrm.wikipedia.org/wiki/Poume" title="Poume – Norman" lang="nrf" hreflang="nrf" data-title="Poume" data-language-autonym="Nouormand" data-language-local-name="Norman" class="interlanguage-link-target"><span>Nouormand</span></a></li><li class="interlanguage-link interwiki-oc mw-list-item"><a href="https://oc.wikipedia.org/wiki/Poma" title="Poma – Occitan" lang="oc" hreflang="oc" data-title="Poma" data-language-autonym="Occitan" data-language-local-name="Occitan" class="interlanguage-link-target"><span>Occitan</span></a></li><li class="interlanguage-link interwiki-mhr mw-list-item"><a href="https://mhr.wikipedia.org/wiki/%D0%9E%D0%BB%D0%BC%D0%B0" title="Олма – Eastern Mari" lang="mhr" hreflang="mhr" data-title="Олма" data-language-autonym="Олык марий" data-language-local-name="Eastern Mari" class="interlanguage-link-target"><span>Олык марий</span></a></li><li class="interlanguage-link interwiki-om mw-list-item"><a href="https://om.wikipedia.org/wiki/Appilii" title="Appilii – Oromo" lang="om" hreflang="om" data-title="Appilii" data-language-autonym="Oromoo" data-language-local-name="Oromo" class="interlanguage-link-target"><span>Oromoo</span></a></li><li class="interlanguage-link interwiki-uz mw-list-item"><a href="https://uz.wikipedia.org/wiki/Olma" title="Olma – Uzbek" lang="uz" hreflang="uz" data-title="Olma" data-language-autonym="Oʻzbekcha / ўзбекча" data-language-local-name="Uzbek" class="interlanguage-link-target"><span>Oʻzbekcha / ўзбекча</span></a></li><li class="interlanguage-link interwiki-pa mw-list-item"><a href="https://pa.wikipedia.org/wiki/%E0%A8%B8%E0%A9%87%E0%A8%AC" title="ਸੇਬ – Punjabi" lang="pa" hreflang="pa" data-title="ਸੇਬ" data-language-autonym="ਪੰਜਾਬੀ" data-language-local-name="Punjabi" class="interlanguage-link-target"><span>ਪੰਜਾਬੀ</span></a></li><li class="interlanguage-link interwiki-pnb mw-list-item"><a href="https://pnb.wikipedia.org/wiki/%D8%B3%DB%8C%D8%A8" title="سیب – Western Punjabi" lang="pnb" hreflang="pnb" data-title="سیب" data-language-autonym="پنجابی" data-language-local-name="Western Punjabi" class="interlanguage-link-target"><span>پنجابی</span></a></li><li class="interlanguage-link interwiki-pl mw-list-item"><a href="https://pl.wikipedia.org/wiki/Jab%C5%82ko" title="Jabłko – Polish" lang="pl" hreflang="pl" data-title="Jabłko" data-language-autonym="Polski" data-language-local-name="Polish" class="interlanguage-link-target"><span>Polski</span></a></li><li class="interlanguage-link interwiki-pt mw-list-item"><a href="https://pt.wikipedia.org/wiki/Ma%C3%A7%C3%A3" title="Maçã – Portuguese" lang="pt" hreflang="pt" data-title="Maçã" data-language-autonym="Português" data-language-local-name="Portuguese" class="interlanguage-link-target"><span>Português</span></a></li><li class="interlanguage-link interwiki-kaa mw-list-item"><a href="https://kaa.wikipedia.org/wiki/Alma" title="Alma – Kara-Kalpak" lang="kaa" hreflang="kaa" data-title="Alma" data-language-autonym="Qaraqalpaqsha" data-language-local-name="Kara-Kalpak" class="interlanguage-link-target"><span>Qaraqalpaqsha</span></a></li><li class="interlanguage-link interwiki-crh mw-list-item"><a href="https://crh.wikipedia.org/wiki/Alma" title="Alma – Crimean Tatar" lang="crh" hreflang="crh" data-title="Alma" data-language-autonym="Qırımtatarca" data-language-local-name="Crimean Tatar" class="interlanguage-link-target"><span>Qırımtatarca</span></a></li><li class="interlanguage-link interwiki-ksh mw-list-item"><a href="https://ksh.wikipedia.org/wiki/Appel" title="Appel – Colognian" lang="ksh" hreflang="ksh" data-title="Appel" data-language-autonym="Ripoarisch" data-language-local-name="Colognian" class="interlanguage-link-target"><span>Ripoarisch</span></a></li><li class="interlanguage-link interwiki-ro mw-list-item"><a href="https://ro.wikipedia.org/wiki/M%C4%83r" title="Măr – Romanian" lang="ro" hreflang="ro" data-title="Măr" data-language-autonym="Română" data-language-local-name="Romanian" class="interlanguage-link-target"><span>Română</span></a></li><li class="interlanguage-link interwiki-rmy mw-list-item"><a href="https://rmy.wikipedia.org/wiki/Pomalo" title="Pomalo – Vlax Romani" lang="rmy" hreflang="rmy" data-title="Pomalo" data-language-autonym="Romani čhib" data-language-local-name="Vlax Romani" class="interlanguage-link-target"><span>Romani čhib</span></a></li><li class="interlanguage-link interwiki-rue mw-list-item"><a href="https://rue.wikipedia.org/wiki/%D0%AF%D0%B1%D0%BA%D0%BE" title="Ябко – Rusyn" lang="rue" hreflang="rue" data-title="Ябко" data-language-autonym="Русиньскый" data-language-local-name="Rusyn" class="interlanguage-link-target"><span>Русиньскый</span></a></li><li class="interlanguage-link interwiki-ru mw-list-item"><a href="https://ru.wikipedia.org/wiki/%D0%AF%D0%B1%D0%BB%D0%BE%D0%BA%D0%BE" title="Яблоко – Russian" lang="ru" hreflang="ru" data-title="Яблоко" data-language-autonym="Русский" data-language-local-name="Russian" class="interlanguage-link-target"><span>Русский</span></a></li><li class="interlanguage-link interwiki-sah mw-list-item"><a href="https://sah.wikipedia.org/wiki/%D0%94%D1%8C%D0%B0%D0%B0%D0%B1%D1%8B%D0%BB%D1%8B%D0%BA%D0%B0" title="Дьаабылыка – Yakut" lang="sah" hreflang="sah" data-title="Дьаабылыка" data-language-autonym="Саха тыла" data-language-local-name="Yakut" class="interlanguage-link-target"><span>Саха тыла</span></a></li><li class="interlanguage-link interwiki-szy mw-list-item"><a href="https://szy.wikipedia.org/wiki/dayas_siku" title="dayas siku – Sakizaya" lang="szy" hreflang="szy" data-title="dayas siku" data-language-autonym="Sakizaya" data-language-local-name="Sakizaya" class="interlanguage-link-target"><span>Sakizaya</span></a></li><li class="interlanguage-link interwiki-sm mw-list-item"><a href="https://sm.wikipedia.org/wiki/Apu" title="Apu – Samoan" lang="sm" hreflang="sm" data-title="Apu" data-language-autonym="Gagana Samoa" data-language-local-name="Samoan" class="interlanguage-link-target"><span>Gagana Samoa</span></a></li><li class="interlanguage-link interwiki-sa mw-list-item"><a href="https://sa.wikipedia.org/wiki/%E0%A4%B8%E0%A5%87%E0%A4%B5%E0%A4%AB%E0%A4%B2%E0%A4%AE%E0%A5%8D" title="सेवफलम् – Sanskrit" lang="sa" hreflang="sa" data-title="सेवफलम्" data-language-autonym="संस्कृतम्" data-language-local-name="Sanskrit" class="interlanguage-link-target"><span>संस्कृतम्</span></a></li><li class="interlanguage-link interwiki-skr mw-list-item"><a href="https://skr.wikipedia.org/wiki/%D8%B3%DB%8C%D8%A8" title="سیب – Saraiki" lang="skr" hreflang="skr" data-title="سیب" data-language-autonym="سرائیکی" data-language-local-name="Saraiki" class="interlanguage-link-target"><span>سرائیکی</span></a></li><li class="interlanguage-link interwiki-sco mw-list-item"><a href="https://sco.wikipedia.org/wiki/Aiple" title="Aiple – Scots" lang="sco" hreflang="sco" data-title="Aiple" data-language-autonym="Scots" data-language-local-name="Scots" class="interlanguage-link-target"><span>Scots</span></a></li><li class="interlanguage-link interwiki-nso mw-list-item"><a href="https://nso.wikipedia.org/wiki/Apole" title="Apole – Northern Sotho" lang="nso" hreflang="nso" data-title="Apole" data-language-autonym="Sesotho sa Leboa" data-language-local-name="Northern Sotho" class="interlanguage-link-target"><span>Sesotho sa Leboa</span></a></li><li class="interlanguage-link interwiki-tn mw-list-item"><a href="https://tn.wikipedia.org/wiki/Apole" title="Apole – Tswana" lang="tn" hreflang="tn" data-title="Apole" data-language-autonym="Setswana" data-language-local-name="Tswana" class="interlanguage-link-target"><span>Setswana</span></a></li><li class="interlanguage-link interwiki-sq mw-list-item"><a href="https://sq.wikipedia.org/wiki/Molla" title="Molla – Albanian" lang="sq" hreflang="sq" data-title="Molla" data-language-autonym="Shqip" data-language-local-name="Albanian" class="interlanguage-link-target"><span>Shqip</span></a></li><li class="interlanguage-link interwiki-scn mw-list-item"><a href="https://scn.wikipedia.org/wiki/Pumu" title="Pumu – Sicilian" lang="scn" hreflang="scn" data-title="Pumu" data-language-autonym="Sicilianu" data-language-local-name="Sicilian" class="interlanguage-link-target"><span>Sicilianu</span></a></li><li class="interlanguage-link interwiki-simple mw-list-item"><a href="https://simple.wikipedia.org/wiki/Apple" title="Apple – Simple English" lang="en-simple" hreflang="en-simple" data-title="Apple" data-language-autonym="Simple English" data-language-local-name="Simple English" class="interlanguage-link-target"><span>Simple English</span></a></li><li class="interlanguage-link interwiki-sd mw-list-item"><a href="https://sd.wikipedia.org/wiki/%D8%B5%D9%88%D9%81" title="صوف – Sindhi" lang="sd" hreflang="sd" data-title="صوف" data-language-autonym="سنڌي" data-language-local-name="Sindhi" class="interlanguage-link-target"><span>سنڌي</span></a></li><li class="interlanguage-link interwiki-sk mw-list-item"><a href="https://sk.wikipedia.org/wiki/Jablko" title="Jablko – Slovak" lang="sk" hreflang="sk" data-title="Jablko" data-language-autonym="Slovenčina" data-language-local-name="Slovak" class="interlanguage-link-target"><span>Slovenčina</span></a></li><li class="interlanguage-link interwiki-sl mw-list-item"><a href="https://sl.wikipedia.org/wiki/Jabolko" title="Jabolko – Slovenian" lang="sl" hreflang="sl" data-title="Jabolko" data-language-autonym="Slovenščina" data-language-local-name="Slovenian" class="interlanguage-link-target"><span>Slovenščina</span></a></li><li class="interlanguage-link interwiki-ckb mw-list-item"><a href="https://ckb.wikipedia.org/wiki/%D8%B3%DB%8E%D9%88" title="سێو – Central Kurdish" lang="ckb" hreflang="ckb" data-title="سێو" data-language-autonym="کوردی" data-language-local-name="Central Kurdish" class="interlanguage-link-target"><span>کوردی</span></a></li><li class="interlanguage-link interwiki-sr mw-list-item"><a href="https://sr.wikipedia.org/wiki/%D0%88%D0%B0%D0%B1%D1%83%D0%BA%D0%B0" title="Јабука – Serbian" lang="sr" hreflang="sr" data-title="Јабука" data-language-autonym="Српски / srpski" data-language-local-name="Serbian" class="interlanguage-link-target"><span>Српски / srpski</span></a></li><li class="interlanguage-link interwiki-sh mw-list-item"><a href="https://sh.wikipedia.org/wiki/Jabuka" title="Jabuka – Serbo-Croatian" lang="sh" hreflang="sh" data-title="Jabuka" data-language-autonym="Srpskohrvatski / српскохрватски" data-language-local-name="Serbo-Croatian" class="interlanguage-link-target"><span>Srpskohrvatski / српскохрватски</span></a></li><li class="interlanguage-link interwiki-su mw-list-item"><a href="https://su.wikipedia.org/wiki/Apel" title="Apel – Sundanese" lang="su" hreflang="su" data-title="Apel" data-language-autonym="Sunda" data-language-local-name="Sundanese" class="interlanguage-link-target"><span>Sunda</span></a></li><li class="interlanguage-link interwiki-fi mw-list-item"><a href="https://fi.wikipedia.org/wiki/Omena" title="Omena – Finnish" lang="fi" hreflang="fi" data-title="Omena" data-language-autonym="Suomi" data-language-local-name="Finnish" class="interlanguage-link-target"><span>Suomi</span></a></li><li class="interlanguage-link interwiki-sv mw-list-item"><a href="https://sv.wikipedia.org/wiki/%C3%84pple" title="Äpple – Swedish" lang="sv" hreflang="sv" data-title="Äpple" data-language-autonym="Svenska" data-language-local-name="Swedish" class="interlanguage-link-target"><span>Svenska</span></a></li><li class="interlanguage-link interwiki-tl mw-list-item"><a href="https://tl.wikipedia.org/wiki/Mansanas" title="Mansanas – Tagalog" lang="tl" hreflang="tl" data-title="Mansanas" data-language-autonym="Tagalog" data-language-local-name="Tagalog" class="interlanguage-link-target"><span>Tagalog</span></a></li><li class="interlanguage-link interwiki-ta badge-Q17437796 badge-featuredarticle mw-list-item" title="featured article badge"><a href="https://ta.wikipedia.org/wiki/%E0%AE%86%E0%AE%AA%E0%AF%8D%E0%AE%AA%E0%AE%BF%E0%AE%B3%E0%AF%8D" title="ஆப்பிள் – Tamil" lang="ta" hreflang="ta" data-title="ஆப்பிள்" data-language-autonym="தமிழ்" data-language-local-name="Tamil" class="interlanguage-link-target"><span>தமிழ்</span></a></li><li class="interlanguage-link interwiki-shi mw-list-item"><a href="https://shi.wikipedia.org/wiki/Adffuy" title="Adffuy – Tachelhit" lang="shi" hreflang="shi" data-title="Adffuy" data-language-autonym="Taclḥit" data-language-local-name="Tachelhit" class="interlanguage-link-target"><span>Taclḥit</span></a></li><li class="interlanguage-link interwiki-kab mw-list-item"><a href="https://kab.wikipedia.org/wiki/Adeffu" title="Adeffu – Kabyle" lang="kab" hreflang="kab" data-title="Adeffu" data-language-autonym="Taqbaylit" data-language-local-name="Kabyle" class="interlanguage-link-target"><span>Taqbaylit</span></a></li><li class="interlanguage-link interwiki-tt mw-list-item"><a href="https://tt.wikipedia.org/wiki/%D0%90%D0%BB%D0%BC%D0%B0" title="Алма – Tatar" lang="tt" hreflang="tt" data-title="Алма" data-language-autonym="Татарча / tatarça" data-language-local-name="Tatar" class="interlanguage-link-target"><span>Татарча / tatarça</span></a></li><li class="interlanguage-link interwiki-shn mw-list-item"><a href="https://shn.wikipedia.org/wiki/%E1%80%99%E1%81%A2%E1%81%B5%E1%80%BA%E1%82%87%E1%81%B5%E1%82%85%E1%80%99%E1%80%BA%E1%82%88%E1%81%B6%E1%80%BD%E1%80%84%E1%80%BA%E1%82%87" title="မၢၵ်ႇၵႅမ်ႈၶွင်ႇ – Shan" lang="shn" hreflang="shn" data-title="မၢၵ်ႇၵႅမ်ႈၶွင်ႇ" data-language-autonym="ၽႃႇသႃႇတႆး " data-language-local-name="Shan" class="interlanguage-link-target"><span>ၽႃႇသႃႇတႆး </span></a></li><li class="interlanguage-link interwiki-te mw-list-item"><a href="https://te.wikipedia.org/wiki/%E0%B0%86%E0%B0%AA%E0%B0%BF%E0%B0%B2%E0%B1%8D" title="ఆపిల్ – Telugu" lang="te" hreflang="te" data-title="ఆపిల్" data-language-autonym="తెలుగు" data-language-local-name="Telugu" class="interlanguage-link-target"><span>తెలుగు</span></a></li><li class="interlanguage-link interwiki-th mw-list-item"><a href="https://th.wikipedia.org/wiki/%E0%B9%81%E0%B8%AD%E0%B8%9B%E0%B9%80%E0%B8%9B%E0%B8%B4%E0%B8%A5" title="แอปเปิล – Thai" lang="th" hreflang="th" data-title="แอปเปิล" data-language-autonym="ไทย" data-language-local-name="Thai" class="interlanguage-link-target"><span>ไทย</span></a></li><li class="interlanguage-link interwiki-tg mw-list-item"><a href="https://tg.wikipedia.org/wiki/%D0%A1%D0%B5%D0%B1" title="Себ – Tajik" lang="tg" hreflang="tg" data-title="Себ" data-language-autonym="Тоҷикӣ" data-language-local-name="Tajik" class="interlanguage-link-target"><span>Тоҷикӣ</span></a></li><li class="interlanguage-link interwiki-chr mw-list-item"><a href="https://chr.wikipedia.org/wiki/%E1%8F%92%E1%8E%A6%E1%8F%94" title="ᏒᎦᏔ – Cherokee" lang="chr" hreflang="chr" data-title="ᏒᎦᏔ" data-language-autonym="ᏣᎳᎩ" data-language-local-name="Cherokee" class="interlanguage-link-target"><span>ᏣᎳᎩ</span></a></li><li class="interlanguage-link interwiki-chy mw-list-item"><a href="https://chy.wikipedia.org/wiki/M%C3%A1%27xeme" title="Má'xeme – Cheyenne" lang="chy" hreflang="chy" data-title="Má'xeme" data-language-autonym="Tsetsêhestâhese" data-language-local-name="Cheyenne" class="interlanguage-link-target"><span>Tsetsêhestâhese</span></a></li><li class="interlanguage-link interwiki-ve mw-list-item"><a href="https://ve.wikipedia.org/wiki/Apula" title="Apula – Venda" lang="ve" hreflang="ve" data-title="Apula" data-language-autonym="Tshivenda" data-language-local-name="Venda" class="interlanguage-link-target"><span>Tshivenda</span></a></li><li class="interlanguage-link interwiki-tr mw-list-item"><a href="https://tr.wikipedia.org/wiki/Elma" title="Elma – Turkish" lang="tr" hreflang="tr" data-title="Elma" data-language-autonym="Türkçe" data-language-local-name="Turkish" class="interlanguage-link-target"><span>Türkçe</span></a></li><li class="interlanguage-link interwiki-tk mw-list-item"><a href="https://tk.wikipedia.org/wiki/Alma" title="Alma – Turkmen" lang="tk" hreflang="tk" data-title="Alma" data-language-autonym="Türkmençe" data-language-local-name="Turkmen" class="interlanguage-link-target"><span>Türkmençe</span></a></li><li class="interlanguage-link interwiki-tyv mw-list-item"><a href="https://tyv.wikipedia.org/wiki/%D0%AF%D0%B1%D0%BB%D0%BE%D0%BA%D0%BE" title="Яблоко – Tuvinian" lang="tyv" hreflang="tyv" data-title="Яблоко" data-language-autonym="Тыва дыл" data-language-local-name="Tuvinian" class="interlanguage-link-target"><span>Тыва дыл</span></a></li><li class="interlanguage-link interwiki-uk mw-list-item"><a href="https://uk.wikipedia.org/wiki/%D0%AF%D0%B1%D0%BB%D1%83%D0%BA%D0%BE" title="Яблуко – Ukrainian" lang="uk" hreflang="uk" data-title="Яблуко" data-language-autonym="Українська" data-language-local-name="Ukrainian" class="interlanguage-link-target"><span>Українська</span></a></li><li class="interlanguage-link interwiki-ur mw-list-item"><a href="https://ur.wikipedia.org/wiki/%D8%B3%DB%8C%D8%A8" title="سیب – Urdu" lang="ur" hreflang="ur" data-title="سیب" data-language-autonym="اردو" data-language-local-name="Urdu" class="interlanguage-link-target"><span>اردو</span></a></li><li class="interlanguage-link interwiki-ug mw-list-item"><a href="https://ug.wikipedia.org/wiki/%D8%A6%D8%A7%D9%84%D9%85%D8%A7" title="ئالما – Uyghur" lang="ug" hreflang="ug" data-title="ئالما" data-language-autonym="ئۇيغۇرچە / Uyghurche" data-language-local-name="Uyghur" class="interlanguage-link-target"><span>ئۇيغۇرچە / Uyghurche</span></a></li><li class="interlanguage-link interwiki-za mw-list-item"><a href="https://za.wikipedia.org/wiki/Makbinzgoj" title="Makbinzgoj – Zhuang" lang="za" hreflang="za" data-title="Makbinzgoj" data-language-autonym="Vahcuengh" data-language-local-name="Zhuang" class="interlanguage-link-target"><span>Vahcuengh</span></a></li><li class="interlanguage-link interwiki-vec mw-list-item"><a href="https://vec.wikipedia.org/wiki/Pomo" title="Pomo – Venetian" lang="vec" hreflang="vec" data-title="Pomo" data-language-autonym="Vèneto" data-language-local-name="Venetian" class="interlanguage-link-target"><span>Vèneto</span></a></li><li class="interlanguage-link interwiki-vep mw-list-item"><a href="https://vep.wikipedia.org/wiki/Jablok" title="Jablok – Veps" lang="vep" hreflang="vep" data-title="Jablok" data-language-autonym="Vepsän kel’" data-language-local-name="Veps" class="interlanguage-link-target"><span>Vepsän kel’</span></a></li><li class="interlanguage-link interwiki-vi badge-Q17437798 badge-goodarticle mw-list-item" title="good article badge"><a href="https://vi.wikipedia.org/wiki/T%C3%A1o_t%C3%A2y" title="Táo tây – Vietnamese" lang="vi" hreflang="vi" data-title="Táo tây" data-language-autonym="Tiếng Việt" data-language-local-name="Vietnamese" class="interlanguage-link-target"><span>Tiếng Việt</span></a></li><li class="interlanguage-link interwiki-vo mw-list-item"><a href="https://vo.wikipedia.org/wiki/Pod" title="Pod – Volapük" lang="vo" hreflang="vo" data-title="Pod" data-language-autonym="Volapük" data-language-local-name="Volapük" class="interlanguage-link-target"><span>Volapük</span></a></li><li class="interlanguage-link interwiki-fiu-vro mw-list-item"><a href="https://fiu-vro.wikipedia.org/wiki/Upin" title="Upin – Võro" lang="vro" hreflang="vro" data-title="Upin" data-language-autonym="Võro" data-language-local-name="Võro" class="interlanguage-link-target"><span>Võro</span></a></li><li class="interlanguage-link interwiki-wa mw-list-item"><a href="https://wa.wikipedia.org/wiki/Pem%C3%AE" title="Pemî – Walloon" lang="wa" hreflang="wa" data-title="Pemî" data-language-autonym="Walon" data-language-local-name="Walloon" class="interlanguage-link-target"><span>Walon</span></a></li><li class="interlanguage-link interwiki-vls mw-list-item"><a href="https://vls.wikipedia.org/wiki/Appel" title="Appel – West Flemish" lang="vls" hreflang="vls" data-title="Appel" data-language-autonym="West-Vlams" data-language-local-name="West Flemish" class="interlanguage-link-target"><span>West-Vlams</span></a></li><li class="interlanguage-link interwiki-war mw-list-item"><a href="https://war.wikipedia.org/wiki/Mansanas" title="Mansanas – Waray" lang="war" hreflang="war" data-title="Mansanas" data-language-autonym="Winaray" data-language-local-name="Waray" class="interlanguage-link-target"><span>Winaray</span></a></li><li class="interlanguage-link interwiki-wuu mw-list-item"><a href="https://wuu.wikipedia.org/wiki/%E8%8B%B9%E6%9E%9C" title="苹果 – Wu" lang="wuu" hreflang="wuu" data-title="苹果" data-language-autonym="吴语" data-language-local-name="Wu" class="interlanguage-link-target"><span>吴语</span></a></li><li class="interlanguage-link interwiki-yi mw-list-item"><a href="https://yi.wikipedia.org/wiki/%D7%A2%D7%A4%D7%9C" title="עפל – Yiddish" lang="yi" hreflang="yi" data-title="עפל" data-language-autonym="ייִדיש" data-language-local-name="Yiddish" class="interlanguage-link-target"><span>ייִדיש</span></a></li><li class="interlanguage-link interwiki-zh-yue mw-list-item"><a href="https://zh-yue.wikipedia.org/wiki/%E8%98%8B%E6%9E%9C" title="蘋果 – Cantonese" lang="yue" hreflang="yue" data-title="蘋果" data-language-autonym="粵語" data-language-local-name="Cantonese" class="interlanguage-link-target"><span>粵語</span></a></li><li class="interlanguage-link interwiki-diq mw-list-item"><a href="https://diq.wikipedia.org/wiki/Saye" title="Saye – Zazaki" lang="diq" hreflang="diq" data-title="Saye" data-language-autonym="Zazaki" data-language-local-name="Zazaki" class="interlanguage-link-target"><span>Zazaki</span></a></li><li class="interlanguage-link interwiki-bat-smg mw-list-item"><a href="https://bat-smg.wikipedia.org/wiki/Vuobols" title="Vuobols – Samogitian" lang="sgs" hreflang="sgs" data-title="Vuobols" data-language-autonym="Žemaitėška" data-language-local-name="Samogitian" class="interlanguage-link-target"><span>Žemaitėška</span></a></li><li class="interlanguage-link interwiki-zh mw-list-item"><a href="https://zh.wikipedia.org/wiki/%E8%8B%B9%E6%9E%9C" title="苹果 – Chinese" lang="zh" hreflang="zh" data-title="苹果" data-language-autonym="中文" data-language-local-name="Chinese" class="interlanguage-link-target"><span>中文</span></a></li><li class="interlanguage-link interwiki-bdr mw-list-item"><a href="https://bdr.wikipedia.org/wiki/Ipol" title="Ipol – West Coast Bajau" lang="bdr" hreflang="bdr" data-title="Ipol" data-language-autonym="Bajau Sama" data-language-local-name="West Coast Bajau" class="interlanguage-link-target"><span>Bajau Sama</span></a></li><li class="interlanguage-link interwiki-iba mw-list-item"><a href="https://iba.wikipedia.org/wiki/Ipul" title="Ipul – Iban" lang="iba" hreflang="iba" data-title="Ipul" data-language-autonym="Jaku Iban" data-language-local-name="Iban" class="interlanguage-link-target"><span>Jaku Iban</span></a></li><li class="interlanguage-link interwiki-kge mw-list-item"><a href="https://kge.wikipedia.org/wiki/Apel" title="Apel – Komering" lang="kge" hreflang="kge" data-title="Apel" data-language-autonym="Kumoring" data-language-local-name="Komering" class="interlanguage-link-target"><span>Kumoring</span></a></li><li class="interlanguage-link interwiki-tly mw-list-item"><a href="https://tly.wikipedia.org/wiki/Sef" title="Sef – Talysh" lang="tly" hreflang="tly" data-title="Sef" data-language-autonym="Tolışi" data-language-local-name="Talysh" class="interlanguage-link-target"><span>Tolışi</span></a></li>
+			</ul>
+			<div class="after-portlet after-portlet-lang"><span class="wb-langlinks-edit wb-langlinks-link"><a href="https://www.wikidata.org/wiki/Special:EntityPage/Q89#sitelinks-wikipedia" title="Edit interlanguage links" class="wbc-editpage">Edit links</a></span></div>
+		</div>
+
+	</div>
+</div>
+</header>
+				<div class="vector-page-toolbar">
+					<div class="vector-page-toolbar-container">
+						<div id="left-navigation">
+							<nav aria-label="Namespaces">
+								
+<div id="p-associated-pages" class="vector-menu vector-menu-tabs mw-portlet mw-portlet-associated-pages">
+	<div class="vector-menu-content">
+		
+		<ul class="vector-menu-content-list">
+			
+			<li id="ca-nstab-main" class="selected vector-tab-noicon mw-list-item"><a href="/wiki/Apple" title="View the content page [ctrl-option-c]" accesskey="c"><span>Article</span></a></li><li id="ca-talk" class="vector-tab-noicon mw-list-item"><a href="/wiki/Talk:Apple" rel="discussion" title="Discuss improvements to the content page [ctrl-option-t]" accesskey="t"><span>Talk</span></a></li>
+		</ul>
+		
+	</div>
+</div>
+
+								
+<div id="vector-variants-dropdown" class="vector-dropdown emptyPortlet">
+	<input type="checkbox" id="vector-variants-dropdown-checkbox" role="button" aria-haspopup="true" data-event-name="ui.dropdown-vector-variants-dropdown" class="vector-dropdown-checkbox " aria-label="Change language variant">
+	<label id="vector-variants-dropdown-label" for="vector-variants-dropdown-checkbox" class="vector-dropdown-label cdx-button cdx-button--fake-button cdx-button--fake-button--enabled cdx-button--weight-quiet" aria-hidden="true"><span class="vector-dropdown-label-text">English</span>
+	</label>
+	<div class="vector-dropdown-content">
+
+
+					
+<div id="p-variants" class="vector-menu mw-portlet mw-portlet-variants emptyPortlet">
+	<div class="vector-menu-content">
+		
+		<ul class="vector-menu-content-list">
+			
+			
+		</ul>
+		
+	</div>
+</div>
+
+				
+	</div>
+</div>
+
+							</nav>
+						</div>
+						<div id="right-navigation" class="vector-collapsible">
+							<nav aria-label="Views">
+								
+<div id="p-views" class="vector-menu vector-menu-tabs mw-portlet mw-portlet-views">
+	<div class="vector-menu-content">
+		
+		<ul class="vector-menu-content-list">
+			
+			<li id="ca-view" class="selected vector-tab-noicon mw-list-item"><a href="/wiki/Apple"><span>Read</span></a></li><li id="ca-viewsource" class="vector-tab-noicon mw-list-item"><a href="/w/index.php?title=Apple&amp;action=edit" title="This page is protected.
+You can view its source [ctrl-option-e]" accesskey="e"><span>View source</span></a></li><li id="ca-history" class="vector-tab-noicon mw-list-item"><a href="/w/index.php?title=Apple&amp;action=history" title="Past revisions of this page [ctrl-option-h]" accesskey="h"><span>View history</span></a></li>
+		</ul>
+		
+	</div>
+</div>
+
+							</nav>
+				
+							<nav class="vector-page-tools-landmark" aria-label="Page tools">
+								
+<div id="vector-page-tools-dropdown" class="vector-dropdown vector-page-tools-dropdown">
+	<input type="checkbox" id="vector-page-tools-dropdown-checkbox" role="button" aria-haspopup="true" data-event-name="ui.dropdown-vector-page-tools-dropdown" class="vector-dropdown-checkbox " aria-label="Tools">
+	<label id="vector-page-tools-dropdown-label" for="vector-page-tools-dropdown-checkbox" class="vector-dropdown-label cdx-button cdx-button--fake-button cdx-button--fake-button--enabled cdx-button--weight-quiet" aria-hidden="true"><span class="vector-dropdown-label-text">Tools</span>
+	</label>
+	<div class="vector-dropdown-content">
+
+
+									<div id="vector-page-tools-unpinned-container" class="vector-unpinned-container">
+						
+<div id="vector-page-tools" class="vector-page-tools vector-pinnable-element">
+	<div class="vector-pinnable-header vector-page-tools-pinnable-header vector-pinnable-header-unpinned" data-feature-name="page-tools-pinned" data-pinnable-element-id="vector-page-tools" data-pinned-container-id="vector-page-tools-pinned-container" data-unpinned-container-id="vector-page-tools-unpinned-container" data-saved-pinned-state="false">
+	<div class="vector-pinnable-header-label">Tools</div>
+	<button class="vector-pinnable-header-toggle-button vector-pinnable-header-pin-button" data-event-name="pinnable-header.vector-page-tools.pin">move to sidebar</button>
+	<button class="vector-pinnable-header-toggle-button vector-pinnable-header-unpin-button" data-event-name="pinnable-header.vector-page-tools.unpin">hide</button>
+</div>
+
+	
+<div id="p-cactions" class="vector-menu mw-portlet mw-portlet-cactions emptyPortlet vector-has-collapsible-items" title="More options">
+	<div class="vector-menu-heading">
+		Actions
+	</div>
+	<div class="vector-menu-content">
+		
+		<ul class="vector-menu-content-list">
+			
+			<li id="ca-more-view" class="selected vector-more-collapsible-item mw-list-item"><a href="/wiki/Apple"><span>Read</span></a></li><li id="ca-more-viewsource" class="vector-more-collapsible-item mw-list-item"><a href="/w/index.php?title=Apple&amp;action=edit"><span>View source</span></a></li><li id="ca-more-history" class="vector-more-collapsible-item mw-list-item"><a href="/w/index.php?title=Apple&amp;action=history"><span>View history</span></a></li>
+		</ul>
+		
+	</div>
+</div>
+
+<div id="p-tb" class="vector-menu mw-portlet mw-portlet-tb">
+	<div class="vector-menu-heading">
+		General
+	</div>
+	<div class="vector-menu-content">
+		
+		<ul class="vector-menu-content-list">
+			
+			<li id="t-whatlinkshere" class="mw-list-item"><a href="/wiki/Special:WhatLinksHere/Apple" title="List of all English Wikipedia pages containing links to this page [ctrl-option-j]" accesskey="j"><span>What links here</span></a></li><li id="t-recentchangeslinked" class="mw-list-item"><a href="/wiki/Special:RecentChangesLinked/Apple" rel="nofollow" title="Recent changes in pages linked from this page [ctrl-option-k]" accesskey="k"><span>Related changes</span></a></li><li id="t-upload" class="mw-list-item"><a href="/wiki/Wikipedia:File_Upload_Wizard" title="Upload files [ctrl-option-u]" accesskey="u"><span>Upload file</span></a></li><li id="t-specialpages" class="mw-list-item"><a href="/wiki/Special:SpecialPages" title="A list of all special pages [ctrl-option-q]" accesskey="q"><span>Special pages</span></a></li><li id="t-permalink" class="mw-list-item"><a href="https://en.wikipedia.org/w/index.php?title=Apple&amp;oldid=1256174424" title="Permanent link to this revision of this page"><span>Permanent link</span></a></li><li id="t-info" class="mw-list-item"><a href="/w/index.php?title=Apple&amp;action=info" title="More information about this page"><span>Page information</span></a></li><li id="t-cite" class="mw-list-item"><a href="/w/index.php?title=Special:CiteThisPage&amp;page=Apple&amp;id=1256174424&amp;wpFormIdentifier=titleform" title="Information on how to cite this page"><span>Cite this page</span></a></li><li id="t-urlshortener" class="mw-list-item"><a href="/w/index.php?title=Special:UrlShortener&amp;url=https%3A%2F%2Fen.wikipedia.org%2Fwiki%2FApple" aria-haspopup="dialog"><span>Get shortened URL</span></a></li><li id="t-urlshortener-qrcode" class="mw-list-item"><a href="/w/index.php?title=Special:QrCode&amp;url=https%3A%2F%2Fen.wikipedia.org%2Fwiki%2FApple"><span>Download QR code</span></a></li>
+		<li class="mw-list-item mw-list-item-js" id="t-collapsible-toggle-all"><a href="#" title="Expand all collapsible elements on the current page" role="button" aria-expanded="false"><span>Expand all</span></a></li><li class="mw-list-item mw-list-item-js" id="wbc-editpage"><a href="https://www.wikidata.org/wiki/Special:EntityPage/Q89#sitelinks-wikipedia" title="Edit interlanguage links"><span>Edit interlanguage links</span></a></li></ul>
+		
+	</div>
+</div>
+
+<div id="p-coll-print_export" class="vector-menu mw-portlet mw-portlet-coll-print_export">
+	<div class="vector-menu-heading">
+		Print/export
+	</div>
+	<div class="vector-menu-content">
+		
+		<ul class="vector-menu-content-list">
+			
+			<li id="coll-download-as-rl" class="mw-list-item"><a href="/w/index.php?title=Special:DownloadAsPdf&amp;page=Apple&amp;action=show-download-screen" title="Download this page as a PDF file"><span>Download as PDF</span></a></li><li id="t-print" class="mw-list-item"><a href="/w/index.php?title=Apple&amp;printable=yes" title="Printable version of this page [ctrl-option-p]" accesskey="p"><span>Printable version</span></a></li>
+		</ul>
+		
+	</div>
+</div>
+
+<div id="p-wikibase-otherprojects" class="vector-menu mw-portlet mw-portlet-wikibase-otherprojects">
+	<div class="vector-menu-heading">
+		In other projects
+	</div>
+	<div class="vector-menu-content">
+		
+		<ul class="vector-menu-content-list">
+			
+			<li class="wb-otherproject-link wb-otherproject-commons mw-list-item"><a href="https://commons.wikimedia.org/wiki/Apple" hreflang="en"><span>Wikimedia Commons</span></a></li><li class="wb-otherproject-link wb-otherproject-wikibooks mw-list-item"><a href="https://en.wikibooks.org/wiki/Cookbook:Apple" hreflang="en"><span>Wikibooks</span></a></li><li class="wb-otherproject-link wb-otherproject-wikiquote mw-list-item"><a href="https://en.wikiquote.org/wiki/Apples" hreflang="en"><span>Wikiquote</span></a></li><li id="t-wikibase" class="wb-otherproject-link wb-otherproject-wikibase-dataitem mw-list-item"><a href="https://www.wikidata.org/wiki/Special:EntityPage/Q89" title="Structured data on this page hosted by Wikidata [ctrl-option-g]" accesskey="g"><span>Wikidata item</span></a></li>
+		</ul>
+		
+	</div>
+</div>
+
+</div>
+
+									</div>
+				
+	</div>
+</div>
+
+							</nav>
+						</div>
+					</div>
+				</div>
+				<div class="vector-column-end">
+					<div class="vector-sticky-pinned-container">
+						<nav class="vector-page-tools-landmark" aria-label="Page tools">
+							<div id="vector-page-tools-pinned-container" class="vector-pinned-container">
+				
+							</div>
+		</nav>
+						<nav class="vector-appearance-landmark" aria-label="Appearance">
+							<div id="vector-appearance-pinned-container" class="vector-pinned-container">
+				<div id="vector-appearance" class="vector-appearance vector-pinnable-element">
+	<div class="vector-pinnable-header vector-appearance-pinnable-header vector-pinnable-header-pinned" data-feature-name="appearance-pinned" data-pinnable-element-id="vector-appearance" data-pinned-container-id="vector-appearance-pinned-container" data-unpinned-container-id="vector-appearance-unpinned-container" data-saved-pinned-state="true">
+	<div class="vector-pinnable-header-label">Appearance</div>
+	<button class="vector-pinnable-header-toggle-button vector-pinnable-header-pin-button" data-event-name="pinnable-header.vector-appearance.pin">move to sidebar</button>
+	<button class="vector-pinnable-header-toggle-button vector-pinnable-header-unpin-button" data-event-name="pinnable-header.vector-appearance.unpin">hide</button>
+</div>
+
+
+<div class="mw-portlet mw-portlet-skin-client-prefs-vector-feature-custom-font-size vector-menu" id="skin-client-prefs-vector-feature-custom-font-size"><div class="vector-menu-heading">Text</div><div class="vector-menu-content"><ul class="vector-menu-content-list"><li class="mw-list-item mw-list-item-js"><div class=""><form><div class="cdx-radio"><input name="skin-client-pref-vector-feature-custom-font-size-group" id="skin-client-pref-vector-feature-custom-font-size-value-0" type="radio" value="0" data-event-name="skin-client-pref-vector-feature-custom-font-size-value-0" class="cdx-radio__input"><span class="cdx-radio__icon"></span><label for="skin-client-pref-vector-feature-custom-font-size-value-0" class="cdx-radio__label">Small</label></div><div class="cdx-radio"><input name="skin-client-pref-vector-feature-custom-font-size-group" id="skin-client-pref-vector-feature-custom-font-size-value-1" type="radio" value="1" data-event-name="skin-client-pref-vector-feature-custom-font-size-value-1" class="cdx-radio__input"><span class="cdx-radio__icon"></span><label for="skin-client-pref-vector-feature-custom-font-size-value-1" class="cdx-radio__label">Standard</label></div><div class="cdx-radio"><input name="skin-client-pref-vector-feature-custom-font-size-group" id="skin-client-pref-vector-feature-custom-font-size-value-2" type="radio" value="2" data-event-name="skin-client-pref-vector-feature-custom-font-size-value-2" class="cdx-radio__input"><span class="cdx-radio__icon"></span><label for="skin-client-pref-vector-feature-custom-font-size-value-2" class="cdx-radio__label">Large</label></div></form></div></li></ul><span class="skin-client-pref-exclusion-notice">This page always uses small font size</span></div></div><div class="mw-portlet mw-portlet-skin-client-prefs-vector-feature-limited-width vector-menu" id="skin-client-prefs-vector-feature-limited-width"><div class="vector-menu-heading">Width</div><div class="vector-menu-content"><ul class="vector-menu-content-list"><li class="mw-list-item mw-list-item-js"><div class=""><form><div class="cdx-radio"><input name="skin-client-pref-vector-feature-limited-width-group" id="skin-client-pref-vector-feature-limited-width-value-1" type="radio" value="1" data-event-name="skin-client-pref-vector-feature-limited-width-value-1" class="cdx-radio__input"><span class="cdx-radio__icon"></span><label for="skin-client-pref-vector-feature-limited-width-value-1" class="cdx-radio__label">Standard</label></div><div class="cdx-radio"><input name="skin-client-pref-vector-feature-limited-width-group" id="skin-client-pref-vector-feature-limited-width-value-0" type="radio" value="0" data-event-name="skin-client-pref-vector-feature-limited-width-value-0" class="cdx-radio__input"><span class="cdx-radio__icon"></span><label for="skin-client-pref-vector-feature-limited-width-value-0" class="cdx-radio__label">Wide</label></div></form></div></li></ul><span class="skin-client-pref-exclusion-notice">The content is as wide as possible for your browser window.</span></div></div><div class="mw-portlet mw-portlet-skin-client-prefs-skin-theme vector-menu" id="skin-client-prefs-skin-theme"><div class="vector-menu-heading">Color <span><span>(beta)</span></span></div><div class="vector-menu-content"><ul class="vector-menu-content-list"><li class="mw-list-item mw-list-item-js"><div class=""><form><div class="cdx-radio"><input name="skin-client-pref-skin-theme-group" id="skin-client-pref-skin-theme-value-os" type="radio" value="os" data-event-name="skin-client-pref-skin-theme-value-os" class="cdx-radio__input"><span class="cdx-radio__icon"></span><label for="skin-client-pref-skin-theme-value-os" class="cdx-radio__label">Automatic</label></div><div class="cdx-radio"><input name="skin-client-pref-skin-theme-group" id="skin-client-pref-skin-theme-value-day" type="radio" value="day" data-event-name="skin-client-pref-skin-theme-value-day" class="cdx-radio__input"><span class="cdx-radio__icon"></span><label for="skin-client-pref-skin-theme-value-day" class="cdx-radio__label">Light</label></div><div class="cdx-radio"><input name="skin-client-pref-skin-theme-group" id="skin-client-pref-skin-theme-value-night" type="radio" value="night" data-event-name="skin-client-pref-skin-theme-value-night" class="cdx-radio__input"><span class="cdx-radio__icon"></span><label for="skin-client-pref-skin-theme-value-night" class="cdx-radio__label">Dark</label></div></form><span id="skin-theme-beta-notice"></span></div></li></ul><span class="skin-client-pref-exclusion-notice">This page is always in light mode.</span></div></div></div>
+
+							</div>
+		</nav>
+					</div>
+				</div>
+				<div id="bodyContent" class="vector-body ve-init-mw-desktopArticleTarget-targetContainer" aria-labelledby="firstHeading" data-mw-ve-target-container="">
+					<div class="vector-body-before-content">
+							<div class="mw-indicators">
+		<div id="mw-indicator-good-star" class="mw-indicator"><div class="mw-parser-output"><span typeof="mw:File"><a href="/wiki/Wikipedia:Good_articles*" title="This is a good article. Click here for more information."><img alt="This is a good article. Click here for more information." src="//upload.wikimedia.org/wikipedia/en/thumb/9/94/Symbol_support_vote.svg/19px-Symbol_support_vote.svg.png" decoding="async" width="19" height="20" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/en/thumb/9/94/Symbol_support_vote.svg/29px-Symbol_support_vote.svg.png 1.5x, //upload.wikimedia.org/wikipedia/en/thumb/9/94/Symbol_support_vote.svg/39px-Symbol_support_vote.svg.png 2x" data-file-width="180" data-file-height="185"></a></span></div></div>
+		<div id="mw-indicator-pp-default" class="mw-indicator"><div class="mw-parser-output"><span typeof="mw:File"><a href="/wiki/Wikipedia:Protection_policy#semi" title="This article is semi-protected."><img alt="Page semi-protected" src="//upload.wikimedia.org/wikipedia/en/thumb/1/1b/Semi-protection-shackle.svg/20px-Semi-protection-shackle.svg.png" decoding="async" width="20" height="20" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/en/thumb/1/1b/Semi-protection-shackle.svg/30px-Semi-protection-shackle.svg.png 1.5x, //upload.wikimedia.org/wikipedia/en/thumb/1/1b/Semi-protection-shackle.svg/40px-Semi-protection-shackle.svg.png 2x" data-file-width="512" data-file-height="512"></a></span></div></div>
+		</div>
+
+						<div id="siteSub" class="noprint">From Wikipedia, the free encyclopedia</div>
+					</div>
+					<div id="contentSub"><div id="mw-content-subtitle"></div></div>
+					
+					
+					<div id="mw-content-text" class="mw-body-content"><div class="mw-content-ltr mw-parser-output" lang="en" dir="ltr"><div class="shortdescription nomobile noexcerpt noprint searchaux" style="display:none">Fruit that grows on a tree</div>
+<style data-mw-deduplicate="TemplateStyles:r1236090951">.mw-parser-output .hatnote{font-style:italic}.mw-parser-output div.hatnote{padding-left:1.6em;margin-bottom:0.5em}.mw-parser-output .hatnote i{font-style:normal}.mw-parser-output .hatnote+link+.hatnote{margin-top:-0.5em}@media print{body.ns-0 .mw-parser-output .hatnote{display:none!important}}</style><div role="note" class="hatnote navigation-not-searchable">This article is about the fruit. For the technology company, see <a href="/wiki/Apple_Inc." title="Apple Inc.">Apple Inc.</a> For other uses, see <a href="/wiki/Apple_(disambiguation)" class="mw-disambig" title="Apple (disambiguation)">Apple (disambiguation)</a>.</div>
+<link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1236090951"><div role="note" class="hatnote navigation-not-searchable">"Apple tree" redirects here. For other uses, see <a href="/wiki/Apple_tree_(disambiguation)" class="mw-disambig" title="Apple tree (disambiguation)">Apple tree (disambiguation)</a>.</div>
+<p class="mw-empty-elt">
+
+
+
+</p>
+<table class="infobox biota" style="text-align: left; width: 200px; font-size: 100%">
+
+<tbody><tr>
+<th colspan="2" style="color:inherit; text-align: center; background-color: rgb(180,250,180)">Apple
+</th></tr>
+<tr>
+<td colspan="2" style="text-align: center"><span class="mw-default-size" typeof="mw:File/Frameless"><a href="/wiki/File:Pink_lady_and_cross_section.jpg" class="mw-file-description"><img src="//upload.wikimedia.org/wikipedia/commons/thumb/a/a6/Pink_lady_and_cross_section.jpg/220px-Pink_lady_and_cross_section.jpg" decoding="async" width="220" height="75" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/commons/thumb/a/a6/Pink_lady_and_cross_section.jpg/330px-Pink_lady_and_cross_section.jpg 1.5x, //upload.wikimedia.org/wikipedia/commons/thumb/a/a6/Pink_lady_and_cross_section.jpg/440px-Pink_lady_and_cross_section.jpg 2x" data-file-width="2800" data-file-height="950"></a></span>
+</td></tr>
+<tr>
+<td colspan="2" style="text-align: center; font-size: 88%">'<a href="/wiki/Cripps_Pink" title="Cripps Pink">Cripps Pink</a>' apples
+</td></tr>
+<tr>
+<td colspan="2" style="text-align: center"><span class="mw-default-size notpageimage" typeof="mw:File/Frameless"><a href="/wiki/File:Malus_domestica_a1.jpg" class="mw-file-description"><img src="//upload.wikimedia.org/wikipedia/commons/thumb/2/22/Malus_domestica_a1.jpg/220px-Malus_domestica_a1.jpg" decoding="async" width="220" height="164" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/commons/thumb/2/22/Malus_domestica_a1.jpg/330px-Malus_domestica_a1.jpg 1.5x, //upload.wikimedia.org/wikipedia/commons/thumb/2/22/Malus_domestica_a1.jpg/440px-Malus_domestica_a1.jpg 2x" data-file-width="1280" data-file-height="956"></a></span>
+</td></tr>
+<tr>
+<td colspan="2" style="text-align: center; font-size: 88%">Flowers
+</td></tr>
+
+
+
+
+<tr>
+<th colspan="2" style="color:inherit; min-width:15em; text-align: center; background-color: rgb(180,250,180)"><a href="/wiki/Taxonomy_(biology)" title="Taxonomy (biology)">Scientific classification</a> <span class="plainlinks taxobox-edit-taxonomy skin-invert" style="font-size:smaller; float:right; padding-right:0.4em; margin-left:-3em;"><span typeof="mw:File"><a href="/wiki/Template:Taxonomy/Malus" title="Edit this classification"><img alt="Edit this classification" src="//upload.wikimedia.org/wikipedia/commons/thumb/8/8a/OOjs_UI_icon_edit-ltr.svg/15px-OOjs_UI_icon_edit-ltr.svg.png" decoding="async" width="15" height="15" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/commons/thumb/8/8a/OOjs_UI_icon_edit-ltr.svg/23px-OOjs_UI_icon_edit-ltr.svg.png 1.5x, //upload.wikimedia.org/wikipedia/commons/thumb/8/8a/OOjs_UI_icon_edit-ltr.svg/30px-OOjs_UI_icon_edit-ltr.svg.png 2x" data-file-width="20" data-file-height="20"></a></span></span>
+</th></tr>
+<tr>
+<td>Kingdom:
+</td>
+<td><a href="/wiki/Plant" title="Plant">Plantae</a>
+</td></tr>
+<tr>
+<td><i>Clade</i>:
+</td>
+<td><a href="/wiki/Vascular_plant" title="Vascular plant">Tracheophytes</a>
+</td></tr>
+<tr>
+<td><i>Clade</i>:
+</td>
+<td><a href="/wiki/Flowering_plant" title="Flowering plant">Angiosperms</a>
+</td></tr>
+<tr>
+<td><i>Clade</i>:
+</td>
+<td><a href="/wiki/Eudicots" title="Eudicots">Eudicots</a>
+</td></tr>
+<tr>
+<td><i>Clade</i>:
+</td>
+<td><a href="/wiki/Rosids" title="Rosids">Rosids</a>
+</td></tr>
+<tr>
+<td>Order:
+</td>
+<td><a href="/wiki/Rosales" title="Rosales">Rosales</a>
+</td></tr>
+<tr>
+<td>Family:
+</td>
+<td><a href="/wiki/Rosaceae" title="Rosaceae">Rosaceae</a>
+</td></tr>
+<tr>
+<td>Genus:
+</td>
+<td><a href="/wiki/Malus" title="Malus"><i>Malus</i></a>
+</td></tr>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<tr>
+<td>Species:
+</td>
+<td><div style="display:inline" class="species"><i><b>M.&nbsp;domestica</b></i></div>
+</td></tr>
+
+
+
+
+
+
+
+
+<tr>
+<th colspan="2" style="color:inherit; text-align: center; background-color: rgb(180,250,180)"><a href="/wiki/Binomial_nomenclature" title="Binomial nomenclature">Binomial name</a>
+</th></tr>
+<tr>
+<td colspan="2" style="text-align: center"><b><span class="binomial"><span style="font-weight:normal;"></span><i>Malus domestica</i></span></b><br><div style="font-size: 85%;">(<a href="/wiki/Georg_Adolf_Suckow" title="Georg Adolf Suckow">Suckow</a>) <a href="/wiki/Borkh." class="mw-redirect" title="Borkh.">Borkh.</a></div>
+</td></tr>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+<tr>
+<th colspan="2" style="color:inherit; text-align: center; background-color: rgb(180,250,180)"><a href="/wiki/Synonym_(taxonomy)" title="Synonym (taxonomy)">Synonyms</a><sup id="cite_ref-FNA_1-0" class="reference"><a href="#cite_note-FNA-1"><span class="cite-bracket">[</span>1<span class="cite-bracket">]</span></a></sup><sup id="cite_ref-POWO_2-0" class="reference"><a href="#cite_note-POWO-2"><span class="cite-bracket">[</span>2<span class="cite-bracket">]</span></a></sup>
+</th></tr>
+<tr>
+<td colspan="2" style="text-align: left">
+<ul><li><i>M.&nbsp;communis</i> <small>Desf., 1768</small></li>
+<li><i>M.&nbsp;pumila</i> <small>Mil.</small></li>
+<li><i>M.&nbsp;frutescens</i> <small>Medik.</small></li>
+<li><i>M.&nbsp;paradisiaca</i> <small>(L.) Medikus</small></li>
+<li><i>M.&nbsp;sylvestris</i> <small>Mil.</small></li>
+<li><i>Pyrus malus</i> <small>L.</small></li>
+<li><i>Pyrus malus</i> var. <i>paradisiaca</i> <small>L.</small></li>
+<li><i>Pyrus dioica</i> <small>Moench</small></li></ul>
+</td></tr>
+
+</tbody></table><style data-mw-deduplicate="TemplateStyles:r1238732961">@media screen{html.skin-theme-clientpref-night .mw-parser-output .infobox.biota tr{background:transparent!important}html.skin-theme-clientpref-night .mw-parser-output .infobox.biota img{background:transparent}}@media screen and (prefers-color-scheme:dark){html.skin-theme-clientpref-os .mw-parser-output .infobox.biota tr{background:transparent!important}html.skin-theme-clientpref-os .mw-parser-output .infobox.biota img{background:white}}.mw-parser-output .infobox.biota .taxobox-edit-taxonomy img{background:transparent!important}body.skin-vector .mw-parser-output table.biota.infobox{margin-top:0.5em}body.skin--responsive .mw-parser-output table.biota.infobox tr.taxonrow td{padding:2px 10px}</style>
+<p>An <b>apple</b> is a round, edible <a href="/wiki/Fruit" title="Fruit">fruit</a> produced by an <b>apple tree</b> (<a href="/wiki/Malus" title="Malus"><i>Malus spp.</i></a>, among them the <b>domestic</b> or <b>orchard apple</b>; <i><b>Malus domestica</b></i>). Apple <a href="/wiki/Fruit_tree" title="Fruit tree">trees</a> are <a href="/wiki/Agriculture" title="Agriculture">cultivated</a> worldwide and are the most widely grown species in the <a href="/wiki/Genus" title="Genus">genus</a> <i><a href="/wiki/Malus" title="Malus">Malus</a></i>. The <a href="/wiki/Tree" title="Tree">tree</a> originated in <a href="/wiki/Central_Asia" title="Central Asia">Central Asia</a>, where its wild ancestor, <i><a href="/wiki/Malus_sieversii" title="Malus sieversii">Malus sieversii</a></i>, is still found. Apples have been grown for thousands of years in Eurasia and were introduced to North America by <a href="/wiki/European_colonization_of_the_Americas" title="European colonization of the Americas">European colonists</a>. Apples have <a href="/wiki/Religious" class="mw-redirect" title="Religious">religious</a> and <a href="/wiki/Mythological" class="mw-redirect" title="Mythological">mythological</a> significance in many cultures, including <a href="/wiki/Norse_mythology" title="Norse mythology">Norse</a>, <a href="/wiki/Greek_mythology" title="Greek mythology">Greek</a>, and <a href="/wiki/European_Christian" class="mw-redirect" title="European Christian">European Christian</a> tradition.
+</p><p>Apples grown from seed tend to be very different from those of their parents, and the resultant fruit frequently lacks desired characteristics. For commercial purposes, including botanical evaluation, apple <a href="/wiki/Cultivar" title="Cultivar">cultivars</a> are propagated by clonal <a href="/wiki/Grafting" title="Grafting">grafting</a> onto <a href="/wiki/Rootstock" title="Rootstock">rootstocks</a>. Apple trees grown without rootstocks tend to be larger and much slower to fruit after planting. Rootstocks are used to control the speed of growth and the size of the resulting tree, allowing for easier harvesting.
+</p><p>There are <a href="/wiki/List_of_apple_cultivars" title="List of apple cultivars">more than 7,500 cultivars of apples</a>. Different cultivars are bred for various tastes and uses, including <a href="/wiki/Cooking_apple" title="Cooking apple">cooking</a>, eating raw, and <a href="/wiki/Cider" title="Cider">cider</a> or <a href="/wiki/Apple_cider" title="Apple cider">apple juice</a> production. Trees and fruit are prone to <a href="/wiki/Fungal" class="mw-redirect" title="Fungal">fungal</a>, bacterial, and pest problems, which can be controlled by a number of <a href="/wiki/Organic_farming" title="Organic farming">organic</a> and non-organic means. In 2010, the fruit's <a href="/wiki/Genome" title="Genome">genome</a> was <a href="/wiki/DNA_sequencing" title="DNA sequencing">sequenced</a> as part of research on disease control and selective breeding in apple production.
+</p>
+<meta property="mw:PageProp/toc">
+<div class="mw-heading mw-heading2"><h2 id="Etymology">Etymology</h2></div>
+<p>The word <i>apple</i>, whose <a href="/wiki/Old_English" title="Old English">Old English</a> ancestor is <span title="Old English (ca. 450-1100)-language text"><i lang="ang-Latn">æppel</i></span>, is descended from the <a href="/wiki/Proto-Germanic" class="mw-redirect" title="Proto-Germanic">Proto-Germanic</a> noun <span title="Proto-Germanic-language text">*<i lang="gem">aplaz</i></span>, descended in turn from <a href="/wiki/Proto-Indo-European" class="mw-redirect" title="Proto-Indo-European">Proto-Indo-European</a> <span title="Proto-Indo-European-language text">*<i lang="ine">h₂ébōl</i></span>.<sup id="cite_ref-Lisa_Lim_3-0" class="reference"><a href="#cite_note-Lisa_Lim-3"><span class="cite-bracket">[</span>3<span class="cite-bracket">]</span></a></sup> As late as the 17th century, the word also functioned as a generic term for all fruit, including <a href="/wiki/Nut_(fruit)" title="Nut (fruit)">nuts</a>. This can be compared to the 14th-century <a href="/wiki/Middle_English" title="Middle English">Middle English</a> expression <span title="Middle English (1100-1500)-language text"><i lang="enm">appel of paradis</i></span>, meaning a <a href="/wiki/Banana" title="Banana">banana</a>.<sup id="cite_ref-4" class="reference"><a href="#cite_note-4"><span class="cite-bracket">[</span>4<span class="cite-bracket">]</span></a></sup>
+</p>
+<div class="mw-heading mw-heading2"><h2 id="Description">Description</h2></div>
+<p>The apple is a <a href="/wiki/Deciduous" title="Deciduous">deciduous</a> tree, generally standing 2 to 4.5 metres (6 to 15 feet) tall in cultivation and up to 15&nbsp;m (49&nbsp;ft) in the wild, though more typically 2 to 10&nbsp;m (6.5 to 33&nbsp;ft).<sup id="cite_ref-UofGeorgia_5-0" class="reference"><a href="#cite_note-UofGeorgia-5"><span class="cite-bracket">[</span>5<span class="cite-bracket">]</span></a></sup><sup id="cite_ref-FNA_1-1" class="reference"><a href="#cite_note-FNA-1"><span class="cite-bracket">[</span>1<span class="cite-bracket">]</span></a></sup> When cultivated, the size, shape and branch density are determined by <a href="/wiki/Rootstock" title="Rootstock">rootstock</a> selection and trimming method.<sup id="cite_ref-UofGeorgia_5-1" class="reference"><a href="#cite_note-UofGeorgia-5"><span class="cite-bracket">[</span>5<span class="cite-bracket">]</span></a></sup> Apple trees may naturally have a rounded to erect crown with a dense canopy of leaves.<sup id="cite_ref-NC_Extension_6-0" class="reference"><a href="#cite_note-NC_Extension-6"><span class="cite-bracket">[</span>6<span class="cite-bracket">]</span></a></sup> The bark of the trunk is dark gray or gray-brown, but young branches are reddish or dark-brown with a smooth texture.<sup id="cite_ref-FNA_1-2" class="reference"><a href="#cite_note-FNA-1"><span class="cite-bracket">[</span>1<span class="cite-bracket">]</span></a></sup><sup id="cite_ref-Heil_et_al._7-0" class="reference"><a href="#cite_note-Heil_et_al.-7"><span class="cite-bracket">[</span>7<span class="cite-bracket">]</span></a></sup> When young twigs are covered in very fine downy hairs and become hairless as they become older.<sup id="cite_ref-Heil_et_al._7-1" class="reference"><a href="#cite_note-Heil_et_al.-7"><span class="cite-bracket">[</span>7<span class="cite-bracket">]</span></a></sup>
+</p><p>The buds are egg-shaped and dark red or purple in color; they range in size from 3 to 5&nbsp;millimeters, but are usually less than 4&nbsp;mm. The <a href="/wiki/Bud_scale" class="mw-redirect" title="Bud scale">bud scales</a> have very hairy edges. When emerging from the buds, the leaves are <dfn><a href="/wiki/Glossary_of_botanical_terms#convolute" title="Glossary of botanical terms"><span title="See entry at: Glossary of botanical terms § convolute" style="color:inherit;" class="glossary-link">convolute</span></a></dfn>, meaning that their edges overlap each other.<sup id="cite_ref-FNA_1-3" class="reference"><a href="#cite_note-FNA-1"><span class="cite-bracket">[</span>1<span class="cite-bracket">]</span></a></sup> Leaves can be  simple ovals (<a href="/wiki/Elliptic_leaves" class="mw-redirect" title="Elliptic leaves">elliptic</a>), medium or wide in width, somewhat egg-shaped with the wider portion toward their base (<a href="/wiki/Ovate_leaves" class="mw-redirect" title="Ovate leaves">ovate</a>), or even with sides that are more parallel to each other instead of curved (<a href="/wiki/Oblong_leaves" class="mw-redirect" title="Oblong leaves">oblong</a>) with a narrow pointed end.<sup id="cite_ref-Heil_et_al._7-2" class="reference"><a href="#cite_note-Heil_et_al.-7"><span class="cite-bracket">[</span>7<span class="cite-bracket">]</span></a></sup><sup id="cite_ref-FNA_1-4" class="reference"><a href="#cite_note-FNA-1"><span class="cite-bracket">[</span>1<span class="cite-bracket">]</span></a></sup> The edges have broadly-angled teeth, but do not have lobes. The top surface of the leaves are <dfn><a href="/wiki/Glossary_of_botanical_terms#glabrescent" title="Glossary of botanical terms"><span title="See entry at: Glossary of botanical terms § glabrescent" style="color:inherit;" class="glossary-link">glabrescent</span></a></dfn>, almost hairless, while the undersides are densely covered in fine hairs.<sup id="cite_ref-FNA_1-5" class="reference"><a href="#cite_note-FNA-1"><span class="cite-bracket">[</span>1<span class="cite-bracket">]</span></a></sup> The leaves are attached <a href="/wiki/Alternate_leaf" class="mw-redirect" title="Alternate leaf">alternately</a> by short leaf stems <style data-mw-deduplicate="TemplateStyles:r1154941027">.mw-parser-output .frac{white-space:nowrap}.mw-parser-output .frac .num,.mw-parser-output .frac .den{font-size:80%;line-height:0;vertical-align:super}.mw-parser-output .frac .den{vertical-align:sub}.mw-parser-output .sr-only{border:0;clip:rect(0,0,0,0);clip-path:polygon(0px 0px,0px 0px,0px 0px);height:1px;margin:-1px;overflow:hidden;padding:0;position:absolute;width:1px}</style>1-to-3.5&nbsp;cm (<span class="frac"><span class="num">1</span>⁄<span class="den">2</span></span>-to-<span class="frac">1<span class="sr-only">+</span><span class="num">1</span>⁄<span class="den">2</span></span>&nbsp;in) long.<sup id="cite_ref-NC_Extension_6-1" class="reference"><a href="#cite_note-NC_Extension-6"><span class="cite-bracket">[</span>6<span class="cite-bracket">]</span></a></sup><sup id="cite_ref-FNA_1-6" class="reference"><a href="#cite_note-FNA-1"><span class="cite-bracket">[</span>1<span class="cite-bracket">]</span></a></sup>
+</p><p><a href="/wiki/Blossoms" class="mw-redirect" title="Blossoms">Blossoms</a> are produced in <a href="/wiki/Spring_(season)" title="Spring (season)">spring</a> simultaneously with the budding of the leaves and are produced on spurs and some long <a href="/wiki/Shoot_(botany)" title="Shoot (botany)">shoots</a>.<sup id="cite_ref-UofGeorgia_5-2" class="reference"><a href="#cite_note-UofGeorgia-5"><span class="cite-bracket">[</span>5<span class="cite-bracket">]</span></a></sup> When the flower buds first begin to open the <a href="/wiki/Petal" title="Petal">petals</a> are rose-pink and fade to white or light pink when fully open with each flower <link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1154941027">3-to-4-centimeter (1-to-<span class="frac">1<span class="sr-only">+</span><span class="num">1</span>⁄<span class="den">2</span></span>-inch) in diameter.<sup id="cite_ref-FNA_1-7" class="reference"><a href="#cite_note-FNA-1"><span class="cite-bracket">[</span>1<span class="cite-bracket">]</span></a></sup> The five-petaled flowers are group in an <a href="/wiki/Inflorescence" title="Inflorescence">inflorescence</a> consisting of a <a href="/wiki/Cyme_(botany)" class="mw-redirect" title="Cyme (botany)">cyme</a> with 3–7 flowers.<sup id="cite_ref-Lim_2012_8-0" class="reference"><a href="#cite_note-Lim_2012-8"><span class="cite-bracket">[</span>8<span class="cite-bracket">]</span></a></sup> The central flower of the inflorescence is called the "king bloom"; it opens first and can develop a larger fruit.<sup id="cite_ref-NC_Extension_6-2" class="reference"><a href="#cite_note-NC_Extension-6"><span class="cite-bracket">[</span>6<span class="cite-bracket">]</span></a></sup> Open apple blossoms are damaged by even brief exposures to temperatures −2&nbsp;°C (28&nbsp;°F) or less, although the overwintering wood and buds are hardy down to −40&nbsp;°C (−40&nbsp;°F).<sup id="cite_ref-Lim_2012_8-1" class="reference"><a href="#cite_note-Lim_2012-8"><span class="cite-bracket">[</span>8<span class="cite-bracket">]</span></a></sup>
+</p>
+<style data-mw-deduplicate="TemplateStyles:r1248256098">@media all and (max-width:720px){.mw-parser-output .mod-gallery{width:100%!important}}.mw-parser-output .mod-gallery{display:table}.mw-parser-output .mod-gallery-default{background:transparent;margin-top:4px}.mw-parser-output .mod-gallery-center{margin-left:auto;margin-right:auto}.mw-parser-output .mod-gallery-left{float:left}.mw-parser-output .mod-gallery-right{float:right}.mw-parser-output .mod-gallery-none{float:none}.mw-parser-output .mod-gallery-collapsible{width:100%}.mw-parser-output .mod-gallery .title,.mw-parser-output .mod-gallery .main,.mw-parser-output .mod-gallery .footer{display:table-row}.mw-parser-output .mod-gallery .title>div{display:table-cell;padding:0 4px 4px;text-align:center;font-weight:bold}.mw-parser-output .mod-gallery .main>div{display:table-cell}.mw-parser-output .mod-gallery .gallery{line-height:1.35em}.mw-parser-output .mod-gallery .footer>div{display:table-cell;padding:4px;text-align:right;font-size:85%;line-height:1em}.mw-parser-output .mod-gallery .title>div *,.mw-parser-output .mod-gallery .footer>div *{overflow:visible}.mw-parser-output .mod-gallery .gallerybox img{background:none!important}.mw-parser-output .mod-gallery .bordered-images .thumb img{border:solid var(--background-color-neutral,#eaecf0)1px}.mw-parser-output .mod-gallery .whitebg .thumb{background:var(--background-color-base,#fff)!important}</style><div class="mod-gallery mod-gallery-default mod-gallery-center"><div class="main"><div><ul class="gallery mw-gallery-packed nochecker bordered-images whitebg">
+		<li class="gallerybox" style="width: 268.382px;">
+			<div class="thumb" style="width: 266.382px;"><span typeof="mw:File"><a href="/wiki/File:Apple_Blossom_@_Manali.jpg" class="mw-file-description" title="Apple blossoms"><img alt="Apple blossoms" src="//upload.wikimedia.org/wikipedia/commons/thumb/b/b3/Apple_Blossom_%40_Manali.jpg/405px-Apple_Blossom_%40_Manali.jpg" decoding="async" width="405" height="270" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/commons/thumb/b/b3/Apple_Blossom_%40_Manali.jpg/608px-Apple_Blossom_%40_Manali.jpg 1.5x, //upload.wikimedia.org/wikipedia/commons/thumb/b/b3/Apple_Blossom_%40_Manali.jpg/810px-Apple_Blossom_%40_Manali.jpg 2x" data-file-width="6000" data-file-height="4000"></a></span></div>
+			<div class="gallerytext">Apple blossoms</div>
+		</li>
+		<li class="gallerybox" style="width: 143.399px;">
+			<div class="thumb" style="width: 142.071px;"><span typeof="mw:File"><a href="/wiki/File:Malus_domestica_-_K%C3%B6hler%E2%80%93s_Medizinal-Pflanzen-108.jpg" class="mw-file-description" title="Botanical illustration"><img alt="Botanical illustration" src="//upload.wikimedia.org/wikipedia/commons/thumb/c/c9/Malus_domestica_-_K%C3%B6hler%E2%80%93s_Medizinal-Pflanzen-108.jpg/215px-Malus_domestica_-_K%C3%B6hler%E2%80%93s_Medizinal-Pflanzen-108.jpg" decoding="async" width="215" height="270" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/commons/thumb/c/c9/Malus_domestica_-_K%C3%B6hler%E2%80%93s_Medizinal-Pflanzen-108.jpg/322px-Malus_domestica_-_K%C3%B6hler%E2%80%93s_Medizinal-Pflanzen-108.jpg 1.5x, //upload.wikimedia.org/wikipedia/commons/thumb/c/c9/Malus_domestica_-_K%C3%B6hler%E2%80%93s_Medizinal-Pflanzen-108.jpg/430px-Malus_domestica_-_K%C3%B6hler%E2%80%93s_Medizinal-Pflanzen-108.jpg 2x" data-file-width="465" data-file-height="584"></a></span></div>
+			<div class="gallerytext">Botanical illustration</div>
+		</li>
+</ul></div></div></div>
+<div class="mw-heading mw-heading3"><h3 id="Fruit">Fruit</h3></div>
+<p>The <a href="/wiki/Fruit" title="Fruit">fruit</a> is a <a href="/wiki/Pome" title="Pome">pome</a> that matures in late <a href="/wiki/Summer" title="Summer">summer</a> or <a href="/wiki/Autumn" title="Autumn">autumn</a>.<sup id="cite_ref-FNA_1-8" class="reference"><a href="#cite_note-FNA-1"><span class="cite-bracket">[</span>1<span class="cite-bracket">]</span></a></sup> The true fruits or <a href="/wiki/Carpel" class="mw-redirect" title="Carpel">carpels</a> are the harder interior chambers inside the apple's core. There are usually five carpels inside an apple, but there may be as few as three. Each of the chambers contains one or two seeds.<sup id="cite_ref-9" class="reference"><a href="#cite_note-9"><span class="cite-bracket">[</span>9<span class="cite-bracket">]</span></a></sup> The edible flesh is formed from the receptacle at the base of the flower.<sup id="cite_ref-10" class="reference"><a href="#cite_note-10"><span class="cite-bracket">[</span>10<span class="cite-bracket">]</span></a></sup>
+</p>
+<ul class="gallery mw-gallery-nolines center">
+		<li class="gallerybox" style="width: 405px">
+			<div class="thumb" style="width: 400px;"><span typeof="mw:File"><a href="/wiki/File:Apple_anatomy,_flower_and_fruit_compared.svg" class="mw-file-description" title="How apple fruit derives from flower structures"><img alt="How apple fruit derives from flower structures" src="//upload.wikimedia.org/wikipedia/commons/thumb/e/e8/Apple_anatomy%2C_flower_and_fruit_compared.svg/400px-Apple_anatomy%2C_flower_and_fruit_compared.svg.png" decoding="async" width="400" height="225" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/commons/thumb/e/e8/Apple_anatomy%2C_flower_and_fruit_compared.svg/600px-Apple_anatomy%2C_flower_and_fruit_compared.svg.png 1.5x, //upload.wikimedia.org/wikipedia/commons/thumb/e/e8/Apple_anatomy%2C_flower_and_fruit_compared.svg/800px-Apple_anatomy%2C_flower_and_fruit_compared.svg.png 2x" data-file-width="1280" data-file-height="720"></a></span></div>
+			<div class="gallerytext">How apple fruit derives from flower structures</div>
+		</li>
+</ul>
+<p>The seeds are egg- to pear-shaped and may be colored from light brown or tan to a very dark brown, often with red shades or even purplish-black. They may have a blunt or sharp point.<sup id="cite_ref-11" class="reference"><a href="#cite_note-11"><span class="cite-bracket">[</span>11<span class="cite-bracket">]</span></a></sup> The five sepals remain attached and stand out from the surface of the apple.<sup id="cite_ref-FNA_1-9" class="reference"><a href="#cite_note-FNA-1"><span class="cite-bracket">[</span>1<span class="cite-bracket">]</span></a></sup>
+</p><p>The size of the fruit varies widely between cultivars, but generally has a diameter between 2.5 and 12&nbsp;cm (1 and 5&nbsp;in).<sup id="cite_ref-Heil_et_al._7-3" class="reference"><a href="#cite_note-Heil_et_al.-7"><span class="cite-bracket">[</span>7<span class="cite-bracket">]</span></a></sup> The shape is quite variable and may be nearly round, elongated, conical, or short and wide.<sup id="cite_ref-12" class="reference"><a href="#cite_note-12"><span class="cite-bracket">[</span>12<span class="cite-bracket">]</span></a></sup>
+</p><p>The groundcolor of ripe apples is yellow, green, yellow-green or whitish yellow. The overcolor of ripe apples can be orange-red, pink-red, red, purple-red or brown-red.  The overcolor amount can be 0–100%.<sup id="cite_ref-Janick_13-0" class="reference"><a href="#cite_note-Janick-13"><span class="cite-bracket">[</span>13<span class="cite-bracket">]</span></a></sup> The skin may be wholly or partly <a href="/wiki/Russeting" title="Russeting">russeted</a>, making it rough and brown. The skin is covered in a protective layer of <a href="/wiki/Epicuticular_wax" title="Epicuticular wax">epicuticular wax</a>.<sup id="cite_ref-14" class="reference"><a href="#cite_note-14"><span class="cite-bracket">[</span>14<span class="cite-bracket">]</span></a></sup> The skin may also be marked with scattered dots.<sup id="cite_ref-FNA_1-10" class="reference"><a href="#cite_note-FNA-1"><span class="cite-bracket">[</span>1<span class="cite-bracket">]</span></a></sup> The flesh is generally pale yellowish-white, though it can be pink, yellow or green.<sup id="cite_ref-Janick_13-1" class="reference"><a href="#cite_note-Janick-13"><span class="cite-bracket">[</span>13<span class="cite-bracket">]</span></a></sup>
+</p>
+<ul class="gallery mw-gallery-packed">
+	<li class="gallerycaption">Apples can have any amount of overcolor, a darker tint over a pale groundcolor.</li>
+		<li class="gallerybox" style="width: 99.3281px;">
+			<div class="thumb" style="width: 98px;"><span typeof="mw:File"><a href="/wiki/File:Yellow_Transparent_(cropped).jpg" class="mw-file-description" title="0% overcolor"><img alt="0% overcolor" src="//upload.wikimedia.org/wikipedia/commons/thumb/a/a2/Yellow_Transparent_%28cropped%29.jpg/146px-Yellow_Transparent_%28cropped%29.jpg" decoding="async" width="146" height="179" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/commons/thumb/a/a2/Yellow_Transparent_%28cropped%29.jpg/220px-Yellow_Transparent_%28cropped%29.jpg 1.5x, //upload.wikimedia.org/wikipedia/commons/thumb/a/a2/Yellow_Transparent_%28cropped%29.jpg/293px-Yellow_Transparent_%28cropped%29.jpg 2x" data-file-width="748" data-file-height="919"></a></span></div>
+			<div class="gallerytext">0% overcolor</div>
+		</li>
+		<li class="gallerybox" style="width: 115.328px;">
+			<div class="thumb" style="width: 114px;"><span typeof="mw:File"><a href="/wiki/File:Lobo_(apple)_(cropped).jpg" class="mw-file-description" title="100% overcolor"><img alt="100% overcolor" src="//upload.wikimedia.org/wikipedia/commons/thumb/f/f1/Lobo_%28apple%29_%28cropped%29.jpg/170px-Lobo_%28apple%29_%28cropped%29.jpg" decoding="async" width="170" height="180" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/commons/thumb/f/f1/Lobo_%28apple%29_%28cropped%29.jpg/255px-Lobo_%28apple%29_%28cropped%29.jpg 1.5x, //upload.wikimedia.org/wikipedia/commons/thumb/f/f1/Lobo_%28apple%29_%28cropped%29.jpg/340px-Lobo_%28apple%29_%28cropped%29.jpg 2x" data-file-width="1327" data-file-height="1406"></a></span></div>
+			<div class="gallerytext">100% overcolor</div>
+		</li>
+</ul>
+<div class="mw-heading mw-heading3"><h3 id="Chemistry">Chemistry</h3></div>
+<p>Important volatile compounds in apples that contribute to their scent and flavour include <a href="/wiki/Acetaldehyde" title="Acetaldehyde">acetaldehyde</a>, <a href="/wiki/Ethyl_acetate" title="Ethyl acetate">ethyl acetate</a>, <a href="/wiki/Butyraldehyde" title="Butyraldehyde">1-butanal</a>, <a href="/wiki/Ethanol" title="Ethanol">ethanol</a>, 2-methylbutanal, <a href="/wiki/3-methylbutanal" class="mw-redirect" title="3-methylbutanal">3-methylbutanal</a>, <a href="/wiki/Ethyl_propionate" title="Ethyl propionate">ethyl propionate</a>, ethyl 2-methylpropionate, <a href="/wiki/Ethyl_butyrate" title="Ethyl butyrate">ethyl butyrate</a>, ethyl 2-methyl butyrate, <a href="/wiki/Hexanal" title="Hexanal">hexanal</a>, <a href="/wiki/1-butanol" class="mw-redirect" title="1-butanol">1-butanol</a>, <a href="/wiki/3-methylbutyl_acetate" class="mw-redirect" title="3-methylbutyl acetate">3-methylbutyl acetate</a>, 2-methylbutyl acetate, 1-propyl butyrate, <a href="/wiki/Ethyl_pentanoate" title="Ethyl pentanoate">ethyl pentanoate</a>, <a href="/wiki/Amyl_acetate" title="Amyl acetate">amyl acetate</a>, <a href="/wiki/2-methyl-1-butanol" class="mw-redirect" title="2-methyl-1-butanol">2-methyl-1-butanol</a>, trans-2-hexenal, <a href="/wiki/Ethyl_hexanoate" title="Ethyl hexanoate">ethyl hexanoate</a>, <a href="/wiki/Hexanol" title="Hexanol">hexanol</a>.<sup id="cite_ref-15" class="reference"><a href="#cite_note-15"><span class="cite-bracket">[</span>15<span class="cite-bracket">]</span></a></sup><sup id="cite_ref-16" class="reference"><a href="#cite_note-16"><span class="cite-bracket">[</span>16<span class="cite-bracket">]</span></a></sup>
+</p>
+<div class="mw-heading mw-heading2"><h2 id="Taxonomy">Taxonomy</h2></div>
+<p>The apple as a species has more than 100 alternative scientific names, or <a href="/wiki/Synonym_(taxonomy)" title="Synonym (taxonomy)">synonyms</a>.<sup id="cite_ref-Proposal_to_conserve_17-0" class="reference"><a href="#cite_note-Proposal_to_conserve-17"><span class="cite-bracket">[</span>17<span class="cite-bracket">]</span></a></sup> In modern times, <i>Malus pumila</i> and <i>Malus domestica</i> are the two main names in use. <i>M.&nbsp;pumila</i> is the older name, but <i>M.&nbsp;domestica</i> has become much more commonly used starting in the 21st century, especially in the western world. Two proposals were made to make <i>M.&nbsp;domestica</i> a <a href="/wiki/Conserved_name" title="Conserved name">conserved name</a>: the earlier proposal was voted down by the Committee for Vascular Plants of the <a href="/wiki/International_Association_for_Plant_Taxonomy" title="International Association for Plant Taxonomy">IAPT</a> in 2014, but in April 2017 the Committee decided, with a narrow majority, that the newly popular name should be conserved.<sup id="cite_ref-18" class="reference"><a href="#cite_note-18"><span class="cite-bracket">[</span>18<span class="cite-bracket">]</span></a></sup> The General Committee of the IAPT decided in June 2017 to approve this change, officially conserving <i>M.&nbsp;domestica</i>.<sup id="cite_ref-19" class="reference"><a href="#cite_note-19"><span class="cite-bracket">[</span>19<span class="cite-bracket">]</span></a></sup> Nevertheless, some works published after 2017 still use <i>M.&nbsp;pumila</i> as the <a href="/wiki/Correct_name" title="Correct name">correct name</a>, under an alternate taxonomy.<sup id="cite_ref-POWO_2-1" class="reference"><a href="#cite_note-POWO-2"><span class="cite-bracket">[</span>2<span class="cite-bracket">]</span></a></sup>
+</p><p>When first classified by <a href="/wiki/Linnaeus" class="mw-redirect" title="Linnaeus">Linnaeus</a> in 1753, the pears, apples, and quinces were combined into one genus that he named <i><a href="/wiki/Pyrus" class="mw-redirect" title="Pyrus">Pyrus</a></i> and he named the apple as <i>Pyrus malus</i>. This was widely accepted, however the botanist <a href="/wiki/Philip_Miller" title="Philip Miller">Philip Miller</a> published an alternate classification in <a href="/wiki/The_Gardeners_Dictionary" title="The Gardeners Dictionary">The Gardeners Dictionary</a> with the apple species separated from <i>Pyrus</i> in 1754. He did not clearly indicate that by <i>Malus pumila</i> he meant the domesticated apple. Nonetheless, it was used as such by many botanists. When <a href="/wiki/Moritz_Balthasar_Borkhausen" title="Moritz Balthasar Borkhausen">Moritz Balthasar Borkhausen</a> published his scientific description of the apple in 1803 it may have been a new combination of <i>P.&nbsp;malus</i> var. <i>domestica</i>, but this was not directly referenced by Borkhausen.<sup id="cite_ref-Proposal_to_conserve_17-1" class="reference"><a href="#cite_note-Proposal_to_conserve-17"><span class="cite-bracket">[</span>17<span class="cite-bracket">]</span></a></sup> The earliest use of var. <i>domestica</i> for the apple was by <a href="/wiki/Georg_Adolf_Suckow" title="Georg Adolf Suckow">Georg Adolf Suckow</a> in 1786.<sup id="cite_ref-POWO_2-2" class="reference"><a href="#cite_note-POWO-2"><span class="cite-bracket">[</span>2<span class="cite-bracket">]</span></a></sup>
+</p>
+<div class="mw-heading mw-heading3"><h3 id="Genome">Genome</h3></div>
+<link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1236090951"><div role="note" class="hatnote navigation-not-searchable">Further information: <a href="/wiki/Apple_genome" title="Apple genome">Apple genome</a></div>
+<p>Apples are <a href="/wiki/Diploid" class="mw-redirect" title="Diploid">diploid</a>, with two sets of <a href="/wiki/Chromosome" title="Chromosome">chromosomes</a> per cell (though triploid cultivars, with three sets, are not uncommon), have 17 chromosomes and an estimated <a href="/wiki/Genome" title="Genome">genome</a> size of approximately 650 Mb. Several whole genome sequences have been completed and made available. The first one in 2010 was based on the diploid cultivar '<a href="/wiki/Golden_Delicious" title="Golden Delicious">Golden Delicious</a>'.<sup id="cite_ref-Velasco_et_al._20-0" class="reference"><a href="#cite_note-Velasco_et_al.-20"><span class="cite-bracket">[</span>20<span class="cite-bracket">]</span></a></sup> However, this first whole genome sequence contained several errors,<sup id="cite_ref-21" class="reference"><a href="#cite_note-21"><span class="cite-bracket">[</span>21<span class="cite-bracket">]</span></a></sup> in part owing to the high degree of <a href="/wiki/Heterozygosity" class="mw-redirect" title="Heterozygosity">heterozygosity</a> in diploid apples which, in combination with an ancient genome duplication, complicated the assembly. Recently, double- and trihaploid individuals have been sequenced, yielding whole genome sequences of higher quality.<sup id="cite_ref-Daccord_et_al._22-0" class="reference"><a href="#cite_note-Daccord_et_al.-22"><span class="cite-bracket">[</span>22<span class="cite-bracket">]</span></a></sup><sup id="cite_ref-Zhang_et_al._23-0" class="reference"><a href="#cite_note-Zhang_et_al.-23"><span class="cite-bracket">[</span>23<span class="cite-bracket">]</span></a></sup>
+</p><p>The first whole genome assembly was estimated to contain around 57,000 genes,<sup id="cite_ref-Velasco_et_al._20-1" class="reference"><a href="#cite_note-Velasco_et_al.-20"><span class="cite-bracket">[</span>20<span class="cite-bracket">]</span></a></sup> though the more recent genome sequences support estimates between 42,000 and 44,700 protein-coding genes.<sup id="cite_ref-Daccord_et_al._22-1" class="reference"><a href="#cite_note-Daccord_et_al.-22"><span class="cite-bracket">[</span>22<span class="cite-bracket">]</span></a></sup><sup id="cite_ref-Zhang_et_al._23-1" class="reference"><a href="#cite_note-Zhang_et_al.-23"><span class="cite-bracket">[</span>23<span class="cite-bracket">]</span></a></sup> The availability of whole genome sequences has provided evidence that the wild ancestor of the cultivated apple most likely is <i>Malus sieversii</i>. Re-sequencing of multiple accessions has supported this, while also suggesting extensive introgression from <i>Malus sylvestris</i> following domestication.<sup id="cite_ref-Duan_2017_24-0" class="reference"><a href="#cite_note-Duan_2017-24"><span class="cite-bracket">[</span>24<span class="cite-bracket">]</span></a></sup>
+</p>
+<div class="mw-heading mw-heading2"><h2 id="Cultivation">Cultivation</h2></div>
+<div class="mw-heading mw-heading3"><h3 id="History">History</h3></div>
+<figure class="mw-default-size" typeof="mw:File/Thumb"><a href="/wiki/File:Apple_origins_map.svg" class="mw-file-description"><img src="//upload.wikimedia.org/wikipedia/commons/thumb/3/31/Apple_origins_map.svg/550px-Apple_origins_map.svg.png" decoding="async" width="550" height="310" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/commons/thumb/3/31/Apple_origins_map.svg/825px-Apple_origins_map.svg.png 1.5x, //upload.wikimedia.org/wikipedia/commons/thumb/3/31/Apple_origins_map.svg/1100px-Apple_origins_map.svg.png 2x" data-file-width="1280" data-file-height="720"></a><figcaption>Map of the origins of the cultivated apple. The wild origin is in Kazakhstan; hybridisations and repeated domestications followed, modifying many attributes of the fruit.<sup id="cite_ref-Duan_2017_24-1" class="reference"><a href="#cite_note-Duan_2017-24"><span class="cite-bracket">[</span>24<span class="cite-bracket">]</span></a></sup></figcaption></figure>
+<figure class="mw-default-size" typeof="mw:File/Thumb"><a href="/wiki/File:95apple.jpeg" class="mw-file-description"><img alt="color photograph of a hand holding a red apple" src="//upload.wikimedia.org/wikipedia/commons/thumb/9/92/95apple.jpeg/220px-95apple.jpeg" decoding="async" width="220" height="165" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/commons/thumb/9/92/95apple.jpeg/330px-95apple.jpeg 1.5x, //upload.wikimedia.org/wikipedia/commons/thumb/9/92/95apple.jpeg/440px-95apple.jpeg 2x" data-file-width="600" data-file-height="450"></a><figcaption>Wild <i><a href="/wiki/Malus_sieversii" title="Malus sieversii">Malus sieversii</a></i> apple in Kazakhstan</figcaption></figure>
+<p><a href="/wiki/Central_Asia" title="Central Asia">Central Asia</a> is generally considered the center of origin for apples due to the genetic variability in specimens there.<sup id="cite_ref-Richards_Volk_2009_25-0" class="reference"><a href="#cite_note-Richards_Volk_2009-25"><span class="cite-bracket">[</span>25<span class="cite-bracket">]</span></a></sup> The wild ancestor of <i>Malus domestica</i> was <i><a href="/wiki/Malus_sieversii" title="Malus sieversii">Malus sieversii</a></i>, found growing wild in the <a href="/wiki/Mountains_of_Central_Asia" title="Mountains of Central Asia">mountains of Central Asia</a> in southern <a href="/wiki/Kazakhstan" title="Kazakhstan">Kazakhstan</a>, <a href="/wiki/Kyrgyzstan" title="Kyrgyzstan">Kyrgyzstan</a>, <a href="/wiki/Tajikistan" title="Tajikistan">Tajikistan</a>, and <a href="/wiki/Xinjiang" title="Xinjiang">northwestern China</a>.<sup id="cite_ref-UofGeorgia_5-3" class="reference"><a href="#cite_note-UofGeorgia-5"><span class="cite-bracket">[</span>5<span class="cite-bracket">]</span></a></sup><sup id="cite_ref-26" class="reference"><a href="#cite_note-26"><span class="cite-bracket">[</span>26<span class="cite-bracket">]</span></a></sup> Cultivation of the species, most likely beginning on the forested flanks of the <a href="/wiki/Tian_Shan" title="Tian Shan">Tian Shan</a> mountains, progressed over a long period of time and permitted secondary <a href="/wiki/Introgression" title="Introgression">introgression</a> of genes from other species into the open-pollinated seeds. Significant exchange with <i><a href="/wiki/Malus_sylvestris" title="Malus sylvestris">Malus sylvestris</a></i>, the crabapple, resulted in populations of apples being more related to crabapples than to the more <a href="/wiki/Morphology_(biology)" title="Morphology (biology)">morphologically</a> similar progenitor <i>Malus sieversii</i>. In strains without recent admixture the contribution of the latter predominates.<sup id="cite_ref-Cornille_2012_27-0" class="reference"><a href="#cite_note-Cornille_2012-27"><span class="cite-bracket">[</span>27<span class="cite-bracket">]</span></a></sup><sup id="cite_ref-28" class="reference"><a href="#cite_note-28"><span class="cite-bracket">[</span>28<span class="cite-bracket">]</span></a></sup><sup id="cite_ref-29" class="reference"><a href="#cite_note-29"><span class="cite-bracket">[</span>29<span class="cite-bracket">]</span></a></sup>
+</p><p>The apple is thought to have been domesticated 4,000–10,000 years ago in the <a href="/wiki/Tian_Shan" title="Tian Shan">Tian Shan</a> mountains, and then to have travelled along the <a href="/wiki/Silk_Road" title="Silk Road">Silk Road</a> to Europe, with hybridization and introgression of wild crabapples from Siberia (<i>M.&nbsp;baccata</i>), the Caucasus (<i>M.&nbsp;orientalis</i>), and Europe (<i>M.&nbsp;sylvestris</i>). Only the <i>M.&nbsp;sieversii</i> trees growing on the western side of the Tian Shan mountains contributed genetically to the domesticated apple, not the isolated population on the eastern side.<sup id="cite_ref-Duan_2017_24-2" class="reference"><a href="#cite_note-Duan_2017-24"><span class="cite-bracket">[</span>24<span class="cite-bracket">]</span></a></sup>
+</p><p>Chinese soft apples, such as <i><a href="/wiki/Malus_asiatica" title="Malus asiatica">M.&nbsp;asiatica</a></i> and <i><a href="/wiki/Malus_prunifolia" title="Malus prunifolia">M.&nbsp;prunifolia</a></i>, have been cultivated as dessert apples for more than 2,000 years in China. These are thought to be hybrids between <i>M.&nbsp;baccata</i> and <i>M.&nbsp;sieversii</i> in Kazakhstan.<sup id="cite_ref-Duan_2017_24-3" class="reference"><a href="#cite_note-Duan_2017-24"><span class="cite-bracket">[</span>24<span class="cite-bracket">]</span></a></sup>
+</p><p>Among the traits selected for by human growers are size, fruit acidity, color, firmness, and soluble sugar. Unusually for domesticated fruits, the wild <i>M.&nbsp;sieversii</i> origin is only slightly smaller than the modern domesticated apple.<sup id="cite_ref-Duan_2017_24-4" class="reference"><a href="#cite_note-Duan_2017-24"><span class="cite-bracket">[</span>24<span class="cite-bracket">]</span></a></sup>
+</p><p>At the Sammardenchia-Cueis site near Udine in Northeastern Italy, seeds from some form of apples have been found in material carbon dated to between 6570 and 5684 BCE.<sup id="cite_ref-30" class="reference"><a href="#cite_note-30"><span class="cite-bracket">[</span>30<span class="cite-bracket">]</span></a></sup> Genetic analysis has not yet been successfully used to determine whether such ancient apples were wild <i>Malus sylvestris</i> or <i>Malus domesticus</i> containing <i>Malus sieversii</i> ancestry. It is hard to distinguish in the archeological record between foraged wild apples and apple plantations.<sup id="cite_ref-Ancient_DNA_31-0" class="reference"><a href="#cite_note-Ancient_DNA-31"><span class="cite-bracket">[</span>31<span class="cite-bracket">]</span></a></sup>
+</p><p>There is indirect evidence of apple cultivation in the third millennium BCE in the <a href="/wiki/Middle_East" title="Middle East">Middle East</a>.<sup id="cite_ref-Ancient_DNA_31-1" class="reference"><a href="#cite_note-Ancient_DNA-31"><span class="cite-bracket">[</span>31<span class="cite-bracket">]</span></a></sup> There is direct evidence, apple cores, dated to the 10th century BCE from a Judean site between the Sinai and Negev.
+<sup id="cite_ref-32" class="reference"><a href="#cite_note-32"><span class="cite-bracket">[</span>32<span class="cite-bracket">]</span></a></sup> There was substantial apple production in European classical antiquity, and grafting was certainly known then.<sup id="cite_ref-Ancient_DNA_31-2" class="reference"><a href="#cite_note-Ancient_DNA-31"><span class="cite-bracket">[</span>31<span class="cite-bracket">]</span></a></sup> Grafting is an essential part of modern domesticated apple production, to be able to propagate the best cultivars; it is unclear when apple tree grafting was invented.<sup id="cite_ref-Ancient_DNA_31-3" class="reference"><a href="#cite_note-Ancient_DNA-31"><span class="cite-bracket">[</span>31<span class="cite-bracket">]</span></a></sup>
+</p>
+<style data-mw-deduplicate="TemplateStyles:r1235681985">.mw-parser-output .side-box{margin:4px 0;box-sizing:border-box;border:1px solid #aaa;font-size:88%;line-height:1.25em;background-color:var(--background-color-interactive-subtle,#f8f9fa);display:flow-root}.mw-parser-output .side-box-abovebelow,.mw-parser-output .side-box-text{padding:0.25em 0.9em}.mw-parser-output .side-box-image{padding:2px 0 2px 0.9em;text-align:center}.mw-parser-output .side-box-imageright{padding:2px 0.9em 2px 0;text-align:center}@media(min-width:500px){.mw-parser-output .side-box-flex{display:flex;align-items:center}.mw-parser-output .side-box-text{flex:1;min-width:0}}@media(min-width:720px){.mw-parser-output .side-box{width:238px}.mw-parser-output .side-box-right{clear:right;float:right;margin-left:1em}.mw-parser-output .side-box-left{margin-right:1em}}</style><style data-mw-deduplicate="TemplateStyles:r1096940132">.mw-parser-output .listen .side-box-text{line-height:1.1em}.mw-parser-output .listen-plain{border:none;background:transparent}.mw-parser-output .listen-embedded{width:100%;margin:0;border-width:1px 0 0 0;background:transparent}.mw-parser-output .listen-header{padding:2px}.mw-parser-output .listen-embedded .listen-header{padding:2px 0}.mw-parser-output .listen-file-header{padding:4px 0}.mw-parser-output .listen .description{padding-top:2px}.mw-parser-output .listen .mw-tmh-player{max-width:100%}@media(max-width:719px){.mw-parser-output .listen{clear:both}}@media(min-width:720px){.mw-parser-output .listen:not(.listen-noimage){width:320px}.mw-parser-output .listen-left{overflow:visible;float:left}.mw-parser-output .listen-center{float:none;margin-left:auto;margin-right:auto}}</style><div class="side-box side-box-right listen noprint"><style data-mw-deduplicate="TemplateStyles:r1126788409">.mw-parser-output .plainlist ol,.mw-parser-output .plainlist ul{line-height:inherit;list-style:none;margin:0;padding:0}.mw-parser-output .plainlist ol li,.mw-parser-output .plainlist ul li{margin-bottom:0}</style>
+<div class="side-box-flex">
+<div class="side-box-image"><span typeof="mw:File"><a href="/wiki/File:Open_book_01.svg" class="mw-file-description"><img src="//upload.wikimedia.org/wikipedia/commons/thumb/f/f3/Open_book_01.svg/60px-Open_book_01.svg.png" decoding="async" width="60" height="60" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/commons/thumb/f/f3/Open_book_01.svg/90px-Open_book_01.svg.png 1.5x, //upload.wikimedia.org/wikipedia/commons/thumb/f/f3/Open_book_01.svg/120px-Open_book_01.svg.png 2x" data-file-width="360" data-file-height="360"></a></span></div>
+<div class="side-box-text plainlist"><div class="haudio">
+<div class="listen-file-header"><a href="/wiki/File:Wild_Apples_by_Henry_David_Thoreau_-_read_by_Kevin_S_for_LibriVox%27s_Short_Nonfiction_Collection_Vol._065_(2019).ogg" title="File:Wild Apples by Henry David Thoreau - read by Kevin S for LibriVox's Short Nonfiction Collection Vol. 065 (2019).ogg">"Wild Apples"<br>by Henry David Thoreau<br><small>Read by Kevin S for LibriVox</small></a></div>
+<div><span typeof="mw:File"><span><span class="mw-tmh-player audio mw-file-element" style="width:232px;"><audio id="mwe_player_0_placeholder" preload="none" data-mw-tmh="" class="" width="232" style="width:232px;" data-durationhint="3696" data-mwtitle="Wild_Apples_by_Henry_David_Thoreau_-_read_by_Kevin_S_for_LibriVox's_Short_Nonfiction_Collection_Vol._065_(2019).ogg" data-mwprovider="wikimediacommons" playsinline="" disabled="disabled" tabindex="-1"></audio><a class="mw-tmh-play" href="/wiki/File:Wild_Apples_by_Henry_David_Thoreau_-_read_by_Kevin_S_for_LibriVox%27s_Short_Nonfiction_Collection_Vol._065_(2019).ogg" title="Play audio" role="button"><span class="mw-tmh-play-icon notheme"></span></a><span class="mw-tmh-duration mw-tmh-label"><span class="sr-only">Duration: 1 hour, 1 minute and 36 seconds.</span><span aria-hidden="true">1:01:36</span></span></span></span></span></div>
+<div class="description">Audio 01:01:35 (<a rel="nofollow" class="external text" href="https://archive.org/details/excursions1863thor/page/266">full text</a>)</div></div></div></div>
+<div class="side-box-abovebelow"><hr><i class="selfreference">Problems playing this file? See <a href="/wiki/Help:Media" title="Help:Media">media help</a>.</i></div>
+</div>
+<p>The Roman writer <a href="/wiki/Pliny_the_Elder" title="Pliny the Elder">Pliny the Elder</a> describes a method of storage for apples from his time in the 1st century. He says they should be placed in a room with good air circulation from a north facing window on a bed of straw, chaff, or mats with windfalls kept separately.<sup id="cite_ref-33" class="reference"><a href="#cite_note-33"><span class="cite-bracket">[</span>33<span class="cite-bracket">]</span></a></sup> Though methods like this will extend the availabity of reasonably fresh apples, without refrigeration their lifespan is limited. Even sturdy winter apple varieties will only keep well until December in cool climates.<sup id="cite_ref-34" class="reference"><a href="#cite_note-34"><span class="cite-bracket">[</span>34<span class="cite-bracket">]</span></a></sup> For longer storage medieval Europeans strung up cored and peeled apples to dry, either whole or sliced into rings.<sup id="cite_ref-35" class="reference"><a href="#cite_note-35"><span class="cite-bracket">[</span>35<span class="cite-bracket">]</span></a></sup>
+</p><p>Of the many Old World plants that the Spanish introduced to <a href="/wiki/Chilo%C3%A9_Archipelago" title="Chiloé Archipelago">Chiloé Archipelago</a> in the 16th century, apple trees became particularly well adapted.<sup id="cite_ref-Torrejonetal2004_36-0" class="reference"><a href="#cite_note-Torrejonetal2004-36"><span class="cite-bracket">[</span>36<span class="cite-bracket">]</span></a></sup> Apples were introduced to North America by colonists in the 17th century,<sup id="cite_ref-UofGeorgia_5-4" class="reference"><a href="#cite_note-UofGeorgia-5"><span class="cite-bracket">[</span>5<span class="cite-bracket">]</span></a></sup> and the first named apple cultivar was introduced in <a href="/wiki/Boston" title="Boston">Boston</a> by Reverend <a href="/wiki/William_Blaxton" title="William Blaxton">William Blaxton</a> in 1640.<sup id="cite_ref-37" class="reference"><a href="#cite_note-37"><span class="cite-bracket">[</span>37<span class="cite-bracket">]</span></a></sup> The only apples native to North America are <a href="/wiki/Crab_apples" class="mw-redirect" title="Crab apples">crab apples</a>.<sup id="cite_ref-Harrowsmith_38-0" class="reference"><a href="#cite_note-Harrowsmith-38"><span class="cite-bracket">[</span>38<span class="cite-bracket">]</span></a></sup>
+</p><p>Apple cultivars brought as seed from Europe were spread along Native American trade routes, as well as being cultivated on colonial farms. An 1845 United States apples nursery catalogue sold 350 of the "best" cultivars, showing the proliferation of new North American cultivars by the early 19th century.<sup id="cite_ref-Harrowsmith_38-1" class="reference"><a href="#cite_note-Harrowsmith-38"><span class="cite-bracket">[</span>38<span class="cite-bracket">]</span></a></sup> In the 20th century, irrigation projects in <a href="/wiki/Eastern_Washington" title="Eastern Washington">Eastern Washington</a> began and allowed the development of the multibillion-dollar fruit industry, of which the apple is the leading product.<sup id="cite_ref-UofGeorgia_5-5" class="reference"><a href="#cite_note-UofGeorgia-5"><span class="cite-bracket">[</span>5<span class="cite-bracket">]</span></a></sup>
+</p><p>Until the 20th century, farmers stored apples in <a href="/wiki/Root_cellar" title="Root cellar">frostproof cellars</a> during the winter for their own use or for sale. Improved transportation of fresh apples by train and road replaced the necessity for storage.<sup id="cite_ref-39" class="reference"><a href="#cite_note-39"><span class="cite-bracket">[</span>39<span class="cite-bracket">]</span></a></sup><sup id="cite_ref-40" class="reference"><a href="#cite_note-40"><span class="cite-bracket">[</span>40<span class="cite-bracket">]</span></a></sup> <a href="/wiki/Controlled_atmosphere" title="Controlled atmosphere">Controlled atmosphere</a> facilities are used to keep apples fresh year-round. Controlled atmosphere facilities use high humidity, low oxygen, and controlled carbon dioxide levels to maintain fruit freshness. They were first researched at Cambridge University in the 1920s and first used in the United States in the 1950s.<sup id="cite_ref-41" class="reference"><a href="#cite_note-41"><span class="cite-bracket">[</span>41<span class="cite-bracket">]</span></a></sup>
+</p>
+<div class="mw-heading mw-heading3"><h3 id="Breeding">Breeding</h3></div>
+<link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1236090951"><div role="note" class="hatnote navigation-not-searchable">See also: <a href="/wiki/Fruit_tree_propagation" title="Fruit tree propagation">Fruit tree propagation</a> and <a href="/wiki/Malling_series" title="Malling series">Malling series</a></div>
+<figure class="mw-default-size" typeof="mw:File/Thumb"><a href="/wiki/File:Apfelbaum_Winterrambour_Hochstamm.jpg" class="mw-file-description"><img src="//upload.wikimedia.org/wikipedia/commons/thumb/5/51/Apfelbaum_Winterrambour_Hochstamm.jpg/220px-Apfelbaum_Winterrambour_Hochstamm.jpg" decoding="async" width="220" height="147" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/commons/thumb/5/51/Apfelbaum_Winterrambour_Hochstamm.jpg/330px-Apfelbaum_Winterrambour_Hochstamm.jpg 1.5x, //upload.wikimedia.org/wikipedia/commons/thumb/5/51/Apfelbaum_Winterrambour_Hochstamm.jpg/440px-Apfelbaum_Winterrambour_Hochstamm.jpg 2x" data-file-width="1792" data-file-height="1200"></a><figcaption>An apple tree in Germany</figcaption></figure>
+<p>Many apples grow readily from seeds. However, apples must be propagated asexually to obtain cuttings with the characteristics of the parent. This is because seedling apples are "<a href="/wiki/Zygosity" title="Zygosity">extreme heterozygotes</a>". Rather than resembling their parents, seedlings are all different from each other and from their parents.<sup id="cite_ref-42" class="reference"><a href="#cite_note-42"><span class="cite-bracket">[</span>42<span class="cite-bracket">]</span></a></sup> <a href="/wiki/Polyploid" class="mw-redirect" title="Polyploid">Triploid</a> cultivars have an additional reproductive barrier in that three sets of chromosomes cannot be divided evenly during meiosis, yielding unequal segregation of the chromosomes (aneuploids). Even in the case when a triploid plant can produce a seed (apples are an example), it occurs infrequently, and seedlings rarely survive.<sup id="cite_ref-43" class="reference"><a href="#cite_note-43"><span class="cite-bracket">[</span>43<span class="cite-bracket">]</span></a></sup>
+</p><p>Because apples are not <a href="/wiki/True-breeding_organism" class="mw-redirect" title="True-breeding organism">true breeders</a> when planted as seeds, propagation usually involves <a href="/wiki/Grafting" title="Grafting">grafting</a> of cuttings. The <a href="/wiki/Rootstock" title="Rootstock">rootstock</a> used for the bottom of the graft can be selected to produce trees of a large variety of sizes, as well as changing the winter hardiness, insect and disease resistance, and soil preference of the resulting tree. Dwarf rootstocks can be used to produce very small trees (less than 3.0&nbsp;m or 10&nbsp;ft high at maturity), which bear fruit many years earlier in their life cycle than full size trees, and are easier to harvest.<sup id="cite_ref-44" class="reference"><a href="#cite_note-44"><span class="cite-bracket">[</span>44<span class="cite-bracket">]</span></a></sup>
+</p><p>Dwarf rootstocks for apple trees can be traced as far back as 300 BCE, to the area of <a href="/wiki/Persia" class="mw-redirect" title="Persia">Persia</a> and <a href="/wiki/Asia_Minor" class="mw-redirect" title="Asia Minor">Asia Minor</a>. <a href="/wiki/Alexander_the_Great" title="Alexander the Great">Alexander the Great</a> sent samples of dwarf apple trees to <a href="/wiki/Aristotle" title="Aristotle">Aristotle</a>'s <a href="/wiki/Lyceum" title="Lyceum">Lyceum</a>. Dwarf rootstocks became common by the 15th century and later went through several cycles of popularity and decline throughout the world.<sup id="cite_ref-45" class="reference"><a href="#cite_note-45"><span class="cite-bracket">[</span>45<span class="cite-bracket">]</span></a></sup> The majority of the rootstocks used to control size in apples were developed in England in the early 1900s. The <a href="/wiki/East_Malling_Research_Station" title="East Malling Research Station">East Malling Research Station</a> conducted extensive research into rootstocks, and their rootstocks are given an "M" prefix to designate their origin. Rootstocks marked with an "MM" prefix are Malling-series cultivars later crossed with trees of '<a href="/wiki/Northern_Spy" title="Northern Spy">Northern Spy</a>' in <a href="/wiki/London_Borough_of_Merton" title="London Borough of Merton">Merton, England</a>.<sup id="cite_ref-46" class="reference"><a href="#cite_note-46"><span class="cite-bracket">[</span>46<span class="cite-bracket">]</span></a></sup>
+</p><p>Most new apple cultivars originate as seedlings, which either arise by chance or are bred by deliberately crossing cultivars with promising characteristics.<sup id="cite_ref-47" class="reference"><a href="#cite_note-47"><span class="cite-bracket">[</span>47<span class="cite-bracket">]</span></a></sup> The words "seedling", "pippin", and "kernel" in the name of an apple cultivar suggest that it originated as a seedling. Apples can also form <a href="/wiki/Bud_sport" class="mw-redirect" title="Bud sport">bud sports</a> (mutations on a single branch). Some bud sports turn out to be improved strains of the parent cultivar. Some differ sufficiently from the parent tree to be considered new cultivars.<sup id="cite_ref-Polomski_&amp;_Reighard_48-0" class="reference"><a href="#cite_note-Polomski_&amp;_Reighard-48"><span class="cite-bracket">[</span>48<span class="cite-bracket">]</span></a></sup>
+</p><p>Apples have been acclimatized in Ecuador at very high altitudes, where they can often, with the needed factors, provide crops twice per year because of constant temperate conditions year-round.<sup id="cite_ref-49" class="reference"><a href="#cite_note-49"><span class="cite-bracket">[</span>49<span class="cite-bracket">]</span></a></sup>
+</p>
+<div class="mw-heading mw-heading3"><h3 id="Pollination">Pollination</h3></div>
+<link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1236090951"><div role="note" class="hatnote navigation-not-searchable">See also: <a href="/wiki/Fruit_tree_pollination" title="Fruit tree pollination">Fruit tree pollination</a></div>
+<figure class="mw-default-size" typeof="mw:File/Thumb"><a href="/wiki/File:Apple_tree_blossom.JPG" class="mw-file-description"><img src="//upload.wikimedia.org/wikipedia/commons/thumb/c/c3/Apple_tree_blossom.JPG/220px-Apple_tree_blossom.JPG" decoding="async" width="220" height="165" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/commons/thumb/c/c3/Apple_tree_blossom.JPG/330px-Apple_tree_blossom.JPG 1.5x, //upload.wikimedia.org/wikipedia/commons/thumb/c/c3/Apple_tree_blossom.JPG/440px-Apple_tree_blossom.JPG 2x" data-file-width="2288" data-file-height="1712"></a><figcaption>Apple blossom from an old <a href="/wiki/Ayrshire" title="Ayrshire">Ayrshire</a> cultivar</figcaption></figure>
+<figure class="mw-default-size" typeof="mw:File/Thumb"><a href="/wiki/File:Orchmason.jpg" class="mw-file-description"><img src="//upload.wikimedia.org/wikipedia/commons/thumb/4/47/Orchmason.jpg/220px-Orchmason.jpg" decoding="async" width="220" height="190" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/commons/thumb/4/47/Orchmason.jpg/330px-Orchmason.jpg 1.5x, //upload.wikimedia.org/wikipedia/commons/thumb/4/47/Orchmason.jpg/440px-Orchmason.jpg 2x" data-file-width="474" data-file-height="410"></a><figcaption>An <a href="/wiki/Orchard_mason_bee" class="mw-redirect" title="Orchard mason bee">orchard mason bee</a> on an apple bloom in <a href="/wiki/British_Columbia" title="British Columbia">British Columbia</a>, Canada</figcaption></figure>
+<p>Apples are self-incompatible; they must <a href="/wiki/Pollination" title="Pollination">cross-pollinate</a> to develop fruit. During the flowering each season, apple growers often utilize <a href="/wiki/Pollinator" title="Pollinator">pollinators</a> to carry pollen. <a href="/wiki/Honey_bee" title="Honey bee">Honey bees</a> are most commonly used. <a href="/wiki/Osmia_lignaria" title="Osmia lignaria">Orchard mason bees</a> are also used as supplemental pollinators in commercial orchards. <a href="/wiki/Bumblebee" title="Bumblebee">Bumblebee</a> <a href="/wiki/Queen_bee" title="Queen bee">queens</a> are sometimes present in orchards, but not usually in sufficient number to be significant pollinators.<sup id="cite_ref-Polomski_&amp;_Reighard_48-1" class="reference"><a href="#cite_note-Polomski_&amp;_Reighard-48"><span class="cite-bracket">[</span>48<span class="cite-bracket">]</span></a></sup><sup id="cite_ref-50" class="reference"><a href="#cite_note-50"><span class="cite-bracket">[</span>50<span class="cite-bracket">]</span></a></sup>
+</p><p>Cultivars are sometimes classified by the day of peak bloom in the average 30-day blossom period, with pollinizers selected from cultivars within a 6-day overlap period. There are four to seven pollination groups in apples, depending on climate:
+</p>
+<ul><li>Group A – Early flowering, 1 to 3 May in England ('<a href="/wiki/Gravenstein" title="Gravenstein">Gravenstein</a>', 'Red Astrachan')</li>
+<li>Group B – 4 to 7 May ('<a href="/wiki/Idared" title="Idared">Idared</a>', '<a href="/wiki/McIntosh_(apple)" title="McIntosh (apple)">McIntosh</a>')</li>
+<li>Group C – Mid-season flowering, 8 to 11 May ('<a href="/wiki/Granny_Smith" title="Granny Smith">Granny Smith</a>', '<a href="/wiki/Cox%27s_Orange_Pippin" title="Cox's Orange Pippin">Cox's Orange Pippin</a>')</li>
+<li>Group D – Mid/late season flowering, 12 to 15 May ('<a href="/wiki/Golden_Delicious" title="Golden Delicious">Golden Delicious</a>', 'Calville blanc d'hiver')</li>
+<li>Group E – Late flowering, 16 to 18 May ('<a href="/wiki/Braeburn" title="Braeburn">Braeburn</a>', 'Reinette d'Orléans')</li>
+<li>Group F – 19 to 23 May ('Suntan')</li>
+<li>Group H – 24 to 28 May ('Court-Pendu Gris' – also called Court-Pendu plat)</li></ul>
+<p>One cultivar can be pollinated by a compatible cultivar from the same group or close (A with A, or A with B, but not A with C or D).<sup id="cite_ref-51" class="reference"><a href="#cite_note-51"><span class="cite-bracket">[</span>51<span class="cite-bracket">]</span></a></sup>
+</p>
+<div class="mw-heading mw-heading3"><h3 id="Maturation_and_harvest">Maturation and harvest</h3></div>
+<link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1236090951"><div role="note" class="hatnote navigation-not-searchable">See also: <a href="/wiki/Fruit_picking" title="Fruit picking">Fruit picking</a> and <a href="/wiki/Fruit_tree_pruning" title="Fruit tree pruning">Fruit tree pruning</a></div>
+<figure class="mw-default-size" typeof="mw:File/Thumb"><a href="/wiki/File:Relander_and_apples.jpg" class="mw-file-description"><img src="//upload.wikimedia.org/wikipedia/commons/thumb/6/61/Relander_and_apples.jpg/220px-Relander_and_apples.jpg" decoding="async" width="220" height="156" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/commons/thumb/6/61/Relander_and_apples.jpg/330px-Relander_and_apples.jpg 1.5x, //upload.wikimedia.org/wikipedia/commons/thumb/6/61/Relander_and_apples.jpg/440px-Relander_and_apples.jpg 2x" data-file-width="1462" data-file-height="1040"></a><figcaption><a href="/wiki/L._K._Relander" class="mw-redirect" title="L. K. Relander">L. K. Relander</a>, the former <a href="/wiki/President_of_Finland" title="President of Finland">President of Finland</a>, with his family picking apples in the 1930s</figcaption></figure>
+<p>Cultivars vary in their yield and the ultimate size of the tree, even when grown on the same rootstock. Some cultivars, if left unpruned, grow very large—letting them bear more fruit, but making harvesting more difficult. Depending on tree density (number of trees planted per unit surface area), mature trees typically bear 40–200&nbsp;kg (90–440&nbsp;lb) of apples each year, though productivity can be close to zero in poor years. Apples are harvested using three-point ladders that are designed to fit amongst the branches. Trees grafted on dwarfing rootstocks bear about 10–80&nbsp;kg (20–180&nbsp;lb) of fruit per year.<sup id="cite_ref-Polomski_&amp;_Reighard_48-2" class="reference"><a href="#cite_note-Polomski_&amp;_Reighard-48"><span class="cite-bracket">[</span>48<span class="cite-bracket">]</span></a></sup>
+</p><p>Some farms with apple orchards open them to the public so consumers can pick their own apples.<sup id="cite_ref-52" class="reference"><a href="#cite_note-52"><span class="cite-bracket">[</span>52<span class="cite-bracket">]</span></a></sup>
+</p><p>Crops ripen at different times of the year according to the cultivar. Cultivar that yield their crop in the summer include '<a href="/wiki/Sweet_Bough" title="Sweet Bough">Sweet Bough</a>' and 'Duchess'; fall producers include 'Blenheim'; winter producers include 'King', '<a href="/wiki/Swazie_(apple)" title="Swazie (apple)">Swayzie</a>', and 'Tolman Sweet'.<sup id="cite_ref-Harrowsmith_38-2" class="reference"><a href="#cite_note-Harrowsmith-38"><span class="cite-bracket">[</span>38<span class="cite-bracket">]</span></a></sup>
+</p>
+<div class="mw-heading mw-heading3"><h3 id="Storage">Storage</h3></div>
+<figure class="mw-default-size" typeof="mw:File/Thumb"><a href="/wiki/File:MIN_Rungis_pommes.jpg" class="mw-file-description"><img src="//upload.wikimedia.org/wikipedia/commons/thumb/3/3a/MIN_Rungis_pommes.jpg/220px-MIN_Rungis_pommes.jpg" decoding="async" width="220" height="147" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/commons/thumb/3/3a/MIN_Rungis_pommes.jpg/330px-MIN_Rungis_pommes.jpg 1.5x, //upload.wikimedia.org/wikipedia/commons/thumb/3/3a/MIN_Rungis_pommes.jpg/440px-MIN_Rungis_pommes.jpg 2x" data-file-width="2130" data-file-height="1420"></a><figcaption>Different apple <a href="/wiki/List_of_apple_cultivars" title="List of apple cultivars">cultivars</a> in a wholesale food market</figcaption></figure>
+<p>Commercially, apples can be stored for months in <a href="/wiki/Controlled_atmosphere" title="Controlled atmosphere">controlled atmosphere</a> chambers. Apples are commonly stored in chambers with lowered concentrations of <a href="/wiki/Oxygen" title="Oxygen">oxygen</a> to reduce respiration and slow softening and other changes if the fruit is already fully ripe. The gas <a href="/wiki/Ethylene" title="Ethylene">ethylene</a> is used by plants as a <a href="/wiki/Hormone" title="Hormone">hormone</a> which promotes ripening, decreasing the time an apple can be stored. For storage longer than about six months the apples are picked earlier, before full ripeness, when ethylene production by the fruit is low. However, in many varieties this increases their sensitivity to <a href="/wiki/Carbon_dioxide" title="Carbon dioxide">carbon dioxide</a>, which also must be controlled.<sup id="cite_ref-53" class="reference"><a href="#cite_note-53"><span class="cite-bracket">[</span>53<span class="cite-bracket">]</span></a></sup>
+</p><p>For home storage, most culitvars of apple can be stored for three weeks in a pantry and four to six weeks from the date of purchase in a refrigerator that maintains 4 to 0&nbsp;°C (39 to 32&nbsp;°F).<sup id="cite_ref-54" class="reference"><a href="#cite_note-54"><span class="cite-bracket">[</span>54<span class="cite-bracket">]</span></a></sup><sup id="cite_ref-55" class="reference"><a href="#cite_note-55"><span class="cite-bracket">[</span>55<span class="cite-bracket">]</span></a></sup> Some varieties of apples (e.g. '<a href="/wiki/Granny_Smith" title="Granny Smith">Granny Smith</a>' and '<a href="/wiki/Fuji_(apple)" title="Fuji (apple)">Fuji</a>') have more than three times the storage life of others.<sup id="cite_ref-56" class="reference"><a href="#cite_note-56"><span class="cite-bracket">[</span>56<span class="cite-bracket">]</span></a></sup>
+</p><p>Non-organic apples may be sprayed with a substance <a href="/wiki/1-methylcyclopropene" class="mw-redirect" title="1-methylcyclopropene">1-methylcyclopropene</a> blocking the apples' ethylene receptors, temporarily preventing them from ripening.<sup id="cite_ref-57" class="reference"><a href="#cite_note-57"><span class="cite-bracket">[</span>57<span class="cite-bracket">]</span></a></sup>
+</p>
+<div class="mw-heading mw-heading3"><h3 id="Pests_and_diseases">Pests and diseases</h3></div>
+<link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1236090951"><div role="note" class="hatnote navigation-not-searchable">Further information: <a href="/wiki/List_of_apple_diseases" title="List of apple diseases">List of apple diseases</a></div>
+<figure class="mw-default-size" typeof="mw:File/Thumb"><a href="/wiki/File:Madige-Apfel-Frucht.jpg" class="mw-file-description"><img src="//upload.wikimedia.org/wikipedia/commons/thumb/c/c6/Madige-Apfel-Frucht.jpg/220px-Madige-Apfel-Frucht.jpg" decoding="async" width="220" height="164" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/commons/thumb/c/c6/Madige-Apfel-Frucht.jpg/330px-Madige-Apfel-Frucht.jpg 1.5x, //upload.wikimedia.org/wikipedia/commons/thumb/c/c6/Madige-Apfel-Frucht.jpg/440px-Madige-Apfel-Frucht.jpg 2x" data-file-width="500" data-file-height="372"></a><figcaption><a href="/wiki/Codling_moth" title="Codling moth">Codling moth</a> larva tunnelling inside an apple</figcaption></figure>
+<p>Apple trees are susceptible to <a href="/wiki/Fungal" class="mw-redirect" title="Fungal">fungal</a> and <a href="/wiki/Bacterial" class="mw-redirect" title="Bacterial">bacterial</a> diseases, and to damage by insect pests. Many commercial orchards pursue a program of chemical sprays to maintain high fruit quality, tree health, and high yields. These prohibit the use of synthetic pesticides, though some older pesticides are allowed. <a href="/wiki/Organic_farming" title="Organic farming">Organic</a> methods include, for instance, introducing its natural predator to reduce the population of a particular pest.
+</p><p>A wide range of pests and diseases can affect the plant. Three of the more common diseases or pests are mildew, aphids, and apple scab.
+</p>
+<ul><li><a href="/wiki/Mildew" title="Mildew">Mildew</a> is characterized by light grey powdery patches appearing on the leaves, shoots and flowers, normally in spring. The flowers turn a creamy yellow color and do not develop correctly. This can be treated similarly to <a href="/wiki/Botryotinia" title="Botryotinia"><i>Botrytis</i></a>—eliminating the conditions that caused the disease and burning the infected plants are among recommended actions.<sup id="cite_ref-58" class="reference"><a href="#cite_note-58"><span class="cite-bracket">[</span>58<span class="cite-bracket">]</span></a></sup></li>
+<li><a href="/wiki/Aphid" title="Aphid">Aphids</a> are small insects with <a href="/wiki/Insect_mouthparts" title="Insect mouthparts">sucking mouthparts</a>. Five species of aphids commonly attack apples: apple grain aphid, rosy apple aphid, apple aphid, spirea aphid, and the woolly apple aphid. The aphid species can be identified by color, time of year, and by differences in the cornicles (small paired projections from their rear).<sup id="cite_ref-59" class="reference"><a href="#cite_note-59"><span class="cite-bracket">[</span>59<span class="cite-bracket">]</span></a></sup> Aphids feed on foliage using needle-like mouth parts to suck out plant juices. When present in high numbers, certain species reduce tree growth and vigor.<sup id="cite_ref-60" class="reference"><a href="#cite_note-60"><span class="cite-bracket">[</span>60<span class="cite-bracket">]</span></a></sup></li>
+<li><a href="/wiki/Apple_scab" title="Apple scab">Apple scab</a>: Apple scab causes leaves to develop olive-brown spots with a velvety texture that later turn brown and become cork-like in texture. The disease also affects the fruit, which also develops similar brown spots with velvety or cork-like textures. Apple scab is spread through fungus growing in old apple leaves on the ground and spreads during warm spring weather to infect the new year's growth.<sup id="cite_ref-Bradley_61-0" class="reference"><a href="#cite_note-Bradley-61"><span class="cite-bracket">[</span>61<span class="cite-bracket">]</span></a></sup></li></ul>
+<p>Among the most serious disease problems is a bacterial disease called <a href="/wiki/Fireblight" class="mw-redirect" title="Fireblight">fireblight</a>, and three fungal diseases: <i><a href="/wiki/Gymnosporangium" title="Gymnosporangium">Gymnosporangium</a></i> rust, <a href="/wiki/Black_Spot_(disease)" class="mw-redirect" title="Black Spot (disease)">black spot</a>,<sup id="cite_ref-62" class="reference"><a href="#cite_note-62"><span class="cite-bracket">[</span>62<span class="cite-bracket">]</span></a></sup> and <a href="/wiki/Bitter_rot_of_apple" title="Bitter rot of apple">bitter rot</a>.<sup id="cite_ref-63" class="reference"><a href="#cite_note-63"><span class="cite-bracket">[</span>63<span class="cite-bracket">]</span></a></sup> <a href="/wiki/Codling_moth" title="Codling moth">Codling moths</a>, and the <a href="/wiki/Apple_maggot" title="Apple maggot">apple maggots</a> of fruit flies, cause serious damage to apple fruits, making them unsaleable. Young apple trees are also prone to mammal pests like mice and deer, which feed on the soft bark of the trees, especially in winter.<sup id="cite_ref-Bradley_61-1" class="reference"><a href="#cite_note-Bradley-61"><span class="cite-bracket">[</span>61<span class="cite-bracket">]</span></a></sup> The larvae of the <a href="/wiki/Synanthedon_myopaeformis" title="Synanthedon myopaeformis">apple clearwing moth (red-belted clearwing)</a> burrow through the bark and into the phloem of apple trees, potentially causing significant damage.<sup id="cite_ref-64" class="reference"><a href="#cite_note-64"><span class="cite-bracket">[</span>64<span class="cite-bracket">]</span></a></sup>
+</p>
+<div class="mw-heading mw-heading3"><h3 id="Cultivars">Cultivars</h3></div>
+<link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1236090951"><div role="note" class="hatnote navigation-not-searchable">Main article: <a href="/wiki/List_of_apple_cultivars" title="List of apple cultivars">List of apple cultivars</a></div>
+<figure class="mw-default-size" typeof="mw:File/Thumb"><a href="/wiki/File:Apples.jpg" class="mw-file-description"><img src="//upload.wikimedia.org/wikipedia/commons/thumb/e/ee/Apples.jpg/170px-Apples.jpg" decoding="async" width="170" height="255" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/commons/thumb/e/ee/Apples.jpg/255px-Apples.jpg 1.5x, //upload.wikimedia.org/wikipedia/commons/thumb/e/ee/Apples.jpg/340px-Apples.jpg 2x" data-file-width="1800" data-file-height="2700"></a><figcaption>An assortment of apple cultivars</figcaption></figure>
+<p>There are more than 7,500 known <a href="/wiki/Cultivar" title="Cultivar">cultivars</a> (cultivated varieties) of apples.<sup id="cite_ref-65" class="reference"><a href="#cite_note-65"><span class="cite-bracket">[</span>65<span class="cite-bracket">]</span></a></sup> Cultivars vary in their <a href="/wiki/Crop_yield" title="Crop yield">yield</a> and the ultimate size of the tree, even when grown on the same <a href="/wiki/Rootstock" title="Rootstock">rootstock</a>.<sup id="cite_ref-England_66-0" class="reference"><a href="#cite_note-England-66"><span class="cite-bracket">[</span>66<span class="cite-bracket">]</span></a></sup> Different cultivars are available for <a href="/wiki/Temperate" class="mw-redirect" title="Temperate">temperate</a> and <a href="/wiki/Subtropical" class="mw-redirect" title="Subtropical">subtropical</a> climates. The UK's National Fruit Collection, which is the responsibility of the Department of Environment, Food, and Rural Affairs, includes a collection of over 2,000 cultivars of apple tree in Kent.<sup id="cite_ref-67" class="reference"><a href="#cite_note-67"><span class="cite-bracket">[</span>67<span class="cite-bracket">]</span></a></sup> The <a href="/wiki/University_of_Reading" title="University of Reading">University of Reading</a>, which is responsible for developing the UK national collection database, provides access to search the national collection. The University of Reading's work is part of the European Cooperative Programme for Plant Genetic Resources of which there are 38 countries participating in the Malus/Pyrus work group.<sup id="cite_ref-68" class="reference"><a href="#cite_note-68"><span class="cite-bracket">[</span>68<span class="cite-bracket">]</span></a></sup>
+</p><p>The UK's national fruit collection database contains much information on the characteristics and origin of many apples, including alternative names for what is essentially the same "genetic" apple cultivar. Most of these cultivars are bred for eating fresh (dessert apples), though some are cultivated specifically for cooking (<a href="/wiki/Cooking_apple" title="Cooking apple">cooking apples</a>) or producing <a href="/wiki/Cider" title="Cider">cider</a>. <a href="/wiki/Cider_apple" title="Cider apple">Cider apples</a> are typically too tart and astringent to eat fresh, but they give the beverage a rich flavor that dessert apples cannot.<sup id="cite_ref-apples1_69-0" class="reference"><a href="#cite_note-apples1-69"><span class="cite-bracket">[</span>69<span class="cite-bracket">]</span></a></sup>
+</p><p>In the United States there are many apple breeding programs associated with universities. <a href="/wiki/Cornell_University" title="Cornell University">Cornell University</a> has had a program operating since 1880 in <a href="/wiki/Geneva,_New_York" title="Geneva, New York">Geneva, New York</a>. Among their recent well known apples is the 'SnapDragon' cultivar released in 2013. In the west <a href="/wiki/Washington_State_University" title="Washington State University">Washington State University</a> started a program to support their apple industry in 1994 and released the '<a href="/wiki/Cosmic_Crisp" title="Cosmic Crisp">Cosmic Crisp</a>' cultivar in 2017. The third most grown apple cultivar in the United States is the '<a href="/wiki/Honeycrisp" title="Honeycrisp">Honeycrisp</a>', released by the <a href="/wiki/University_of_Minnesota" title="University of Minnesota">University of Minnesota</a> program in 1991.<sup id="cite_ref-70" class="reference"><a href="#cite_note-70"><span class="cite-bracket">[</span>70<span class="cite-bracket">]</span></a></sup> Unusually for a popular cultivar, the 'Honeycrisp' is not directly related to another popular apple cultivar but instead to two unsuccessful cultivars.<sup id="cite_ref-71" class="reference"><a href="#cite_note-71"><span class="cite-bracket">[</span>71<span class="cite-bracket">]</span></a></sup> In Europe there are also many breeding programs such as the <a href="/wiki/Julius_K%C3%BChn-Institut" title="Julius Kühn-Institut">Julius Kühn-Institut</a>, the German federal research center for cultivated plants.<sup id="cite_ref-72" class="reference"><a href="#cite_note-72"><span class="cite-bracket">[</span>72<span class="cite-bracket">]</span></a></sup>
+</p><p>Commercially popular apple cultivars are soft but crisp. Other desirable qualities in modern commercial apple breeding are a colorful skin, absence of <a href="/wiki/Russet_apple" title="Russet apple">russeting</a>, ease of shipping, lengthy storage ability, high yields, disease resistance, common apple shape, and developed flavor.<sup id="cite_ref-England_66-1" class="reference"><a href="#cite_note-England-66"><span class="cite-bracket">[</span>66<span class="cite-bracket">]</span></a></sup> Modern apples are generally sweeter than older cultivars, as popular tastes in apples have varied over time. Most North Americans and Europeans favor sweet, subacid apples, but tart apples have a strong minority following.<sup id="cite_ref-World_73-0" class="reference"><a href="#cite_note-World-73"><span class="cite-bracket">[</span>73<span class="cite-bracket">]</span></a></sup> Extremely sweet apples with barely any acid flavor are popular in Asia,<sup id="cite_ref-World_73-1" class="reference"><a href="#cite_note-World-73"><span class="cite-bracket">[</span>73<span class="cite-bracket">]</span></a></sup> especially the <a href="/wiki/Indian_subcontinent" title="Indian subcontinent">Indian subcontinent</a>.<sup id="cite_ref-apples1_69-1" class="reference"><a href="#cite_note-apples1-69"><span class="cite-bracket">[</span>69<span class="cite-bracket">]</span></a></sup>
+</p>
+<figure class="mw-default-size" typeof="mw:File/Thumb"><a href="/wiki/File:Mele_non_comuni.jpg" class="mw-file-description"><img src="//upload.wikimedia.org/wikipedia/commons/thumb/7/71/Mele_non_comuni.jpg/220px-Mele_non_comuni.jpg" decoding="async" width="220" height="147" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/commons/thumb/7/71/Mele_non_comuni.jpg/330px-Mele_non_comuni.jpg 1.5x, //upload.wikimedia.org/wikipedia/commons/thumb/7/71/Mele_non_comuni.jpg/440px-Mele_non_comuni.jpg 2x" data-file-width="3000" data-file-height="2000"></a><figcaption>Less common apple cultivars from an orchard in Italy</figcaption></figure>
+<p>Old cultivars are often oddly shaped, russeted, and grow in a variety of textures and colors. Some find them to have better flavor than modern cultivars, but they may have other problems that make them commercially unviable—low yield, disease susceptibility, poor tolerance for storage or transport, or just being the "wrong" size.<sup id="cite_ref-Hobby_Farms_Mag._74-0" class="reference"><a href="#cite_note-Hobby_Farms_Mag.-74"><span class="cite-bracket">[</span>74<span class="cite-bracket">]</span></a></sup> A few old cultivars are still produced on a large scale, but many have been preserved by home gardeners and farmers that sell directly to local markets. Many unusual and locally important cultivars with their own unique taste and appearance exist; apple conservation campaigns have sprung up around the world to preserve such local cultivars from extinction. In the United Kingdom, old cultivars such as '<a href="/wiki/Cox%27s_Orange_Pippin" title="Cox's Orange Pippin">Cox's Orange Pippin</a>' and '<a href="/wiki/Egremont_Russet" title="Egremont Russet">Egremont Russet</a>' are still commercially important even though by modern standards they are low yielding and susceptible to disease.<sup id="cite_ref-UofGeorgia_5-6" class="reference"><a href="#cite_note-UofGeorgia-5"><span class="cite-bracket">[</span>5<span class="cite-bracket">]</span></a></sup>
+</p>
+<div class="mw-heading mw-heading3"><h3 id="Production">Production</h3></div>
+<link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1236090951"><div role="note" class="hatnote navigation-not-searchable">Main article: <a href="/wiki/List_of_countries_by_apple_production" title="List of countries by apple production">List of countries by apple production</a></div>
+<table class="wikitable floatright" style="width:13em; text-align:center">
+<tbody><tr>
+<th colspan="2">Apple production<br>
+<p><small>2022, millions of <a href="/wiki/Tonne" title="Tonne">tonnes</a></small><br>
+</p>
+</th></tr>
+<tr>
+<td><span class="flagicon"><span class="mw-image-border" typeof="mw:File"><span><img alt="" src="//upload.wikimedia.org/wikipedia/commons/thumb/f/fa/Flag_of_the_People%27s_Republic_of_China.svg/23px-Flag_of_the_People%27s_Republic_of_China.svg.png" decoding="async" width="23" height="15" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/commons/thumb/f/fa/Flag_of_the_People%27s_Republic_of_China.svg/35px-Flag_of_the_People%27s_Republic_of_China.svg.png 1.5x, //upload.wikimedia.org/wikipedia/commons/thumb/f/fa/Flag_of_the_People%27s_Republic_of_China.svg/45px-Flag_of_the_People%27s_Republic_of_China.svg.png 2x" data-file-width="900" data-file-height="600"></span></span>&nbsp;</span><a href="/wiki/China" title="China">China</a></td>
+<td>47.6
+</td></tr>
+<tr>
+<td><span class="flagicon"><span class="mw-image-border" typeof="mw:File"><span><img alt="" src="//upload.wikimedia.org/wikipedia/commons/thumb/5/5d/Flag_of_the_United_States_%2823px%29.png/23px-Flag_of_the_United_States_%2823px%29.png" decoding="async" width="23" height="13" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/commons/thumb/5/5d/Flag_of_the_United_States_%2823px%29.png/35px-Flag_of_the_United_States_%2823px%29.png 1.5x, //upload.wikimedia.org/wikipedia/commons/thumb/5/5d/Flag_of_the_United_States_%2823px%29.png/46px-Flag_of_the_United_States_%2823px%29.png 2x" data-file-width="69" data-file-height="39"></span></span>&nbsp;</span><a href="/wiki/United_States" title="United States">United States</a></td>
+<td>4.8
+</td></tr>
+<tr>
+<td><span class="flagicon"><span class="mw-image-border" typeof="mw:File"><span><img alt="" src="//upload.wikimedia.org/wikipedia/commons/thumb/b/b4/Flag_of_Turkey.svg/23px-Flag_of_Turkey.svg.png" decoding="async" width="23" height="15" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/commons/thumb/b/b4/Flag_of_Turkey.svg/35px-Flag_of_Turkey.svg.png 1.5x, //upload.wikimedia.org/wikipedia/commons/thumb/b/b4/Flag_of_Turkey.svg/45px-Flag_of_Turkey.svg.png 2x" data-file-width="1200" data-file-height="800"></span></span>&nbsp;</span><a href="/wiki/Turkey" title="Turkey">Turkey</a></td>
+<td>4.4
+</td></tr>
+<tr>
+<td><span class="flagicon"><span class="mw-image-border" typeof="mw:File"><span><img alt="" src="//upload.wikimedia.org/wikipedia/en/thumb/1/12/Flag_of_Poland.svg/23px-Flag_of_Poland.svg.png" decoding="async" width="23" height="14" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/en/thumb/1/12/Flag_of_Poland.svg/35px-Flag_of_Poland.svg.png 1.5x, //upload.wikimedia.org/wikipedia/en/thumb/1/12/Flag_of_Poland.svg/46px-Flag_of_Poland.svg.png 2x" data-file-width="1280" data-file-height="800"></span></span>&nbsp;</span><a href="/wiki/Poland" title="Poland">Poland</a></td>
+<td>4.3
+</td></tr>
+<tr>
+<td><span class="flagicon"><span class="mw-image-border" typeof="mw:File"><span><img alt="" src="//upload.wikimedia.org/wikipedia/en/thumb/4/41/Flag_of_India.svg/23px-Flag_of_India.svg.png" decoding="async" width="23" height="15" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/en/thumb/4/41/Flag_of_India.svg/35px-Flag_of_India.svg.png 1.5x, //upload.wikimedia.org/wikipedia/en/thumb/4/41/Flag_of_India.svg/45px-Flag_of_India.svg.png 2x" data-file-width="900" data-file-height="600"></span></span>&nbsp;</span><a href="/wiki/India" title="India">India</a></td>
+<td>2.6
+</td></tr>
+<tr>
+<td><b>World</b></td>
+<td><b>95.8</b>
+</td></tr>
+<tr>
+<td colspan="2" style="text-align: center;"><small>Source: <a href="/wiki/FAOSTAT" class="mw-redirect" title="FAOSTAT">FAOSTAT</a> of the United Nations</small><sup id="cite_ref-faostat_75-0" class="reference"><a href="#cite_note-faostat-75"><span class="cite-bracket">[</span>75<span class="cite-bracket">]</span></a></sup>
+</td></tr></tbody></table>
+<p>World production of apples in 2022 was 96 million <a href="/wiki/Tonne" title="Tonne">tonnes</a>, with China producing 50% of the total (table).<sup id="cite_ref-faostat_75-1" class="reference"><a href="#cite_note-faostat-75"><span class="cite-bracket">[</span>75<span class="cite-bracket">]</span></a></sup> Secondary producers were the United States, <a href="/wiki/Turkey" title="Turkey">Turkey</a>, and <a href="/wiki/Poland" title="Poland">Poland</a>.<sup id="cite_ref-faostat_75-2" class="reference"><a href="#cite_note-faostat-75"><span class="cite-bracket">[</span>75<span class="cite-bracket">]</span></a></sup>
+</p>
+<div class="mw-heading mw-heading2"><h2 id="Toxicity">Toxicity</h2></div>
+<div class="mw-heading mw-heading3"><h3 id="Amygdalin">Amygdalin</h3></div>
+<p>Apple seeds contain small amounts of <a href="/wiki/Amygdalin" title="Amygdalin">amygdalin</a>, a sugar and <a href="/wiki/Cyanide" title="Cyanide">cyanide</a> compound known as a <a href="/wiki/Cyanogenic_glycoside" class="mw-redirect" title="Cyanogenic glycoside">cyanogenic glycoside</a>. Ingesting small amounts of apple seeds causes no ill effects, but consumption of extremely large doses can cause <a href="/wiki/Adverse_reaction" class="mw-redirect" title="Adverse reaction">adverse reactions</a>. It may take several hours before the poison takes effect, as cyanogenic glycosides must be <a href="/wiki/Hydrolyzed" class="mw-redirect" title="Hydrolyzed">hydrolyzed</a> before the cyanide ion is released.<sup id="cite_ref-76" class="reference"><a href="#cite_note-76"><span class="cite-bracket">[</span>76<span class="cite-bracket">]</span></a></sup> The U.S. <a href="/wiki/National_Library_of_Medicine" class="mw-redirect" title="National Library of Medicine">National Library of Medicine</a>'s <a href="/wiki/Hazardous_Substances_Data_Bank" title="Hazardous Substances Data Bank">Hazardous Substances Data Bank</a> records no cases of amygdalin poisoning from consuming apple seeds.<sup id="cite_ref-77" class="reference"><a href="#cite_note-77"><span class="cite-bracket">[</span>77<span class="cite-bracket">]</span></a></sup>
+</p>
+<div class="mw-heading mw-heading3"><h3 id="Allergy">Allergy</h3></div>
+<p>One form of apple allergy, often found in northern Europe, is called birch-apple syndrome and is found in people who are also allergic to <a href="/wiki/Birch" title="Birch">birch</a> <a href="/wiki/Pollen" title="Pollen">pollen</a>.<sup id="cite_ref-EU_78-0" class="reference"><a href="#cite_note-EU-78"><span class="cite-bracket">[</span>78<span class="cite-bracket">]</span></a></sup> Allergic reactions are triggered by a protein in apples that is similar to birch pollen, and people affected by this protein can also develop allergies to other fruits, nuts, and vegetables. Reactions, which entail <a href="/wiki/Oral_allergy_syndrome" title="Oral allergy syndrome">oral allergy syndrome</a> (OAS), generally involve itching and inflammation of the mouth and throat,<sup id="cite_ref-EU_78-1" class="reference"><a href="#cite_note-EU-78"><span class="cite-bracket">[</span>78<span class="cite-bracket">]</span></a></sup> but in rare cases can also include life-threatening <a href="/wiki/Anaphylaxis" title="Anaphylaxis">anaphylaxis</a>.<sup id="cite_ref-79" class="reference"><a href="#cite_note-79"><span class="cite-bracket">[</span>79<span class="cite-bracket">]</span></a></sup> This reaction only occurs when raw fruit is consumed—the allergen is neutralized in the cooking process. The variety of apple, maturity and storage conditions can change the amount of allergen present in individual fruits. Long storage times can increase the amount of proteins that cause birch-apple syndrome.<sup id="cite_ref-EU_78-2" class="reference"><a href="#cite_note-EU-78"><span class="cite-bracket">[</span>78<span class="cite-bracket">]</span></a></sup>
+</p><p>In other areas, such as the Mediterranean, some individuals have adverse reactions to apples because of their similarity to peaches.<sup id="cite_ref-EU_78-3" class="reference"><a href="#cite_note-EU-78"><span class="cite-bracket">[</span>78<span class="cite-bracket">]</span></a></sup> This form of apple allergy also includes OAS, but often has more severe symptoms, such as vomiting, abdominal pain and <a href="/wiki/Urticaria" class="mw-redirect" title="Urticaria">urticaria</a>, and can be life-threatening. Individuals with this form of allergy can also develop reactions to other fruits and nuts. Cooking does not break down the protein causing this particular reaction, so affected individuals cannot eat raw or cooked apples. Freshly harvested, over-ripe fruits tend to have the highest levels of the protein that causes this reaction.<sup id="cite_ref-EU_78-4" class="reference"><a href="#cite_note-EU-78"><span class="cite-bracket">[</span>78<span class="cite-bracket">]</span></a></sup>
+</p><p>Breeding efforts have yet to produce a <a href="/wiki/Hypoallergenic" title="Hypoallergenic">hypoallergenic</a> fruit suitable for either of the two forms of apple allergy.<sup id="cite_ref-EU_78-5" class="reference"><a href="#cite_note-EU-78"><span class="cite-bracket">[</span>78<span class="cite-bracket">]</span></a></sup>
+</p>
+<div class="mw-heading mw-heading2"><h2 id="Uses">Uses</h2></div>
+<link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1236090951"><div role="note" class="hatnote navigation-not-searchable">See also: <a href="/wiki/Cooking_apple" title="Cooking apple">Cooking apple</a> and <a href="/wiki/Cider_apple" title="Cider apple">Cider apple</a></div>
+<div class="mw-heading mw-heading3"><h3 id="Nutrition">Nutrition</h3></div>
+<style data-mw-deduplicate="TemplateStyles:r1034237262">.mw-parser-output .stack{box-sizing:border-box}.mw-parser-output .stack>div{margin:1px;overflow:hidden}@media all and (min-width:720px){.mw-parser-output .stack-clear-left{float:left;clear:left}.mw-parser-output .stack-clear-right{float:right;clear:right}.mw-parser-output .stack-left{float:left}.mw-parser-output .stack-right{float:right}.mw-parser-output .stack-margin-clear-left{float:left;clear:left;margin-right:1em}.mw-parser-output .stack-margin-clear-right{float:right;clear:right;margin-left:1em}.mw-parser-output .stack-margin-left{float:left;margin-right:1em}.mw-parser-output .stack-margin-right{float:right;margin-left:1em}}</style><div class="stack mw-stack stack-right"><div>
+<style data-mw-deduplicate="TemplateStyles:r1257001546">.mw-parser-output .infobox-subbox{padding:0;border:none;margin:-3px;width:auto;min-width:100%;font-size:100%;clear:none;float:none;background-color:transparent}.mw-parser-output .infobox-3cols-child{margin:auto}.mw-parser-output .infobox .navbar{font-size:100%}@media screen{html.skin-theme-clientpref-night .mw-parser-output .infobox-full-data:not(.notheme)>div:not(.notheme)[style]{background:#1f1f23!important;color:#f8f9fa}}@media screen and (prefers-color-scheme:dark){html.skin-theme-clientpref-os .mw-parser-output .infobox-full-data:not(.notheme) div:not(.notheme){background:#1f1f23!important;color:#f8f9fa}}@media(min-width:640px){body.skin--responsive .mw-parser-output .infobox-table{display:table!important}body.skin--responsive .mw-parser-output .infobox-table>caption{display:table-caption!important}body.skin--responsive .mw-parser-output .infobox-table>tbody{display:table-row-group}body.skin--responsive .mw-parser-output .infobox-table tr{display:table-row!important}body.skin--responsive .mw-parser-output .infobox-table th,body.skin--responsive .mw-parser-output .infobox-table td{padding-left:inherit;padding-right:inherit}}</style><table class="infobox nowrap"><caption class="infobox-title" style="white-space:normal; padding-bottom:0.15em;">Apples, with skin (edible parts)</caption><tbody><tr><th colspan="2" class="infobox-header">Nutritional value per 100&nbsp;g (3.5&nbsp;oz)</th></tr><tr><th scope="row" class="infobox-label"><a href="/wiki/Food_energy" title="Food energy">Energy</a></th><td class="infobox-data">218&nbsp;kJ (52&nbsp;kcal)</td></tr><tr><td colspan="2" class="infobox-full-data"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1257001546"></td></tr><tr><th scope="row" class="infobox-label" style="padding-left:0.65em;line-height:1.1em;font-weight:normal;padding-right:0.25em;"><div style="position:relative;left:-0.65em;"><b><a href="/wiki/Carbohydrate" title="Carbohydrate">Carbohydrates</a></b></div></th><td class="infobox-data" style="vertical-align:middle;padding-left:0.65em;line-height:1.1em;"><div style="position:relative;left:-0.65em;">13.81 g</div></td></tr><tr><th scope="row" class="infobox-label" style="padding-left:0.65em;line-height:1.1em;font-weight:normal;padding-right:0.25em;"><a href="/wiki/Sugar" title="Sugar">Sugars</a></th><td class="infobox-data" style="vertical-align:middle;padding-left:0.65em;line-height:1.1em;">10.39</td></tr><tr><th scope="row" class="infobox-label" style="padding-left:0.65em;line-height:1.1em;font-weight:normal;padding-right:0.25em;"><a href="/wiki/Dietary_fiber" title="Dietary fiber">Dietary fiber</a></th><td class="infobox-data" style="vertical-align:middle;padding-left:0.65em;line-height:1.1em;">2.4 g</td></tr><tr style="display:none"><td colspan="2">
+</td></tr><tr><td colspan="2" class="infobox-full-data"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1257001546"></td></tr><tr><th scope="row" class="infobox-label" style="padding-left:0.65em;line-height:1.1em;font-weight:normal;padding-right:0.25em;"><div style="position:relative;left:-0.65em;"><b><a href="/wiki/Fat" title="Fat">Fat</a></b></div></th><td class="infobox-data" style="vertical-align:middle;padding-left:0.65em;line-height:1.1em;"><div style="position:relative;left:-0.65em;">0.17 g</div></td></tr><tr style="display:none"><td colspan="2">
+</td></tr><tr><td colspan="2" class="infobox-full-data"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1257001546"></td></tr><tr><th scope="row" class="infobox-label" style="padding-left:0.65em;line-height:1.1em;font-weight:normal;padding-right:0.25em;"><div style="position:relative;left:-0.65em;"><b><a href="/wiki/Protein_(nutrient)" title="Protein (nutrient)">Protein</a></b></div></th><td class="infobox-data" style="vertical-align:middle;padding-left:0.65em;line-height:1.1em;"><div style="position:relative;left:-0.65em;">0.26 g</div></td></tr>
+<tr><td colspan="2">
+<table class="mw-collapsible mw-collapsed mw-made-collapsible" style="; ; width:100%;">
+
+<tbody><tr>
+<th colspan="2" style="line-height:normal; padding:0.2em; ;"><button type="button" class="mw-collapsible-toggle mw-collapsible-toggle-default mw-collapsible-toggle-collapsed" aria-expanded="false" tabindex="0"><span class="mw-collapsible-text">show</span></button><div style="text-align: center; padding: 0 0.4em; margin: 0 3.3em">Vitamins and minerals</div></th>
+</tr><tr style="display:none"><td colspan="2">
+</td></tr><tr style="display: none;"><td colspan="2" class="infobox-full-data"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1257001546"></td></tr><tr style="display: none;"><th scope="row" class="infobox-label" style="padding-left:0.65em;line-height:1.1em;font-weight:normal;padding-right:0.25em;"><b style="margin-left:-0.65em"><a href="/wiki/Vitamin" title="Vitamin">Vitamins</a></b></th><td class="infobox-data" style="vertical-align:middle;padding-left:0.65em;line-height:1.1em;"><b>Quantity</b> <div style="float: right;"><abbr title="Percentage of Daily Value"><b>%DV</b></abbr><sup>†</sup></div></td></tr><tr style="display: none;"><th scope="row" class="infobox-label" style="padding-left:0.65em;line-height:1.1em;font-weight:normal;padding-right:0.25em;"><a href="/wiki/Vitamin_A" title="Vitamin A">Vitamin A equiv.</a><div style="padding-left:0.65em;padding-top:0.25em;font-weight:normal;"><a href="/wiki/Beta-Carotene" class="mw-redirect" title="Beta-Carotene">beta-Carotene</a></div><div style="padding-left:0.65em;padding-top:0.25em;font-weight:normal;"><a href="/wiki/Lutein" title="Lutein">lutein</a> <a href="/wiki/Zeaxanthin" title="Zeaxanthin">zeaxanthin</a></div></th><td class="infobox-data" style="vertical-align:middle;padding-left:0.65em;line-height:1.1em;"><div style="float: right;">0%</div> 3 μg<div style="padding-left:0.65em;padding-top:0.25em;"><div style="float: right;">0%</div>27 μg</div><div style="padding-left:0.65em;padding-top:0.25em;">29 μg</div></td></tr><tr style="display: none;"><th scope="row" class="infobox-label" style="padding-left:0.65em;line-height:1.1em;font-weight:normal;padding-right:0.25em;"><a href="/wiki/Thiamine" title="Thiamine">Thiamine (B<span style="position: relative; top: 0.35em;">1</span>)</a></th><td class="infobox-data" style="vertical-align:middle;padding-left:0.65em;line-height:1.1em;"><div style="float: right;">1%</div> 0.017 mg</td></tr><tr style="display: none;"><th scope="row" class="infobox-label" style="padding-left:0.65em;line-height:1.1em;font-weight:normal;padding-right:0.25em;"><a href="/wiki/Riboflavin" title="Riboflavin">Riboflavin (B<span style="position: relative; top: 0.35em;">2</span>)</a></th><td class="infobox-data" style="vertical-align:middle;padding-left:0.65em;line-height:1.1em;"><div style="float: right;">2%</div> 0.026 mg</td></tr><tr style="display: none;"><th scope="row" class="infobox-label" style="padding-left:0.65em;line-height:1.1em;font-weight:normal;padding-right:0.25em;"><a href="/wiki/Niacin_(nutrient)" class="mw-redirect" title="Niacin (nutrient)">Niacin (B<span style="position: relative; top: 0.35em;">3</span>)</a></th><td class="infobox-data" style="vertical-align:middle;padding-left:0.65em;line-height:1.1em;"><div style="float: right;">1%</div> 0.091 mg</td></tr><tr style="display: none;"><th scope="row" class="infobox-label" style="padding-left:0.65em;line-height:1.1em;font-weight:normal;padding-right:0.25em;"><a href="/wiki/Pantothenic_acid" title="Pantothenic acid">Pantothenic acid (B<span style="position: relative; top: 0.35em;">5</span>)</a></th><td class="infobox-data" style="vertical-align:middle;padding-left:0.65em;line-height:1.1em;"><div style="float: right;">1%</div> 0.061 mg</td></tr><tr style="display: none;"><th scope="row" class="infobox-label" style="padding-left:0.65em;line-height:1.1em;font-weight:normal;padding-right:0.25em;"><a href="/wiki/Vitamin_B6" title="Vitamin B6">Vitamin B<span style="position: relative; top: 0.3em;">6</span></a></th><td class="infobox-data" style="vertical-align:middle;padding-left:0.65em;line-height:1.1em;"><div style="float: right;">2%</div> 0.041 mg</td></tr><tr style="display: none;"><th scope="row" class="infobox-label" style="padding-left:0.65em;line-height:1.1em;font-weight:normal;padding-right:0.25em;"><a href="/wiki/Folate" title="Folate">Folate (B<span style="position: relative; top: 0.35em;">9</span>)</a></th><td class="infobox-data" style="vertical-align:middle;padding-left:0.65em;line-height:1.1em;"><div style="float: right;">1%</div> 3 μg</td></tr><tr style="display: none;"><th scope="row" class="infobox-label" style="padding-left:0.65em;line-height:1.1em;font-weight:normal;padding-right:0.25em;"><a href="/wiki/Vitamin_C" title="Vitamin C">Vitamin C</a></th><td class="infobox-data" style="vertical-align:middle;padding-left:0.65em;line-height:1.1em;"><div style="float: right;">5%</div> 4.6 mg</td></tr><tr style="display: none;"><th scope="row" class="infobox-label" style="padding-left:0.65em;line-height:1.1em;font-weight:normal;padding-right:0.25em;"><a href="/wiki/Vitamin_E" title="Vitamin E">Vitamin E</a></th><td class="infobox-data" style="vertical-align:middle;padding-left:0.65em;line-height:1.1em;"><div style="float: right;">1%</div> 0.18 mg</td></tr><tr style="display: none;"><th scope="row" class="infobox-label" style="padding-left:0.65em;line-height:1.1em;font-weight:normal;padding-right:0.25em;"><a href="/wiki/Vitamin_K" title="Vitamin K">Vitamin K</a></th><td class="infobox-data" style="vertical-align:middle;padding-left:0.65em;line-height:1.1em;"><div style="float: right;">2%</div> 2.2 μg</td></tr><tr style="display:none"><td colspan="2">
+</td></tr><tr style="display: none;"><td colspan="2" class="infobox-full-data"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1257001546"></td></tr><tr style="display: none;"><th scope="row" class="infobox-label" style="padding-left:0.65em;line-height:1.1em;font-weight:normal;padding-right:0.25em;"><b style="margin-left:-0.65em"><a href="/wiki/Mineral_(nutrient)" title="Mineral (nutrient)">Minerals</a></b></th><td class="infobox-data" style="vertical-align:middle;padding-left:0.65em;line-height:1.1em;"><b>Quantity</b> <div style="float: right;"><abbr title="Percentage of Daily Value"><b>%DV</b></abbr><sup>†</sup></div></td></tr><tr style="display: none;"><th scope="row" class="infobox-label" style="padding-left:0.65em;line-height:1.1em;font-weight:normal;padding-right:0.25em;"><a href="/wiki/Calcium_in_biology#Humans" title="Calcium in biology">Calcium</a></th><td class="infobox-data" style="vertical-align:middle;padding-left:0.65em;line-height:1.1em;"><div style="float: right;">0%</div> 6 mg</td></tr><tr style="display: none;"><th scope="row" class="infobox-label" style="padding-left:0.65em;line-height:1.1em;font-weight:normal;padding-right:0.25em;"><a href="/wiki/Human_iron_metabolism" title="Human iron metabolism">Iron</a></th><td class="infobox-data" style="vertical-align:middle;padding-left:0.65em;line-height:1.1em;"><div style="float: right;">1%</div> 0.12 mg</td></tr><tr style="display: none;"><th scope="row" class="infobox-label" style="padding-left:0.65em;line-height:1.1em;font-weight:normal;padding-right:0.25em;"><a href="/wiki/Magnesium_in_biology" title="Magnesium in biology">Magnesium</a></th><td class="infobox-data" style="vertical-align:middle;padding-left:0.65em;line-height:1.1em;"><div style="float: right;">1%</div> 5 mg</td></tr><tr style="display: none;"><th scope="row" class="infobox-label" style="padding-left:0.65em;line-height:1.1em;font-weight:normal;padding-right:0.25em;"><a href="/wiki/Manganese#Human_health_and_nutrition" title="Manganese">Manganese</a></th><td class="infobox-data" style="vertical-align:middle;padding-left:0.65em;line-height:1.1em;"><div style="float: right;">2%</div> 0.035 mg</td></tr><tr style="display: none;"><th scope="row" class="infobox-label" style="padding-left:0.65em;line-height:1.1em;font-weight:normal;padding-right:0.25em;"><a href="/wiki/Phosphorus#Biological_role" title="Phosphorus">Phosphorus</a></th><td class="infobox-data" style="vertical-align:middle;padding-left:0.65em;line-height:1.1em;"><div style="float: right;">1%</div> 11 mg</td></tr><tr style="display: none;"><th scope="row" class="infobox-label" style="padding-left:0.65em;line-height:1.1em;font-weight:normal;padding-right:0.25em;"><a href="/wiki/Potassium_in_biology" title="Potassium in biology">Potassium</a></th><td class="infobox-data" style="vertical-align:middle;padding-left:0.65em;line-height:1.1em;"><div style="float: right;">4%</div> 107 mg</td></tr><tr style="display: none;"><th scope="row" class="infobox-label" style="padding-left:0.65em;line-height:1.1em;font-weight:normal;padding-right:0.25em;"><a href="/wiki/Sodium_in_biology" title="Sodium in biology">Sodium</a></th><td class="infobox-data" style="vertical-align:middle;padding-left:0.65em;line-height:1.1em;"><div style="float: right;">0%</div> 1 mg</td></tr><tr style="display: none;"><th scope="row" class="infobox-label" style="padding-left:0.65em;line-height:1.1em;font-weight:normal;padding-right:0.25em;"><a href="/wiki/Zinc#Biological_role" title="Zinc">Zinc</a></th><td class="infobox-data" style="vertical-align:middle;padding-left:0.65em;line-height:1.1em;"><div style="float: right;">0%</div> 0.04 mg</td></tr><tr style="display: none;"><td colspan="2">
+</td></tr></tbody></table></td></tr><tr><td colspan="2" class="infobox-full-data"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1257001546"></td></tr><tr><th scope="row" class="infobox-label" style="padding-left:0.65em;line-height:1.1em;font-weight:normal;padding-right:0.25em;"><b style="margin-left:-0.65em">Other constituents</b></th><td class="infobox-data" style="vertical-align:middle;padding-left:0.65em;line-height:1.1em;"><b>Quantity</b></td></tr><tr><th scope="row" class="infobox-label" style="padding-left:0.65em;line-height:1.1em;font-weight:normal;padding-right:0.25em;">Water</th><td class="infobox-data" style="vertical-align:middle;padding-left:0.65em;line-height:1.1em;">85.56 g</td></tr><tr style="display:none"><td colspan="2">
+</td></tr><tr><td colspan="2" class="infobox-full-data"><hr><div class="wrap" style="padding:0.3em;line-height:1.2em;"><a rel="nofollow" class="external text" href="https://fdc.nal.usda.gov/fdc-app.html#/food-details/1102644/nutrients">Link to Full Nutrient Report of USDA Database entry</a></div></td></tr><tr><td colspan="2" class="infobox-below wrap" style="background:#e0e0e0;padding:0.3em;line-height:1.5em;font-weight:normal;font-size:0.9em"><sup>†</sup>Percentages estimated using <a href="/wiki/Reference_Daily_Intake#Daily_Values" title="Reference Daily Intake">US&nbsp;recommendations</a> for adults,<sup id="cite_ref-FDADailyValues_80-0" class="reference"><a href="#cite_note-FDADailyValues-80"><span class="cite-bracket">[</span>80<span class="cite-bracket">]</span></a></sup> except for potassium, which is estimated based on expert recommendation from <a href="/wiki/National_Academies_of_Sciences,_Engineering,_and_Medicine" title="National Academies of Sciences, Engineering, and Medicine">the National Academies</a>.<sup id="cite_ref-NationalAcademiesPotassium_81-0" class="reference"><a href="#cite_note-NationalAcademiesPotassium-81"><span class="cite-bracket">[</span>81<span class="cite-bracket">]</span></a></sup></td></tr></tbody></table>
+</div></div>
+<p>A raw apple is 86% water and 14% <a href="/wiki/Carbohydrate" title="Carbohydrate">carbohydrates</a>, with negligible content of <a href="/wiki/Fat" title="Fat">fat</a> and <a href="/wiki/Protein" title="Protein">protein</a> (table). A reference serving of a raw apple with skin weighing 100&nbsp;g (3.5&nbsp;oz) provides 52 <a href="/wiki/Calorie" title="Calorie">calories</a> and a moderate content of <a href="/wiki/Dietary_fiber" title="Dietary fiber">dietary fiber</a> (table). Otherwise, there is low content of <a href="/wiki/Micronutrient" title="Micronutrient">micronutrients</a>, with the <a href="/wiki/Daily_Value" class="mw-redirect" title="Daily Value">Daily Values</a> of all falling below 10% (table).
+</p>
+<div class="mw-heading mw-heading3"><h3 id="Culinary">Culinary</h3></div>
+<link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1236090951"><div role="note" class="hatnote navigation-not-searchable">Further information: <a href="/wiki/List_of_apple_dishes" title="List of apple dishes">List of apple dishes</a></div>
+<figure class="mw-default-size mw-halign-left" typeof="mw:File/Thumb"><a href="/wiki/File:Paring,_slicing_and_coring_machine_%E2%80%A2_p279_%E2%80%A2_Scammell%27s_Cyclopedia.tif" class="mw-file-description"><img src="//upload.wikimedia.org/wikipedia/commons/thumb/a/a3/Paring%2C_slicing_and_coring_machine_%E2%80%A2_p279_%E2%80%A2_Scammell%27s_Cyclopedia.tif/lossy-page1-220px-Paring%2C_slicing_and_coring_machine_%E2%80%A2_p279_%E2%80%A2_Scammell%27s_Cyclopedia.tif.jpg" decoding="async" width="220" height="173" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/commons/thumb/a/a3/Paring%2C_slicing_and_coring_machine_%E2%80%A2_p279_%E2%80%A2_Scammell%27s_Cyclopedia.tif/lossy-page1-330px-Paring%2C_slicing_and_coring_machine_%E2%80%A2_p279_%E2%80%A2_Scammell%27s_Cyclopedia.tif.jpg 1.5x, //upload.wikimedia.org/wikipedia/commons/thumb/a/a3/Paring%2C_slicing_and_coring_machine_%E2%80%A2_p279_%E2%80%A2_Scammell%27s_Cyclopedia.tif/lossy-page1-440px-Paring%2C_slicing_and_coring_machine_%E2%80%A2_p279_%E2%80%A2_Scammell%27s_Cyclopedia.tif.jpg 2x" data-file-width="1350" data-file-height="1060"></a><figcaption>Machine for paring, coring, and slicing apples, from Henry B. Scammell's 1897 handbook <i>Cyclopedia of Valuable Receipts</i></figcaption></figure>
+<p>Apples varieties can be grouped as <a href="/wiki/Cooking_apple" title="Cooking apple">cooking apples</a>, <a href="/wiki/Table_apple" title="Table apple">eating apples</a>, and <a href="/wiki/Cider_apple" title="Cider apple">cider apples</a>, the last so astringent as to be "almost inedible".<sup id="cite_ref-Davidson_2014_82-0" class="reference"><a href="#cite_note-Davidson_2014-82"><span class="cite-bracket">[</span>82<span class="cite-bracket">]</span></a></sup> Apples are consumed as <a href="/wiki/Apple_juice" title="Apple juice">juice</a>, raw in salads, baked in <a href="/wiki/Apple_pie" title="Apple pie">pies</a>, cooked into <a href="/wiki/Apple_sauce" title="Apple sauce">sauces</a> and <a href="/wiki/Apple_butter" title="Apple butter">apple butter</a>, or baked.<sup id="cite_ref-83" class="reference"><a href="#cite_note-83"><span class="cite-bracket">[</span>83<span class="cite-bracket">]</span></a></sup> They are sometimes used as an ingredient in savory foods, such as sausage and stuffing.<sup id="cite_ref-84" class="reference"><a href="#cite_note-84"><span class="cite-bracket">[</span>84<span class="cite-bracket">]</span></a></sup>
+</p><p>Several techniques are used to preserve apples and apple products. Traditional methods include drying and making <a href="/wiki/Apple_butter" title="Apple butter">apple butter</a>.<sup id="cite_ref-Davidson_2014_82-1" class="reference"><a href="#cite_note-Davidson_2014-82"><span class="cite-bracket">[</span>82<span class="cite-bracket">]</span></a></sup> Juice and cider are produced commercially; cider is a significant industry in regions such as the <a href="/wiki/West_of_England" title="West of England">West of England</a> and <a href="/wiki/Normandy" title="Normandy">Normandy</a>.<sup id="cite_ref-Davidson_2014_82-2" class="reference"><a href="#cite_note-Davidson_2014-82"><span class="cite-bracket">[</span>82<span class="cite-bracket">]</span></a></sup>
+</p><p>A <a href="/wiki/Toffee_apple" class="mw-redirect" title="Toffee apple">toffee apple</a> (UK) or <a href="/wiki/Caramel_apple" title="Caramel apple">caramel apple</a> (US) is a confection made by coating an apple in hot <a href="/wiki/Toffee" title="Toffee">toffee</a> or <a href="/wiki/Caramel" title="Caramel">caramel</a> candy respectively and allowing it to cool.<sup id="cite_ref-85" class="reference"><a href="#cite_note-85"><span class="cite-bracket">[</span>85<span class="cite-bracket">]</span></a></sup><sup id="cite_ref-Lim_2012_8-2" class="reference"><a href="#cite_note-Lim_2012-8"><span class="cite-bracket">[</span>8<span class="cite-bracket">]</span></a></sup> <a href="/wiki/Apples_and_honey" title="Apples and honey">Apples and honey</a> are a ritual <a href="/wiki/Food_pairing" title="Food pairing">food pairing</a> eaten during the Jewish New Year of <a href="/wiki/Rosh_Hashanah" title="Rosh Hashanah">Rosh Hashanah</a>.<sup id="cite_ref-86" class="reference"><a href="#cite_note-86"><span class="cite-bracket">[</span>86<span class="cite-bracket">]</span></a></sup>
+</p><p>Apples are an important ingredient in many desserts, such as <a href="/wiki/Apple_pie" title="Apple pie">pies</a>, <a href="/wiki/Crumble" title="Crumble">crumbles</a>, and <a href="/wiki/Apple_cake" title="Apple cake">cakes</a>. When cooked, some apple cultivars easily form a puree known as <a href="/wiki/Apple_sauce" title="Apple sauce">apple sauce</a>, which can be cooked down to form a preserve, apple butter. They are often <a href="/wiki/Baked" class="mw-redirect" title="Baked">baked</a> or <a href="/wiki/Stewed" class="mw-redirect" title="Stewed">stewed</a>, and are cooked in some meat dishes.<sup id="cite_ref-Davidson_2014_82-3" class="reference"><a href="#cite_note-Davidson_2014-82"><span class="cite-bracket">[</span>82<span class="cite-bracket">]</span></a></sup>
+</p>
+<link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1235681985"><style data-mw-deduplicate="TemplateStyles:r1237033735">@media print{body.ns-0 .mw-parser-output .sistersitebox{display:none!important}}@media screen{html.skin-theme-clientpref-night .mw-parser-output .sistersitebox img[src*="Wiktionary-logo-en-v2.svg"]{background-color:white}}@media screen and (prefers-color-scheme:dark){html.skin-theme-clientpref-os .mw-parser-output .sistersitebox img[src*="Wiktionary-logo-en-v2.svg"]{background-color:white}}</style><div class="side-box side-box-right plainlinks sistersitebox"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1126788409">
+<div class="side-box-flex">
+<div class="side-box-image"><span class="noviewer" typeof="mw:File"><span><img alt="" src="//upload.wikimedia.org/wikipedia/commons/thumb/d/df/Wikibooks-logo-en-noslogan.svg/40px-Wikibooks-logo-en-noslogan.svg.png" decoding="async" width="40" height="40" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/commons/thumb/d/df/Wikibooks-logo-en-noslogan.svg/60px-Wikibooks-logo-en-noslogan.svg.png 1.5x, //upload.wikimedia.org/wikipedia/commons/thumb/d/df/Wikibooks-logo-en-noslogan.svg/80px-Wikibooks-logo-en-noslogan.svg.png 2x" data-file-width="400" data-file-height="400"></span></span></div>
+<div class="side-box-text plainlist">Wikibooks <a href="https://en.wikibooks.org/wiki/Cookbook" class="extiw" title="wikibooks:Cookbook">Cookbook</a> has a recipe/module on
+<link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1126788409"><div class="plainlist" style="margin-left: 1.6em;">
+<ul><li><i><b><a href="https://en.wikibooks.org/wiki/Cookbook:Apple" class="extiw" title="wikibooks:Cookbook:Apple"> Apple</a></b></i></li></ul>
+</div></div></div>
+</div>
+<p>Apples are <a href="/wiki/Cider_mill" title="Cider mill">milled</a> or <a href="/wiki/Fruit_press#Cider_press" title="Fruit press">pressed</a> to produce <a href="/wiki/Apple_juice" title="Apple juice">apple juice</a>, which may be drunk unfiltered (called <a href="/wiki/Apple_cider" title="Apple cider">apple cider</a> in North America), or filtered. Filtered juice is often concentrated and frozen, then reconstituted later and consumed. Apple juice can be <a href="/wiki/Fermentation_(food)" class="mw-redirect" title="Fermentation (food)">fermented</a> to make <a href="/wiki/Cider" title="Cider">cider</a> (called hard cider in North America), <a href="/wiki/Ciderkin" title="Ciderkin">ciderkin</a>, and vinegar.<sup id="cite_ref-Lim_2012_8-3" class="reference"><a href="#cite_note-Lim_2012-8"><span class="cite-bracket">[</span>8<span class="cite-bracket">]</span></a></sup> Through <a href="/wiki/Distillation" title="Distillation">distillation</a>, various alcoholic beverages can be produced, such as <a href="/wiki/Applejack_(beverage)" class="mw-redirect" title="Applejack (beverage)">applejack</a>, <a href="/wiki/Calvados" title="Calvados">Calvados</a>, and <a href="/wiki/Apple_brandy" class="mw-redirect" title="Apple brandy">apple brandy</a>.<sup id="cite_ref-Lim_2012_8-4" class="reference"><a href="#cite_note-Lim_2012-8"><span class="cite-bracket">[</span>8<span class="cite-bracket">]</span></a></sup><sup id="cite_ref-87" class="reference"><a href="#cite_note-87"><span class="cite-bracket">[</span>87<span class="cite-bracket">]</span></a></sup>
+</p>
+<div class="mw-heading mw-heading3"><h3 id="Organic_production">Organic production</h3></div>
+<p><a href="/wiki/Organic_farming" title="Organic farming">Organic</a> apples are commonly produced in the United States.<sup id="cite_ref-organic_88-0" class="reference"><a href="#cite_note-organic-88"><span class="cite-bracket">[</span>88<span class="cite-bracket">]</span></a></sup> Due to infestations by key insects and diseases, organic production is difficult in Europe.<sup id="cite_ref-croplife_89-0" class="reference"><a href="#cite_note-croplife-89"><span class="cite-bracket">[</span>89<span class="cite-bracket">]</span></a></sup> The use of pesticides containing chemicals, such as sulfur, copper, microorganisms, viruses, clay powders, or plant extracts (<a href="/wiki/Pyrethrum" title="Pyrethrum">pyrethrum</a>, <a href="/wiki/Neem" class="mw-redirect" title="Neem">neem</a>) has been approved by the EU Organic Standing Committee to improve organic yield and quality.<sup id="cite_ref-croplife_89-1" class="reference"><a href="#cite_note-croplife-89"><span class="cite-bracket">[</span>89<span class="cite-bracket">]</span></a></sup> A light coating of <a href="/wiki/Kaolin" class="mw-redirect" title="Kaolin">kaolin</a>, which forms a physical barrier to some pests, also may help prevent apple sun scalding.<sup id="cite_ref-Polomski_&amp;_Reighard_48-3" class="reference"><a href="#cite_note-Polomski_&amp;_Reighard-48"><span class="cite-bracket">[</span>48<span class="cite-bracket">]</span></a></sup>
+</p>
+<div class="mw-heading mw-heading3"><h3 id="Non-browning_apples">Non-browning apples</h3></div>
+<p>Apple skins and seeds contain <a href="/wiki/Polyphenol" title="Polyphenol">polyphenols</a>.<sup id="cite_ref-Ribeiro2014_90-0" class="reference"><a href="#cite_note-Ribeiro2014-90"><span class="cite-bracket">[</span>90<span class="cite-bracket">]</span></a></sup> These are oxidised by the <a href="/wiki/Enzyme" title="Enzyme">enzyme</a> <a href="/wiki/Polyphenol_oxidase" title="Polyphenol oxidase">polyphenol oxidase</a>, which causes <a href="/wiki/Food_browning" title="Food browning">browning</a> in sliced or bruised apples, by <a href="/wiki/Catalysis" title="Catalysis">catalyzing</a> the <a href="/wiki/Oxidation" class="mw-redirect" title="Oxidation">oxidation</a> of phenolic compounds to <a href="/wiki/O-quinone" class="mw-redirect" title="O-quinone">o-quinones</a>, a browning factor.<sup id="cite_ref-nic_91-0" class="reference"><a href="#cite_note-nic-91"><span class="cite-bracket">[</span>91<span class="cite-bracket">]</span></a></sup> Browning reduces apple taste, color, and food value. <a href="/wiki/Arctic_apples" class="mw-redirect" title="Arctic apples">Arctic apples</a>, a non-browning group of apples introduced to the United States market in 2019, have been <a href="/wiki/Genetically_modified_food" title="Genetically modified food">genetically modified</a> to silence the <a href="/wiki/Gene_expression" title="Gene expression">expression</a> of polyphenol oxidase, thereby delaying a browning effect and improving apple eating quality.<sup id="cite_ref-92" class="reference"><a href="#cite_note-92"><span class="cite-bracket">[</span>92<span class="cite-bracket">]</span></a></sup><sup id="cite_ref-93" class="reference"><a href="#cite_note-93"><span class="cite-bracket">[</span>93<span class="cite-bracket">]</span></a></sup> The US <a href="/wiki/Food_and_Drug_Administration" title="Food and Drug Administration">Food and Drug Administration</a> in 2015, and <a href="/wiki/Canadian_Food_Inspection_Agency" title="Canadian Food Inspection Agency">Canadian Food Inspection Agency</a> in 2017, determined that Arctic apples are as safe and nutritious as conventional apples.<sup id="cite_ref-fda2015_94-0" class="reference"><a href="#cite_note-fda2015-94"><span class="cite-bracket">[</span>94<span class="cite-bracket">]</span></a></sup><sup id="cite_ref-cfia_95-0" class="reference"><a href="#cite_note-cfia-95"><span class="cite-bracket">[</span>95<span class="cite-bracket">]</span></a></sup>
+</p>
+<div class="mw-heading mw-heading3"><h3 id="Other_products">Other products</h3></div>
+<p><a href="/wiki/Apple_seed_oil" title="Apple seed oil">Apple seed oil</a> is obtained by <a href="/wiki/Expeller_pressing" title="Expeller pressing">pressing</a> apple seeds for manufacturing <a href="/wiki/Cosmetics" title="Cosmetics">cosmetics</a>.<sup id="cite_ref-96" class="reference"><a href="#cite_note-96"><span class="cite-bracket">[</span>96<span class="cite-bracket">]</span></a></sup>
+</p>
+<div class="mw-heading mw-heading2"><h2 id="In_culture">In culture</h2></div>
+<link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1236090951"><div role="note" class="hatnote navigation-not-searchable">Main article: <a href="/wiki/Apple_(symbolism)" title="Apple (symbolism)">Apple (symbolism)</a></div>
+<div class="mw-heading mw-heading3"><h3 id="Germanic_paganism">Germanic paganism</h3></div>
+<figure class="mw-default-size" typeof="mw:File/Thumb"><a href="/wiki/File:Carl_Larsson_Brita_as_Iduna.jpg" class="mw-file-description"><img alt="Illustration of girl in a red dress, holding 3 candles in one hand and a basket of apples in the other" src="//upload.wikimedia.org/wikipedia/commons/thumb/1/11/Carl_Larsson_Brita_as_Iduna.jpg/170px-Carl_Larsson_Brita_as_Iduna.jpg" decoding="async" width="170" height="240" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/commons/thumb/1/11/Carl_Larsson_Brita_as_Iduna.jpg/255px-Carl_Larsson_Brita_as_Iduna.jpg 1.5x, //upload.wikimedia.org/wikipedia/commons/thumb/1/11/Carl_Larsson_Brita_as_Iduna.jpg/340px-Carl_Larsson_Brita_as_Iduna.jpg 2x" data-file-width="390" data-file-height="550"></a><figcaption>"Brita as <a href="/wiki/I%C3%B0unn" title="Iðunn">Iduna</a>" (1901) by <a href="/wiki/Carl_Larsson" title="Carl Larsson">Carl Larsson</a></figcaption></figure>
+<p>In <a href="/wiki/Norse_mythology" title="Norse mythology">Norse mythology</a>, the goddess <a href="/wiki/I%C3%B0unn" title="Iðunn">Iðunn</a> is portrayed in the <i><a href="/wiki/Prose_Edda" title="Prose Edda">Prose Edda</a></i> (written in the 13th century by <a href="/wiki/Snorri_Sturluson" title="Snorri Sturluson">Snorri Sturluson</a>) as providing apples to the <a href="/wiki/Gods" class="mw-redirect" title="Gods">gods</a> that give them <a href="/wiki/Eternal_youth" title="Eternal youth">eternal youthfulness</a>. The English scholar <a href="/wiki/H._R._Ellis_Davidson" class="mw-redirect" title="H. R. Ellis Davidson">H. R. Ellis Davidson</a> links apples to religious practices in <a href="/wiki/Germanic_paganism" title="Germanic paganism">Germanic paganism</a>, from which <a href="/wiki/Norse_paganism" class="mw-redirect" title="Norse paganism">Norse paganism</a> developed. She points out that buckets of apples were found in the <a href="/wiki/Oseberg_ship" class="mw-redirect" title="Oseberg ship">Oseberg ship</a> burial site in Norway, that fruit and nuts (Iðunn having been described as being transformed into a nut in <i><a href="/wiki/Sk%C3%A1ldskaparm%C3%A1l" title="Skáldskaparmál">Skáldskaparmál</a></i>) have been found in the early graves of the <a href="/wiki/Germanic_peoples" title="Germanic peoples">Germanic peoples</a> in England and elsewhere on the continent of Europe, which may have had a symbolic meaning, and that nuts are still a recognized symbol of <a href="/wiki/Fertility" title="Fertility">fertility</a> in southwest England.<sup id="cite_ref-Davidson_1990_97-0" class="reference"><a href="#cite_note-Davidson_1990-97"><span class="cite-bracket">[</span>97<span class="cite-bracket">]</span></a></sup>
+</p><p>Davidson notes a connection between apples and the <a href="/wiki/Vanir" title="Vanir">Vanir</a>, a tribe of gods associated with <a href="/wiki/Fertility" title="Fertility">fertility</a> in Norse mythology, citing an instance of eleven "golden apples" being given to woo the beautiful <a href="/wiki/Ger%C3%B0r" title="Gerðr">Gerðr</a> by <a href="/wiki/Sk%C3%ADrnir" title="Skírnir">Skírnir</a>, who was acting as messenger for the major Vanir god <a href="/wiki/Freyr" title="Freyr">Freyr</a> in stanzas 19 and 20 of <i><a href="/wiki/Sk%C3%ADrnism%C3%A1l" title="Skírnismál">Skírnismál</a></i>. Davidson also notes a further connection between fertility and apples in Norse mythology in chapter 2 of the <i><a href="/wiki/V%C3%B6lsunga_saga" title="Völsunga saga">Völsunga saga</a></i>: when the major goddess <a href="/wiki/Frigg" title="Frigg">Frigg</a> sends King <a href="/wiki/Rerir" title="Rerir">Rerir</a> an apple after he prays to Odin for a child, Frigg's messenger (in the guise of a crow) drops the apple in his lap as he sits atop a <a href="/wiki/Tumulus" title="Tumulus">mound</a>.<sup id="cite_ref-Davidson_1990_97-1" class="reference"><a href="#cite_note-Davidson_1990-97"><span class="cite-bracket">[</span>97<span class="cite-bracket">]</span></a></sup> Rerir's wife's consumption of the apple results in a six-year pregnancy and the birth (by <a href="/wiki/Caesarean_section" title="Caesarean section">Caesarean section</a>) of their son—the hero <a href="/wiki/V%C3%B6lsung" title="Völsung">Völsung</a>.<sup id="cite_ref-98" class="reference"><a href="#cite_note-98"><span class="cite-bracket">[</span>98<span class="cite-bracket">]</span></a></sup>
+</p><p>Further, Davidson points out the "strange" phrase "Apples of <a href="/wiki/Hel_(location)" title="Hel (location)">Hel</a>" used in an 11th-century poem by the <a href="/wiki/Skald" title="Skald">skald</a> Thorbiorn Brúnarson. She states this may imply that the apple was thought of by Brúnarson as the food of the dead. Further, Davidson notes that the potentially Germanic goddess <a href="/wiki/Nehalennia" title="Nehalennia">Nehalennia</a> is sometimes depicted with apples and that parallels exist in early Irish stories. Davidson asserts that while cultivation of the apple in Northern Europe extends back to at least the time of the <a href="/wiki/Roman_Empire" title="Roman Empire">Roman Empire</a> and came to Europe from the <a href="/wiki/Near_East" title="Near East">Near East</a>, the native varieties of apple trees growing in Northern Europe are small and bitter. Davidson concludes that in the figure of Iðunn "we must have a dim reflection of an old symbol: that of the guardian goddess of the life-giving fruit of the other world."<sup id="cite_ref-Davidson_1990_97-2" class="reference"><a href="#cite_note-Davidson_1990-97"><span class="cite-bracket">[</span>97<span class="cite-bracket">]</span></a></sup>
+</p>
+<div class="mw-heading mw-heading3"><h3 id="Greek_mythology">Greek mythology</h3></div>
+<figure class="mw-default-size mw-halign-right" typeof="mw:File/Thumb"><a href="/wiki/File:Hercules_Musei_Capitolini_MC1265_n2.jpg" class="mw-file-description"><img src="//upload.wikimedia.org/wikipedia/commons/thumb/4/4d/Hercules_Musei_Capitolini_MC1265_n2.jpg/170px-Hercules_Musei_Capitolini_MC1265_n2.jpg" decoding="async" width="170" height="298" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/commons/thumb/4/4d/Hercules_Musei_Capitolini_MC1265_n2.jpg/255px-Hercules_Musei_Capitolini_MC1265_n2.jpg 1.5x, //upload.wikimedia.org/wikipedia/commons/thumb/4/4d/Hercules_Musei_Capitolini_MC1265_n2.jpg/340px-Hercules_Musei_Capitolini_MC1265_n2.jpg 2x" data-file-width="564" data-file-height="990"></a><figcaption><a href="/wiki/Heracles" title="Heracles">Heracles</a> with the apple of <a href="/wiki/Hesperides" title="Hesperides">Hesperides</a> </figcaption></figure>
+<p>Apples appear in many <a href="/wiki/World_religions" title="World religions">religious traditions</a>, including Greek and Roman <a href="/wiki/Mythology" class="mw-redirect" title="Mythology">mythology</a> where it has an ambiguous symbolism of discord, fertility, or courtship.<sup id="cite_ref-99" class="reference"><a href="#cite_note-99"><span class="cite-bracket">[</span>99<span class="cite-bracket">]</span></a></sup> In <a href="/wiki/Greek_mythology" title="Greek mythology">Greek mythology</a>, the <a href="/wiki/Greek_hero" class="mw-redirect" title="Greek hero">Greek hero</a> <a href="/wiki/Heracles" title="Heracles">Heracles</a>, as a part of his <a href="/wiki/Twelve_Labours" class="mw-redirect" title="Twelve Labours">Twelve Labours</a>, was required to travel to the Garden of the Hesperides and pick the golden apples off the <a href="/wiki/Hesperides#The_Garden_of_the_Hesperides" title="Hesperides">Tree of Life</a> growing at its center.<sup id="cite_ref-Ruck_2001_100-0" class="reference"><a href="#cite_note-Ruck_2001-100"><span class="cite-bracket">[</span>100<span class="cite-bracket">]</span></a></sup>
+</p><p>The Greek goddess of discord, <a href="/wiki/Eris_(mythology)" title="Eris (mythology)">Eris</a>, became disgruntled after she was excluded from the wedding of <a href="/wiki/Peleus" title="Peleus">Peleus</a> and <a href="/wiki/Thetis" title="Thetis">Thetis</a>.<sup id="cite_ref-101" class="reference"><a href="#cite_note-101"><span class="cite-bracket">[</span>101<span class="cite-bracket">]</span></a></sup> In retaliation, she tossed a <a href="/wiki/Apple_of_Discord" title="Apple of Discord">golden apple</a> inscribed <a href="/wiki/Kallisti" class="mw-redirect" title="Kallisti">Καλλίστη</a> (<i>Kallistē</i>, "For the most beautiful one"), into the wedding party. Three goddesses claimed the apple: <a href="/wiki/Hera" title="Hera">Hera</a>, <a href="/wiki/Athena" title="Athena">Athena</a>, and <a href="/wiki/Aphrodite" title="Aphrodite">Aphrodite</a>. <a href="/wiki/Paris_(mythology)" title="Paris (mythology)">Paris</a> of <a href="/wiki/Troy" title="Troy">Troy</a> was appointed to select the recipient. After being bribed by both Hera and Athena, Aphrodite tempted him with the most beautiful woman in the world, <a href="/wiki/Helen_of_Troy" title="Helen of Troy">Helen</a> of <a href="/wiki/Sparta" title="Sparta">Sparta</a>. He awarded the apple to Aphrodite, thus indirectly causing the <a href="/wiki/Trojan_War" title="Trojan War">Trojan War</a>.<sup id="cite_ref-102" class="reference"><a href="#cite_note-102"><span class="cite-bracket">[</span>102<span class="cite-bracket">]</span></a></sup><sup id="cite_ref-103" class="reference"><a href="#cite_note-103"><span class="cite-bracket">[</span>103<span class="cite-bracket">]</span></a></sup>
+</p><p>The apple was thus considered, in ancient Greece, sacred to Aphrodite. To throw an apple at someone was to symbolically declare one's love; and similarly, to catch it was to symbolically show one's acceptance of that love. An epigram claiming authorship by Plato states:<sup id="cite_ref-104" class="reference"><a href="#cite_note-104"><span class="cite-bracket">[</span>104<span class="cite-bracket">]</span></a></sup>
+</p>
+<style data-mw-deduplicate="TemplateStyles:r1244412712">.mw-parser-output .templatequote{overflow:hidden;margin:1em 0;padding:0 32px}.mw-parser-output .templatequotecite{line-height:1.5em;text-align:left;margin-top:0}@media(min-width:500px){.mw-parser-output .templatequotecite{padding-left:1.6em}}</style><blockquote class="templatequote"><p>I throw the apple at you, and if you are willing to love me, take it and share your girlhood with me; but if your thoughts are what I pray they are not, even then take it, and consider how short-lived is beauty.</p><div class="templatequotecite">— <cite><a href="/wiki/Plato" title="Plato">Plato</a>, Epigram VII</cite></div></blockquote>
+<p><a href="/wiki/Atalanta" title="Atalanta">Atalanta</a>, also of Greek mythology, raced all her suitors in an attempt to avoid marriage. She outran all but <a href="/wiki/Hippomenes" title="Hippomenes">Hippomenes</a> (also known as <a href="/wiki/Melanion" class="mw-redirect" title="Melanion">Melanion</a>, a name possibly derived from <i>melon</i>, the Greek word for both "apple" and fruit in general),<sup id="cite_ref-Ruck_2001_100-1" class="reference"><a href="#cite_note-Ruck_2001-100"><span class="cite-bracket">[</span>100<span class="cite-bracket">]</span></a></sup> who defeated her by cunning, not speed. Hippomenes knew that he could not win in a fair race, so he used three golden apples (gifts of Aphrodite, the goddess of love) to distract Atalanta. It took all three apples and all of his speed, but Hippomenes was finally successful, winning the race and Atalanta's hand.<sup id="cite_ref-105" class="reference"><a href="#cite_note-105"><span class="cite-bracket">[</span>105<span class="cite-bracket">]</span></a></sup><sup id="cite_ref-106" class="reference"><a href="#cite_note-106"><span class="cite-bracket">[</span>106<span class="cite-bracket">]</span></a></sup>
+</p>
+<div class="mw-heading mw-heading3"><h3 id="Celtic_mythology">Celtic mythology</h3></div>
+<p>In <a href="/wiki/Celtic_mythology" title="Celtic mythology">Celtic mythology</a>, the <a href="/wiki/Otherworld" title="Otherworld">otherworld</a> has many names, including <i>Emain Ablach</i>, "Emain of the Apple-trees". A version of this is <a href="/wiki/Avalon" title="Avalon">Avalon</a> in <a href="/wiki/Arthurian_legend" class="mw-redirect" title="Arthurian legend">Arthurian legend</a>, or in <a href="/wiki/Welsh_language" title="Welsh language">Welsh</a> <i>Ynys Afallon</i>, "Island of Apples".<sup id="cite_ref-107" class="reference"><a href="#cite_note-107"><span class="cite-bracket">[</span>107<span class="cite-bracket">]</span></a></sup>
+</p>
+<div class="mw-heading mw-heading3"><h3 id="China">China</h3></div>
+<figure class="mw-default-size" typeof="mw:File/Thumb"><a href="/wiki/File:Christmas_apples_at_FamilyMart_Beijing_West_Railway_Station_store_(20171224194116).jpg" class="mw-file-description"><img src="//upload.wikimedia.org/wikipedia/commons/thumb/9/9b/Christmas_apples_at_FamilyMart_Beijing_West_Railway_Station_store_%2820171224194116%29.jpg/220px-Christmas_apples_at_FamilyMart_Beijing_West_Railway_Station_store_%2820171224194116%29.jpg" decoding="async" width="219" height="151" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/commons/thumb/9/9b/Christmas_apples_at_FamilyMart_Beijing_West_Railway_Station_store_%2820171224194116%29.jpg/330px-Christmas_apples_at_FamilyMart_Beijing_West_Railway_Station_store_%2820171224194116%29.jpg 1.5x, //upload.wikimedia.org/wikipedia/commons/thumb/9/9b/Christmas_apples_at_FamilyMart_Beijing_West_Railway_Station_store_%2820171224194116%29.jpg/440px-Christmas_apples_at_FamilyMart_Beijing_West_Railway_Station_store_%2820171224194116%29.jpg 2x" data-file-width="2981" data-file-height="2051"></a><figcaption><i>Píngānguǒ</i> ("Peace apples") on sale in Beijing for Christmas Eve (2017)</figcaption></figure>
+<p>In China, apples symbolise <a href="/wiki/Peace" title="Peace">peace</a>, since the sounds of the first element ("píng") in the words "apple" (苹果, <i>Píngguǒ</i>) and "peace" (平安, <i>Píng'ān</i>) are <a href="/wiki/Homophone" title="Homophone">homophonous</a> in Mandarin and Cantonese.<sup id="cite_ref-Lisa_Lim_3-1" class="reference"><a href="#cite_note-Lisa_Lim-3"><span class="cite-bracket">[</span>3<span class="cite-bracket">]</span></a></sup><sup id="cite_ref-English_in_China_108-0" class="reference"><a href="#cite_note-English_in_China-108"><span class="cite-bracket">[</span>108<span class="cite-bracket">]</span></a></sup> When these two words are combined, the word <i>Píngānguǒ</i> (平安果, "Peace apples") is formed. This association developed further as the name for <a href="/wiki/Christmas_Eve" title="Christmas Eve">Christmas Eve</a> in Mandarin is <i>Píngānyè</i> (平安夜, "Peaceful/Quiet Evening"), which made the <a href="/wiki/Gift" title="Gift">gifting</a> of apples at this season to friends and associates popular, as a way to wish them peace and safety.<sup id="cite_ref-English_in_China_108-1" class="reference"><a href="#cite_note-English_in_China-108"><span class="cite-bracket">[</span>108<span class="cite-bracket">]</span></a></sup>
+</p>
+<div class="mw-heading mw-heading3"><h3 id="Christian_art">Christian art</h3></div>
+<figure class="mw-default-size" typeof="mw:File/Thumb"><a href="/wiki/File:Albrecht_D%C3%BCrer_-_Adam_and_Eve_(Prado)_2.jpg" class="mw-file-description"><img src="//upload.wikimedia.org/wikipedia/commons/thumb/a/a2/Albrecht_D%C3%BCrer_-_Adam_and_Eve_%28Prado%29_2.jpg/220px-Albrecht_D%C3%BCrer_-_Adam_and_Eve_%28Prado%29_2.jpg" decoding="async" width="220" height="276" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/commons/thumb/a/a2/Albrecht_D%C3%BCrer_-_Adam_and_Eve_%28Prado%29_2.jpg/330px-Albrecht_D%C3%BCrer_-_Adam_and_Eve_%28Prado%29_2.jpg 1.5x, //upload.wikimedia.org/wikipedia/commons/thumb/a/a2/Albrecht_D%C3%BCrer_-_Adam_and_Eve_%28Prado%29_2.jpg/440px-Albrecht_D%C3%BCrer_-_Adam_and_Eve_%28Prado%29_2.jpg 2x" data-file-width="2337" data-file-height="2934"></a><figcaption><i><a href="/wiki/Adam_and_Eve" title="Adam and Eve">Adam and Eve</a></i> by <a href="/wiki/Albrecht_D%C3%BCrer" title="Albrecht Dürer">Albrecht Dürer</a> (1507), showcasing the apple as a symbol of sin</figcaption></figure>
+<p>Though the <a href="/wiki/Forbidden_fruit" title="Forbidden fruit">forbidden fruit</a> of <a href="/wiki/Garden_of_Eden" title="Garden of Eden">Eden</a> in the <a href="/wiki/Book_of_Genesis" title="Book of Genesis">Book of Genesis</a> is not identified, popular Christian tradition has held that it was an apple that <a href="/wiki/Eve" title="Eve">Eve</a> coaxed <a href="/wiki/Adam" title="Adam">Adam</a> to share with her.<sup id="cite_ref-Macrone_109-0" class="reference"><a href="#cite_note-Macrone-109"><span class="cite-bracket">[</span>109<span class="cite-bracket">]</span></a></sup> The origin of the popular identification with a fruit unknown in the Middle East in biblical times is found in wordplay with the <a href="/wiki/Latin" title="Latin">Latin</a> words <i>mālum</i> (an apple) and <i>mălum</i> (an evil), each of which is normally written <i>malum</i>.<sup id="cite_ref-110" class="reference"><a href="#cite_note-110"><span class="cite-bracket">[</span>110<span class="cite-bracket">]</span></a></sup> The tree of the forbidden fruit is called "the tree of the knowledge of good and evil" in Genesis 2:17,<sup id="cite_ref-111" class="reference"><a href="#cite_note-111"><span class="cite-bracket">[</span>111<span class="cite-bracket">]</span></a></sup> and the Latin for "good and evil" is <i>bonum et malum</i>.<sup id="cite_ref-112" class="reference"><a href="#cite_note-112"><span class="cite-bracket">[</span>112<span class="cite-bracket">]</span></a></sup>
+</p><p><a href="/wiki/Renaissance" title="Renaissance">Renaissance</a> painters may also have been influenced by the story of the <a href="/wiki/Golden_apple" title="Golden apple">golden apples</a> in the <a href="/wiki/Hesperides#The_Garden_of_the_Hesperides" title="Hesperides">Garden of Hesperides</a>. As a result, in the story of Adam and Eve, the apple became a symbol for knowledge, immortality, temptation, the fall of man into sin, and sin itself. The <a href="/wiki/Larynx" title="Larynx">larynx</a> in the human throat has been called the "<a href="/wiki/Adam%27s_apple" title="Adam's apple">Adam's apple</a>" because of a notion that it was caused by the forbidden fruit remaining in the throat of Adam. The apple as symbol of sexual <a href="/wiki/Seduction" title="Seduction">seduction</a> has been used to imply human sexuality, possibly in an ironic vein.<sup id="cite_ref-Macrone_109-1" class="reference"><a href="#cite_note-Macrone-109"><span class="cite-bracket">[</span>109<span class="cite-bracket">]</span></a></sup>
+</p>
+<div class="mw-heading mw-heading3"><h3 id="Proverb">Proverb</h3></div>
+<p>The <a href="/wiki/Proverb" title="Proverb">proverb</a>, "<a href="/wiki/An_apple_a_day_keeps_the_doctor_away" title="An apple a day keeps the doctor away">An apple a day keeps the doctor away</a>", addressing the supposed health benefits of the fruit, has been traced to 19th-century <a href="/wiki/Wales" title="Wales">Wales</a>, where the original phrase was "Eat an apple on going to bed, and you'll keep the doctor from earning his bread".<sup id="cite_ref-113" class="reference"><a href="#cite_note-113"><span class="cite-bracket">[</span>113<span class="cite-bracket">]</span></a></sup> In the 19th century and early 20th, the phrase evolved to "an apple a day, no doctor to pay" and "an apple a day sends the doctor away"; the phrasing now commonly used was first recorded in 1922.<sup id="cite_ref-114" class="reference"><a href="#cite_note-114"><span class="cite-bracket">[</span>114<span class="cite-bracket">]</span></a></sup>
+</p>
+<div class="mw-heading mw-heading2"><h2 id="See_also">See also</h2></div>
+<ul><li><a href="/wiki/Apple_chip" title="Apple chip">Apple chip</a></li>
+<li><a href="/wiki/Applecrab" title="Applecrab">Applecrab</a>, apple–crabapple hybrids for eating</li>
+<li><a href="/wiki/Johnny_Appleseed" title="Johnny Appleseed">Johnny Appleseed</a></li></ul>
+<div class="mw-heading mw-heading2"><h2 id="References">References</h2></div>
+<style data-mw-deduplicate="TemplateStyles:r1239543626">.mw-parser-output .reflist{margin-bottom:0.5em;list-style-type:decimal}@media screen{.mw-parser-output .reflist{font-size:90%}}.mw-parser-output .reflist .references{font-size:100%;margin-bottom:0;list-style-type:inherit}.mw-parser-output .reflist-columns-2{column-width:30em}.mw-parser-output .reflist-columns-3{column-width:25em}.mw-parser-output .reflist-columns{margin-top:0.3em}.mw-parser-output .reflist-columns ol{margin-top:0}.mw-parser-output .reflist-columns li{page-break-inside:avoid;break-inside:avoid-column}.mw-parser-output .reflist-upper-alpha{list-style-type:upper-alpha}.mw-parser-output .reflist-upper-roman{list-style-type:upper-roman}.mw-parser-output .reflist-lower-alpha{list-style-type:lower-alpha}.mw-parser-output .reflist-lower-greek{list-style-type:lower-greek}.mw-parser-output .reflist-lower-roman{list-style-type:lower-roman}</style><div class="reflist">
+<div class="mw-references-wrap mw-references-columns"><ol class="references">
+<li id="cite_note-FNA-1"><span class="mw-cite-backlink">^ <a href="#cite_ref-FNA_1-0"><span class="cite-accessibility-label">Jump up to: </span><sup><i><b>a</b></i></sup></a> <a href="#cite_ref-FNA_1-1"><sup><i><b>b</b></i></sup></a> <a href="#cite_ref-FNA_1-2"><sup><i><b>c</b></i></sup></a> <a href="#cite_ref-FNA_1-3"><sup><i><b>d</b></i></sup></a> <a href="#cite_ref-FNA_1-4"><sup><i><b>e</b></i></sup></a> <a href="#cite_ref-FNA_1-5"><sup><i><b>f</b></i></sup></a> <a href="#cite_ref-FNA_1-6"><sup><i><b>g</b></i></sup></a> <a href="#cite_ref-FNA_1-7"><sup><i><b>h</b></i></sup></a> <a href="#cite_ref-FNA_1-8"><sup><i><b>i</b></i></sup></a> <a href="#cite_ref-FNA_1-9"><sup><i><b>j</b></i></sup></a> <a href="#cite_ref-FNA_1-10"><sup><i><b>k</b></i></sup></a></span> <span class="reference-text"><style data-mw-deduplicate="TemplateStyles:r1238218222">.mw-parser-output cite.citation{font-style:inherit;word-wrap:break-word}.mw-parser-output .citation q{quotes:"\"""\"""'""'"}.mw-parser-output .citation:target{background-color:rgba(0,127,255,0.133)}.mw-parser-output .id-lock-free.id-lock-free a{background:url("//upload.wikimedia.org/wikipedia/commons/6/65/Lock-green.svg")right 0.1em center/9px no-repeat}.mw-parser-output .id-lock-limited.id-lock-limited a,.mw-parser-output .id-lock-registration.id-lock-registration a{background:url("//upload.wikimedia.org/wikipedia/commons/d/d6/Lock-gray-alt-2.svg")right 0.1em center/9px no-repeat}.mw-parser-output .id-lock-subscription.id-lock-subscription a{background:url("//upload.wikimedia.org/wikipedia/commons/a/aa/Lock-red-alt-2.svg")right 0.1em center/9px no-repeat}.mw-parser-output .cs1-ws-icon a{background:url("//upload.wikimedia.org/wikipedia/commons/4/4c/Wikisource-logo.svg")right 0.1em center/12px no-repeat}body:not(.skin-timeless):not(.skin-minerva) .mw-parser-output .id-lock-free a,body:not(.skin-timeless):not(.skin-minerva) .mw-parser-output .id-lock-limited a,body:not(.skin-timeless):not(.skin-minerva) .mw-parser-output .id-lock-registration a,body:not(.skin-timeless):not(.skin-minerva) .mw-parser-output .id-lock-subscription a,body:not(.skin-timeless):not(.skin-minerva) .mw-parser-output .cs1-ws-icon a{background-size:contain;padding:0 1em 0 0}.mw-parser-output .cs1-code{color:inherit;background:inherit;border:none;padding:inherit}.mw-parser-output .cs1-hidden-error{display:none;color:var(--color-error,#d33)}.mw-parser-output .cs1-visible-error{color:var(--color-error,#d33)}.mw-parser-output .cs1-maint{display:none;color:#085;margin-left:0.3em}.mw-parser-output .cs1-kern-left{padding-left:0.2em}.mw-parser-output .cs1-kern-right{padding-right:0.2em}.mw-parser-output .citation .mw-selflink{font-weight:inherit}@media screen{.mw-parser-output .cs1-format{font-size:95%}html.skin-theme-clientpref-night .mw-parser-output .cs1-maint{color:#18911f}}@media screen and (prefers-color-scheme:dark){html.skin-theme-clientpref-os .mw-parser-output .cs1-maint{color:#18911f}}</style><cite id="CITEREFDickson2021" class="citation web cs1">Dickson, Elizabeth E. (28 May 2021). <a rel="nofollow" class="external text" href="http://floranorthamerica.org/Malus_domestica">"<i>Malus domestica</i>"</a>. <i><a href="/wiki/Flora_of_North_America" title="Flora of North America">Flora of North America</a></i>. <a rel="nofollow" class="external text" href="https://web.archive.org/web/20240728060606/http://floranorthamerica.org/Malus_domestica">Archived</a> from the original on 28 July 2024<span class="reference-accessdate">. Retrieved <span class="nowrap">27 July</span> 2024</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=unknown&amp;rft.jtitle=Flora+of+North+America&amp;rft.atitle=Malus+domestica&amp;rft.date=2021-05-28&amp;rft.aulast=Dickson&amp;rft.aufirst=Elizabeth+E.&amp;rft_id=http%3A%2F%2Ffloranorthamerica.org%2FMalus_domestica&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-POWO-2"><span class="mw-cite-backlink">^ <a href="#cite_ref-POWO_2-0"><span class="cite-accessibility-label">Jump up to: </span><sup><i><b>a</b></i></sup></a> <a href="#cite_ref-POWO_2-1"><sup><i><b>b</b></i></sup></a> <a href="#cite_ref-POWO_2-2"><sup><i><b>c</b></i></sup></a></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="https://powo.science.kew.org/taxon/726282-1">"<i>Malus domestica</i> (Suckow) Borkh"</a>. <i><a href="/wiki/Plants_of_the_World_Online" title="Plants of the World Online">Plants of the World Online</a></i>. <a href="/wiki/Royal_Botanic_Gardens,_Kew" title="Royal Botanic Gardens, Kew">Royal Botanic Gardens, Kew</a><span class="reference-accessdate">. Retrieved <span class="nowrap">31 July</span> 2024</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=unknown&amp;rft.jtitle=Plants+of+the+World+Online&amp;rft.atitle=Malus+domestica+%28Suckow%29+Borkh.&amp;rft_id=https%3A%2F%2Fpowo.science.kew.org%2Ftaxon%2F726282-1&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-Lisa_Lim-3"><span class="mw-cite-backlink">^ <a href="#cite_ref-Lisa_Lim_3-0"><span class="cite-accessibility-label">Jump up to: </span><sup><i><b>a</b></i></sup></a> <a href="#cite_ref-Lisa_Lim_3-1"><sup><i><b>b</b></i></sup></a></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFLim2021" class="citation news cs1">Lim, Lisa (6 July 2021). <a rel="nofollow" class="external text" href="https://www.scmp.com/magazines/post-magazine/article/3139890/where-word-apple-came-and-why-forbidden-fruit-was-unlucky">"Where the word 'apple' came from and why the forbidden fruit was unlucky to be linked with the fall of man"</a>. Language Matters. <i><a href="/wiki/South_China_Morning_Post" title="South China Morning Post">South China Morning Post</a></i>. Hong Kong, China: <a href="/wiki/Alibaba_Group" title="Alibaba Group">Alibaba Group</a>. <a rel="nofollow" class="external text" href="https://web.archive.org/web/20230628112156/https://www.scmp.com/magazines/post-magazine/article/3139890/where-word-apple-came-and-why-forbidden-fruit-was-unlucky">Archived</a> from the original on 28 June 2023<span class="reference-accessdate">. Retrieved <span class="nowrap">28 June</span> 2023</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=South+China+Morning+Post&amp;rft.atitle=Where+the+word+%27apple%27+came+from+and+why+the+forbidden+fruit+was+unlucky+to+be+linked+with+the+fall+of+man&amp;rft.date=2021-07-06&amp;rft.aulast=Lim&amp;rft.aufirst=Lisa&amp;rft_id=https%3A%2F%2Fwww.scmp.com%2Fmagazines%2Fpost-magazine%2Farticle%2F3139890%2Fwhere-word-apple-came-and-why-forbidden-fruit-was-unlucky&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-4"><span class="mw-cite-backlink"><b><a href="#cite_ref-4" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="https://www.etymonline.com/word/apple">"Origin and meaning of "apple" by Online Etymology Dictionary"</a>. <i><a href="/wiki/Online_Etymology_Dictionary" title="Online Etymology Dictionary">Online Etymology Dictionary</a></i>. <a rel="nofollow" class="external text" href="https://web.archive.org/web/20191221020212/https://www.etymonline.com/word/apple">Archived</a> from the original on 21 December 2019<span class="reference-accessdate">. Retrieved <span class="nowrap">22 November</span> 2019</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=unknown&amp;rft.jtitle=Online+Etymology+Dictionary&amp;rft.atitle=Origin+and+meaning+of+%22apple%22+by+Online+Etymology+Dictionary&amp;rft_id=https%3A%2F%2Fwww.etymonline.com%2Fword%2Fapple&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-UofGeorgia-5"><span class="mw-cite-backlink">^ <a href="#cite_ref-UofGeorgia_5-0"><span class="cite-accessibility-label">Jump up to: </span><sup><i><b>a</b></i></sup></a> <a href="#cite_ref-UofGeorgia_5-1"><sup><i><b>b</b></i></sup></a> <a href="#cite_ref-UofGeorgia_5-2"><sup><i><b>c</b></i></sup></a> <a href="#cite_ref-UofGeorgia_5-3"><sup><i><b>d</b></i></sup></a> <a href="#cite_ref-UofGeorgia_5-4"><sup><i><b>e</b></i></sup></a> <a href="#cite_ref-UofGeorgia_5-5"><sup><i><b>f</b></i></sup></a> <a href="#cite_ref-UofGeorgia_5-6"><sup><i><b>g</b></i></sup></a></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFRieger" class="citation web cs1">Rieger, Mark. <a rel="nofollow" class="external text" href="https://web.archive.org/web/20080121045236/http://www.uga.edu/fruit/apple.html">"Apple - <i>Malus domestica</i>"</a>. <i>HORT 3020: Intro Fruit Crops</i>. <a href="/wiki/University_of_Georgia" title="University of Georgia">University of Georgia</a>. Archived from <a rel="nofollow" class="external text" href="http://www.uga.edu/fruit/apple.html">the original</a> on 21 January 2008<span class="reference-accessdate">. Retrieved <span class="nowrap">22 January</span> 2008</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=unknown&amp;rft.jtitle=HORT+3020%3A+Intro+Fruit+Crops&amp;rft.atitle=Apple+-+Malus+domestica&amp;rft.aulast=Rieger&amp;rft.aufirst=Mark&amp;rft_id=http%3A%2F%2Fwww.uga.edu%2Ffruit%2Fapple.html&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-NC_Extension-6"><span class="mw-cite-backlink">^ <a href="#cite_ref-NC_Extension_6-0"><span class="cite-accessibility-label">Jump up to: </span><sup><i><b>a</b></i></sup></a> <a href="#cite_ref-NC_Extension_6-1"><sup><i><b>b</b></i></sup></a> <a href="#cite_ref-NC_Extension_6-2"><sup><i><b>c</b></i></sup></a></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="https://plants.ces.ncsu.edu/plants/malus-domestica/common-name/apples/">"Apples - <i>Malus domestica</i>"</a>. <i>North Carolina Extension Gardener Plant Toolbox</i>. <a href="/wiki/North_Carolina_State_University" title="North Carolina State University">North Carolina State University</a>. <a rel="nofollow" class="external text" href="https://web.archive.org/web/20240531122432/https://plants.ces.ncsu.edu/plants/malus-domestica/common-name/apples/">Archived</a> from the original on 31 May 2024<span class="reference-accessdate">. Retrieved <span class="nowrap">31 July</span> 2024</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=unknown&amp;rft.jtitle=North+Carolina+Extension+Gardener+Plant+Toolbox&amp;rft.atitle=Apples+-+Malus+domestica&amp;rft_id=https%3A%2F%2Fplants.ces.ncsu.edu%2Fplants%2Fmalus-domestica%2Fcommon-name%2Fapples%2F&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-Heil_et_al.-7"><span class="mw-cite-backlink">^ <a href="#cite_ref-Heil_et_al._7-0"><span class="cite-accessibility-label">Jump up to: </span><sup><i><b>a</b></i></sup></a> <a href="#cite_ref-Heil_et_al._7-1"><sup><i><b>b</b></i></sup></a> <a href="#cite_ref-Heil_et_al._7-2"><sup><i><b>c</b></i></sup></a> <a href="#cite_ref-Heil_et_al._7-3"><sup><i><b>d</b></i></sup></a></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFHeilO'Kane,_Jr.ReevesClifford2013" class="citation book cs1">Heil, Kenneth D.; O'Kane, Jr., Steve L.; Reeves, Linda Mary; Clifford, Arnold (2013). <a rel="nofollow" class="external text" href="https://archive.org/details/mobot31753003888887/page/n926"><i>Flora of the Four Corners Region: Vascular Plants of the San Juan River Drainage, Arizona, Colorado, New Mexico, and Utah</i></a> (First&nbsp;ed.). St. Louis, Missouri: <a href="/wiki/Missouri_Botanical_Garden" title="Missouri Botanical Garden">Missouri Botanical Garden</a>. p.&nbsp;909. <a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&nbsp;<a href="/wiki/Special:BookSources/978-1-930723-84-9" title="Special:BookSources/978-1-930723-84-9"><bdi>978-1-930723-84-9</bdi></a>. <a href="/wiki/ISSN_(identifier)" class="mw-redirect" title="ISSN (identifier)">ISSN</a>&nbsp;<a rel="nofollow" class="external text" href="https://search.worldcat.org/issn/0161-1542">0161-1542</a>. <a href="/wiki/LCCN_(identifier)" class="mw-redirect" title="LCCN (identifier)">LCCN</a>&nbsp;<a rel="nofollow" class="external text" href="https://lccn.loc.gov/2012949654">2012949654</a>. <a href="/wiki/OCLC_(identifier)" class="mw-redirect" title="OCLC (identifier)">OCLC</a>&nbsp;<a rel="nofollow" class="external text" href="https://search.worldcat.org/oclc/859541992">859541992</a><span class="reference-accessdate">. Retrieved <span class="nowrap">27 July</span> 2024</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=book&amp;rft.btitle=Flora+of+the+Four+Corners+Region%3A+Vascular+Plants+of+the+San+Juan+River+Drainage%2C+Arizona%2C+Colorado%2C+New+Mexico%2C+and+Utah&amp;rft.place=St.+Louis%2C+Missouri&amp;rft.pages=909&amp;rft.edition=First&amp;rft.pub=Missouri+Botanical+Garden&amp;rft.date=2013&amp;rft_id=info%3Aoclcnum%2F859541992&amp;rft.issn=0161-1542&amp;rft_id=info%3Alccn%2F2012949654&amp;rft.isbn=978-1-930723-84-9&amp;rft.aulast=Heil&amp;rft.aufirst=Kenneth+D.&amp;rft.au=O%27Kane%2C+Jr.%2C+Steve+L.&amp;rft.au=Reeves%2C+Linda+Mary&amp;rft.au=Clifford%2C+Arnold&amp;rft_id=https%3A%2F%2Farchive.org%2Fdetails%2Fmobot31753003888887%2Fpage%2Fn926&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-Lim_2012-8"><span class="mw-cite-backlink">^ <a href="#cite_ref-Lim_2012_8-0"><span class="cite-accessibility-label">Jump up to: </span><sup><i><b>a</b></i></sup></a> <a href="#cite_ref-Lim_2012_8-1"><sup><i><b>b</b></i></sup></a> <a href="#cite_ref-Lim_2012_8-2"><sup><i><b>c</b></i></sup></a> <a href="#cite_ref-Lim_2012_8-3"><sup><i><b>d</b></i></sup></a> <a href="#cite_ref-Lim_2012_8-4"><sup><i><b>e</b></i></sup></a></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFLim2012" class="citation book cs1 cs1-prop-long-vol">Lim, Tong Kwee (2012). "<i>Malus</i> x <i>domestica</i>". <i>Edible Medicinal and Non-Medicinal Plants</i>. Vol.&nbsp;4, Fruit (First&nbsp;ed.). Dordrecht, the Netherlands: <a href="/wiki/Springer_Publishing" title="Springer Publishing">Springer</a>. pp.&nbsp;414–415. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<a rel="nofollow" class="external text" href="https://doi.org/10.1007%2F978-94-007-4053-2_49">10.1007/978-94-007-4053-2_49</a>. <a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&nbsp;<a href="/wiki/Special:BookSources/978-94-007-4053-2" title="Special:BookSources/978-94-007-4053-2"><bdi>978-94-007-4053-2</bdi></a>. <a href="/wiki/OCLC_(identifier)" class="mw-redirect" title="OCLC (identifier)">OCLC</a>&nbsp;<a rel="nofollow" class="external text" href="https://search.worldcat.org/oclc/795503871">795503871</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=bookitem&amp;rft.atitle=Malus+x+domestica&amp;rft.btitle=Edible+Medicinal+and+Non-Medicinal+Plants&amp;rft.place=Dordrecht%2C+the+Netherlands&amp;rft.pages=414-415&amp;rft.edition=First&amp;rft.pub=Springer&amp;rft.date=2012&amp;rft_id=info%3Aoclcnum%2F795503871&amp;rft_id=info%3Adoi%2F10.1007%2F978-94-007-4053-2_49&amp;rft.isbn=978-94-007-4053-2&amp;rft.aulast=Lim&amp;rft.aufirst=Tong+Kwee&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-9"><span class="mw-cite-backlink"><b><a href="#cite_ref-9" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFJuniperMabberley2006" class="citation book cs1"><a href="/wiki/Barrie_Juniper" title="Barrie Juniper">Juniper, Barrie E.</a>; <a href="/wiki/David_Mabberley" title="David Mabberley">Mabberley, David J.</a> (2006). <span class="id-lock-registration" title="Free registration required"><a rel="nofollow" class="external text" href="https://archive.org/details/storyofapple0000juni"><i>The Story of the Apple</i></a></span> (First&nbsp;ed.). Portland, Oregon: <a href="/wiki/Timber_Press" class="mw-redirect" title="Timber Press">Timber Press</a>. p.&nbsp;27. <a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&nbsp;<a href="/wiki/Special:BookSources/978-0-88192-784-9" title="Special:BookSources/978-0-88192-784-9"><bdi>978-0-88192-784-9</bdi></a>. <a href="/wiki/LCCN_(identifier)" class="mw-redirect" title="LCCN (identifier)">LCCN</a>&nbsp;<a rel="nofollow" class="external text" href="https://lccn.loc.gov/2006011869">2006011869</a>. <a href="/wiki/OCLC_(identifier)" class="mw-redirect" title="OCLC (identifier)">OCLC</a>&nbsp;<a rel="nofollow" class="external text" href="https://search.worldcat.org/oclc/67383484">67383484</a><span class="reference-accessdate">. Retrieved <span class="nowrap">1 August</span> 2024</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=book&amp;rft.btitle=The+Story+of+the+Apple&amp;rft.place=Portland%2C+Oregon&amp;rft.pages=27&amp;rft.edition=First&amp;rft.pub=Timber+Press&amp;rft.date=2006&amp;rft_id=info%3Aoclcnum%2F67383484&amp;rft_id=info%3Alccn%2F2006011869&amp;rft.isbn=978-0-88192-784-9&amp;rft.aulast=Juniper&amp;rft.aufirst=Barrie+E.&amp;rft.au=Mabberley%2C+David+J.&amp;rft_id=https%3A%2F%2Farchive.org%2Fdetails%2Fstoryofapple0000juni&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-10"><span class="mw-cite-backlink"><b><a href="#cite_ref-10" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="https://schoolgardening.rhs.org.uk/Resources/Info-Sheet/Fruit-Glossary">"Fruit glossary"</a>. Royal Horticultural Society. <a rel="nofollow" class="external text" href="https://web.archive.org/web/20240807071550/https://schoolgardening.rhs.org.uk/Resources/Info-Sheet/Fruit-Glossary">Archived</a> from the original on 7 August 2024<span class="reference-accessdate">. Retrieved <span class="nowrap">7 August</span> 2024</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=unknown&amp;rft.btitle=Fruit+glossary&amp;rft.pub=Royal+Horticultural+Society&amp;rft_id=https%3A%2F%2Fschoolgardening.rhs.org.uk%2FResources%2FInfo-Sheet%2FFruit-Glossary&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-11"><span class="mw-cite-backlink"><b><a href="#cite_ref-11" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFBurford2013" class="citation book cs1"><a href="/wiki/Tom_Burford" title="Tom Burford">Burford, Tom</a> (2013). <span class="id-lock-limited" title="Free access subject to limited trial, subscription normally required"><a rel="nofollow" class="external text" href="https://archive.org/details/applesofnorthame0000burf"><i>Apples of North America&nbsp;: 192 Exceptional Varieties for Gardeners, Growers and Cooks</i></a></span> (First&nbsp;ed.). Portland, Oregon: <a href="/wiki/Timber_Press" class="mw-redirect" title="Timber Press">Timber Press</a>. pp.&nbsp;22, 50, 55, 122, 123, 137, 141, 147, 159, 245, 246. <a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&nbsp;<a href="/wiki/Special:BookSources/978-1-60469-249-5" title="Special:BookSources/978-1-60469-249-5"><bdi>978-1-60469-249-5</bdi></a>. <a href="/wiki/LCCN_(identifier)" class="mw-redirect" title="LCCN (identifier)">LCCN</a>&nbsp;<a rel="nofollow" class="external text" href="https://lccn.loc.gov/2012045130">2012045130</a>. <a href="/wiki/OCLC_(identifier)" class="mw-redirect" title="OCLC (identifier)">OCLC</a>&nbsp;<a rel="nofollow" class="external text" href="https://search.worldcat.org/oclc/819860825">819860825</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=book&amp;rft.btitle=Apples+of+North+America+%3A+192+Exceptional+Varieties+for+Gardeners%2C+Growers+and+Cooks&amp;rft.place=Portland%2C+Oregon&amp;rft.pages=22%2C+50%2C+55%2C+122%2C+123%2C+137%2C+141%2C+147%2C+159%2C+245%2C+246&amp;rft.edition=First&amp;rft.pub=Timber+Press&amp;rft.date=2013&amp;rft_id=info%3Aoclcnum%2F819860825&amp;rft_id=info%3Alccn%2F2012045130&amp;rft.isbn=978-1-60469-249-5&amp;rft.aulast=Burford&amp;rft.aufirst=Tom&amp;rft_id=https%3A%2F%2Farchive.org%2Fdetails%2Fapplesofnorthame0000burf&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-12"><span class="mw-cite-backlink"><b><a href="#cite_ref-12" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="https://agresearch.montana.edu/warc/guides/apples/heritage_orchard_management_guide/heritage-fruit-id-guide/apple_id_characteristics/appleid_shape.html">"Shape"</a>. <i>Western Agricultural Research Center</i>. <a href="/wiki/Montana_State_University" title="Montana State University">Montana State University</a>. <a rel="nofollow" class="external text" href="https://web.archive.org/web/20240423183929/https://agresearch.montana.edu/warc/guides/apples/heritage_orchard_management_guide/heritage-fruit-id-guide/apple_id_characteristics/appleid_shape.html">Archived</a> from the original on 23 April 2024<span class="reference-accessdate">. Retrieved <span class="nowrap">30 July</span> 2024</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=unknown&amp;rft.jtitle=Western+Agricultural+Research+Center&amp;rft.atitle=Shape&amp;rft_id=https%3A%2F%2Fagresearch.montana.edu%2Fwarc%2Fguides%2Fapples%2Fheritage_orchard_management_guide%2Fheritage-fruit-id-guide%2Fapple_id_characteristics%2Fappleid_shape.html&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-Janick-13"><span class="mw-cite-backlink">^ <a href="#cite_ref-Janick_13-0"><span class="cite-accessibility-label">Jump up to: </span><sup><i><b>a</b></i></sup></a> <a href="#cite_ref-Janick_13-1"><sup><i><b>b</b></i></sup></a></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFJanickCumminsBrownHemmat1996" class="citation book cs1 cs1-prop-long-vol">Janick, Jules; Cummins, James N.; Brown, Susan K.; Hemmat, Minou (1996). <a rel="nofollow" class="external text" href="http://www.hort.purdue.edu/newcrop/pri/chapter.pdf">"Chapter 1: Apples"</a> <span class="cs1-format">(PDF)</span>. <i>Fruit Breeding</i>. Vol.&nbsp;I: Tree and Tropical Fruits. New York: <a href="/wiki/John_Wiley_%26_Sons" class="mw-redirect" title="John Wiley &amp; Sons">John Wiley &amp; Sons</a>. pp.&nbsp;9, 48. <a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&nbsp;<a href="/wiki/Special:BookSources/978-0-471-31014-3" title="Special:BookSources/978-0-471-31014-3"><bdi>978-0-471-31014-3</bdi></a>. <a href="/wiki/LCCN_(identifier)" class="mw-redirect" title="LCCN (identifier)">LCCN</a>&nbsp;<a rel="nofollow" class="external text" href="https://lccn.loc.gov/95016407">95016407</a>. <a href="/wiki/OCLC_(identifier)" class="mw-redirect" title="OCLC (identifier)">OCLC</a>&nbsp;<a rel="nofollow" class="external text" href="https://search.worldcat.org/oclc/1302621533">1302621533</a>. <a rel="nofollow" class="external text" href="https://web.archive.org/web/20130719085631/http://www.hort.purdue.edu/newcrop/pri/chapter.pdf">Archived</a> <span class="cs1-format">(PDF)</span> from the original on 19 July 2013<span class="reference-accessdate">. Retrieved <span class="nowrap">30 August</span> 2024</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=bookitem&amp;rft.atitle=Chapter+1%3A+Apples&amp;rft.btitle=Fruit+Breeding&amp;rft.place=New+York&amp;rft.pages=9%2C+48&amp;rft.pub=John+Wiley+%26+Sons&amp;rft.date=1996&amp;rft_id=info%3Aoclcnum%2F1302621533&amp;rft_id=info%3Alccn%2F95016407&amp;rft.isbn=978-0-471-31014-3&amp;rft.aulast=Janick&amp;rft.aufirst=Jules&amp;rft.au=Cummins%2C+James+N.&amp;rft.au=Brown%2C+Susan+K.&amp;rft.au=Hemmat%2C+Minou&amp;rft_id=http%3A%2F%2Fwww.hort.purdue.edu%2Fnewcrop%2Fpri%2Fchapter.pdf&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-14"><span class="mw-cite-backlink"><b><a href="#cite_ref-14" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="https://web.archive.org/web/20130524130738/http://postharvest.tfrec.wsu.edu/pages/N2I2A">"Natural Waxes on Fruits"</a>. Postharvest.tfrec.wsu.edu. 29 October 2010. Archived from <a rel="nofollow" class="external text" href="http://postharvest.tfrec.wsu.edu/pages/N2I2A">the original</a> on 24 May 2013<span class="reference-accessdate">. Retrieved <span class="nowrap">14 June</span> 2013</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=unknown&amp;rft.btitle=Natural+Waxes+on+Fruits&amp;rft.pub=Postharvest.tfrec.wsu.edu&amp;rft.date=2010-10-29&amp;rft_id=http%3A%2F%2Fpostharvest.tfrec.wsu.edu%2Fpages%2FN2I2A&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-15"><span class="mw-cite-backlink"><b><a href="#cite_ref-15" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFFlathBlackForreyMcDonald1969" class="citation journal cs1">Flath, R. A.; Black, D. R.; Forrey, R. R.; McDonald, G. M.; Mon, T. R.; Teranishi, R. (1 August 1969). "Volatiles in Gravenstein Apple Essence Identified by GC-Mass Spectrometry". <i>Journal of Chromatographic Science</i>. <b>7</b> (8): 508. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<a rel="nofollow" class="external text" href="https://doi.org/10.1093%2FCHROMSCI%2F7.8.508">10.1093/CHROMSCI/7.8.508</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=Journal+of+Chromatographic+Science&amp;rft.atitle=Volatiles+in+Gravenstein+Apple+Essence+Identified+by+GC-Mass+Spectrometry&amp;rft.volume=7&amp;rft.issue=8&amp;rft.pages=508&amp;rft.date=1969-08-01&amp;rft_id=info%3Adoi%2F10.1093%2FCHROMSCI%2F7.8.508&amp;rft.aulast=Flath&amp;rft.aufirst=R.+A.&amp;rft.au=Black%2C+D.+R.&amp;rft.au=Forrey%2C+R.+R.&amp;rft.au=McDonald%2C+G.+M.&amp;rft.au=Mon%2C+T.+R.&amp;rft.au=Teranishi%2C+R.&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-16"><span class="mw-cite-backlink"><b><a href="#cite_ref-16" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFFlathBlackGuadagniMcFadden1967" class="citation journal cs1">Flath, Robert A.; Black, Dale Robert.; Guadagni, Dante G.; McFadden, William H.; Schultz, Thomas H. (January 1967). "Identification and organoleptic evaluation of compounds in Delicious apple essence". <i><a href="/wiki/Journal_of_Agricultural_and_Food_Chemistry" title="Journal of Agricultural and Food Chemistry">Journal of Agricultural and Food Chemistry</a></i>. <b>15</b> (1): 29. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<a rel="nofollow" class="external text" href="https://doi.org/10.1021%2Fjf60149a032">10.1021/jf60149a032</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=Journal+of+Agricultural+and+Food+Chemistry&amp;rft.atitle=Identification+and+organoleptic+evaluation+of+compounds+in+Delicious+apple+essence&amp;rft.volume=15&amp;rft.issue=1&amp;rft.pages=29&amp;rft.date=1967-01&amp;rft_id=info%3Adoi%2F10.1021%2Fjf60149a032&amp;rft.aulast=Flath&amp;rft.aufirst=Robert+A.&amp;rft.au=Black%2C+Dale+Robert.&amp;rft.au=Guadagni%2C+Dante+G.&amp;rft.au=McFadden%2C+William+H.&amp;rft.au=Schultz%2C+Thomas+H.&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-Proposal_to_conserve-17"><span class="mw-cite-backlink">^ <a href="#cite_ref-Proposal_to_conserve_17-0"><span class="cite-accessibility-label">Jump up to: </span><sup><i><b>a</b></i></sup></a> <a href="#cite_ref-Proposal_to_conserve_17-1"><sup><i><b>b</b></i></sup></a></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFQianLiuTang2010" class="citation journal cs1">Qian, Guan-Ze; Liu, Lian-Fen; Tang, Geng-Guo (April 2010). "(1933) Proposal to conserve the name <i>Malus domestica</i> against <i>M.&nbsp;pumila</i>, <i>M.&nbsp;communis</i>, <i>M.&nbsp;frutescens</i>, and <i>Pyrus dioica</i> ( Rosaceae )". <i><a href="/wiki/Taxon_(journal)" title="Taxon (journal)">Taxon</a></i>. <b>59</b> (2): 650–652. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<a rel="nofollow" class="external text" href="https://doi.org/10.1002%2Ftax.592038">10.1002/tax.592038</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=Taxon&amp;rft.atitle=%281933%29+Proposal+to+conserve+the+name+Malus+domestica+against+M.+pumila%2C+M.+communis%2C+M.+frutescens%2C+and+Pyrus+dioica+%28+Rosaceae+%29&amp;rft.volume=59&amp;rft.issue=2&amp;rft.pages=650-652&amp;rft.date=2010-04&amp;rft_id=info%3Adoi%2F10.1002%2Ftax.592038&amp;rft.aulast=Qian&amp;rft.aufirst=Guan-Ze&amp;rft.au=Liu%2C+Lian-Fen&amp;rft.au=Tang%2C+Geng-Guo&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-18"><span class="mw-cite-backlink"><b><a href="#cite_ref-18" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFApplequist2017" class="citation journal cs1">Applequist, Wendy L. (2017). <a rel="nofollow" class="external text" href="https://apirs.plants.ifas.ufl.edu/site/assets/files/375067/375067.pdf">"Report of the Nomenclature Committee for Vascular Plants: 69"</a> <span class="cs1-format">(PDF)</span>. <i><a href="/wiki/Taxon_(journal)" title="Taxon (journal)">Taxon</a></i>. <b>66</b> (2): 500–513. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<a rel="nofollow" class="external text" href="https://doi.org/10.12705%2F662.17">10.12705/662.17</a>. <a rel="nofollow" class="external text" href="https://web.archive.org/web/20240507042204/https://apirs.plants.ifas.ufl.edu/site/assets/files/375067/375067.pdf">Archived</a> <span class="cs1-format">(PDF)</span> from the original on 7 May 2024.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=Taxon&amp;rft.atitle=Report+of+the+Nomenclature+Committee+for+Vascular+Plants%3A+69&amp;rft.volume=66&amp;rft.issue=2&amp;rft.pages=500-513&amp;rft.date=2017&amp;rft_id=info%3Adoi%2F10.12705%2F662.17&amp;rft.aulast=Applequist&amp;rft.aufirst=Wendy+L.&amp;rft_id=https%3A%2F%2Fapirs.plants.ifas.ufl.edu%2Fsite%2Fassets%2Ffiles%2F375067%2F375067.pdf&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-19"><span class="mw-cite-backlink"><b><a href="#cite_ref-19" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFWilson2017" class="citation journal cs1">Wilson, Karen L. (June 2017). <a rel="nofollow" class="external text" href="https://doi.org/10.12705%2F663.15">"Report of the General Committee: 18"</a>. <i>Taxon</i>. <b>66</b> (3): 742. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<span class="id-lock-free" title="Freely accessible"><a rel="nofollow" class="external text" href="https://doi.org/10.12705%2F663.15">10.12705/663.15</a></span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=Taxon&amp;rft.atitle=Report+of+the+General+Committee%3A+18&amp;rft.volume=66&amp;rft.issue=3&amp;rft.pages=742&amp;rft.date=2017-06&amp;rft_id=info%3Adoi%2F10.12705%2F663.15&amp;rft.aulast=Wilson&amp;rft.aufirst=Karen+L.&amp;rft_id=https%3A%2F%2Fdoi.org%2F10.12705%252F663.15&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-Velasco_et_al.-20"><span class="mw-cite-backlink">^ <a href="#cite_ref-Velasco_et_al._20-0"><span class="cite-accessibility-label">Jump up to: </span><sup><i><b>a</b></i></sup></a> <a href="#cite_ref-Velasco_et_al._20-1"><sup><i><b>b</b></i></sup></a></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFVelascoZharkikhAffourtitDhingra2010" class="citation journal cs1">Velasco, Riccardo; Zharkikh, Andrey; Affourtit, Jason; Dhingra, Amit; Cestaro, Alessandro; et&nbsp;al. (2010). <a rel="nofollow" class="external text" href="https://doi.org/10.1038%2Fng.654">"The genome of the domesticated apple (<i>Malus</i> × <i>domestica</i> Borkh.)"</a>. <i>Nature Genetics</i>. <b>42</b> (10): 833–839. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<span class="id-lock-free" title="Freely accessible"><a rel="nofollow" class="external text" href="https://doi.org/10.1038%2Fng.654">10.1038/ng.654</a></span>. <a href="/wiki/PMID_(identifier)" class="mw-redirect" title="PMID (identifier)">PMID</a>&nbsp;<a rel="nofollow" class="external text" href="https://pubmed.ncbi.nlm.nih.gov/20802477">20802477</a>. <a href="/wiki/S2CID_(identifier)" class="mw-redirect" title="S2CID (identifier)">S2CID</a>&nbsp;<a rel="nofollow" class="external text" href="https://api.semanticscholar.org/CorpusID:14854514">14854514</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=Nature+Genetics&amp;rft.atitle=The+genome+of+the+domesticated+apple+%28Malus+%C3%97+domestica+Borkh.%29&amp;rft.volume=42&amp;rft.issue=10&amp;rft.pages=833-839&amp;rft.date=2010&amp;rft_id=https%3A%2F%2Fapi.semanticscholar.org%2FCorpusID%3A14854514%23id-name%3DS2CID&amp;rft_id=info%3Apmid%2F20802477&amp;rft_id=info%3Adoi%2F10.1038%2Fng.654&amp;rft.aulast=Velasco&amp;rft.aufirst=Riccardo&amp;rft.au=Zharkikh%2C+Andrey&amp;rft.au=Affourtit%2C+Jason&amp;rft.au=Dhingra%2C+Amit&amp;rft.au=Cestaro%2C+Alessandro&amp;rft.au=Kalyanaraman%2C+Ananth&amp;rft.au=Fontana%2C+Paolo&amp;rft.au=Bhatnagar%2C+Satish+K.&amp;rft.au=Troggio%2C+Michela&amp;rft.au=Pruss%2C+Dmitry&amp;rft.au=Salvi%2C+Silvio&amp;rft.au=Pindo%2C+Massimo&amp;rft.au=Baldi%2C+Paolo&amp;rft.au=Castelletti%2C+Sara&amp;rft.au=Cavaiuolo%2C+Marina&amp;rft.au=Coppola%2C+Giuseppina&amp;rft.au=Costa%2C+Fabrizio&amp;rft.au=Cova%2C+Valentina&amp;rft.au=Dal+Ri%2C+Antonio&amp;rft.au=Goremykin%2C+Vadim&amp;rft.au=Komjanc%2C+Matteo&amp;rft.au=Longhi%2C+Sara&amp;rft.au=Magnago%2C+Pierluigi&amp;rft.au=Malacarne%2C+Giulia&amp;rft.au=Malnoy%2C+Mickael&amp;rft.au=Micheletti%2C+Diego&amp;rft.au=Moretto%2C+Marco&amp;rft.au=Perazzolli%2C+Michele&amp;rft.au=Si-Ammour%2C+Azeddine&amp;rft.au=Vezzulli%2C+Silvia&amp;rft_id=https%3A%2F%2Fdoi.org%2F10.1038%252Fng.654&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-21"><span class="mw-cite-backlink"><b><a href="#cite_ref-21" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFDi_PierroGianfranceschiDi_GuardoKoehorst-Van_Putten2016" class="citation journal cs1">Di Pierro, Erica A.; Gianfranceschi, Luca; Di Guardo, Mario; Koehorst-Van Putten, Herma J.J.; Kruisselbrink, Johannes W.; et&nbsp;al. (2016). <a rel="nofollow" class="external text" href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC5120355">"A high-density, multi-parental SNP genetic map on apple validates a new mapping approach for outcrossing species"</a>. <i><a href="/wiki/Horticulture_Research" class="mw-redirect" title="Horticulture Research">Horticulture Research</a></i>. <b>3</b> (1): 16057. <a href="/wiki/Bibcode_(identifier)" class="mw-redirect" title="Bibcode (identifier)">Bibcode</a>:<a rel="nofollow" class="external text" href="https://ui.adsabs.harvard.edu/abs/2016HorR....316057D">2016HorR....316057D</a>. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<a rel="nofollow" class="external text" href="https://doi.org/10.1038%2Fhortres.2016.57">10.1038/hortres.2016.57</a>. <a href="/wiki/PMC_(identifier)" class="mw-redirect" title="PMC (identifier)">PMC</a>&nbsp;<span class="id-lock-free" title="Freely accessible"><a rel="nofollow" class="external text" href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC5120355">5120355</a></span>. <a href="/wiki/PMID_(identifier)" class="mw-redirect" title="PMID (identifier)">PMID</a>&nbsp;<a rel="nofollow" class="external text" href="https://pubmed.ncbi.nlm.nih.gov/27917289">27917289</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=Horticulture+Research&amp;rft.atitle=A+high-density%2C+multi-parental+SNP+genetic+map+on+apple+validates+a+new+mapping+approach+for+outcrossing+species&amp;rft.volume=3&amp;rft.issue=1&amp;rft.pages=16057&amp;rft.date=2016&amp;rft_id=https%3A%2F%2Fwww.ncbi.nlm.nih.gov%2Fpmc%2Farticles%2FPMC5120355%23id-name%3DPMC&amp;rft_id=info%3Apmid%2F27917289&amp;rft_id=info%3Adoi%2F10.1038%2Fhortres.2016.57&amp;rft_id=info%3Abibcode%2F2016HorR....316057D&amp;rft.aulast=Di+Pierro&amp;rft.aufirst=Erica+A.&amp;rft.au=Gianfranceschi%2C+Luca&amp;rft.au=Di+Guardo%2C+Mario&amp;rft.au=Koehorst-Van+Putten%2C+Herma+J.J.&amp;rft.au=Kruisselbrink%2C+Johannes+W.&amp;rft.au=Longhi%2C+Sara&amp;rft.au=Troggio%2C+Michela&amp;rft.au=Bianco%2C+Luca&amp;rft.au=Muranty%2C+H%C3%A9l%C3%A8ne&amp;rft.au=Pagliarani%2C+Giulia&amp;rft.au=Tartarini%2C+Stefano&amp;rft.au=Letschka%2C+Thomas&amp;rft.au=Lozano+Luis%2C+Lidia&amp;rft.au=Garkava-Gustavsson%2C+Larisa&amp;rft.au=Micheletti%2C+Diego&amp;rft.au=Bink%2C+Marco+C.A.M.&amp;rft.au=Voorrips%2C+Roeland+E.&amp;rft.au=Aziz%2C+Ebrahimi&amp;rft.au=Velasco%2C+Riccardo&amp;rft.au=Laurens%2C+Fran%C3%A7ois&amp;rft.au=Van+De+Weg%2C+W.+Eric&amp;rft_id=https%3A%2F%2Fwww.ncbi.nlm.nih.gov%2Fpmc%2Farticles%2FPMC5120355&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-Daccord_et_al.-22"><span class="mw-cite-backlink">^ <a href="#cite_ref-Daccord_et_al._22-0"><span class="cite-accessibility-label">Jump up to: </span><sup><i><b>a</b></i></sup></a> <a href="#cite_ref-Daccord_et_al._22-1"><sup><i><b>b</b></i></sup></a></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFDaccordCeltonLinsmithBecker2017" class="citation journal cs1">Daccord, Nicolas; Celton, Jean-Marc; Linsmith, Gareth; et&nbsp;al. (2017). <a rel="nofollow" class="external text" href="https://doi.org/10.1038%2Fng.3886">"High-quality de novo assembly of the apple genome and methylome dynamics of early fruit development"</a>. <i>Nature Genetics</i>. <b>49</b> (7). Nature Communications: 1099–1106. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<span class="id-lock-free" title="Freely accessible"><a rel="nofollow" class="external text" href="https://doi.org/10.1038%2Fng.3886">10.1038/ng.3886</a></span>. <a href="/wiki/Hdl_(identifier)" class="mw-redirect" title="Hdl (identifier)">hdl</a>:<span class="id-lock-free" title="Freely accessible"><a rel="nofollow" class="external text" href="https://hdl.handle.net/10449%2F42064">10449/42064</a></span>. <a href="/wiki/PMID_(identifier)" class="mw-redirect" title="PMID (identifier)">PMID</a>&nbsp;<a rel="nofollow" class="external text" href="https://pubmed.ncbi.nlm.nih.gov/28581499">28581499</a>. <a href="/wiki/S2CID_(identifier)" class="mw-redirect" title="S2CID (identifier)">S2CID</a>&nbsp;<a rel="nofollow" class="external text" href="https://api.semanticscholar.org/CorpusID:24690391">24690391</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=Nature+Genetics&amp;rft.atitle=High-quality+de+novo+assembly+of+the+apple+genome+and+methylome+dynamics+of+early+fruit+development&amp;rft.volume=49&amp;rft.issue=7&amp;rft.pages=1099-1106&amp;rft.date=2017&amp;rft_id=info%3Ahdl%2F10449%2F42064&amp;rft_id=https%3A%2F%2Fapi.semanticscholar.org%2FCorpusID%3A24690391%23id-name%3DS2CID&amp;rft_id=info%3Apmid%2F28581499&amp;rft_id=info%3Adoi%2F10.1038%2Fng.3886&amp;rft.aulast=Daccord&amp;rft.aufirst=Nicolas&amp;rft.au=Celton%2C+Jean-Marc&amp;rft.au=Linsmith%2C+Gareth&amp;rft.au=Becker%2C+Claude&amp;rft.au=Choisne%2C+Nathalie&amp;rft.au=Schijlen%2C+Elio&amp;rft.au=Van+De+Geest%2C+Henri&amp;rft.au=Bianco%2C+Luca&amp;rft.au=Micheletti%2C+Diego&amp;rft.au=Velasco%2C+Riccardo&amp;rft.au=Di+Pierro%2C+Erica+Adele&amp;rft.au=Gouzy%2C+J%C3%A9r%C3%B4me&amp;rft.au=Rees%2C+D+Jasper+G.&amp;rft.au=Gu%C3%A9rif%2C+Philippe&amp;rft.au=Muranty%2C+H%C3%A9l%C3%A8ne&amp;rft.au=Durel%2C+Charles-Eric&amp;rft.au=Laurens%2C+Fran%C3%A7ois&amp;rft.au=Lespinasse%2C+Yves&amp;rft.au=Gaillard%2C+Sylvain&amp;rft.au=Aubourg%2C+S%C3%A9bastien&amp;rft.au=Quesneville%2C+Hadi&amp;rft.au=Weigel%2C+Detlef&amp;rft.au=Van+De+Weg%2C+Eric&amp;rft.au=Troggio%2C+Michela&amp;rft.au=Bucher%2C+Etienne&amp;rft_id=https%3A%2F%2Fdoi.org%2F10.1038%252Fng.3886&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-Zhang_et_al.-23"><span class="mw-cite-backlink">^ <a href="#cite_ref-Zhang_et_al._23-0"><span class="cite-accessibility-label">Jump up to: </span><sup><i><b>a</b></i></sup></a> <a href="#cite_ref-Zhang_et_al._23-1"><sup><i><b>b</b></i></sup></a></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFZhangHuHanLi2019" class="citation journal cs1">Zhang, Liyi; Hu, Jiang; Han, Xiaolei; Li, Jingjing; Gao, Yuan; et&nbsp;al. (2019). <a rel="nofollow" class="external text" href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC6445120">"A high-quality apple genome assembly reveals the association of a retrotransposon and red fruit colour"</a>. <i>Nature Communications</i>. <b>10</b> (1). Nature Genetics: 1494. <a href="/wiki/Bibcode_(identifier)" class="mw-redirect" title="Bibcode (identifier)">Bibcode</a>:<a rel="nofollow" class="external text" href="https://ui.adsabs.harvard.edu/abs/2019NatCo..10.1494Z">2019NatCo..10.1494Z</a>. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<a rel="nofollow" class="external text" href="https://doi.org/10.1038%2Fs41467-019-09518-x">10.1038/s41467-019-09518-x</a>. <a href="/wiki/PMC_(identifier)" class="mw-redirect" title="PMC (identifier)">PMC</a>&nbsp;<span class="id-lock-free" title="Freely accessible"><a rel="nofollow" class="external text" href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC6445120">6445120</a></span>. <a href="/wiki/PMID_(identifier)" class="mw-redirect" title="PMID (identifier)">PMID</a>&nbsp;<a rel="nofollow" class="external text" href="https://pubmed.ncbi.nlm.nih.gov/30940818">30940818</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=Nature+Communications&amp;rft.atitle=A+high-quality+apple+genome+assembly+reveals+the+association+of+a+retrotransposon+and+red+fruit+colour&amp;rft.volume=10&amp;rft.issue=1&amp;rft.pages=1494&amp;rft.date=2019&amp;rft_id=https%3A%2F%2Fwww.ncbi.nlm.nih.gov%2Fpmc%2Farticles%2FPMC6445120%23id-name%3DPMC&amp;rft_id=info%3Apmid%2F30940818&amp;rft_id=info%3Adoi%2F10.1038%2Fs41467-019-09518-x&amp;rft_id=info%3Abibcode%2F2019NatCo..10.1494Z&amp;rft.aulast=Zhang&amp;rft.aufirst=Liyi&amp;rft.au=Hu%2C+Jiang&amp;rft.au=Han%2C+Xiaolei&amp;rft.au=Li%2C+Jingjing&amp;rft.au=Gao%2C+Yuan&amp;rft.au=Richards%2C+Christopher+M.&amp;rft.au=Zhang%2C+Caixia&amp;rft.au=Tian%2C+Yi&amp;rft.au=Liu%2C+Guiming&amp;rft.au=Gul%2C+Hera&amp;rft.au=Wang%2C+Dajiang&amp;rft.au=Tian%2C+Yu&amp;rft.au=Yang%2C+Chuanxin&amp;rft.au=Meng%2C+Minghui&amp;rft.au=Yuan%2C+Gaopeng&amp;rft.au=Kang%2C+Guodong&amp;rft.au=Wu%2C+Yonglong&amp;rft.au=Wang%2C+Kun&amp;rft.au=Zhang%2C+Hengtao&amp;rft.au=Wang%2C+Depeng&amp;rft.au=Cong%2C+Peihua&amp;rft_id=https%3A%2F%2Fwww.ncbi.nlm.nih.gov%2Fpmc%2Farticles%2FPMC6445120&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-Duan_2017-24"><span class="mw-cite-backlink">^ <a href="#cite_ref-Duan_2017_24-0"><span class="cite-accessibility-label">Jump up to: </span><sup><i><b>a</b></i></sup></a> <a href="#cite_ref-Duan_2017_24-1"><sup><i><b>b</b></i></sup></a> <a href="#cite_ref-Duan_2017_24-2"><sup><i><b>c</b></i></sup></a> <a href="#cite_ref-Duan_2017_24-3"><sup><i><b>d</b></i></sup></a> <a href="#cite_ref-Duan_2017_24-4"><sup><i><b>e</b></i></sup></a></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFDuanBaiSunWang2017" class="citation journal cs1">Duan, Naibin; Bai, Yang; Sun, Honghe; Wang, Nan; Ma, Yumin; et&nbsp;al. (2017). <a rel="nofollow" class="external text" href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC5557836">"Genome re-sequencing reveals the history of apple and supports a two-stage model for fruit enlargement"</a>. <i>Nature Communications</i>. <b>8</b> (1): 249. <a href="/wiki/Bibcode_(identifier)" class="mw-redirect" title="Bibcode (identifier)">Bibcode</a>:<a rel="nofollow" class="external text" href="https://ui.adsabs.harvard.edu/abs/2017NatCo...8..249D">2017NatCo...8..249D</a>. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<a rel="nofollow" class="external text" href="https://doi.org/10.1038%2Fs41467-017-00336-7">10.1038/s41467-017-00336-7</a>. <a href="/wiki/PMC_(identifier)" class="mw-redirect" title="PMC (identifier)">PMC</a>&nbsp;<span class="id-lock-free" title="Freely accessible"><a rel="nofollow" class="external text" href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC5557836">5557836</a></span>. <a href="/wiki/PMID_(identifier)" class="mw-redirect" title="PMID (identifier)">PMID</a>&nbsp;<a rel="nofollow" class="external text" href="https://pubmed.ncbi.nlm.nih.gov/28811498">28811498</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=Nature+Communications&amp;rft.atitle=Genome+re-sequencing+reveals+the+history+of+apple+and+supports+a+two-stage+model+for+fruit+enlargement&amp;rft.volume=8&amp;rft.issue=1&amp;rft.pages=249&amp;rft.date=2017&amp;rft_id=https%3A%2F%2Fwww.ncbi.nlm.nih.gov%2Fpmc%2Farticles%2FPMC5557836%23id-name%3DPMC&amp;rft_id=info%3Apmid%2F28811498&amp;rft_id=info%3Adoi%2F10.1038%2Fs41467-017-00336-7&amp;rft_id=info%3Abibcode%2F2017NatCo...8..249D&amp;rft.aulast=Duan&amp;rft.aufirst=Naibin&amp;rft.au=Bai%2C+Yang&amp;rft.au=Sun%2C+Honghe&amp;rft.au=Wang%2C+Nan&amp;rft.au=Ma%2C+Yumin&amp;rft.au=Li%2C+Mingjun&amp;rft.au=Wang%2C+Xin&amp;rft.au=Jiao%2C+Chen&amp;rft.au=Legall%2C+Noah&amp;rft.au=Mao%2C+Linyong&amp;rft.au=Wan%2C+Sibao&amp;rft.au=Wang%2C+Kun&amp;rft.au=He%2C+Tianming&amp;rft.au=Feng%2C+Shouqian&amp;rft.au=Zhang%2C+Zongying&amp;rft.au=Mao%2C+Zhiquan&amp;rft.au=Shen%2C+Xiang&amp;rft.au=Chen%2C+Xiaoliu&amp;rft.au=Jiang%2C+Yuanmao&amp;rft.au=Wu%2C+Shujing&amp;rft.au=Yin%2C+Chengmiao&amp;rft.au=Ge%2C+Shunfeng&amp;rft.au=Yang%2C+Long&amp;rft.au=Jiang%2C+Shenghui&amp;rft.au=Xu%2C+Haifeng&amp;rft.au=Liu%2C+Jingxuan&amp;rft.au=Wang%2C+Deyun&amp;rft.au=Qu%2C+Changzhi&amp;rft.au=Wang%2C+Yicheng&amp;rft.au=Zuo%2C+Weifang&amp;rft_id=https%3A%2F%2Fwww.ncbi.nlm.nih.gov%2Fpmc%2Farticles%2FPMC5557836&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-Richards_Volk_2009-25"><span class="mw-cite-backlink"><b><a href="#cite_ref-Richards_Volk_2009_25-0" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFRichardsVolk,_Gayle_M.Reilley,_Ann_A.Henk,_Adam_D.2009" class="citation journal cs1">Richards, Christopher M.; Volk, Gayle M.; Reilley, Ann A.; Henk, Adam D.; Lockwood, Dale R.; et&nbsp;al. (2009). "Genetic diversity and population structure in <i>Malus sieversii</i>, a wild progenitor species of domesticated apple". <i>Tree Genetics &amp; Genomes</i>. <b>5</b> (2): 339–347. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<a rel="nofollow" class="external text" href="https://doi.org/10.1007%2Fs11295-008-0190-9">10.1007/s11295-008-0190-9</a>. <a href="/wiki/S2CID_(identifier)" class="mw-redirect" title="S2CID (identifier)">S2CID</a>&nbsp;<a rel="nofollow" class="external text" href="https://api.semanticscholar.org/CorpusID:19847067">19847067</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=Tree+Genetics+%26+Genomes&amp;rft.atitle=Genetic+diversity+and+population+structure+in+Malus+sieversii%2C+a+wild+progenitor+species+of+domesticated+apple&amp;rft.volume=5&amp;rft.issue=2&amp;rft.pages=339-347&amp;rft.date=2009&amp;rft_id=info%3Adoi%2F10.1007%2Fs11295-008-0190-9&amp;rft_id=https%3A%2F%2Fapi.semanticscholar.org%2FCorpusID%3A19847067%23id-name%3DS2CID&amp;rft.aulast=Richards&amp;rft.aufirst=Christopher+M.&amp;rft.au=Volk%2C+Gayle+M.&amp;rft.au=Reilley%2C+Ann+A.&amp;rft.au=Henk%2C+Adam+D.&amp;rft.au=Lockwood%2C+Dale+R.&amp;rft.au=Reeves%2C+Patrick+A.&amp;rft.au=Forsline%2C+Philip+L.&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-26"><span class="mw-cite-backlink"><b><a href="#cite_ref-26" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFLauriMaguyloTrottier2006" class="citation journal cs1">Lauri, Pierre-éric; Maguylo, Karen; Trottier, Catherine (March 2006). <a rel="nofollow" class="external text" href="https://bsapubs.onlinelibrary.wiley.com/doi/full/10.3732/ajb.93.3.357">"Architecture and size relations: an essay on the apple (Malus × domestica, Rosaceae) tree"</a>. <i>American Journal of Botany</i>. <b>93</b> (3): 357–368. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<a rel="nofollow" class="external text" href="https://doi.org/10.3732%2Fajb.93.3.357">10.3732/ajb.93.3.357</a>. <a href="/wiki/PMID_(identifier)" class="mw-redirect" title="PMID (identifier)">PMID</a>&nbsp;<a rel="nofollow" class="external text" href="https://pubmed.ncbi.nlm.nih.gov/21646196">21646196</a>. <a rel="nofollow" class="external text" href="https://web.archive.org/web/20190420154707/https://bsapubs.onlinelibrary.wiley.com/doi/full/10.3732/ajb.93.3.357">Archived</a> from the original on 20 April 2019<span class="reference-accessdate">. Retrieved <span class="nowrap">27 July</span> 2024</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=American+Journal+of+Botany&amp;rft.atitle=Architecture+and+size+relations%3A+an+essay+on+the+apple+%28Malus+%C3%97+domestica%2C+Rosaceae%29+tree&amp;rft.volume=93&amp;rft.issue=3&amp;rft.pages=357-368&amp;rft.date=2006-03&amp;rft_id=info%3Adoi%2F10.3732%2Fajb.93.3.357&amp;rft_id=info%3Apmid%2F21646196&amp;rft.aulast=Lauri&amp;rft.aufirst=Pierre-%C3%A9ric&amp;rft.au=Maguylo%2C+Karen&amp;rft.au=Trottier%2C+Catherine&amp;rft_id=https%3A%2F%2Fbsapubs.onlinelibrary.wiley.com%2Fdoi%2Ffull%2F10.3732%2Fajb.93.3.357&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-Cornille_2012-27"><span class="mw-cite-backlink"><b><a href="#cite_ref-Cornille_2012_27-0" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFCornilleGladieuxSmuldersRoldán-Ruiz2012" class="citation journal cs1">Cornille, Amandine; Gladieux, Pierre; Smulders, Marinus J. M.; Roldán-Ruiz, Isabel; Laurens, François; et&nbsp;al. (2012). Mauricio, Rodney (ed.). <a rel="nofollow" class="external text" href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC3349737">"New Insight into the History of Domesticated Apple: Secondary Contribution of the European Wild Apple to the Genome of Cultivated Varieties"</a>. <i>PLOS Genetics</i>. <b>8</b> (5): e1002703. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<span class="id-lock-free" title="Freely accessible"><a rel="nofollow" class="external text" href="https://doi.org/10.1371%2Fjournal.pgen.1002703">10.1371/journal.pgen.1002703</a></span>. <a href="/wiki/PMC_(identifier)" class="mw-redirect" title="PMC (identifier)">PMC</a>&nbsp;<span class="id-lock-free" title="Freely accessible"><a rel="nofollow" class="external text" href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC3349737">3349737</a></span>. <a href="/wiki/PMID_(identifier)" class="mw-redirect" title="PMID (identifier)">PMID</a>&nbsp;<a rel="nofollow" class="external text" href="https://pubmed.ncbi.nlm.nih.gov/22589740">22589740</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=PLOS+Genetics&amp;rft.atitle=New+Insight+into+the+History+of+Domesticated+Apple%3A+Secondary+Contribution+of+the+European+Wild+Apple+to+the+Genome+of+Cultivated+Varieties&amp;rft.volume=8&amp;rft.issue=5&amp;rft.pages=e1002703&amp;rft.date=2012&amp;rft_id=https%3A%2F%2Fwww.ncbi.nlm.nih.gov%2Fpmc%2Farticles%2FPMC3349737%23id-name%3DPMC&amp;rft_id=info%3Apmid%2F22589740&amp;rft_id=info%3Adoi%2F10.1371%2Fjournal.pgen.1002703&amp;rft.aulast=Cornille&amp;rft.aufirst=Amandine&amp;rft.au=Gladieux%2C+Pierre&amp;rft.au=Smulders%2C+Marinus+J.+M.&amp;rft.au=Rold%C3%A1n-Ruiz%2C+Isabel&amp;rft.au=Laurens%2C+Fran%C3%A7ois&amp;rft.au=Le+Cam%2C+Bruno&amp;rft.au=Nersesyan%2C+Anush&amp;rft.au=Clavel%2C+Joanne&amp;rft.au=Olonova%2C+Marina&amp;rft_id=https%3A%2F%2Fwww.ncbi.nlm.nih.gov%2Fpmc%2Farticles%2FPMC3349737&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-28"><span class="mw-cite-backlink"><b><a href="#cite_ref-28" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFKean2012" class="citation web cs1">Kean, Sam (17 May 2012). <a rel="nofollow" class="external text" href="https://www.science.org/content/article/scienceshot-secret-history-domesticated-apple">"ScienceShot: The Secret History of the Domesticated Apple"</a>. <a rel="nofollow" class="external text" href="https://web.archive.org/web/20160611184017/http://www.sciencemag.org/news/2012/05/scienceshot-secret-history-domesticated-apple">Archived</a> from the original on 11 June 2016.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=unknown&amp;rft.btitle=ScienceShot%3A+The+Secret+History+of+the+Domesticated+Apple&amp;rft.date=2012-05-17&amp;rft.aulast=Kean&amp;rft.aufirst=Sam&amp;rft_id=https%3A%2F%2Fwww.science.org%2Fcontent%2Farticle%2Fscienceshot-secret-history-domesticated-apple&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-29"><span class="mw-cite-backlink"><b><a href="#cite_ref-29" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFCoartVan_GlabekeDe_LooseLarsen2006" class="citation journal cs1">Coart, E.; Van Glabeke, S.; De Loose, M.; Larsen, A.S.; Roldán-Ruiz, I. (2006). "Chloroplast diversity in the genus <i>Malus</i>: new insights into the relationship between the European wild apple (<i>Malus sylvestris</i> (L.) Mill.) and the domesticated apple (<i>Malus domestica</i> Borkh.)". <i>Mol. Ecol</i>. <b>15</b> (8): 2171–2182. <a href="/wiki/Bibcode_(identifier)" class="mw-redirect" title="Bibcode (identifier)">Bibcode</a>:<a rel="nofollow" class="external text" href="https://ui.adsabs.harvard.edu/abs/2006MolEc..15.2171C">2006MolEc..15.2171C</a>. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<a rel="nofollow" class="external text" href="https://doi.org/10.1111%2Fj.1365-294x.2006.02924.x">10.1111/j.1365-294x.2006.02924.x</a>. <a href="/wiki/PMID_(identifier)" class="mw-redirect" title="PMID (identifier)">PMID</a>&nbsp;<a rel="nofollow" class="external text" href="https://pubmed.ncbi.nlm.nih.gov/16780433">16780433</a>. <a href="/wiki/S2CID_(identifier)" class="mw-redirect" title="S2CID (identifier)">S2CID</a>&nbsp;<a rel="nofollow" class="external text" href="https://api.semanticscholar.org/CorpusID:31481730">31481730</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=Mol.+Ecol.&amp;rft.atitle=Chloroplast+diversity+in+the+genus+Malus%3A+new+insights+into+the+relationship+between+the+European+wild+apple+%28Malus+sylvestris+%28L.%29+Mill.%29+and+the+domesticated+apple+%28Malus+domestica+Borkh.%29&amp;rft.volume=15&amp;rft.issue=8&amp;rft.pages=2171-2182&amp;rft.date=2006&amp;rft_id=info%3Adoi%2F10.1111%2Fj.1365-294x.2006.02924.x&amp;rft_id=https%3A%2F%2Fapi.semanticscholar.org%2FCorpusID%3A31481730%23id-name%3DS2CID&amp;rft_id=info%3Apmid%2F16780433&amp;rft_id=info%3Abibcode%2F2006MolEc..15.2171C&amp;rft.aulast=Coart&amp;rft.aufirst=E.&amp;rft.au=Van+Glabeke%2C+S.&amp;rft.au=De+Loose%2C+M.&amp;rft.au=Larsen%2C+A.S.&amp;rft.au=Rold%C3%A1n-Ruiz%2C+I.&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-30"><span class="mw-cite-backlink"><b><a href="#cite_ref-30" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFRottoliPessina2007" class="citation book cs1">Rottoli, Mauro; Pessina, Andrea (2007). "Chapter 9: Neolithic agriculture in Italy: an update of archaeobotanical data with particular emphasis on northern settlements". In Colledge, Sue; Conolly, James (eds.). <span class="id-lock-limited" title="Free access subject to limited trial, subscription normally required"><a rel="nofollow" class="external text" href="https://archive.org/details/originsspreadofd0000unse"><i>The Origins and Spread of Domestic Plants in Southwest Asia and Europe</i></a></span> (First&nbsp;ed.). Walnut Creek, California: <a href="/wiki/Left_Coast_Press" title="Left Coast Press">Left Coast Press</a>; University College London Institute of Archaeology Publications. pp.&nbsp;142–143. <a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&nbsp;<a href="/wiki/Special:BookSources/978-1-59874-988-5" title="Special:BookSources/978-1-59874-988-5"><bdi>978-1-59874-988-5</bdi></a>. <a href="/wiki/OCLC_(identifier)" class="mw-redirect" title="OCLC (identifier)">OCLC</a>&nbsp;<a rel="nofollow" class="external text" href="https://search.worldcat.org/oclc/84838157">84838157</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=bookitem&amp;rft.atitle=Chapter+9%3A+Neolithic+agriculture+in+Italy%3A+an+update+of+archaeobotanical+data+with+particular+emphasis+on+northern+settlements&amp;rft.btitle=The+Origins+and+Spread+of+Domestic+Plants+in+Southwest+Asia+and+Europe&amp;rft.place=Walnut+Creek%2C+California&amp;rft.pages=142-143&amp;rft.edition=First&amp;rft.pub=Left+Coast+Press%3B+University+College+London+Institute+of+Archaeology+Publications&amp;rft.date=2007&amp;rft_id=info%3Aoclcnum%2F84838157&amp;rft.isbn=978-1-59874-988-5&amp;rft.aulast=Rottoli&amp;rft.aufirst=Mauro&amp;rft.au=Pessina%2C+Andrea&amp;rft_id=https%3A%2F%2Farchive.org%2Fdetails%2Foriginsspreadofd0000unse&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-Ancient_DNA-31"><span class="mw-cite-backlink">^ <a href="#cite_ref-Ancient_DNA_31-0"><span class="cite-accessibility-label">Jump up to: </span><sup><i><b>a</b></i></sup></a> <a href="#cite_ref-Ancient_DNA_31-1"><sup><i><b>b</b></i></sup></a> <a href="#cite_ref-Ancient_DNA_31-2"><sup><i><b>c</b></i></sup></a> <a href="#cite_ref-Ancient_DNA_31-3"><sup><i><b>d</b></i></sup></a></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFSchlumbaumvan_GlabekeRoldan-Ruiz2012" class="citation journal cs1">Schlumbaum, Angela; van Glabeke, Sabine; Roldan-Ruiz, Isabel (January 2012). "Towards the onset of fruit tree growing north of the Alps: Ancient DNA from waterlogged apple (<i>Malus</i> sp.) seed fragments". <i>Annals of Anatomy - Anatomischer Anzeiger</i>. <b>194</b> (1): 157–162. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<a rel="nofollow" class="external text" href="https://doi.org/10.1016%2Fj.aanat.2011.03.004">10.1016/j.aanat.2011.03.004</a>. <a href="/wiki/PMID_(identifier)" class="mw-redirect" title="PMID (identifier)">PMID</a>&nbsp;<a rel="nofollow" class="external text" href="https://pubmed.ncbi.nlm.nih.gov/21501956">21501956</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=Annals+of+Anatomy+-+Anatomischer+Anzeiger&amp;rft.atitle=Towards+the+onset+of+fruit+tree+growing+north+of+the+Alps%3A+Ancient+DNA+from+waterlogged+apple+%28Malus+sp.%29+seed+fragments&amp;rft.volume=194&amp;rft.issue=1&amp;rft.pages=157-162&amp;rft.date=2012-01&amp;rft_id=info%3Adoi%2F10.1016%2Fj.aanat.2011.03.004&amp;rft_id=info%3Apmid%2F21501956&amp;rft.aulast=Schlumbaum&amp;rft.aufirst=Angela&amp;rft.au=van+Glabeke%2C+Sabine&amp;rft.au=Roldan-Ruiz%2C+Isabel&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-32"><span class="mw-cite-backlink"><b><a href="#cite_ref-32" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFSauer1993" class="citation book cs1"><a href="/wiki/Jonathan_Deininger_Sauer" title="Jonathan Deininger Sauer">Sauer, Jonathan D.</a> (1993). <i>Historical Geography of Crop Plants: A Select Roster</i> (First&nbsp;ed.). Boca Raton, Florida: <a href="/wiki/CRC_Press" title="CRC Press">CRC Press</a>. pp.&nbsp;109–113. <a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&nbsp;<a href="/wiki/Special:BookSources/978-0-8493-8901-6" title="Special:BookSources/978-0-8493-8901-6"><bdi>978-0-8493-8901-6</bdi></a>. <a href="/wiki/LCCN_(identifier)" class="mw-redirect" title="LCCN (identifier)">LCCN</a>&nbsp;<a rel="nofollow" class="external text" href="https://lccn.loc.gov/92045590">92045590</a>. <a href="/wiki/OCLC_(identifier)" class="mw-redirect" title="OCLC (identifier)">OCLC</a>&nbsp;<a rel="nofollow" class="external text" href="https://search.worldcat.org/oclc/27224696">27224696</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=book&amp;rft.btitle=Historical+Geography+of+Crop+Plants%3A+A+Select+Roster&amp;rft.place=Boca+Raton%2C+Florida&amp;rft.pages=109-113&amp;rft.edition=First&amp;rft.pub=CRC+Press&amp;rft.date=1993&amp;rft_id=info%3Aoclcnum%2F27224696&amp;rft_id=info%3Alccn%2F92045590&amp;rft.isbn=978-0-8493-8901-6&amp;rft.aulast=Sauer&amp;rft.aufirst=Jonathan+D.&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-33"><span class="mw-cite-backlink"><b><a href="#cite_ref-33" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFPlinius1855" class="citation book cs1"><a href="/wiki/Pliny_the_Elder" title="Pliny the Elder">Plinius, Gaius Secundus</a> (1855). <a rel="nofollow" class="external text" href="https://archive.org/details/naturalhistoryof03plin/page/303"><i>The Natural History of Pliny</i></a>. Vol.&nbsp;III. Translated by <a href="/wiki/John_Bostock_(physician)" title="John Bostock (physician)">Bostock, John</a>; <a href="/wiki/Henry_Thomas_Riley" title="Henry Thomas Riley">Riley, Henry T.</a> London: <a href="/wiki/Henry_G._Bohn" class="mw-redirect" title="Henry G. Bohn">Henry G. Bohn</a>. p.&nbsp;303<span class="reference-accessdate">. Retrieved <span class="nowrap">3 August</span> 2024</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=book&amp;rft.btitle=The+Natural+History+of+Pliny&amp;rft.place=London&amp;rft.pages=303&amp;rft.pub=Henry+G.+Bohn&amp;rft.date=1855&amp;rft.aulast=Plinius&amp;rft.aufirst=Gaius+Secundus&amp;rft_id=https%3A%2F%2Farchive.org%2Fdetails%2Fnaturalhistoryof03plin%2Fpage%2F303&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-34"><span class="mw-cite-backlink"><b><a href="#cite_ref-34" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFMartin1976" class="citation book cs1">Martin, Alice A. (1976). <a rel="nofollow" class="external text" href="https://archive.org/details/allaboutapples0000mart/page/64"><i>All About Apples</i></a> (First&nbsp;ed.). Boston, Massachusetts: <a href="/wiki/Houghton_Mifflin_Company" class="mw-redirect" title="Houghton Mifflin Company">Houghton Mifflin Company</a>. pp.&nbsp;64–65. <a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&nbsp;<a href="/wiki/Special:BookSources/978-0-395-20724-6" title="Special:BookSources/978-0-395-20724-6"><bdi>978-0-395-20724-6</bdi></a>. <a href="/wiki/OCLC_(identifier)" class="mw-redirect" title="OCLC (identifier)">OCLC</a>&nbsp;<a rel="nofollow" class="external text" href="https://search.worldcat.org/oclc/1733691">1733691</a><span class="reference-accessdate">. Retrieved <span class="nowrap">3 August</span> 2024</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=book&amp;rft.btitle=All+About+Apples&amp;rft.place=Boston%2C+Massachusetts&amp;rft.pages=64-65&amp;rft.edition=First&amp;rft.pub=Houghton+Mifflin+Company&amp;rft.date=1976&amp;rft_id=info%3Aoclcnum%2F1733691&amp;rft.isbn=978-0-395-20724-6&amp;rft.aulast=Martin&amp;rft.aufirst=Alice+A.&amp;rft_id=https%3A%2F%2Farchive.org%2Fdetails%2Fallaboutapples0000mart%2Fpage%2F64&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-35"><span class="mw-cite-backlink"><b><a href="#cite_ref-35" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFAdamson2004" class="citation book cs1">Adamson, Melitta Weiss (2004). <span class="id-lock-limited" title="Free access subject to limited trial, subscription normally required"><a rel="nofollow" class="external text" href="https://archive.org/details/foodinmedievalti0000adam"><i>Food in Medieval Times</i></a></span> (First&nbsp;ed.). Westport, Connecticut: <a href="/wiki/Greenwood_Press" class="mw-redirect" title="Greenwood Press">Greenwood Press</a>. pp.&nbsp;19–20. <a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&nbsp;<a href="/wiki/Special:BookSources/978-0-313-32147-4" title="Special:BookSources/978-0-313-32147-4"><bdi>978-0-313-32147-4</bdi></a>. <a href="/wiki/LCCN_(identifier)" class="mw-redirect" title="LCCN (identifier)">LCCN</a>&nbsp;<a rel="nofollow" class="external text" href="https://lccn.loc.gov/2004014054">2004014054</a>. <a href="/wiki/OCLC_(identifier)" class="mw-redirect" title="OCLC (identifier)">OCLC</a>&nbsp;<a rel="nofollow" class="external text" href="https://search.worldcat.org/oclc/55738647">55738647</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=book&amp;rft.btitle=Food+in+Medieval+Times&amp;rft.place=Westport%2C+Connecticut&amp;rft.pages=19-20&amp;rft.edition=First&amp;rft.pub=Greenwood+Press&amp;rft.date=2004&amp;rft_id=info%3Aoclcnum%2F55738647&amp;rft_id=info%3Alccn%2F2004014054&amp;rft.isbn=978-0-313-32147-4&amp;rft.aulast=Adamson&amp;rft.aufirst=Melitta+Weiss&amp;rft_id=https%3A%2F%2Farchive.org%2Fdetails%2Ffoodinmedievalti0000adam&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-Torrejonetal2004-36"><span class="mw-cite-backlink"><b><a href="#cite_ref-Torrejonetal2004_36-0" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFTorrejónCisternasAraneda2004" class="citation journal cs1 cs1-prop-foreign-lang-source">Torrejón, Fernando; Cisternas, Marco; Araneda, Alberto (2004). <a rel="nofollow" class="external text" href="https://doi.org/10.4067%2Fs0716-078x2004000400009">"Efectos ambientales de la colonización española desde el río Maullín al archipiélago de Chiloé, sur de Chile"</a> [Environmental effects of the spanish colonization from de Maullín river to the Chiloé archipelago, southern Chile]. <i><a href="/wiki/Revista_Chilena_de_Historia_Natural" title="Revista Chilena de Historia Natural">Revista Chilena de Historia Natural</a></i> (in Spanish). <b>77</b> (4): 661–677. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<span class="id-lock-free" title="Freely accessible"><a rel="nofollow" class="external text" href="https://doi.org/10.4067%2Fs0716-078x2004000400009">10.4067/s0716-078x2004000400009</a></span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=Revista+Chilena+de+Historia+Natural&amp;rft.atitle=Efectos+ambientales+de+la+colonizaci%C3%B3n+espa%C3%B1ola+desde+el+r%C3%ADo+Maull%C3%ADn+al+archipi%C3%A9lago+de+Chilo%C3%A9%2C+sur+de+Chile&amp;rft.volume=77&amp;rft.issue=4&amp;rft.pages=661-677&amp;rft.date=2004&amp;rft_id=info%3Adoi%2F10.4067%2Fs0716-078x2004000400009&amp;rft.aulast=Torrej%C3%B3n&amp;rft.aufirst=Fernando&amp;rft.au=Cisternas%2C+Marco&amp;rft.au=Araneda%2C+Alberto&amp;rft_id=https%3A%2F%2Fdoi.org%2F10.4067%252Fs0716-078x2004000400009&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-37"><span class="mw-cite-backlink"><b><a href="#cite_ref-37" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFSmith1963" class="citation book cs1">Smith, Archibald William (1963). <span class="id-lock-registration" title="Free registration required"><a rel="nofollow" class="external text" href="https://archive.org/details/gardenersbookofp00smit/page/40"><i>A Gardener's Book of Plant Names&nbsp;: A Handbook of the Meaning and Origins of Plant Names</i></a></span> (First&nbsp;ed.). New York: <a href="/wiki/Harper_%26_Row" class="mw-redirect" title="Harper &amp; Row">Harper &amp; Row</a>. p.&nbsp;40. <a href="/wiki/LCCN_(identifier)" class="mw-redirect" title="LCCN (identifier)">LCCN</a>&nbsp;<a rel="nofollow" class="external text" href="https://lccn.loc.gov/62009906">62009906</a>. <a href="/wiki/OCLC_(identifier)" class="mw-redirect" title="OCLC (identifier)">OCLC</a>&nbsp;<a rel="nofollow" class="external text" href="https://search.worldcat.org/oclc/710612">710612</a><span class="reference-accessdate">. Retrieved <span class="nowrap">10 August</span> 2024</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=book&amp;rft.btitle=A+Gardener%27s+Book+of+Plant+Names+%3A+A+Handbook+of+the+Meaning+and+Origins+of+Plant+Names&amp;rft.place=New+York&amp;rft.pages=40&amp;rft.edition=First&amp;rft.pub=Harper+%26+Row&amp;rft.date=1963&amp;rft_id=info%3Aoclcnum%2F710612&amp;rft_id=info%3Alccn%2F62009906&amp;rft.aulast=Smith&amp;rft.aufirst=Archibald+William&amp;rft_id=https%3A%2F%2Farchive.org%2Fdetails%2Fgardenersbookofp00smit%2Fpage%2F40&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-Harrowsmith-38"><span class="mw-cite-backlink">^ <a href="#cite_ref-Harrowsmith_38-0"><span class="cite-accessibility-label">Jump up to: </span><sup><i><b>a</b></i></sup></a> <a href="#cite_ref-Harrowsmith_38-1"><sup><i><b>b</b></i></sup></a> <a href="#cite_ref-Harrowsmith_38-2"><sup><i><b>c</b></i></sup></a></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFPoole1980" class="citation book cs1">Poole, Mike (1980). <span class="id-lock-registration" title="Free registration required"><a rel="nofollow" class="external text" href="https://archive.org/details/harrowsmithreade0000unse_k4b7/page/122">"Heirloom Apples"</a></span>. In Lawrence, James (ed.). <i>The Harrowsmith Reader Volume II</i>. Camden East, Ontario: <a href="/wiki/Camden_House_Publishing" title="Camden House Publishing">Camden House Publishing</a>. p.&nbsp;122. <a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&nbsp;<a href="/wiki/Special:BookSources/978-0-920656-11-2" title="Special:BookSources/978-0-920656-11-2"><bdi>978-0-920656-11-2</bdi></a>. <a href="/wiki/OCLC_(identifier)" class="mw-redirect" title="OCLC (identifier)">OCLC</a>&nbsp;<a rel="nofollow" class="external text" href="https://search.worldcat.org/oclc/1336124440">1336124440</a><span class="reference-accessdate">. Retrieved <span class="nowrap">10 August</span> 2024</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=bookitem&amp;rft.atitle=Heirloom+Apples&amp;rft.btitle=The+Harrowsmith+Reader+Volume+II&amp;rft.place=Camden+East%2C+Ontario&amp;rft.pages=122&amp;rft.pub=Camden+House+Publishing&amp;rft.date=1980&amp;rft_id=info%3Aoclcnum%2F1336124440&amp;rft.isbn=978-0-920656-11-2&amp;rft.aulast=Poole&amp;rft.aufirst=Mike&amp;rft_id=https%3A%2F%2Farchive.org%2Fdetails%2Fharrowsmithreade0000unse_k4b7%2Fpage%2F122&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-39"><span class="mw-cite-backlink"><b><a href="#cite_ref-39" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFVan_Valen1900" class="citation book cs1">Van Valen, James M. (1900). <a rel="nofollow" class="external text" href="https://archive.org/details/historybergenco00valegoog/page/33"><i>History of Bergen County, New Jersey</i></a>. New York: New Jersey Publishing and Engraving Company. pp.&nbsp;33–34. <a href="/wiki/OCLC_(identifier)" class="mw-redirect" title="OCLC (identifier)">OCLC</a>&nbsp;<a rel="nofollow" class="external text" href="https://search.worldcat.org/oclc/25697876">25697876</a><span class="reference-accessdate">. Retrieved <span class="nowrap">9 August</span> 2024</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=book&amp;rft.btitle=History+of+Bergen+County%2C+New+Jersey&amp;rft.place=New+York&amp;rft.pages=33-34&amp;rft.pub=New+Jersey+Publishing+and+Engraving+Company&amp;rft.date=1900&amp;rft_id=info%3Aoclcnum%2F25697876&amp;rft.aulast=Van+Valen&amp;rft.aufirst=James+M.&amp;rft_id=https%3A%2F%2Farchive.org%2Fdetails%2Fhistorybergenco00valegoog%2Fpage%2F33&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-40"><span class="mw-cite-backlink"><b><a href="#cite_ref-40" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFBrox1999" class="citation book cs1"><a href="/wiki/Jane_Brox" title="Jane Brox">Brox, Jane</a> (1999). <span class="id-lock-registration" title="Free registration required"><a rel="nofollow" class="external text" href="https://archive.org/details/fivethousanddays00brox/page/150"><i>Five Thousand Days Like This One</i></a></span> (First&nbsp;ed.). Boston, Massachusetts: Beacon Press. pp.&nbsp;150–151. <a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&nbsp;<a href="/wiki/Special:BookSources/978-0-8070-2106-4" title="Special:BookSources/978-0-8070-2106-4"><bdi>978-0-8070-2106-4</bdi></a>. <a href="/wiki/LCCN_(identifier)" class="mw-redirect" title="LCCN (identifier)">LCCN</a>&nbsp;<a rel="nofollow" class="external text" href="https://lccn.loc.gov/98035051">98035051</a>. <a href="/wiki/OCLC_(identifier)" class="mw-redirect" title="OCLC (identifier)">OCLC</a>&nbsp;<a rel="nofollow" class="external text" href="https://search.worldcat.org/oclc/39605684">39605684</a><span class="reference-accessdate">. Retrieved <span class="nowrap">9 August</span> 2024</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=book&amp;rft.btitle=Five+Thousand+Days+Like+This+One&amp;rft.place=Boston%2C+Massachusetts&amp;rft.pages=150-151&amp;rft.edition=First&amp;rft.pub=Beacon+Press&amp;rft.date=1999&amp;rft_id=info%3Aoclcnum%2F39605684&amp;rft_id=info%3Alccn%2F98035051&amp;rft.isbn=978-0-8070-2106-4&amp;rft.aulast=Brox&amp;rft.aufirst=Jane&amp;rft_id=https%3A%2F%2Farchive.org%2Fdetails%2Ffivethousanddays00brox%2Fpage%2F150&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-41"><span class="mw-cite-backlink"><b><a href="#cite_ref-41" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFCohen2018" class="citation web cs1">Cohen, Rachel D. (26 November 2018). <a rel="nofollow" class="external text" href="https://www.npr.org/sections/thesalt/2018/11/26/668256349/thanks-to-science-you-can-eat-an-apple-every-day">"Thanks To Science, You Can Eat An Apple Every Day"</a>. <i>The Salt</i>. <a href="/wiki/NPR" title="NPR">NPR</a>. <a rel="nofollow" class="external text" href="https://web.archive.org/web/20240618003023/https://www.npr.org/sections/thesalt/2018/11/26/668256349/thanks-to-science-you-can-eat-an-apple-every-day">Archived</a> from the original on 18 June 2024<span class="reference-accessdate">. Retrieved <span class="nowrap">1 August</span> 2024</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=unknown&amp;rft.jtitle=The+Salt&amp;rft.atitle=Thanks+To+Science%2C+You+Can+Eat+An+Apple+Every+Day&amp;rft.date=2018-11-26&amp;rft.aulast=Cohen&amp;rft.aufirst=Rachel+D.&amp;rft_id=https%3A%2F%2Fwww.npr.org%2Fsections%2Fthesalt%2F2018%2F11%2F26%2F668256349%2Fthanks-to-science-you-can-eat-an-apple-every-day&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-42"><span class="mw-cite-backlink"><b><a href="#cite_ref-42" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="https://blogs.cornell.edu/jentsch/the-heirloom-orchard/">"The Heirloom Apple Orchard"</a>. <i>The Jentsch Lab</i>. <a href="/wiki/Cornell_University" title="Cornell University">Cornell University</a>. <a rel="nofollow" class="external text" href="https://web.archive.org/web/20240730203237/https://blogs.cornell.edu/jentsch/the-heirloom-orchard/">Archived</a> from the original on 30 July 2024<span class="reference-accessdate">. Retrieved <span class="nowrap">9 August</span> 2024</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=unknown&amp;rft.jtitle=The+Jentsch+Lab&amp;rft.atitle=The+Heirloom+Apple+Orchard&amp;rft_id=https%3A%2F%2Fblogs.cornell.edu%2Fjentsch%2Fthe-heirloom-orchard%2F&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-43"><span class="mw-cite-backlink"><b><a href="#cite_ref-43" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFRanney" class="citation conference cs1">Ranney, Thomas G. <a rel="nofollow" class="external text" href="https://web.archive.org/web/20100723170402/http://www.ces.ncsu.edu/fletcher/programs/nursery/metria/metria11/ranney/index.html">"Polyploidy: From Evolution to Landscape Plant Improvement"</a>. <i>Proceedings of the 11th Metropolitan Tree Improvement Alliance (METRIA) Conference</i>. <a rel="nofollow" class="external text" href="https://www.ces.ncsu.edu/fletcher/programs/nursery/metria/metria11/index.html">11th Metropolitan Tree Improvement Alliance Conference held in Gresham, Oregon, August 23–24, 2000</a>. <i>METRIA (NCSU.edu)</i>. METRIA. Archived from <a rel="nofollow" class="external text" href="http://www.ces.ncsu.edu/fletcher/programs/nursery/metria/metria11/ranney/index.html">the original</a> on 23 July 2010<span class="reference-accessdate">. Retrieved <span class="nowrap">7 November</span> 2010</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=conference&amp;rft.jtitle=METRIA+%28NCSU.edu%29&amp;rft.atitle=Proceedings+of+the+11th+Metropolitan+Tree+Improvement+Alliance+%28METRIA%29+Conference&amp;rft.aulast=Ranney&amp;rft.aufirst=Thomas+G.&amp;rft_id=http%3A%2F%2Fwww.ces.ncsu.edu%2Ffletcher%2Fprograms%2Fnursery%2Fmetria%2Fmetria11%2Franney%2Findex.html&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-44"><span class="mw-cite-backlink"><b><a href="#cite_ref-44" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFLordOuellette2010" class="citation web cs1">Lord, William G.; Ouellette, Amy (February 2010). <a rel="nofollow" class="external text" href="https://web.archive.org/web/20130930151829/http://extension.unh.edu/resources/files/Resource000583_Rep605.pdf">"Dwarf Rootstocks for Apple Trees in the Home Garden"</a> <span class="cs1-format">(PDF)</span>. <a href="/wiki/University_of_New_Hampshire" title="University of New Hampshire">University of New Hampshire</a>. Archived from <a rel="nofollow" class="external text" href="http://extension.unh.edu/resources/files/resource000583_rep605.pdf">the original</a> <span class="cs1-format">(PDF)</span> on 30 September 2013<span class="reference-accessdate">. Retrieved <span class="nowrap">1 September</span> 2013</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=unknown&amp;rft.btitle=Dwarf+Rootstocks+for+Apple+Trees+in+the+Home+Garden&amp;rft.pub=University+of+New+Hampshire&amp;rft.date=2010-02&amp;rft.aulast=Lord&amp;rft.aufirst=William+G.&amp;rft.au=Ouellette%2C+Amy&amp;rft_id=http%3A%2F%2Fextension.unh.edu%2Fresources%2Ffiles%2Fresource000583_rep605.pdf&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-45"><span class="mw-cite-backlink"><b><a href="#cite_ref-45" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFFallahiColtFallahiChun2002" class="citation journal cs1">Fallahi, Esmaeil; Colt, W. Michael; Fallahi, Bahar; Chun, Ik-Jo (January 2002). <a rel="nofollow" class="external text" href="https://journals.ashs.org/horttech/view/journals/horttech/12/1/article-p38.xml">"The Importance of Apple Rootstocks on Tree Growth, Yield, Fruit Quality, Leaf Nutrition, and Photosynthesis with an Emphasis on 'Fuji'<span class="cs1-kern-right"></span>"</a>. <i>HortTechnology</i>. <b>12</b> (1): 38–44. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<a rel="nofollow" class="external text" href="https://doi.org/10.21273%2FHORTTECH.12.1.38">10.21273/HORTTECH.12.1.38</a>. <a rel="nofollow" class="external text" href="https://web.archive.org/web/20140211173706/http://horttech.ashspublications.org/content/12/1/38.full.pdf">Archived</a> <span class="cs1-format">(PDF)</span> from the original on 11 February 2014<span class="reference-accessdate">. Retrieved <span class="nowrap">9 August</span> 2024</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=HortTechnology&amp;rft.atitle=The+Importance+of+Apple+Rootstocks+on+Tree+Growth%2C+Yield%2C+Fruit+Quality%2C+Leaf+Nutrition%2C+and+Photosynthesis+with+an+Emphasis+on+%27Fuji%27&amp;rft.volume=12&amp;rft.issue=1&amp;rft.pages=38-44&amp;rft.date=2002-01&amp;rft_id=info%3Adoi%2F10.21273%2FHORTTECH.12.1.38&amp;rft.aulast=Fallahi&amp;rft.aufirst=Esmaeil&amp;rft.au=Colt%2C+W.+Michael&amp;rft.au=Fallahi%2C+Bahar&amp;rft.au=Chun%2C+Ik-Jo&amp;rft_id=https%3A%2F%2Fjournals.ashs.org%2Fhorttech%2Fview%2Fjournals%2Fhorttech%2F12%2F1%2Farticle-p38.xml&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-46"><span class="mw-cite-backlink"><b><a href="#cite_ref-46" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFParker1993" class="citation web cs1">Parker, M.L. (September 1993). <a rel="nofollow" class="external text" href="https://web.archive.org/web/20130911051127/http://www.ces.ncsu.edu/hil/hil-300-a.html">"Apple Rootstocks and Tree Spacing"</a>. <i>North Carolina Cooperative Extension Service</i>. Archived from <a rel="nofollow" class="external text" href="http://www.ces.ncsu.edu/hil/hil-300-a.html">the original</a> on 11 September 2013<span class="reference-accessdate">. Retrieved <span class="nowrap">1 September</span> 2013</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=unknown&amp;rft.jtitle=North+Carolina+Cooperative+Extension+Service&amp;rft.atitle=Apple+Rootstocks+and+Tree+Spacing&amp;rft.date=1993-09&amp;rft.aulast=Parker&amp;rft.aufirst=M.L.&amp;rft_id=http%3A%2F%2Fwww.ces.ncsu.edu%2Fhil%2Fhil-300-a.html&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-47"><span class="mw-cite-backlink"><b><a href="#cite_ref-47" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFFerreeWarrington2003" class="citation book cs1">Ferree, David Curtis; Warrington, Ian J. (2003). <i>Apples: Botany, Production, and Uses</i>. New York: Centre for Agriculture and Bioscience International. pp.&nbsp;33–35. <a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&nbsp;<a href="/wiki/Special:BookSources/978-0851995922" title="Special:BookSources/978-0851995922"><bdi>978-0851995922</bdi></a>. <a href="/wiki/OCLC_(identifier)" class="mw-redirect" title="OCLC (identifier)">OCLC</a>&nbsp;<a rel="nofollow" class="external text" href="https://search.worldcat.org/oclc/133167834">133167834</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=book&amp;rft.btitle=Apples%3A+Botany%2C+Production%2C+and+Uses&amp;rft.place=New+York&amp;rft.pages=33-35&amp;rft.pub=Centre+for+Agriculture+and+Bioscience+International&amp;rft.date=2003&amp;rft_id=info%3Aoclcnum%2F133167834&amp;rft.isbn=978-0851995922&amp;rft.aulast=Ferree&amp;rft.aufirst=David+Curtis&amp;rft.au=Warrington%2C+Ian+J.&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-Polomski_&amp;_Reighard-48"><span class="mw-cite-backlink">^ <a href="#cite_ref-Polomski_&amp;_Reighard_48-0"><span class="cite-accessibility-label">Jump up to: </span><sup><i><b>a</b></i></sup></a> <a href="#cite_ref-Polomski_&amp;_Reighard_48-1"><sup><i><b>b</b></i></sup></a> <a href="#cite_ref-Polomski_&amp;_Reighard_48-2"><sup><i><b>c</b></i></sup></a> <a href="#cite_ref-Polomski_&amp;_Reighard_48-3"><sup><i><b>d</b></i></sup></a></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFPolomskiReighard" class="citation web cs1">Polomski, Bob; Reighard, Greg. <a rel="nofollow" class="external text" href="https://web.archive.org/web/20080228131352/http://hgic.clemson.edu/factsheets/HGIC1350.htm">"Apple HGIC 1350"</a>. <i>Home &amp; Garden Information Center</i>. <a href="/wiki/Clemson_University" title="Clemson University">Clemson University</a>. Archived from <a rel="nofollow" class="external text" href="http://hgic.clemson.edu/factsheets/HGIC1350.htm">the original</a> on 28 February 2008<span class="reference-accessdate">. Retrieved <span class="nowrap">22 January</span> 2008</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=unknown&amp;rft.jtitle=Home+%26+Garden+Information+Center&amp;rft.atitle=Apple+HGIC+1350&amp;rft.aulast=Polomski&amp;rft.aufirst=Bob&amp;rft.au=Reighard%2C+Greg&amp;rft_id=http%3A%2F%2Fhgic.clemson.edu%2Ffactsheets%2FHGIC1350.htm&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-49"><span class="mw-cite-backlink"><b><a href="#cite_ref-49" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFBarahona1992" class="citation journal cs1">Barahona, M. (1992). "Adaptation of Apple Varieties in Ecuador". <i>Acta Horticulturae</i> (310): 135–142. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<a rel="nofollow" class="external text" href="https://doi.org/10.17660%2FActaHortic.1992.310.17">10.17660/ActaHortic.1992.310.17</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=Acta+Horticulturae&amp;rft.atitle=Adaptation+of+Apple+Varieties+in+Ecuador&amp;rft.issue=310&amp;rft.pages=135-142&amp;rft.date=1992&amp;rft_id=info%3Adoi%2F10.17660%2FActaHortic.1992.310.17&amp;rft.aulast=Barahona&amp;rft.aufirst=M.&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-50"><span class="mw-cite-backlink"><b><a href="#cite_ref-50" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFAdamson2011" class="citation thesis cs1">Adamson, Nancy Lee (2011). <a rel="nofollow" class="external text" href="http://www.step-project.net/NPDOCS/Adamson_NL_D_2011.pdf"><i>An Assessment of Non-Apis Bees as Fruit and Vegetable Crop Pollinators in Southwest Virginia</i></a> <span class="cs1-format">(PDF)</span> (Doctor of Philosophy in Entomology thesis). <a href="/wiki/Virginia_Polytechnic_Institute_and_State_University" class="mw-redirect" title="Virginia Polytechnic Institute and State University">Virginia Polytechnic Institute and State University</a>. <a rel="nofollow" class="external text" href="https://web.archive.org/web/20151120230411/http://www.step-project.net/NPDOCS/Adamson_NL_D_2011.pdf">Archived</a> <span class="cs1-format">(PDF)</span> from the original on 20 November 2015<span class="reference-accessdate">. Retrieved <span class="nowrap">15 October</span> 2015</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Adissertation&amp;rft.title=An+Assessment+of+Non-Apis+Bees+as+Fruit+and+Vegetable+Crop+Pollinators+in+Southwest+Virginia&amp;rft.degree=Doctor+of+Philosophy+in+Entomology&amp;rft.inst=Virginia+Polytechnic+Institute+and+State+University&amp;rft.date=2011&amp;rft.aulast=Adamson&amp;rft.aufirst=Nancy+Lee&amp;rft_id=http%3A%2F%2Fwww.step-project.net%2FNPDOCS%2FAdamson_NL_D_2011.pdf&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-51"><span class="mw-cite-backlink"><b><a href="#cite_ref-51" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFPowell1986" class="citation journal cs1">Powell, L.E. (1986). "The Chilling Requirement in Apple and Its Role in Regulating Time of Flowering in Spring in Cold-Winter Climate". <i>Acta Horticulturae</i> (179). Wageningen, Netherlands: <a href="/wiki/International_Society_for_Horticultural_Science" title="International Society for Horticultural Science">International Society for Horticultural Science</a>: 129–140. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<a rel="nofollow" class="external text" href="https://doi.org/10.17660%2FActaHortic.1986.179.10">10.17660/ActaHortic.1986.179.10</a>. <a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&nbsp;<a href="/wiki/Special:BookSources/978-90-6605-182-9" title="Special:BookSources/978-90-6605-182-9"><bdi>978-90-6605-182-9</bdi></a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=Acta+Horticulturae&amp;rft.atitle=The+Chilling+Requirement+in+Apple+and+Its+Role+in+Regulating+Time+of+Flowering+in+Spring+in+Cold-Winter+Climate&amp;rft.issue=179&amp;rft.pages=129-140&amp;rft.date=1986&amp;rft_id=info%3Adoi%2F10.17660%2FActaHortic.1986.179.10&amp;rft.isbn=978-90-6605-182-9&amp;rft.aulast=Powell&amp;rft.aufirst=L.E.&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-52"><span class="mw-cite-backlink"><b><a href="#cite_ref-52" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFRomano2023" class="citation web cs1">Romano, Andrea (10 September 2023). <a rel="nofollow" class="external text" href="https://www.travelandleisure.com/trip-ideas/fall-vacations/best-orchards-for-apple-picking">"20 Best Places to Go Apple Picking in the United States"</a>. <i>Travel + Leisure</i>. <a rel="nofollow" class="external text" href="https://web.archive.org/web/20240421140207/https://www.travelandleisure.com/trip-ideas/fall-vacations/best-orchards-for-apple-picking">Archived</a> from the original on 21 April 2024<span class="reference-accessdate">. Retrieved <span class="nowrap">2 August</span> 2024</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=unknown&amp;rft.jtitle=Travel+%2B+Leisure&amp;rft.atitle=20+Best+Places+to+Go+Apple+Picking+in+the+United+States&amp;rft.date=2023-09-10&amp;rft.aulast=Romano&amp;rft.aufirst=Andrea&amp;rft_id=https%3A%2F%2Fwww.travelandleisure.com%2Ftrip-ideas%2Ffall-vacations%2Fbest-orchards-for-apple-picking&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-53"><span class="mw-cite-backlink"><b><a href="#cite_ref-53" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFGrazianoFarcuh2021" class="citation web cs1">Graziano, Jack; Farcuh, Macarena (10 September 2021). <a rel="nofollow" class="external text" href="https://extension.umd.edu/resource/controlled-atmosphere-storage-apples">"Controlled Atmosphere Storage of Apples"</a>. <i>University of Maryland Extension</i>. <a rel="nofollow" class="external text" href="https://web.archive.org/web/20230324131954/https://extension.umd.edu/resource/controlled-atmosphere-storage-apples">Archived</a> from the original on 24 March 2023<span class="reference-accessdate">. Retrieved <span class="nowrap">2 August</span> 2024</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=unknown&amp;rft.jtitle=University+of+Maryland+Extension&amp;rft.atitle=Controlled+Atmosphere+Storage+of+Apples&amp;rft.date=2021-09-10&amp;rft.aulast=Graziano&amp;rft.aufirst=Jack&amp;rft.au=Farcuh%2C+Macarena&amp;rft_id=https%3A%2F%2Fextension.umd.edu%2Fresource%2Fcontrolled-atmosphere-storage-apples&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-54"><span class="mw-cite-backlink"><b><a href="#cite_ref-54" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="https://www.foodsafety.gov/keep-food-safe/foodkeeper-app">"FoodKeeper App"</a>. <i>FoodSafety.gov</i>. <a href="/wiki/United_States_Department_of_Health_and_Human_Services" title="United States Department of Health and Human Services">United States Department of Health and Human Services</a>. 26 April 2019<span class="reference-accessdate">. Retrieved <span class="nowrap">17 September</span> 2024</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=unknown&amp;rft.jtitle=FoodSafety.gov&amp;rft.atitle=FoodKeeper+App&amp;rft.date=2019-04-26&amp;rft_id=https%3A%2F%2Fwww.foodsafety.gov%2Fkeep-food-safe%2Ffoodkeeper-app&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-55"><span class="mw-cite-backlink"><b><a href="#cite_ref-55" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="https://www.foodsafety.gov/keep-food-safe/4-steps-to-food-safety">"4 Steps to Food Safety"</a>. <i>FoodSafety.gov</i>. <a href="/wiki/United_States_Department_of_Health_and_Human_Services" title="United States Department of Health and Human Services">United States Department of Health and Human Services</a>. 12 April 2019<span class="reference-accessdate">. Retrieved <span class="nowrap">17 September</span> 2024</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=unknown&amp;rft.jtitle=FoodSafety.gov&amp;rft.atitle=4+Steps+to+Food+Safety&amp;rft.date=2019-04-12&amp;rft_id=https%3A%2F%2Fwww.foodsafety.gov%2Fkeep-food-safe%2F4-steps-to-food-safety&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-56"><span class="mw-cite-backlink"><b><a href="#cite_ref-56" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="https://web.archive.org/web/20150315033439/http://www.csiro.au/en/Research/Health/Food-safety/Refrigerating-foods">"Refrigerated storage of perishable foods"</a>. <a href="/wiki/CSIRO" title="CSIRO">CSIRO</a>. 26 February 2015. Archived from <a rel="nofollow" class="external text" href="http://www.csiro.au/en/Research/Health/Food-safety/Refrigerating-foods">the original</a> on 15 March 2015<span class="reference-accessdate">. Retrieved <span class="nowrap">25 May</span> 2007</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=unknown&amp;rft.btitle=Refrigerated+storage+of+perishable+foods&amp;rft.pub=CSIRO&amp;rft.date=2015-02-26&amp;rft_id=http%3A%2F%2Fwww.csiro.au%2Fen%2FResearch%2FHealth%2FFood-safety%2FRefrigerating-foods&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-57"><span class="mw-cite-backlink"><b><a href="#cite_ref-57" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFKarp2006" class="citation news cs1">Karp, David (25 October 2006). <a rel="nofollow" class="external text" href="https://www.nytimes.com/2006/10/25/dining/25fruit.html">"Puff the Magic Preservative: Lasting Crunch, but Less Scent"</a>. <i><a href="/wiki/The_New_York_Times" title="The New York Times">The New York Times</a></i>. <a rel="nofollow" class="external text" href="https://web.archive.org/web/20110803082104/http://www.nytimes.com/2006/10/25/dining/25fruit.html">Archived</a> from the original on 3 August 2011<span class="reference-accessdate">. Retrieved <span class="nowrap">26 July</span> 2017</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=The+New+York+Times&amp;rft.atitle=Puff+the+Magic+Preservative%3A+Lasting+Crunch%2C+but+Less+Scent&amp;rft.date=2006-10-25&amp;rft.aulast=Karp&amp;rft.aufirst=David&amp;rft_id=https%3A%2F%2Fwww.nytimes.com%2F2006%2F10%2F25%2Fdining%2F25fruit.html&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-58"><span class="mw-cite-backlink"><b><a href="#cite_ref-58" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFJackson1914" class="citation book cs1">Jackson, H.S. (1914). <a rel="nofollow" class="external text" href="https://archive.org/details/CUbiodiversity628875-8748/page/475">"Powdery Mildew"</a>. In Lowther, Granville; Worthington, William (eds.). <i>The Encyclopedia of Practical Horticulture: A Reference System of Commercial Horticulture, Covering the Practical and Scientific Phases of Horticulture, with Special Reference to Fruits and Vegetables</i>. Vol.&nbsp;I. North Yakima, Washington: The Encyclopedia of Horticulture Corporation. pp.&nbsp;475–476<span class="reference-accessdate">. Retrieved <span class="nowrap">1 August</span> 2024</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=bookitem&amp;rft.atitle=Powdery+Mildew&amp;rft.btitle=The+Encyclopedia+of+Practical+Horticulture%3A+A+Reference+System+of+Commercial+Horticulture%2C+Covering+the+Practical+and+Scientific+Phases+of+Horticulture%2C+with+Special+Reference+to+Fruits+and+Vegetables&amp;rft.place=North+Yakima%2C+Washington&amp;rft.pages=475-476&amp;rft.pub=The+Encyclopedia+of+Horticulture+Corporation&amp;rft.date=1914&amp;rft.aulast=Jackson&amp;rft.aufirst=H.S.&amp;rft_id=https%3A%2F%2Farchive.org%2Fdetails%2FCUbiodiversity628875-8748%2Fpage%2F475&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-59"><span class="mw-cite-backlink"><b><a href="#cite_ref-59" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFLowtherWorthington1914" class="citation book cs1">Lowther, Granville; Worthington, William, eds. (1914). <a rel="nofollow" class="external text" href="https://archive.org/details/CUbiodiversity628875-8748/page/475"><i>The Encyclopedia of Practical Horticulture: A Reference System of Commercial Horticulture, Covering the Practical and Scientific Phases of Horticulture, with Special Reference to Fruits and Vegetables</i></a>. Vol.&nbsp;I. North Yakima, Washington: The Encyclopedia of Horticulture Corporation. pp.&nbsp;45–51<span class="reference-accessdate">. Retrieved <span class="nowrap">1 August</span> 2024</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=book&amp;rft.btitle=The+Encyclopedia+of+Practical+Horticulture%3A+A+Reference+System+of+Commercial+Horticulture%2C+Covering+the+Practical+and+Scientific+Phases+of+Horticulture%2C+with+Special+Reference+to+Fruits+and+Vegetables&amp;rft.place=North+Yakima%2C+Washington&amp;rft.pages=45-51&amp;rft.pub=The+Encyclopedia+of+Horticulture+Corporation&amp;rft.date=1914&amp;rft_id=https%3A%2F%2Farchive.org%2Fdetails%2FCUbiodiversity628875-8748%2Fpage%2F475&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-60"><span class="mw-cite-backlink"><b><a href="#cite_ref-60" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFColiLos2003" class="citation book cs1">Coli, William M.; Los, Lorraine M., eds. (2003). <a rel="nofollow" class="external text" href="https://web.archive.org/web/20080212130013/http://www.umass.edu/fruitadvisor/NEAPMG/index.htm">"Insect Pests"</a>. <a rel="nofollow" class="external text" href="http://www.umass.edu/fruitadvisor/NEAPMG/index.htm"><i>2003-2004 New England Apple Pest Management Guide</i></a>. <a href="/wiki/University_of_Massachusetts_Amherst" title="University of Massachusetts Amherst">University of Massachusetts Amherst</a>. pp.&nbsp;28–29. Archived from the original on 12 February 2008<span class="reference-accessdate">. Retrieved <span class="nowrap">3 March</span> 2008</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=bookitem&amp;rft.atitle=Insect+Pests&amp;rft.btitle=2003-2004+New+England+Apple+Pest+Management+Guide&amp;rft.pages=28-29&amp;rft.pub=University+of+Massachusetts+Amherst&amp;rft.date=2003&amp;rft_id=https%3A%2F%2Fweb.archive.org%2Fweb%2F20070221120428%2Fhttp%3A%2F%2Fwww.umass.edu%2Ffruitadvisor%2FNEAPMG%2F28-46.pdf&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span><span class="cs1-maint citation-comment"><code class="cs1-code">{{<a href="/wiki/Template:Cite_book" title="Template:Cite book">cite book</a>}}</code>:  CS1 maint: bot: original URL status unknown (<a href="/wiki/Category:CS1_maint:_bot:_original_URL_status_unknown" title="Category:CS1 maint: bot: original URL status unknown">link</a>)</span></span>
+</li>
+<li id="cite_note-Bradley-61"><span class="mw-cite-backlink">^ <a href="#cite_ref-Bradley_61-0"><span class="cite-accessibility-label">Jump up to: </span><sup><i><b>a</b></i></sup></a> <a href="#cite_ref-Bradley_61-1"><sup><i><b>b</b></i></sup></a></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFAtthoweGilkesonKiteMichalak2009" class="citation book cs1">Atthowe, Helen; Gilkeson, Linda A.; Kite, L. Patricia; Michalak, Patricia S.; Pleasant, Barbara; Reich, Lee; Scheider, Alfred F. (2009). Bradley, Fern Marshall; Ellis, Bardara W.; Martin, Deborah L. (eds.). <span class="id-lock-limited" title="Free access subject to limited trial, subscription normally required"><a rel="nofollow" class="external text" href="https://archive.org/details/organicgardeners00brad_0/page/32"><i>The Organic Gardener's Handbook of Natural Pest and Disease Control</i></a></span>. New York: <a href="/wiki/Rodale,_Inc." title="Rodale, Inc.">Rodale, Inc.</a> pp.&nbsp;32–34. <a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&nbsp;<a href="/wiki/Special:BookSources/978-1-60529-677-7" title="Special:BookSources/978-1-60529-677-7"><bdi>978-1-60529-677-7</bdi></a>. <a href="/wiki/LCCN_(identifier)" class="mw-redirect" title="LCCN (identifier)">LCCN</a>&nbsp;<a rel="nofollow" class="external text" href="https://lccn.loc.gov/2009039996">2009039996</a>. <a href="/wiki/OCLC_(identifier)" class="mw-redirect" title="OCLC (identifier)">OCLC</a>&nbsp;<a rel="nofollow" class="external text" href="https://search.worldcat.org/oclc/419860680">419860680</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=book&amp;rft.btitle=The+Organic+Gardener%27s+Handbook+of+Natural+Pest+and+Disease+Control&amp;rft.place=New+York&amp;rft.pages=32-34&amp;rft.pub=Rodale%2C+Inc.&amp;rft.date=2009&amp;rft_id=info%3Aoclcnum%2F419860680&amp;rft_id=info%3Alccn%2F2009039996&amp;rft.isbn=978-1-60529-677-7&amp;rft.aulast=Atthowe&amp;rft.aufirst=Helen&amp;rft.au=Gilkeson%2C+Linda+A.&amp;rft.au=Kite%2C+L.+Patricia&amp;rft.au=Michalak%2C+Patricia+S.&amp;rft.au=Pleasant%2C+Barbara&amp;rft.au=Reich%2C+Lee&amp;rft.au=Scheider%2C+Alfred+F.&amp;rft_id=https%3A%2F%2Farchive.org%2Fdetails%2Forganicgardeners00brad_0%2Fpage%2F32&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-62"><span class="mw-cite-backlink"><b><a href="#cite_ref-62" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFColiBerkettSpitko2003" class="citation book cs1">Coli, William M.; Berkett, Lorraine P.; Spitko, Robin, eds. (2003). <a rel="nofollow" class="external text" href="https://web.archive.org/web/20080212130013/http://www.umass.edu/fruitadvisor/NEAPMG/index.htm">"Other Apple Diseases"</a>. <a rel="nofollow" class="external text" href="http://www.umass.edu/fruitadvisor/NEAPMG/index.htm"><i>2003-2004 New England Apple Pest Management Guide</i></a>. <a href="/wiki/University_of_Massachusetts_Amherst" title="University of Massachusetts Amherst">University of Massachusetts Amherst</a>. pp.&nbsp;19–27. Archived from the original on 12 February 2008<span class="reference-accessdate">. Retrieved <span class="nowrap">3 March</span> 2008</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=bookitem&amp;rft.atitle=Other+Apple+Diseases&amp;rft.btitle=2003-2004+New+England+Apple+Pest+Management+Guide&amp;rft.pages=19-27&amp;rft.pub=University+of+Massachusetts+Amherst&amp;rft.date=2003&amp;rft_id=https%3A%2F%2Fweb.archive.org%2Fweb%2F20070221120311%2Fhttp%3A%2F%2Fwww.umass.edu%2Ffruitadvisor%2FNEAPMG%2F19-27.pdf&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span><span class="cs1-maint citation-comment"><code class="cs1-code">{{<a href="/wiki/Template:Cite_book" title="Template:Cite book">cite book</a>}}</code>:  CS1 maint: bot: original URL status unknown (<a href="/wiki/Category:CS1_maint:_bot:_original_URL_status_unknown" title="Category:CS1 maint: bot: original URL status unknown">link</a>)</span></span>
+</li>
+<li id="cite_note-63"><span class="mw-cite-backlink"><b><a href="#cite_ref-63" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFMartinKrawczykKhodadadiAćimović2021" class="citation journal cs1">Martin, Phillip L.; Krawczyk, Teresa; Khodadadi, Fatemeh; Aćimović, Srđan G.; Peter, Kari A. (2021). <a rel="nofollow" class="external text" href="https://doi.org/10.1094%2FPHYTO-09-20-0432-R">"Bitter Rot of Apple in the Mid-Atlantic United States: Causal Species and Evaluation of the Impacts of Regional Weather Patterns and Cultivar Susceptibility"</a>. <i><a href="/wiki/Phytopathology_(journal)" class="mw-redirect" title="Phytopathology (journal)">Phytopathology</a></i>. <b>111</b> (6): 966–981. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<span class="id-lock-free" title="Freely accessible"><a rel="nofollow" class="external text" href="https://doi.org/10.1094%2FPHYTO-09-20-0432-R">10.1094/PHYTO-09-20-0432-R</a></span>. <a href="/wiki/ISSN_(identifier)" class="mw-redirect" title="ISSN (identifier)">ISSN</a>&nbsp;<a rel="nofollow" class="external text" href="https://search.worldcat.org/issn/0031-949X">0031-949X</a>. <a href="/wiki/PMID_(identifier)" class="mw-redirect" title="PMID (identifier)">PMID</a>&nbsp;<a rel="nofollow" class="external text" href="https://pubmed.ncbi.nlm.nih.gov/33487025">33487025</a>. <a href="/wiki/S2CID_(identifier)" class="mw-redirect" title="S2CID (identifier)">S2CID</a>&nbsp;<a rel="nofollow" class="external text" href="https://api.semanticscholar.org/CorpusID:231701083">231701083</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=Phytopathology&amp;rft.atitle=Bitter+Rot+of+Apple+in+the+Mid-Atlantic+United+States%3A+Causal+Species+and+Evaluation+of+the+Impacts+of+Regional+Weather+Patterns+and+Cultivar+Susceptibility&amp;rft.volume=111&amp;rft.issue=6&amp;rft.pages=966-981&amp;rft.date=2021&amp;rft.issn=0031-949X&amp;rft_id=https%3A%2F%2Fapi.semanticscholar.org%2FCorpusID%3A231701083%23id-name%3DS2CID&amp;rft_id=info%3Apmid%2F33487025&amp;rft_id=info%3Adoi%2F10.1094%2FPHYTO-09-20-0432-R&amp;rft.aulast=Martin&amp;rft.aufirst=Phillip+L.&amp;rft.au=Krawczyk%2C+Teresa&amp;rft.au=Khodadadi%2C+Fatemeh&amp;rft.au=A%C4%87imovi%C4%87%2C+Sr%C4%91an+G.&amp;rft.au=Peter%2C+Kari+A.&amp;rft_id=https%3A%2F%2Fdoi.org%2F10.1094%252FPHYTO-09-20-0432-R&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-64"><span class="mw-cite-backlink"><b><a href="#cite_ref-64" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFErler2010" class="citation journal cs1">Erler, Fedai (1 January 2010). <a rel="nofollow" class="external text" href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC3014806">"Efficacy of tree trunk coating materials in the control of the apple clearwing, Synanthedon myopaeformis"</a>. <i>Journal of Insect Science</i>. <b>10</b> (1): 63. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<a rel="nofollow" class="external text" href="https://doi.org/10.1673%2F031.010.6301">10.1673/031.010.6301</a>. <a href="/wiki/PMC_(identifier)" class="mw-redirect" title="PMC (identifier)">PMC</a>&nbsp;<span class="id-lock-free" title="Freely accessible"><a rel="nofollow" class="external text" href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC3014806">3014806</a></span>. <a href="/wiki/PMID_(identifier)" class="mw-redirect" title="PMID (identifier)">PMID</a>&nbsp;<a rel="nofollow" class="external text" href="https://pubmed.ncbi.nlm.nih.gov/20672979">20672979</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=Journal+of+Insect+Science&amp;rft.atitle=Efficacy+of+tree+trunk+coating+materials+in+the+control+of+the+apple+clearwing%2C+Synanthedon+myopaeformis&amp;rft.volume=10&amp;rft.issue=1&amp;rft.pages=63&amp;rft.date=2010-01-01&amp;rft_id=https%3A%2F%2Fwww.ncbi.nlm.nih.gov%2Fpmc%2Farticles%2FPMC3014806%23id-name%3DPMC&amp;rft_id=info%3Apmid%2F20672979&amp;rft_id=info%3Adoi%2F10.1673%2F031.010.6301&amp;rft.aulast=Erler&amp;rft.aufirst=Fedai&amp;rft_id=https%3A%2F%2Fwww.ncbi.nlm.nih.gov%2Fpmc%2Farticles%2FPMC3014806&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-65"><span class="mw-cite-backlink"><b><a href="#cite_ref-65" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFElzebroekWind2008" class="citation book cs1">Elzebroek, A. T. G.; Wind, Koop (2008). <a rel="nofollow" class="external text" href="https://books.google.com/books?id=YvU1XnUVxFQC&amp;q=apple%20cultivars%207%2C500&amp;pg=PT39"><i>Guide to Cultivated Plants</i></a>. Wallingford, United Kingdom: <a href="/wiki/CAB_International" title="CAB International">CABI</a>. p.&nbsp;27. <a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&nbsp;<a href="/wiki/Special:BookSources/978-1-84593-356-2" title="Special:BookSources/978-1-84593-356-2"><bdi>978-1-84593-356-2</bdi></a>. <a href="/wiki/LCCN_(identifier)" class="mw-redirect" title="LCCN (identifier)">LCCN</a>&nbsp;<a rel="nofollow" class="external text" href="https://lccn.loc.gov/2007028459">2007028459</a>. <a href="/wiki/OCLC_(identifier)" class="mw-redirect" title="OCLC (identifier)">OCLC</a>&nbsp;<a rel="nofollow" class="external text" href="https://search.worldcat.org/oclc/156975183">156975183</a>. <a rel="nofollow" class="external text" href="https://web.archive.org/web/20201020231604/https://books.google.com/books?id=YvU1XnUVxFQC&amp;q=apple%20cultivars%207,500&amp;pg=PT39">Archived</a> from the original on 20 October 2020<span class="reference-accessdate">. Retrieved <span class="nowrap">6 October</span> 2020</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=book&amp;rft.btitle=Guide+to+Cultivated+Plants&amp;rft.place=Wallingford%2C+United+Kingdom&amp;rft.pages=27&amp;rft.pub=CABI&amp;rft.date=2008&amp;rft_id=info%3Aoclcnum%2F156975183&amp;rft_id=info%3Alccn%2F2007028459&amp;rft.isbn=978-1-84593-356-2&amp;rft.aulast=Elzebroek&amp;rft.aufirst=A.+T.+G.&amp;rft.au=Wind%2C+Koop&amp;rft_id=https%3A%2F%2Fbooks.google.com%2Fbooks%3Fid%3DYvU1XnUVxFQC%26q%3Dapple%2520cultivars%25207%252C500%26pg%3DPT39&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-England-66"><span class="mw-cite-backlink">^ <a href="#cite_ref-England_66-0"><span class="cite-accessibility-label">Jump up to: </span><sup><i><b>a</b></i></sup></a> <a href="#cite_ref-England_66-1"><sup><i><b>b</b></i></sup></a></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="https://web.archive.org/web/20080512000735/http://www.plantpress.com/wildlife/o523-apple.php">"Apple – <i>Malus domestica</i>"</a>. <a href="/wiki/Natural_England" title="Natural England">Natural England</a>. Archived from <a rel="nofollow" class="external text" href="http://www.plantpress.com/wildlife/o523-apple.php">the original</a> on 12 May 2008<span class="reference-accessdate">. Retrieved <span class="nowrap">22 January</span> 2008</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=unknown&amp;rft.btitle=Apple+%E2%80%93+Malus+domestica&amp;rft.pub=Natural+England&amp;rft_id=http%3A%2F%2Fwww.plantpress.com%2Fwildlife%2Fo523-apple.php&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-67"><span class="mw-cite-backlink"><b><a href="#cite_ref-67" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="http://www.nationalfruitcollection.org.uk/index.php">"Home"</a>. <i><a href="/wiki/National_Fruit_Collection" title="National Fruit Collection">National Fruit Collection</a></i>. <a rel="nofollow" class="external text" href="https://web.archive.org/web/20120615145659/http://www.nationalfruitcollection.org.uk/index.php">Archived</a> from the original on 15 June 2012<span class="reference-accessdate">. Retrieved <span class="nowrap">2 December</span> 2012</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=unknown&amp;rft.jtitle=National+Fruit+Collection&amp;rft.atitle=Home&amp;rft_id=http%3A%2F%2Fwww.nationalfruitcollection.org.uk%2Findex.php&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-68"><span class="mw-cite-backlink"><b><a href="#cite_ref-68" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="https://web.archive.org/web/20140826114504/http://www.ecpgr.cgiar.org/index.php?id=2501&amp;tx_wfqbe_pi1%5Buid&amp;">"ECPGR Malus/Pyrus Working Group Members"</a>. <i>Ecpgr.cgiar.org</i>. 22 July 2002. Archived from <a rel="nofollow" class="external text" href="http://www.ecpgr.cgiar.org/index.php?id=2501&amp;tx_wfqbe_pi1%5Buid%5D=59">the original</a> on 26 August 2014<span class="reference-accessdate">. Retrieved <span class="nowrap">25 August</span> 2014</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=unknown&amp;rft.jtitle=Ecpgr.cgiar.org&amp;rft.atitle=ECPGR+Malus%2FPyrus+Working+Group+Members&amp;rft.date=2002-07-22&amp;rft_id=http%3A%2F%2Fwww.ecpgr.cgiar.org%2Findex.php%3Fid%3D2501%26tx_wfqbe_pi1%26%2391%3Buid%26%2393%3B%3D59&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-apples1-69"><span class="mw-cite-backlink">^ <a href="#cite_ref-apples1_69-0"><span class="cite-accessibility-label">Jump up to: </span><sup><i><b>a</b></i></sup></a> <a href="#cite_ref-apples1_69-1"><sup><i><b>b</b></i></sup></a></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFTarjan,_Sue2006" class="citation web cs1">Tarjan, Sue (Fall 2006). <a rel="nofollow" class="external text" href="https://web.archive.org/web/20070811154017/http://casfs.ucsc.edu/publications/news%20and%20notes/Fall_06_N%26N.pdf">"Autumn Apple Musings"</a> <span class="cs1-format">(PDF)</span>. News &amp; Notes of the UCSC Farm &amp; Garden, Center for Agroecology &amp; Sustainable Food Systems. pp.&nbsp;1–2. Archived from <a rel="nofollow" class="external text" href="http://casfs.ucsc.edu/publications/news%20and%20notes/Fall_06_N&amp;N.pdf">the original</a> <span class="cs1-format">(PDF)</span> on 11 August 2007<span class="reference-accessdate">. Retrieved <span class="nowrap">24 January</span> 2008</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=unknown&amp;rft.btitle=Autumn+Apple+Musings&amp;rft.pages=1-2&amp;rft.pub=News+%26+Notes+of+the+UCSC+Farm+%26+Garden%2C+Center+for+Agroecology+%26+Sustainable+Food+Systems&amp;rft.date=2006&amp;rft.au=Tarjan%2C+Sue&amp;rft_id=http%3A%2F%2Fcasfs.ucsc.edu%2Fpublications%2Fnews%2520and%2520notes%2FFall_06_N%26N.pdf&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-70"><span class="mw-cite-backlink"><b><a href="#cite_ref-70" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFBeck2020" class="citation news cs1">Beck, Kellen (17 October 2020). <a rel="nofollow" class="external text" href="https://mashable.com/article/apple-breeding">"How breeders bring out the best in new apples"</a>. <i>Mashable</i>. <a rel="nofollow" class="external text" href="https://web.archive.org/web/20240731195019/https://mashable.com/article/apple-breeding">Archived</a> from the original on 31 July 2024<span class="reference-accessdate">. Retrieved <span class="nowrap">31 July</span> 2024</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=Mashable&amp;rft.atitle=How+breeders+bring+out+the+best+in+new+apples&amp;rft.date=2020-10-17&amp;rft.aulast=Beck&amp;rft.aufirst=Kellen&amp;rft_id=https%3A%2F%2Fmashable.com%2Farticle%2Fapple-breeding&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-71"><span class="mw-cite-backlink"><b><a href="#cite_ref-71" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFMigicovsky2021" class="citation news cs1">Migicovsky, Zoë (22 August 2021). <a rel="nofollow" class="external text" href="https://theconversation.com/how-a-few-good-apples-spawned-todays-top-varieties-and-why-breeders-must-branch-out-164538">"How a few good apples spawned today's top varieties — and why breeders must branch out"</a>. <i>The Conversation</i>. <a rel="nofollow" class="external text" href="https://web.archive.org/web/20240731195017/https://theconversation.com/how-a-few-good-apples-spawned-todays-top-varieties-and-why-breeders-must-branch-out-164538">Archived</a> from the original on 31 July 2024<span class="reference-accessdate">. Retrieved <span class="nowrap">31 July</span> 2024</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=The+Conversation&amp;rft.atitle=How+a+few+good+apples+spawned+today%27s+top+varieties+%E2%80%94+and+why+breeders+must+branch+out&amp;rft.date=2021-08-22&amp;rft.aulast=Migicovsky&amp;rft.aufirst=Zo%C3%AB&amp;rft_id=https%3A%2F%2Ftheconversation.com%2Fhow-a-few-good-apples-spawned-todays-top-varieties-and-why-breeders-must-branch-out-164538&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-72"><span class="mw-cite-backlink"><b><a href="#cite_ref-72" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFPeilDunemannRichterHoefer2008" class="citation journal cs1 cs1-prop-foreign-lang-source">Peil, A.; Dunemann, F.; Richter, K.; Hoefer, M.; Király, I.; Flachowsky, H.; Hanke, M.-V. (2008). <a rel="nofollow" class="external text" href="http://orgprints.org/13698/">"Resistance Breeding in Apple at Dresden-Pillnitz"</a>. <i>Ecofruit - 13th International Conference on Cultivation Technique and Phytopathological Problems in Organic Fruit-Growing: Proceedings to the Conference from 18thFebruary to 20th February 2008 at Weinsberg/Germany</i> (in German): 220–225. <a rel="nofollow" class="external text" href="https://web.archive.org/web/20210128124933/https://orgprints.org/13698/">Archived</a> from the original on 28 January 2021<span class="reference-accessdate">. Retrieved <span class="nowrap">31 July</span> 2024</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=Ecofruit+-+13th+International+Conference+on+Cultivation+Technique+and+Phytopathological+Problems+in+Organic+Fruit-Growing%3A+Proceedings+to+the+Conference+from+18thFebruary+to+20th+February+2008+at+Weinsberg%2FGermany&amp;rft.atitle=Resistance+Breeding+in+Apple+at+Dresden-Pillnitz&amp;rft.pages=220-225&amp;rft.date=2008&amp;rft.aulast=Peil&amp;rft.aufirst=A.&amp;rft.au=Dunemann%2C+F.&amp;rft.au=Richter%2C+K.&amp;rft.au=Hoefer%2C+M.&amp;rft.au=Kir%C3%A1ly%2C+I.&amp;rft.au=Flachowsky%2C+H.&amp;rft.au=Hanke%2C+M.-V.&amp;rft_id=http%3A%2F%2Forgprints.org%2F13698%2F&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-World-73"><span class="mw-cite-backlink">^ <a href="#cite_ref-World_73-0"><span class="cite-accessibility-label">Jump up to: </span><sup><i><b>a</b></i></sup></a> <a href="#cite_ref-World_73-1"><sup><i><b>b</b></i></sup></a></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="https://web.archive.org/web/20080211120700/http://www.fas.usda.gov/htp2/circular/1998/98-03/applefea.html">"World apple situation"</a>. Archived from <a rel="nofollow" class="external text" href="https://www.fas.usda.gov/htp2/circular/1998/98-03/applefea.html">the original</a> on 11 February 2008<span class="reference-accessdate">. Retrieved <span class="nowrap">24 January</span> 2008</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=unknown&amp;rft.btitle=World+apple+situation&amp;rft_id=http%3A%2F%2Fwww.fas.usda.gov%2Fhtp2%2Fcircular%2F1998%2F98-03%2Fapplefea.html&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-Hobby_Farms_Mag.-74"><span class="mw-cite-backlink"><b><a href="#cite_ref-Hobby_Farms_Mag._74-0" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFWeaver2003" class="citation magazine cs1">Weaver, Sue (June–July 2003). <a rel="nofollow" class="external text" href="http://www.hobbyfarms.com/apples-of-antiquity-3/">"Crops &amp; Gardening – Apples of Antiquity"</a>. <i>Hobby Farms Magazine</i>. <a rel="nofollow" class="external text" href="https://web.archive.org/web/20170219090902/http://www.hobbyfarms.com/apples-of-antiquity-3/">Archived</a> from the original on 19 February 2017.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=Hobby+Farms+Magazine&amp;rft.atitle=Crops+%26+Gardening+%E2%80%93+Apples+of+Antiquity&amp;rft.date=2003-06%2F2003-07&amp;rft.aulast=Weaver&amp;rft.aufirst=Sue&amp;rft_id=http%3A%2F%2Fwww.hobbyfarms.com%2Fapples-of-antiquity-3%2F&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-faostat-75"><span class="mw-cite-backlink">^ <a href="#cite_ref-faostat_75-0"><span class="cite-accessibility-label">Jump up to: </span><sup><i><b>a</b></i></sup></a> <a href="#cite_ref-faostat_75-1"><sup><i><b>b</b></i></sup></a> <a href="#cite_ref-faostat_75-2"><sup><i><b>c</b></i></sup></a></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="http://www.fao.org/faostat/en/#data/QC">"Apple production in 2022; from pick lists: Crops/World Regions/Production Quantity"</a>. FAOSTAT, UN <a href="/wiki/Food_and_Agriculture_Organization" title="Food and Agriculture Organization">Food and Agriculture Organization</a>, Statistics Division. 2024. <a rel="nofollow" class="external text" href="https://web.archive.org/web/20161112130804/http://www.fao.org/faostat/en/#data/QC">Archived</a> from the original on 12 November 2016<span class="reference-accessdate">. Retrieved <span class="nowrap">18 June</span> 2024</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=unknown&amp;rft.btitle=Apple+production+in+2022%3B+from+pick+lists%3A+Crops%2FWorld+Regions%2FProduction+Quantity&amp;rft.pub=FAOSTAT%2C+UN+Food+and+Agriculture+Organization%2C+Statistics+Division&amp;rft.date=2024&amp;rft_id=http%3A%2F%2Fwww.fao.org%2Ffaostat%2Fen%2F%23data%2FQC&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-76"><span class="mw-cite-backlink"><b><a href="#cite_ref-76" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFNelsonShihBalick2007" class="citation book cs1">Nelson, Lewis S.; Shih, Richard D.; <a href="/wiki/Michael_Jeffrey_Balick" title="Michael Jeffrey Balick">Balick, Michael J.</a> (2007). <span class="id-lock-registration" title="Free registration required"><a rel="nofollow" class="external text" href="https://archive.org/details/handbookofpoison0000nels/page/211"><i>Handbook of Poisonous and Injurious Plants</i></a></span> (Second&nbsp;ed.). New York: <a href="/wiki/New_York_Botanical_Garden" title="New York Botanical Garden">New York Botanical Garden</a>&nbsp;: <a href="/wiki/Springer_Publishing" title="Springer Publishing">Springer</a>. pp.&nbsp;27, 211–212. <a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&nbsp;<a href="/wiki/Special:BookSources/978-0387-31268-2" title="Special:BookSources/978-0387-31268-2"><bdi>978-0387-31268-2</bdi></a>. <a href="/wiki/LCCN_(identifier)" class="mw-redirect" title="LCCN (identifier)">LCCN</a>&nbsp;<a rel="nofollow" class="external text" href="https://lccn.loc.gov/2005938815">2005938815</a>. <a href="/wiki/OCLC_(identifier)" class="mw-redirect" title="OCLC (identifier)">OCLC</a>&nbsp;<a rel="nofollow" class="external text" href="https://search.worldcat.org/oclc/77537459">77537459</a><span class="reference-accessdate">. Retrieved <span class="nowrap">11 September</span> 2024</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=book&amp;rft.btitle=Handbook+of+Poisonous+and+Injurious+Plants&amp;rft.place=New+York&amp;rft.pages=27%2C+211-212&amp;rft.edition=Second&amp;rft.pub=New+York+Botanical+Garden+%3A+Springer&amp;rft.date=2007&amp;rft_id=info%3Aoclcnum%2F77537459&amp;rft_id=info%3Alccn%2F2005938815&amp;rft.isbn=978-0387-31268-2&amp;rft.aulast=Nelson&amp;rft.aufirst=Lewis+S.&amp;rft.au=Shih%2C+Richard+D.&amp;rft.au=Balick%2C+Michael+J.&amp;rft_id=https%3A%2F%2Farchive.org%2Fdetails%2Fhandbookofpoison0000nels%2Fpage%2F211&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-77"><span class="mw-cite-backlink"><b><a href="#cite_ref-77" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="https://toxnet.nlm.nih.gov/cgi-bin/sis/search/a?dbs+hsdb:@term+@DOCNO+3559">"Amygdalin"</a>. Toxnet, US Library of Medicine. <a rel="nofollow" class="external text" href="https://web.archive.org/web/20170421094516/https://toxnet.nlm.nih.gov/cgi-bin/sis/search/a?dbs+hsdb:@term+@DOCNO+3559">Archived</a> from the original on 21 April 2017<span class="reference-accessdate">. Retrieved <span class="nowrap">20 April</span> 2017</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=unknown&amp;rft.btitle=Amygdalin&amp;rft.pub=Toxnet%2C+US+Library+of+Medicine&amp;rft_id=https%3A%2F%2Ftoxnet.nlm.nih.gov%2Fcgi-bin%2Fsis%2Fsearch%2Fa%3Fdbs%2Bhsdb%3A%40term%2B%40DOCNO%2B3559&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-EU-78"><span class="mw-cite-backlink">^ <a href="#cite_ref-EU_78-0"><span class="cite-accessibility-label">Jump up to: </span><sup><i><b>a</b></i></sup></a> <a href="#cite_ref-EU_78-1"><sup><i><b>b</b></i></sup></a> <a href="#cite_ref-EU_78-2"><sup><i><b>c</b></i></sup></a> <a href="#cite_ref-EU_78-3"><sup><i><b>d</b></i></sup></a> <a href="#cite_ref-EU_78-4"><sup><i><b>e</b></i></sup></a> <a href="#cite_ref-EU_78-5"><sup><i><b>f</b></i></sup></a></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="https://web.archive.org/web/20120723201454/http://foodallergens.ifr.ac.uk/food.lasso?selected_food=2">"General Information – Apple"</a>. Informall. Archived from <a rel="nofollow" class="external text" href="http://foodallergens.ifr.ac.uk/food.lasso?selected_food=2#summary">the original</a> on 23 July 2012<span class="reference-accessdate">. Retrieved <span class="nowrap">17 October</span> 2011</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=unknown&amp;rft.btitle=General+Information+%E2%80%93+Apple&amp;rft.pub=Informall&amp;rft_id=http%3A%2F%2Ffoodallergens.ifr.ac.uk%2Ffood.lasso%3Fselected_food%3D2%23summary&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-79"><span class="mw-cite-backlink"><b><a href="#cite_ref-79" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text">Landau, Elizabeth, <a rel="nofollow" class="external text" href="https://www.cnn.com/2009/HEALTH/04/08/oral.allergy.syndrome/index.html">Oral allergy syndrome may explain mysterious reactions</a>, 8 April 2009, <i>CNN Health</i>, accessed 17 October 2011</span>
+</li>
+<li id="cite_note-FDADailyValues-80"><span class="mw-cite-backlink"><b><a href="#cite_ref-FDADailyValues_80-0" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFUnited_States_Food_and_Drug_Administration2024" class="citation web cs1"><a href="/wiki/Food_and_Drug_Administration" title="Food and Drug Administration">United States Food and Drug Administration</a> (2024). <a rel="nofollow" class="external text" href="https://www.fda.gov/food/nutrition-facts-label/daily-value-nutrition-and-supplement-facts-labels">"Daily Value on the Nutrition and Supplement Facts Labels"</a>. <i>FDA</i>. <a rel="nofollow" class="external text" href="https://web.archive.org/web/20240327175201/https://www.fda.gov/food/nutrition-facts-label/daily-value-nutrition-and-supplement-facts-labels">Archived</a> from the original on 27 March 2024<span class="reference-accessdate">. Retrieved <span class="nowrap">28 March</span> 2024</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=unknown&amp;rft.jtitle=FDA&amp;rft.atitle=Daily+Value+on+the+Nutrition+and+Supplement+Facts+Labels&amp;rft.date=2024&amp;rft.au=United+States+Food+and+Drug+Administration&amp;rft_id=https%3A%2F%2Fwww.fda.gov%2Ffood%2Fnutrition-facts-label%2Fdaily-value-nutrition-and-supplement-facts-labels&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-NationalAcademiesPotassium-81"><span class="mw-cite-backlink"><b><a href="#cite_ref-NationalAcademiesPotassium_81-0" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFNational_Academies_of_Sciences,_Engineering,_and_MedicineHealth_and_Medicine_DivisionFood_and_Nutrition_BoardCommittee_to_Review_the_Dietary_Reference_Intakes_for_Sodium_and_Potassium2019" class="citation book cs1">National Academies of Sciences, Engineering, and Medicine; Health and Medicine Division; Food and Nutrition Board; Committee to Review the Dietary Reference Intakes for Sodium and Potassium (2019). Oria, Maria; Harrison, Meghan; Stallings, Virginia A. (eds.). <a rel="nofollow" class="external text" href="http://www.ncbi.nlm.nih.gov/books/NBK538102/"><i>Dietary Reference Intakes for Sodium and Potassium</i></a>. The National Academies Collection: Reports funded by National Institutes of Health. Washington, DC: National Academies Press (US). <a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&nbsp;<a href="/wiki/Special:BookSources/978-0-309-48834-1" title="Special:BookSources/978-0-309-48834-1"><bdi>978-0-309-48834-1</bdi></a>. <a href="/wiki/PMID_(identifier)" class="mw-redirect" title="PMID (identifier)">PMID</a>&nbsp;<a rel="nofollow" class="external text" href="https://pubmed.ncbi.nlm.nih.gov/30844154">30844154</a>. <a rel="nofollow" class="external text" href="https://web.archive.org/web/20240509063633/https://www.ncbi.nlm.nih.gov/books/NBK538102/">Archived</a> from the original on 9 May 2024<span class="reference-accessdate">. Retrieved <span class="nowrap">21 June</span> 2024</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=book&amp;rft.btitle=Dietary+Reference+Intakes+for+Sodium+and+Potassium&amp;rft.place=Washington%2C+DC&amp;rft.series=The+National+Academies+Collection%3A+Reports+funded+by+National+Institutes+of+Health&amp;rft.pub=National+Academies+Press+%28US%29&amp;rft.date=2019&amp;rft_id=info%3Apmid%2F30844154&amp;rft.isbn=978-0-309-48834-1&amp;rft.au=National+Academies+of+Sciences%2C+Engineering%2C+and+Medicine&amp;rft.au=Health+and+Medicine+Division&amp;rft.au=Food+and+Nutrition+Board&amp;rft.au=Committee+to+Review+the+Dietary+Reference+Intakes+for+Sodium+and+Potassium&amp;rft_id=http%3A%2F%2Fwww.ncbi.nlm.nih.gov%2Fbooks%2FNBK538102%2F&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-Davidson_2014-82"><span class="mw-cite-backlink">^ <a href="#cite_ref-Davidson_2014_82-0"><span class="cite-accessibility-label">Jump up to: </span><sup><i><b>a</b></i></sup></a> <a href="#cite_ref-Davidson_2014_82-1"><sup><i><b>b</b></i></sup></a> <a href="#cite_ref-Davidson_2014_82-2"><sup><i><b>c</b></i></sup></a> <a href="#cite_ref-Davidson_2014_82-3"><sup><i><b>d</b></i></sup></a></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFDavidson2014" class="citation book cs1"><a href="/wiki/Alan_Davidson_(food_writer)" title="Alan Davidson (food writer)">Davidson, Alan</a> (2014). <span class="id-lock-registration" title="Free registration required"><a rel="nofollow" class="external text" href="https://archive.org/details/oxfordcompaniont0000davi_w2w6/page/27">"Apple"</a></span>. In <a href="/wiki/Tom_Jaine" title="Tom Jaine">Jaine, Tom</a> (ed.). <i><a href="/wiki/The_Oxford_Companion_to_Food" title="The Oxford Companion to Food">The Oxford Companion to Food</a></i>. Illustrated by Soun Vannithone (Third&nbsp;ed.). Oxford: <a href="/wiki/Oxford_University_Press" title="Oxford University Press">Oxford University Press</a>. pp.&nbsp;27–31. <a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&nbsp;<a href="/wiki/Special:BookSources/978-0-19-967733-7" title="Special:BookSources/978-0-19-967733-7"><bdi>978-0-19-967733-7</bdi></a>. <a href="/wiki/LCCN_(identifier)" class="mw-redirect" title="LCCN (identifier)">LCCN</a>&nbsp;<a rel="nofollow" class="external text" href="https://lccn.loc.gov/2013957569">2013957569</a>. <a href="/wiki/OCLC_(identifier)" class="mw-redirect" title="OCLC (identifier)">OCLC</a>&nbsp;<a rel="nofollow" class="external text" href="https://search.worldcat.org/oclc/890807357">890807357</a>. <a href="/wiki/OL_(identifier)" class="mw-redirect" title="OL (identifier)">OL</a>&nbsp;<a rel="nofollow" class="external text" href="https://openlibrary.org/books/OL27172691M">27172691M</a><span class="reference-accessdate">. Retrieved <span class="nowrap">18 September</span> 2024</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=bookitem&amp;rft.atitle=Apple&amp;rft.btitle=The+Oxford+Companion+to+Food&amp;rft.place=Oxford&amp;rft.pages=27-31&amp;rft.edition=Third&amp;rft.pub=Oxford+University+Press&amp;rft.date=2014&amp;rft_id=info%3Aoclcnum%2F890807357&amp;rft_id=info%3Alccn%2F2013957569&amp;rft_id=https%3A%2F%2Fopenlibrary.org%2Fbooks%2FOL27172691M%23id-name%3DOL&amp;rft.isbn=978-0-19-967733-7&amp;rft.aulast=Davidson&amp;rft.aufirst=Alan&amp;rft_id=https%3A%2F%2Farchive.org%2Fdetails%2Foxfordcompaniont0000davi_w2w6%2Fpage%2F27&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-83"><span class="mw-cite-backlink"><b><a href="#cite_ref-83" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFTraverso2011" class="citation book cs1">Traverso, Amy (2011). <span class="id-lock-limited" title="Free access subject to limited trial, subscription normally required"><a rel="nofollow" class="external text" href="https://archive.org/details/appleloverscookb0000trav"><i>The Apple Lover's Cookbook</i></a></span>. Photographs by Squire Fox (First&nbsp;ed.). New York: <a href="/wiki/W.W._Norton_%26_Company" class="mw-redirect" title="W.W. Norton &amp; Company">W.W. Norton &amp; Company</a>. pp.&nbsp;16, 32, 35, 45, 92, 137, 262–263, 275. <a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&nbsp;<a href="/wiki/Special:BookSources/978-0-393-06599-2" title="Special:BookSources/978-0-393-06599-2"><bdi>978-0-393-06599-2</bdi></a>. <a href="/wiki/LCCN_(identifier)" class="mw-redirect" title="LCCN (identifier)">LCCN</a>&nbsp;<a rel="nofollow" class="external text" href="https://lccn.loc.gov/2011016560">2011016560</a>. <a href="/wiki/OCLC_(identifier)" class="mw-redirect" title="OCLC (identifier)">OCLC</a>&nbsp;<a rel="nofollow" class="external text" href="https://search.worldcat.org/oclc/711051767">711051767</a>. <a href="/wiki/OL_(identifier)" class="mw-redirect" title="OL (identifier)">OL</a>&nbsp;<a rel="nofollow" class="external text" href="https://openlibrary.org/works/OL16450839W">16450839W</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=book&amp;rft.btitle=The+Apple+Lover%27s+Cookbook&amp;rft.place=New+York&amp;rft.pages=16%2C+32%2C+35%2C+45%2C+92%2C+137%2C+262-263%2C+275&amp;rft.edition=First&amp;rft.pub=W.W.+Norton+%26+Company&amp;rft.date=2011&amp;rft_id=info%3Aoclcnum%2F711051767&amp;rft_id=info%3Alccn%2F2011016560&amp;rft_id=https%3A%2F%2Fopenlibrary.org%2Fworks%2FOL16450839W%23id-name%3DOL&amp;rft.isbn=978-0-393-06599-2&amp;rft.aulast=Traverso&amp;rft.aufirst=Amy&amp;rft_id=https%3A%2F%2Farchive.org%2Fdetails%2Fappleloverscookb0000trav&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-84"><span class="mw-cite-backlink"><b><a href="#cite_ref-84" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFKellogg2015" class="citation web cs1">Kellogg, Kristi (15 January 2015). <a rel="nofollow" class="external text" href="https://www.epicurious.com/ingredients/apple-of-my-eye-gallery">"81 Best Apple Recipes: Dinners, Desserts, Salads, and More"</a>. <i>Epicurious</i>. <a rel="nofollow" class="external text" href="https://web.archive.org/web/20201018215038/https://www.epicurious.com/ingredients/apple-of-my-eye-gallery">Archived</a> from the original on 18 October 2020<span class="reference-accessdate">. Retrieved <span class="nowrap">17 October</span> 2020</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=unknown&amp;rft.jtitle=Epicurious&amp;rft.atitle=81+Best+Apple+Recipes%3A+Dinners%2C+Desserts%2C+Salads%2C+and+More&amp;rft.date=2015-01-15&amp;rft.aulast=Kellogg&amp;rft.aufirst=Kristi&amp;rft_id=https%3A%2F%2Fwww.epicurious.com%2Fingredients%2Fapple-of-my-eye-gallery&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-85"><span class="mw-cite-backlink"><b><a href="#cite_ref-85" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFDavidson2014" class="citation book cs1"><a href="/wiki/Alan_Davidson_(food_writer)" title="Alan Davidson (food writer)">Davidson, Alan</a> (2014). <span class="id-lock-registration" title="Free registration required"><a rel="nofollow" class="external text" href="https://archive.org/details/oxfordcompaniont0000davi_w2w6/page/824/">"Toffee Apple"</a></span>. In <a href="/wiki/Tom_Jaine" title="Tom Jaine">Jaine, Tom</a> (ed.). <i><a href="/wiki/The_Oxford_Companion_to_Food" title="The Oxford Companion to Food">The Oxford Companion to Food</a></i>. Illustrated by Soun Vannithone (Third&nbsp;ed.). Oxford: <a href="/wiki/Oxford_University_Press" title="Oxford University Press">Oxford University Press</a>. p.&nbsp;824. <a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&nbsp;<a href="/wiki/Special:BookSources/978-0-19-967733-7" title="Special:BookSources/978-0-19-967733-7"><bdi>978-0-19-967733-7</bdi></a>. <a href="/wiki/LCCN_(identifier)" class="mw-redirect" title="LCCN (identifier)">LCCN</a>&nbsp;<a rel="nofollow" class="external text" href="https://lccn.loc.gov/2013957569">2013957569</a>. <a href="/wiki/OCLC_(identifier)" class="mw-redirect" title="OCLC (identifier)">OCLC</a>&nbsp;<a rel="nofollow" class="external text" href="https://search.worldcat.org/oclc/890807357">890807357</a>. <a href="/wiki/OL_(identifier)" class="mw-redirect" title="OL (identifier)">OL</a>&nbsp;<a rel="nofollow" class="external text" href="https://openlibrary.org/books/OL27172691M">27172691M</a><span class="reference-accessdate">. Retrieved <span class="nowrap">18 September</span> 2024</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=bookitem&amp;rft.atitle=Toffee+Apple&amp;rft.btitle=The+Oxford+Companion+to+Food&amp;rft.place=Oxford&amp;rft.pages=824&amp;rft.edition=Third&amp;rft.pub=Oxford+University+Press&amp;rft.date=2014&amp;rft_id=info%3Aoclcnum%2F890807357&amp;rft_id=info%3Alccn%2F2013957569&amp;rft_id=https%3A%2F%2Fopenlibrary.org%2Fbooks%2FOL27172691M%23id-name%3DOL&amp;rft.isbn=978-0-19-967733-7&amp;rft.aulast=Davidson&amp;rft.aufirst=Alan&amp;rft_id=https%3A%2F%2Farchive.org%2Fdetails%2Foxfordcompaniont0000davi_w2w6%2Fpage%2F824%2F&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-86"><span class="mw-cite-backlink"><b><a href="#cite_ref-86" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFShurpin" class="citation web cs1">Shurpin, Yehuda. <a rel="nofollow" class="external text" href="https://www.chabad.org/library/article_cdo/aid/3053586/jewish/Why-All-the-Symbolic-Rosh-Hashanah-Foods.htm">"Why All the Symbolic Rosh Hashanah Foods? "בולבול"<span class="cs1-kern-right"></span>"</a>. <i>Chabad.org</i>. <a rel="nofollow" class="external text" href="https://web.archive.org/web/20230321154816/https://www.chabad.org/library/article_cdo/aid/3053586/jewish/Why-All-the-Symbolic-Rosh-Hashanah-Foods.htm">Archived</a> from the original on 21 March 2023<span class="reference-accessdate">. Retrieved <span class="nowrap">21 March</span> 2023</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=unknown&amp;rft.jtitle=Chabad.org&amp;rft.atitle=Why+All+the+Symbolic+Rosh+Hashanah+Foods%3F+%22%D7%91%D7%95%D7%9C%D7%91%D7%95%D7%9C%22&amp;rft.aulast=Shurpin&amp;rft.aufirst=Yehuda&amp;rft_id=https%3A%2F%2Fwww.chabad.org%2Flibrary%2Farticle_cdo%2Faid%2F3053586%2Fjewish%2FWhy-All-the-Symbolic-Rosh-Hashanah-Foods.htm&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-87"><span class="mw-cite-backlink"><b><a href="#cite_ref-87" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFYepsen2017" class="citation book cs1">Yepsen, Roger B. (2017) [1994]. <i>Apples</i> (Revised and Updated&nbsp;ed.). New York: W.W. Norton &amp; Company. p.&nbsp;52. <a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&nbsp;<a href="/wiki/Special:BookSources/978-1-68268-019-3" title="Special:BookSources/978-1-68268-019-3"><bdi>978-1-68268-019-3</bdi></a>. <a href="/wiki/LCCN_(identifier)" class="mw-redirect" title="LCCN (identifier)">LCCN</a>&nbsp;<a rel="nofollow" class="external text" href="https://lccn.loc.gov/2017010136">2017010136</a>. <a href="/wiki/OCLC_(identifier)" class="mw-redirect" title="OCLC (identifier)">OCLC</a>&nbsp;<a rel="nofollow" class="external text" href="https://search.worldcat.org/oclc/973918728">973918728</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=book&amp;rft.btitle=Apples&amp;rft.place=New+York&amp;rft.pages=52&amp;rft.edition=Revised+and+Updated&amp;rft.pub=W.W.+Norton+%26+Company&amp;rft.date=2017&amp;rft_id=info%3Aoclcnum%2F973918728&amp;rft_id=info%3Alccn%2F2017010136&amp;rft.isbn=978-1-68268-019-3&amp;rft.aulast=Yepsen&amp;rft.aufirst=Roger+B.&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-organic-88"><span class="mw-cite-backlink"><b><a href="#cite_ref-organic_88-0" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="https://web.archive.org/web/20170224052612/http://www.agmrc.org/commodities-products/fruits/apples/organic-apples/">"Organic apples"</a>. USDA Agricultural Marketing Service. February 2016. Archived from <a rel="nofollow" class="external text" href="http://www.agmrc.org/commodities-products/fruits/apples/organic-apples/">the original</a> on 24 February 2017<span class="reference-accessdate">. Retrieved <span class="nowrap">23 February</span> 2017</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=unknown&amp;rft.btitle=Organic+apples&amp;rft.pub=USDA+Agricultural+Marketing+Service&amp;rft.date=2016-02&amp;rft_id=http%3A%2F%2Fwww.agmrc.org%2Fcommodities-products%2Ffruits%2Fapples%2Forganic-apples%2F&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-croplife-89"><span class="mw-cite-backlink">^ <a href="#cite_ref-croplife_89-0"><span class="cite-accessibility-label">Jump up to: </span><sup><i><b>a</b></i></sup></a> <a href="#cite_ref-croplife_89-1"><sup><i><b>b</b></i></sup></a></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="https://croplife.org/wp-content/uploads/pdf_files/European-Organic-apple-production-demonstrates-the-value-of-pesticides.pdf">"European Organic Apple Production Demonstrates the Value of Pesticides"</a> <span class="cs1-format">(PDF)</span>. CropLife Foundation, Washington, DC. December 2011. <a rel="nofollow" class="external text" href="https://web.archive.org/web/20170224054210/https://croplife.org/wp-content/uploads/pdf_files/European-Organic-apple-production-demonstrates-the-value-of-pesticides.pdf">Archived</a> <span class="cs1-format">(PDF)</span> from the original on 24 February 2017<span class="reference-accessdate">. Retrieved <span class="nowrap">23 February</span> 2017</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=unknown&amp;rft.btitle=European+Organic+Apple+Production+Demonstrates+the+Value+of+Pesticides&amp;rft.pub=CropLife+Foundation%2C+Washington%2C+DC&amp;rft.date=2011-12&amp;rft_id=https%3A%2F%2Fcroplife.org%2Fwp-content%2Fuploads%2Fpdf_files%2FEuropean-Organic-apple-production-demonstrates-the-value-of-pesticides.pdf&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-Ribeiro2014-90"><span class="mw-cite-backlink"><b><a href="#cite_ref-Ribeiro2014_90-0" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFRibeiroGomes_de_MouraAguiarde_Oliveira2014" class="citation journal cs1">Ribeiro, Flávia A.P.; Gomes de Moura, Carolina F.; Aguiar, Odair; de Oliveira, Flavia; Spadari, Regina C.; Oliveira, Nara R.C.; Oshima, Celina T.F.; Ribeiro, Daniel A. (September 2014). "The chemopreventive activity of apple against carcinogenesis: antioxidant activity and cell cycle control". <i>European Journal of Cancer Prevention</i> (Review). <b>23</b> (5): 477–480. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<a rel="nofollow" class="external text" href="https://doi.org/10.1097%2FCEJ.0000000000000005">10.1097/CEJ.0000000000000005</a>. <a href="/wiki/PMID_(identifier)" class="mw-redirect" title="PMID (identifier)">PMID</a>&nbsp;<a rel="nofollow" class="external text" href="https://pubmed.ncbi.nlm.nih.gov/24366437">24366437</a>. <a href="/wiki/S2CID_(identifier)" class="mw-redirect" title="S2CID (identifier)">S2CID</a>&nbsp;<a rel="nofollow" class="external text" href="https://api.semanticscholar.org/CorpusID:23026644">23026644</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=European+Journal+of+Cancer+Prevention&amp;rft.atitle=The+chemopreventive+activity+of+apple+against+carcinogenesis%3A+antioxidant+activity+and+cell+cycle+control&amp;rft.volume=23&amp;rft.issue=5&amp;rft.pages=477-480&amp;rft.date=2014-09&amp;rft_id=https%3A%2F%2Fapi.semanticscholar.org%2FCorpusID%3A23026644%23id-name%3DS2CID&amp;rft_id=info%3Apmid%2F24366437&amp;rft_id=info%3Adoi%2F10.1097%2FCEJ.0000000000000005&amp;rft.aulast=Ribeiro&amp;rft.aufirst=Fl%C3%A1via+A.P.&amp;rft.au=Gomes+de+Moura%2C+Carolina+F.&amp;rft.au=Aguiar%2C+Odair&amp;rft.au=de+Oliveira%2C+Flavia&amp;rft.au=Spadari%2C+Regina+C.&amp;rft.au=Oliveira%2C+Nara+R.C.&amp;rft.au=Oshima%2C+Celina+T.F.&amp;rft.au=Ribeiro%2C+Daniel+A.&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-nic-91"><span class="mw-cite-backlink"><b><a href="#cite_ref-nic_91-0" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFNicolasRichard-ForgetGoupyAmiot1994" class="citation journal cs1">Nicolas, J. J.; Richard-Forget, F. C.; Goupy, P. M.; Amiot, M. J.; Aubert, S. Y. (1 January 1994). "Enzymatic browning reactions in apple and apple products". <i>Critical Reviews in Food Science and Nutrition</i>. <b>34</b> (2): 109–157. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<a rel="nofollow" class="external text" href="https://doi.org/10.1080%2F10408399409527653">10.1080/10408399409527653</a>. <a href="/wiki/PMID_(identifier)" class="mw-redirect" title="PMID (identifier)">PMID</a>&nbsp;<a rel="nofollow" class="external text" href="https://pubmed.ncbi.nlm.nih.gov/8011143">8011143</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=Critical+Reviews+in+Food+Science+and+Nutrition&amp;rft.atitle=Enzymatic+browning+reactions+in+apple+and+apple+products&amp;rft.volume=34&amp;rft.issue=2&amp;rft.pages=109-157&amp;rft.date=1994-01-01&amp;rft_id=info%3Adoi%2F10.1080%2F10408399409527653&amp;rft_id=info%3Apmid%2F8011143&amp;rft.aulast=Nicolas&amp;rft.aufirst=J.+J.&amp;rft.au=Richard-Forget%2C+F.+C.&amp;rft.au=Goupy%2C+P.+M.&amp;rft.au=Amiot%2C+M.+J.&amp;rft.au=Aubert%2C+S.+Y.&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-92"><span class="mw-cite-backlink"><b><a href="#cite_ref-92" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="https://www.okspecialtyfruits.com/our-science/ppo-silencing/">"PPO silencing"</a>. Okanagan Specialty Fruits. 2019. <a rel="nofollow" class="external text" href="https://web.archive.org/web/20210427083033/https://www.okspecialtyfruits.com/our-science/ppo-silencing/">Archived</a> from the original on 27 April 2021<span class="reference-accessdate">. Retrieved <span class="nowrap">14 November</span> 2019</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=unknown&amp;rft.btitle=PPO+silencing&amp;rft.pub=Okanagan+Specialty+Fruits&amp;rft.date=2019&amp;rft_id=https%3A%2F%2Fwww.okspecialtyfruits.com%2Four-science%2Fppo-silencing%2F&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-93"><span class="mw-cite-backlink"><b><a href="#cite_ref-93" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="https://www.freshfruitportal.com/news/2019/08/13/u-s-gm-non-browning-arctic-apple-expands-into-foodservice/">"United States: GM non-browning Arctic apple expands into foodservice"</a>. Fresh Fruit Portal. 13 August 2019. <a rel="nofollow" class="external text" href="https://web.archive.org/web/20210627220702/https://www.freshfruitportal.com/news/2019/08/13/u-s-gm-non-browning-arctic-apple-expands-into-foodservice/">Archived</a> from the original on 27 June 2021<span class="reference-accessdate">. Retrieved <span class="nowrap">14 November</span> 2019</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=unknown&amp;rft.btitle=United+States%3A+GM+non-browning+Arctic+apple+expands+into+foodservice&amp;rft.pub=Fresh+Fruit+Portal&amp;rft.date=2019-08-13&amp;rft_id=https%3A%2F%2Fwww.freshfruitportal.com%2Fnews%2F2019%2F08%2F13%2Fu-s-gm-non-browning-arctic-apple-expands-into-foodservice%2F&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-fda2015-94"><span class="mw-cite-backlink"><b><a href="#cite_ref-fda2015_94-0" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="https://www.fda.gov/Food/IngredientsPackagingLabeling/GEPlants/Submissions/ucm436163.htm">"Okanagan Specialty Fruits: Biotechnology Consultation Agency Response Letter BNF 000132"</a>. <i>U.S. Food and Drug Administration</i>. 20 March 2015. <a rel="nofollow" class="external text" href="https://wayback.archive-it.org/7993/20171031091829/https://www.fda.gov/Food/IngredientsPackagingLabeling/GEPlants/Submissions/ucm436163.htm">Archived</a> from the original on 31 October 2017<span class="reference-accessdate">. Retrieved <span class="nowrap">14 November</span> 2019</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=unknown&amp;rft.jtitle=U.S.+Food+and+Drug+Administration&amp;rft.atitle=Okanagan+Specialty+Fruits%3A+Biotechnology+Consultation+Agency+Response+Letter+BNF+000132&amp;rft.date=2015-03-20&amp;rft_id=https%3A%2F%2Fwww.fda.gov%2FFood%2FIngredientsPackagingLabeling%2FGEPlants%2FSubmissions%2Fucm436163.htm&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-cfia-95"><span class="mw-cite-backlink"><b><a href="#cite_ref-cfia_95-0" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="http://www.inspection.gc.ca/plants/plants-with-novel-traits/general-public/questions-and-answers-arctic-apple/eng/1426884802194/1426884861294">"Questions and answers: Arctic Apple"</a>. Canadian Food Inspection Agency, Government of Canada. 8 September 2017. <a rel="nofollow" class="external text" href="https://web.archive.org/web/20180919152434/http://www.inspection.gc.ca/plants/plants-with-novel-traits/general-public/questions-and-answers-arctic-apple/eng/1426884802194/1426884861294">Archived</a> from the original on 19 September 2018<span class="reference-accessdate">. Retrieved <span class="nowrap">14 November</span> 2019</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=unknown&amp;rft.btitle=Questions+and+answers%3A+Arctic+Apple&amp;rft.pub=Canadian+Food+Inspection+Agency%2C+Government+of+Canada&amp;rft.date=2017-09-08&amp;rft_id=http%3A%2F%2Fwww.inspection.gc.ca%2Fplants%2Fplants-with-novel-traits%2Fgeneral-public%2Fquestions-and-answers-arctic-apple%2Feng%2F1426884802194%2F1426884861294&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-96"><span class="mw-cite-backlink"><b><a href="#cite_ref-96" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFYuVan_De_VoortLiYue2007" class="citation journal cs1">Yu, Xiuzhu; Van De Voort, Frederick R.; Li, Zhixi; Yue, Tianli (2007). "Proximate Composition of the Apple Seed and Characterization of Its Oil". <i>International Journal of Food Engineering</i>. <b>3</b> (5). <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<a rel="nofollow" class="external text" href="https://doi.org/10.2202%2F1556-3758.1283">10.2202/1556-3758.1283</a>. <a href="/wiki/S2CID_(identifier)" class="mw-redirect" title="S2CID (identifier)">S2CID</a>&nbsp;<a rel="nofollow" class="external text" href="https://api.semanticscholar.org/CorpusID:98590230">98590230</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=International+Journal+of+Food+Engineering&amp;rft.atitle=Proximate+Composition+of+the+Apple+Seed+and+Characterization+of+Its+Oil&amp;rft.volume=3&amp;rft.issue=5&amp;rft.date=2007&amp;rft_id=info%3Adoi%2F10.2202%2F1556-3758.1283&amp;rft_id=https%3A%2F%2Fapi.semanticscholar.org%2FCorpusID%3A98590230%23id-name%3DS2CID&amp;rft.aulast=Yu&amp;rft.aufirst=Xiuzhu&amp;rft.au=Van+De+Voort%2C+Frederick+R.&amp;rft.au=Li%2C+Zhixi&amp;rft.au=Yue%2C+Tianli&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-Davidson_1990-97"><span class="mw-cite-backlink">^ <a href="#cite_ref-Davidson_1990_97-0"><span class="cite-accessibility-label">Jump up to: </span><sup><i><b>a</b></i></sup></a> <a href="#cite_ref-Davidson_1990_97-1"><sup><i><b>b</b></i></sup></a> <a href="#cite_ref-Davidson_1990_97-2"><sup><i><b>c</b></i></sup></a></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFDavidson1990" class="citation book cs1"><a href="/wiki/Hilda_Ellis_Davidson" title="Hilda Ellis Davidson">Davidson, Hilda Roderick Ellis</a> (1990) [1st pub. 1964]. <i>Gods and Myths of Northern Europe</i>. London: <a href="/wiki/Penguin_Books" title="Penguin Books">Penguin Books</a>. pp.&nbsp;165–166. <a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&nbsp;<a href="/wiki/Special:BookSources/0-14-013627-4" title="Special:BookSources/0-14-013627-4"><bdi>0-14-013627-4</bdi></a>. <a href="/wiki/OCLC_(identifier)" class="mw-redirect" title="OCLC (identifier)">OCLC</a>&nbsp;<a rel="nofollow" class="external text" href="https://search.worldcat.org/oclc/29336401">29336401</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=book&amp;rft.btitle=Gods+and+Myths+of+Northern+Europe&amp;rft.place=London&amp;rft.pages=165-166&amp;rft.pub=Penguin+Books&amp;rft.date=1990&amp;rft_id=info%3Aoclcnum%2F29336401&amp;rft.isbn=0-14-013627-4&amp;rft.aulast=Davidson&amp;rft.aufirst=Hilda+Roderick+Ellis&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-98"><span class="mw-cite-backlink"><b><a href="#cite_ref-98" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFDavidson1998" class="citation book cs1"><a href="/wiki/Hilda_Ellis_Davidson" title="Hilda Ellis Davidson">Davidson, Hilda Ellis</a> (1998). <i>Roles of the Northern Goddess</i>. London; New York: <a href="/wiki/Routledge" title="Routledge">Routledge</a>. pp.&nbsp;146–147. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<a rel="nofollow" class="external text" href="https://doi.org/10.4324%2F9780203025550">10.4324/9780203025550</a>. <a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&nbsp;<a href="/wiki/Special:BookSources/0-415-13610-5" title="Special:BookSources/0-415-13610-5"><bdi>0-415-13610-5</bdi></a>. <a href="/wiki/LCCN_(identifier)" class="mw-redirect" title="LCCN (identifier)">LCCN</a>&nbsp;<a rel="nofollow" class="external text" href="https://lccn.loc.gov/97018309">97018309</a>. <a href="/wiki/OCLC_(identifier)" class="mw-redirect" title="OCLC (identifier)">OCLC</a>&nbsp;<a rel="nofollow" class="external text" href="https://search.worldcat.org/oclc/48138055">48138055</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=book&amp;rft.btitle=Roles+of+the+Northern+Goddess&amp;rft.place=London%3B+New+York&amp;rft.pages=146-147&amp;rft.pub=Routledge&amp;rft.date=1998&amp;rft_id=info%3Aoclcnum%2F48138055&amp;rft_id=info%3Alccn%2F97018309&amp;rft_id=info%3Adoi%2F10.4324%2F9780203025550&amp;rft.isbn=0-415-13610-5&amp;rft.aulast=Davidson&amp;rft.aufirst=Hilda+Ellis&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-99"><span class="mw-cite-backlink"><b><a href="#cite_ref-99" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFBiedermann1992" class="citation book cs1">Biedermann, Hans (1992). <span class="id-lock-registration" title="Free registration required"><a rel="nofollow" class="external text" href="https://archive.org/details/dictionaryofsymb00bied_0/page/16"><i>Dictionary of Symbolism</i></a></span>. Translated by Hulbert, James. New York: Facts on File. pp.&nbsp;16–17. <a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&nbsp;<a href="/wiki/Special:BookSources/978-0-8160-2593-0" title="Special:BookSources/978-0-8160-2593-0"><bdi>978-0-8160-2593-0</bdi></a>. <a href="/wiki/LCCN_(identifier)" class="mw-redirect" title="LCCN (identifier)">LCCN</a>&nbsp;<a rel="nofollow" class="external text" href="https://lccn.loc.gov/91044933">91044933</a>. <a href="/wiki/OCLC_(identifier)" class="mw-redirect" title="OCLC (identifier)">OCLC</a>&nbsp;<a rel="nofollow" class="external text" href="https://search.worldcat.org/oclc/25092926">25092926</a><span class="reference-accessdate">. Retrieved <span class="nowrap">3 October</span> 2024</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=book&amp;rft.btitle=Dictionary+of+Symbolism&amp;rft.place=New+York&amp;rft.pages=16-17&amp;rft.pub=Facts+on+File&amp;rft.date=1992&amp;rft_id=info%3Aoclcnum%2F25092926&amp;rft_id=info%3Alccn%2F91044933&amp;rft.isbn=978-0-8160-2593-0&amp;rft.aulast=Biedermann&amp;rft.aufirst=Hans&amp;rft_id=https%3A%2F%2Farchive.org%2Fdetails%2Fdictionaryofsymb00bied_0%2Fpage%2F16&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-Ruck_2001-100"><span class="mw-cite-backlink">^ <a href="#cite_ref-Ruck_2001_100-0"><span class="cite-accessibility-label">Jump up to: </span><sup><i><b>a</b></i></sup></a> <a href="#cite_ref-Ruck_2001_100-1"><sup><i><b>b</b></i></sup></a></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFRuckStaplesHeinrich2001" class="citation book cs1"><a href="/wiki/Carl_A._P._Ruck" title="Carl A. P. Ruck">Ruck, Carl A. P.</a>; <a href="/wiki/Blaise_Daniel_Staples" title="Blaise Daniel Staples">Staples, Blaise D.</a>; <a href="/wiki/Clark_Heinrich" title="Clark Heinrich">Heinrich, Clark</a> (2001). <i>The apples of Apollo&nbsp;: pagan and Christian mysteries of the Eucharist</i>. Durham, North Carolina: <a href="/wiki/Carolina_Academic_Press" title="Carolina Academic Press">Carolina Academic Press</a>. pp.&nbsp;64–70. <a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&nbsp;<a href="/wiki/Special:BookSources/978-0-89089-924-3" title="Special:BookSources/978-0-89089-924-3"><bdi>978-0-89089-924-3</bdi></a>. <a href="/wiki/LCCN_(identifier)" class="mw-redirect" title="LCCN (identifier)">LCCN</a>&nbsp;<a rel="nofollow" class="external text" href="https://lccn.loc.gov/00040351">00040351</a>. <a href="/wiki/OCLC_(identifier)" class="mw-redirect" title="OCLC (identifier)">OCLC</a>&nbsp;<a rel="nofollow" class="external text" href="https://search.worldcat.org/oclc/46337324">46337324</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=book&amp;rft.btitle=The+apples+of+Apollo+%3A+pagan+and+Christian+mysteries+of+the+Eucharist&amp;rft.place=Durham%2C+North+Carolina&amp;rft.pages=64-70&amp;rft.pub=Carolina+Academic+Press&amp;rft.date=2001&amp;rft_id=info%3Aoclcnum%2F46337324&amp;rft_id=info%3Alccn%2F00040351&amp;rft.isbn=978-0-89089-924-3&amp;rft.aulast=Ruck&amp;rft.aufirst=Carl+A.+P.&amp;rft.au=Staples%2C+Blaise+D.&amp;rft.au=Heinrich%2C+Clark&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-101"><span class="mw-cite-backlink"><b><a href="#cite_ref-101" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="https://www.theoi.com/Daimon/Eris.html">"Eris - Greek Goddess of Strife &amp; Discord (Roman Discordia)"</a>. <i><a href="/wiki/Theoi_Project" title="Theoi Project">Theoi Project</a></i>. Aaron J. Atsma. <a rel="nofollow" class="external text" href="https://web.archive.org/web/20240925003522/https://www.theoi.com/Daimon/Eris.html">Archived</a> from the original on 25 September 2024<span class="reference-accessdate">. Retrieved <span class="nowrap">26 September</span> 2024</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=unknown&amp;rft.jtitle=Theoi+Project&amp;rft.atitle=Eris+-+Greek+Goddess+of+Strife+%26+Discord+%28Roman+Discordia%29&amp;rft_id=https%3A%2F%2Fwww.theoi.com%2FDaimon%2FEris.html&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-102"><span class="mw-cite-backlink"><b><a href="#cite_ref-102" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFLucian1905" class="citation book cs1"><a href="/wiki/Lucian" title="Lucian">Lucian</a> (1905). <a rel="nofollow" class="external text" href="https://archive.org/details/worksoflucianofs01luciuoft/page/78"><i>The Works of Lucian of Samosata</i></a>. Vol.&nbsp;I. Translated by <a href="/wiki/H._W._Fowler" title="H. W. Fowler">Fowler, H.W.</a>; <a href="/wiki/Francis_George_Fowler" title="Francis George Fowler">Fowler, F.G.</a> (First&nbsp;ed.). Oxford: <a href="/wiki/Clarendon_Press" class="mw-redirect" title="Clarendon Press">Clarendon Press</a>. pp.&nbsp;78–85. <a href="/wiki/LCCN_(identifier)" class="mw-redirect" title="LCCN (identifier)">LCCN</a>&nbsp;<a rel="nofollow" class="external text" href="https://lccn.loc.gov/06001045">06001045</a>. <a href="/wiki/OCLC_(identifier)" class="mw-redirect" title="OCLC (identifier)">OCLC</a>&nbsp;<a rel="nofollow" class="external text" href="https://search.worldcat.org/oclc/506365">506365</a><span class="reference-accessdate">. Retrieved <span class="nowrap">26 September</span> 2024</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=book&amp;rft.btitle=The+Works+of+Lucian+of+Samosata&amp;rft.place=Oxford&amp;rft.pages=78-85&amp;rft.edition=First&amp;rft.pub=Clarendon+Press&amp;rft.date=1905&amp;rft_id=info%3Aoclcnum%2F506365&amp;rft_id=info%3Alccn%2F06001045&amp;rft.au=Lucian&amp;rft_id=https%3A%2F%2Farchive.org%2Fdetails%2Fworksoflucianofs01luciuoft%2Fpage%2F78&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-103"><span class="mw-cite-backlink"><b><a href="#cite_ref-103" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="https://www.theoi.com/Olympios/JudgementParis.html">"Judgement of Paris - Greek Mythology"</a>. <i><a href="/wiki/Theoi_Project" title="Theoi Project">Theoi Project</a></i>. Aaron J. Atsma. <a rel="nofollow" class="external text" href="https://web.archive.org/web/20240824120807/https://www.theoi.com/Olympios/JudgementParis.html">Archived</a> from the original on 24 August 2024<span class="reference-accessdate">. Retrieved <span class="nowrap">26 September</span> 2024</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=unknown&amp;rft.jtitle=Theoi+Project&amp;rft.atitle=Judgement+of+Paris+-+Greek+Mythology&amp;rft_id=https%3A%2F%2Fwww.theoi.com%2FOlympios%2FJudgementParis.html&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-104"><span class="mw-cite-backlink"><b><a href="#cite_ref-104" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFPlato1997" class="citation book cs1"><a href="/wiki/Plato" title="Plato">Plato</a> (1997). <span class="id-lock-registration" title="Free registration required"><a rel="nofollow" class="external text" href="https://archive.org/details/completeworks00plat/page/1744">"Epigrams"</a></span>. In Cooper, John M.; Hutchinson, D.S. (eds.). <i>Complete Works</i>. Translated by Edmonds, J.M.; Cooper, John M. Indianapolis, Indiana: <a href="/wiki/Hackett_Publishing_Company" title="Hackett Publishing Company">Hackett Publishing</a>. p.&nbsp;1744. <a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&nbsp;<a href="/wiki/Special:BookSources/0-87220-349-2" title="Special:BookSources/0-87220-349-2"><bdi>0-87220-349-2</bdi></a>. <a href="/wiki/LCCN_(identifier)" class="mw-redirect" title="LCCN (identifier)">LCCN</a>&nbsp;<a rel="nofollow" class="external text" href="https://lccn.loc.gov/96053280">96053280</a>. <a href="/wiki/OCLC_(identifier)" class="mw-redirect" title="OCLC (identifier)">OCLC</a>&nbsp;<a rel="nofollow" class="external text" href="https://search.worldcat.org/oclc/36178550">36178550</a><span class="reference-accessdate">. Retrieved <span class="nowrap">27 September</span> 2024</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=bookitem&amp;rft.atitle=Epigrams&amp;rft.btitle=Complete+Works&amp;rft.place=Indianapolis%2C+Indiana&amp;rft.pages=1744&amp;rft.pub=Hackett+Publishing&amp;rft.date=1997&amp;rft_id=info%3Aoclcnum%2F36178550&amp;rft_id=info%3Alccn%2F96053280&amp;rft.isbn=0-87220-349-2&amp;rft.au=Plato&amp;rft_id=https%3A%2F%2Farchive.org%2Fdetails%2Fcompleteworks00plat%2Fpage%2F1744&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-105"><span class="mw-cite-backlink"><b><a href="#cite_ref-105" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFPinsent1969" class="citation book cs1"><a href="/wiki/John_Pinsent" title="John Pinsent">Pinsent, John</a> (1969). <span class="id-lock-registration" title="Free registration required"><a rel="nofollow" class="external text" href="https://archive.org/details/greekmythology00pins/page/79"><i>Greek Mythology</i></a></span> (First&nbsp;ed.). London: Paul Hamlyn. p.&nbsp;79. <a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&nbsp;<a href="/wiki/Special:BookSources/978-0-600-02422-4" title="Special:BookSources/978-0-600-02422-4"><bdi>978-0-600-02422-4</bdi></a>. <a href="/wiki/LCCN_(identifier)" class="mw-redirect" title="LCCN (identifier)">LCCN</a>&nbsp;<a rel="nofollow" class="external text" href="https://lccn.loc.gov/78449216">78449216</a>. <a href="/wiki/OCLC_(identifier)" class="mw-redirect" title="OCLC (identifier)">OCLC</a>&nbsp;<a rel="nofollow" class="external text" href="https://search.worldcat.org/oclc/61702">61702</a><span class="reference-accessdate">. Retrieved <span class="nowrap">3 October</span> 2024</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=book&amp;rft.btitle=Greek+Mythology&amp;rft.place=London&amp;rft.pages=79&amp;rft.edition=First&amp;rft.pub=Paul+Hamlyn&amp;rft.date=1969&amp;rft_id=info%3Aoclcnum%2F61702&amp;rft_id=info%3Alccn%2F78449216&amp;rft.isbn=978-0-600-02422-4&amp;rft.aulast=Pinsent&amp;rft.aufirst=John&amp;rft_id=https%3A%2F%2Farchive.org%2Fdetails%2Fgreekmythology00pins%2Fpage%2F79&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-106"><span class="mw-cite-backlink"><b><a href="#cite_ref-106" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="https://www.theoi.com/Heroine/Atalanta.html">"Atalanta (Atalante) - Arcadian Heroine of Greek Mythology"</a>. <i><a href="/wiki/Theoi_Project" title="Theoi Project">Theoi Project</a></i>. Aaron J. Atsma. <a rel="nofollow" class="external text" href="https://web.archive.org/web/20240927101406/https://www.theoi.com/Heroine/Atalanta.html">Archived</a> from the original on 27 September 2024<span class="reference-accessdate">. Retrieved <span class="nowrap">3 October</span> 2024</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=unknown&amp;rft.jtitle=Theoi+Project&amp;rft.atitle=Atalanta+%28Atalante%29+-+Arcadian+Heroine+of+Greek+Mythology&amp;rft_id=https%3A%2F%2Fwww.theoi.com%2FHeroine%2FAtalanta.html&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-107"><span class="mw-cite-backlink"><b><a href="#cite_ref-107" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFFlieger2005" class="citation book cs1"><a href="/wiki/Verlyn_Flieger" title="Verlyn Flieger">Flieger, Verlyn</a> (2005). <i>Interrupted Music&nbsp;: The Making of Tolkien's Mythology</i>. Kent, Ohio: <a href="/wiki/Kent_State_University_Press" class="mw-redirect" title="Kent State University Press">Kent State University Press</a>. pp.&nbsp;122–123. <a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&nbsp;<a href="/wiki/Special:BookSources/978-0-87338-824-5" title="Special:BookSources/978-0-87338-824-5"><bdi>978-0-87338-824-5</bdi></a>. <a href="/wiki/LCCN_(identifier)" class="mw-redirect" title="LCCN (identifier)">LCCN</a>&nbsp;<a rel="nofollow" class="external text" href="https://lccn.loc.gov/2004024490">2004024490</a>. <a href="/wiki/OCLC_(identifier)" class="mw-redirect" title="OCLC (identifier)">OCLC</a>&nbsp;<a rel="nofollow" class="external text" href="https://search.worldcat.org/oclc/56805947">56805947</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=book&amp;rft.btitle=Interrupted+Music+%3A+The+Making+of+Tolkien%27s+Mythology&amp;rft.place=Kent%2C+Ohio&amp;rft.pages=122-123&amp;rft.pub=Kent+State+University+Press&amp;rft.date=2005&amp;rft_id=info%3Aoclcnum%2F56805947&amp;rft_id=info%3Alccn%2F2004024490&amp;rft.isbn=978-0-87338-824-5&amp;rft.aulast=Flieger&amp;rft.aufirst=Verlyn&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-English_in_China-108"><span class="mw-cite-backlink">^ <a href="#cite_ref-English_in_China_108-0"><span class="cite-accessibility-label">Jump up to: </span><sup><i><b>a</b></i></sup></a> <a href="#cite_ref-English_in_China_108-1"><sup><i><b>b</b></i></sup></a></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="https://teach-english-in-china.co.uk/why-do-the-chinese-give-apples-around-christmas/">"Why Do the Chinese Give Apples Around Christmas?"</a>. <i>Teach English In China</i>. 22 December 2019. <a rel="nofollow" class="external text" href="https://web.archive.org/web/20201001003304/https://teach-english-in-china.co.uk/why-do-the-chinese-give-apples-around-christmas/">Archived</a> from the original on 1 October 2020<span class="reference-accessdate">. Retrieved <span class="nowrap">3 September</span> 2024</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=unknown&amp;rft.jtitle=Teach+English+In+China&amp;rft.atitle=Why+Do+the+Chinese+Give+Apples+Around+Christmas%3F&amp;rft.date=2019-12-22&amp;rft_id=https%3A%2F%2Fteach-english-in-china.co.uk%2Fwhy-do-the-chinese-give-apples-around-christmas%2F&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-Macrone-109"><span class="mw-cite-backlink">^ <a href="#cite_ref-Macrone_109-0"><span class="cite-accessibility-label">Jump up to: </span><sup><i><b>a</b></i></sup></a> <a href="#cite_ref-Macrone_109-1"><sup><i><b>b</b></i></sup></a></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFMacrone1998" class="citation book cs1">Macrone, Michael (1998). <a rel="nofollow" class="external text" href="https://archive.org/details/brushupyourbible00macr"><i>Brush up your Bible!</i></a>. New York: <a href="/wiki/Gramercy_Books" class="mw-redirect" title="Gramercy Books">Gramercy Books</a>. pp.&nbsp;15–16, 340–341. <a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&nbsp;<a href="/wiki/Special:BookSources/978-0-517-20189-3" title="Special:BookSources/978-0-517-20189-3"><bdi>978-0-517-20189-3</bdi></a>. <a href="/wiki/OCLC_(identifier)" class="mw-redirect" title="OCLC (identifier)">OCLC</a>&nbsp;<a rel="nofollow" class="external text" href="https://search.worldcat.org/oclc/38270894">38270894</a><span class="reference-accessdate">. Retrieved <span class="nowrap">31 July</span> 2024</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=book&amp;rft.btitle=Brush+up+your+Bible%21&amp;rft.place=New+York&amp;rft.pages=15-16%2C+340-341&amp;rft.pub=Gramercy+Books&amp;rft.date=1998&amp;rft_id=info%3Aoclcnum%2F38270894&amp;rft.isbn=978-0-517-20189-3&amp;rft.aulast=Macrone&amp;rft.aufirst=Michael&amp;rft_id=https%3A%2F%2Farchive.org%2Fdetails%2Fbrushupyourbible00macr&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-110"><span class="mw-cite-backlink"><b><a href="#cite_ref-110" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFKissling2004" class="citation book cs1">Kissling, Paul J. (2004). <a rel="nofollow" class="external text" href="https://books.google.com/books?id=lotBnvqdmeQC&amp;q=Genesis+apple&amp;pg=PA193"><i>Genesis</i></a>. Vol.&nbsp;1. Joplin, Missouri: College Press. p.&nbsp;193. <a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&nbsp;<a href="/wiki/Special:BookSources/978-0-89900-875-2" title="Special:BookSources/978-0-89900-875-2"><bdi>978-0-89900-875-2</bdi></a>. <a href="/wiki/LCCN_(identifier)" class="mw-redirect" title="LCCN (identifier)">LCCN</a>&nbsp;<a rel="nofollow" class="external text" href="https://lccn.loc.gov/2004022577">2004022577</a>. <a href="/wiki/OCLC_(identifier)" class="mw-redirect" title="OCLC (identifier)">OCLC</a>&nbsp;<a rel="nofollow" class="external text" href="https://search.worldcat.org/oclc/56672257">56672257</a>. <a rel="nofollow" class="external text" href="https://web.archive.org/web/20210126053142/https://books.google.com/books?id=lotBnvqdmeQC&amp;q=Genesis+apple&amp;pg=PA193">Archived</a> from the original on 26 January 2021<span class="reference-accessdate">. Retrieved <span class="nowrap">6 October</span> 2020</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=book&amp;rft.btitle=Genesis&amp;rft.place=Joplin%2C+Missouri&amp;rft.pages=193&amp;rft.pub=College+Press&amp;rft.date=2004&amp;rft_id=info%3Aoclcnum%2F56672257&amp;rft_id=info%3Alccn%2F2004022577&amp;rft.isbn=978-0-89900-875-2&amp;rft.aulast=Kissling&amp;rft.aufirst=Paul+J.&amp;rft_id=https%3A%2F%2Fbooks.google.com%2Fbooks%3Fid%3DlotBnvqdmeQC%26q%3DGenesis%2Bapple%26pg%3DPA193&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-111"><span class="mw-cite-backlink"><b><a href="#cite_ref-111" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><a rel="nofollow" class="external text" href="https://www.esv.org/Genesis+2:17">Genesis 2:17</a></span>
+</li>
+<li id="cite_note-112"><span class="mw-cite-backlink"><b><a href="#cite_ref-112" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFHendel2013" class="citation book cs1">Hendel, Ronald S. (2013). <a rel="nofollow" class="external text" href="https://books.google.com/books?id=xBPpIHwcZMUC&amp;q=Genesis+apple+malum&amp;pg=PA114"><i>The Book of Genesis: A Biography</i></a>. Princeton, New Jersey: <a href="/wiki/Princeton_University_Press" title="Princeton University Press">Princeton University Press</a>. p.&nbsp;114. <a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&nbsp;<a href="/wiki/Special:BookSources/978-0-69114012-4" title="Special:BookSources/978-0-69114012-4"><bdi>978-0-69114012-4</bdi></a>. <a href="/wiki/LCCN_(identifier)" class="mw-redirect" title="LCCN (identifier)">LCCN</a>&nbsp;<a rel="nofollow" class="external text" href="https://lccn.loc.gov/2012015634">2012015634</a>. <a href="/wiki/OCLC_(identifier)" class="mw-redirect" title="OCLC (identifier)">OCLC</a>&nbsp;<a rel="nofollow" class="external text" href="https://search.worldcat.org/oclc/788265521">788265521</a>. <a rel="nofollow" class="external text" href="https://web.archive.org/web/20230305222115/https://books.google.com/books?id=xBPpIHwcZMUC&amp;q=Genesis+apple+malum&amp;pg=PA114#v=snippet&amp;q=Genesis%20apple%20malum&amp;f=false">Archived</a> from the original on 5 March 2023<span class="reference-accessdate">. Retrieved <span class="nowrap">4 October</span> 2024</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=book&amp;rft.btitle=The+Book+of+Genesis%3A+A+Biography&amp;rft.place=Princeton%2C+New+Jersey&amp;rft.pages=114&amp;rft.pub=Princeton+University+Press&amp;rft.date=2013&amp;rft_id=info%3Aoclcnum%2F788265521&amp;rft_id=info%3Alccn%2F2012015634&amp;rft.isbn=978-0-69114012-4&amp;rft.aulast=Hendel&amp;rft.aufirst=Ronald+S.&amp;rft_id=https%3A%2F%2Fbooks.google.com%2Fbooks%3Fid%3DxBPpIHwcZMUC%26q%3DGenesis%2Bapple%2Bmalum%26pg%3DPA114&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span> </span>
+</li>
+<li id="cite_note-113"><span class="mw-cite-backlink"><b><a href="#cite_ref-113" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFMiederKingsburyHarder1996" class="citation book cs1"><a href="/wiki/Wolfgang_Mieder" title="Wolfgang Mieder">Mieder, Wolfgang</a>; Kingsbury, Stewart A.; <a href="/wiki/Kelsie_B._Harder" title="Kelsie B. Harder">Harder, Kelsie B.</a>, eds. (1996) [1992]. <span class="id-lock-registration" title="Free registration required"><a rel="nofollow" class="external text" href="https://archive.org/details/dictionaryofamer00wolf_0/page/23"><i>A Dictionary of American Proverbs</i></a></span> (Paperback&nbsp;ed.). New York: Oxford University Press. p.&nbsp;23. <a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&nbsp;<a href="/wiki/Special:BookSources/978-0-19-511133-0" title="Special:BookSources/978-0-19-511133-0"><bdi>978-0-19-511133-0</bdi></a>. <a href="/wiki/LCCN_(identifier)" class="mw-redirect" title="LCCN (identifier)">LCCN</a>&nbsp;<a rel="nofollow" class="external text" href="https://lccn.loc.gov/91015508">91015508</a>. <a href="/wiki/OCLC_(identifier)" class="mw-redirect" title="OCLC (identifier)">OCLC</a>&nbsp;<a rel="nofollow" class="external text" href="https://search.worldcat.org/oclc/23693799">23693799</a><span class="reference-accessdate">. Retrieved <span class="nowrap">23 August</span> 2024</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=book&amp;rft.btitle=A+Dictionary+of+American+Proverbs&amp;rft.place=New+York&amp;rft.pages=23&amp;rft.edition=Paperback&amp;rft.pub=Oxford+University+Press&amp;rft.date=1996&amp;rft_id=info%3Aoclcnum%2F23693799&amp;rft_id=info%3Alccn%2F91015508&amp;rft.isbn=978-0-19-511133-0&amp;rft_id=https%3A%2F%2Farchive.org%2Fdetails%2Fdictionaryofamer00wolf_0%2Fpage%2F23&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+<li id="cite_note-114"><span class="mw-cite-backlink"><b><a href="#cite_ref-114" aria-label="Jump up" title="Jump up">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFPollan2001" class="citation book cs1"><a href="/wiki/Michael_Pollan" title="Michael Pollan">Pollan, Michael</a> (2001). <span class="id-lock-limited" title="Free access subject to limited trial, subscription normally required"><a rel="nofollow" class="external text" href="https://archive.org/details/botanyofdesirepl0000poll_v5w7"><i>The Botany of Desire: A Plant's-Eye View of the World</i></a></span> (First&nbsp;ed.). New York: <a href="/wiki/Random_House" title="Random House">Random House</a>. pp.&nbsp;9, 22, 50. <a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&nbsp;<a href="/wiki/Special:BookSources/978-0-375-50129-6" title="Special:BookSources/978-0-375-50129-6"><bdi>978-0-375-50129-6</bdi></a>. <a href="/wiki/LCCN_(identifier)" class="mw-redirect" title="LCCN (identifier)">LCCN</a>&nbsp;<a rel="nofollow" class="external text" href="https://lccn.loc.gov/00066479">00066479</a>. <a href="/wiki/OCLC_(identifier)" class="mw-redirect" title="OCLC (identifier)">OCLC</a>&nbsp;<a rel="nofollow" class="external text" href="https://search.worldcat.org/oclc/49803415">49803415</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=book&amp;rft.btitle=The+Botany+of+Desire%3A+A+Plant%27s-Eye+View+of+the+World&amp;rft.place=New+York&amp;rft.pages=9%2C+22%2C+50&amp;rft.edition=First&amp;rft.pub=Random+House&amp;rft.date=2001&amp;rft_id=info%3Aoclcnum%2F49803415&amp;rft_id=info%3Alccn%2F00066479&amp;rft.isbn=978-0-375-50129-6&amp;rft.aulast=Pollan&amp;rft.aufirst=Michael&amp;rft_id=https%3A%2F%2Farchive.org%2Fdetails%2Fbotanyofdesirepl0000poll_v5w7&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></span>
+</li>
+</ol></div></div>
+<div class="mw-heading mw-heading2"><h2 id="Further_reading">Further reading</h2></div>
+<ul><li><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation book cs1"><a href="/wiki/Frank_Browning_(author)" title="Frank Browning (author)">Browning, Frank</a> (1998). <span class="id-lock-registration" title="Free registration required"><a rel="nofollow" class="external text" href="https://archive.org/details/apples00brow"><i>Apples</i></a></span> (First&nbsp;ed.). New York: <a href="/wiki/North_Point_Press" class="mw-redirect" title="North Point Press">North Point Press</a>. <a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&nbsp;<a href="/wiki/Special:BookSources/978-0-86547-537-3" title="Special:BookSources/978-0-86547-537-3"><bdi>978-0-86547-537-3</bdi></a>. <a href="/wiki/LCCN_(identifier)" class="mw-redirect" title="LCCN (identifier)">LCCN</a>&nbsp;<a rel="nofollow" class="external text" href="https://lccn.loc.gov/98027252">98027252</a>. <a href="/wiki/OCLC_(identifier)" class="mw-redirect" title="OCLC (identifier)">OCLC</a>&nbsp;<a rel="nofollow" class="external text" href="https://search.worldcat.org/oclc/39235786">39235786</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=book&amp;rft.btitle=Apples&amp;rft.place=New+York&amp;rft.edition=First&amp;rft.pub=North+Point+Press&amp;rft.date=1998&amp;rft_id=info%3Aoclcnum%2F39235786&amp;rft_id=info%3Alccn%2F98027252&amp;rft.isbn=978-0-86547-537-3&amp;rft.aulast=Browning&amp;rft.aufirst=Frank&amp;rft_id=https%3A%2F%2Farchive.org%2Fdetails%2Fapples00brow&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></li>
+<li><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation book cs1">Hanson, Beth; Marinelli, Janet; Saphire, Sigrun Wolff; Tebbitt, Mark, eds. (2003). <span class="id-lock-registration" title="Free registration required"><a rel="nofollow" class="external text" href="https://archive.org/details/bestapplestobuyg0000unse"><i>The Best Apples to Buy and Grow</i></a></span> (First&nbsp;ed.). Brooklyn, New York: <a href="/wiki/Brooklyn_Botanic_Garden" title="Brooklyn Botanic Garden">Brooklyn Botanic Garden</a>. <a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&nbsp;<a href="/wiki/Special:BookSources/978-1-889538-66-2" title="Special:BookSources/978-1-889538-66-2"><bdi>978-1-889538-66-2</bdi></a>. <a href="/wiki/OCLC_(identifier)" class="mw-redirect" title="OCLC (identifier)">OCLC</a>&nbsp;<a rel="nofollow" class="external text" href="https://search.worldcat.org/oclc/60384060">60384060</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=book&amp;rft.btitle=The+Best+Apples+to+Buy+and+Grow&amp;rft.place=Brooklyn%2C+New+York&amp;rft.edition=First&amp;rft.pub=Brooklyn+Botanic+Garden&amp;rft.date=2003&amp;rft_id=info%3Aoclcnum%2F60384060&amp;rft.isbn=978-1-889538-66-2&amp;rft_id=https%3A%2F%2Farchive.org%2Fdetails%2Fbestapplestobuyg0000unse&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></li>
+<li><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation book cs1"><a href="/wiki/Barrie_Juniper" title="Barrie Juniper">Juniper, Barrie E.</a>; <a href="/wiki/David_Mabberley" title="David Mabberley">Mabberley, David J.</a> (2006). <span class="id-lock-registration" title="Free registration required"><a rel="nofollow" class="external text" href="https://archive.org/details/storyofapple0000juni"><i>The Story of the Apple</i></a></span> (First&nbsp;ed.). Portland, Oregon: <a href="/wiki/Timber_Press" class="mw-redirect" title="Timber Press">Timber Press</a>. <a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&nbsp;<a href="/wiki/Special:BookSources/978-0-88192-784-9" title="Special:BookSources/978-0-88192-784-9"><bdi>978-0-88192-784-9</bdi></a>. <a href="/wiki/LCCN_(identifier)" class="mw-redirect" title="LCCN (identifier)">LCCN</a>&nbsp;<a rel="nofollow" class="external text" href="https://lccn.loc.gov/2006011869">2006011869</a>. <a href="/wiki/OCLC_(identifier)" class="mw-redirect" title="OCLC (identifier)">OCLC</a>&nbsp;<a rel="nofollow" class="external text" href="https://search.worldcat.org/oclc/67383484">67383484</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=book&amp;rft.btitle=The+Story+of+the+Apple&amp;rft.place=Portland%2C+Oregon&amp;rft.edition=First&amp;rft.pub=Timber+Press&amp;rft.date=2006&amp;rft_id=info%3Aoclcnum%2F67383484&amp;rft_id=info%3Alccn%2F2006011869&amp;rft.isbn=978-0-88192-784-9&amp;rft.aulast=Juniper&amp;rft.aufirst=Barrie+E.&amp;rft.au=Mabberley%2C+David+J.&amp;rft_id=https%3A%2F%2Farchive.org%2Fdetails%2Fstoryofapple0000juni&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></li>
+<li><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation book cs1">Phillips, Michael (1998). <span class="id-lock-registration" title="Free registration required"><a rel="nofollow" class="external text" href="https://archive.org/details/applegrowerguide0000phil"><i>The Apple Grower&nbsp;: A Guide for the Organic Orchardist</i></a></span> (First&nbsp;ed.). White River Junction, Vermont: <a href="/wiki/Chelsea_Green_Publishing" title="Chelsea Green Publishing">Chelsea Green Publishing</a>. <a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&nbsp;<a href="/wiki/Special:BookSources/978-1-890132-04-0" title="Special:BookSources/978-1-890132-04-0"><bdi>978-1-890132-04-0</bdi></a>. <a href="/wiki/LCCN_(identifier)" class="mw-redirect" title="LCCN (identifier)">LCCN</a>&nbsp;<a rel="nofollow" class="external text" href="https://lccn.loc.gov/98003631">98003631</a>. <a href="/wiki/OCLC_(identifier)" class="mw-redirect" title="OCLC (identifier)">OCLC</a>&nbsp;<a rel="nofollow" class="external text" href="https://search.worldcat.org/oclc/38731995">38731995</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=book&amp;rft.btitle=The+Apple+Grower+%3A+A+Guide+for+the+Organic+Orchardist&amp;rft.place=White+River+Junction%2C+Vermont&amp;rft.edition=First&amp;rft.pub=Chelsea+Green+Publishing&amp;rft.date=1998&amp;rft_id=info%3Aoclcnum%2F38731995&amp;rft_id=info%3Alccn%2F98003631&amp;rft.isbn=978-1-890132-04-0&amp;rft.aulast=Phillips&amp;rft.aufirst=Michael&amp;rft_id=https%3A%2F%2Farchive.org%2Fdetails%2Fapplegrowerguide0000phil&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></li>
+<li><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation book cs1">Sanders, Rosie (2010). <i>The Apple Book</i> (Second&nbsp;ed.). London: <a href="/wiki/Frances_Lincoln_Limited" class="mw-redirect" title="Frances Lincoln Limited">Frances Lincoln Limited</a>. <a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&nbsp;<a href="/wiki/Special:BookSources/9780711231412" title="Special:BookSources/9780711231412"><bdi>9780711231412</bdi></a>. <a href="/wiki/OCLC_(identifier)" class="mw-redirect" title="OCLC (identifier)">OCLC</a>&nbsp;<a rel="nofollow" class="external text" href="https://search.worldcat.org/oclc/646397065">646397065</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=book&amp;rft.btitle=The+Apple+Book&amp;rft.place=London&amp;rft.edition=Second&amp;rft.pub=Frances+Lincoln+Limited&amp;rft.date=2010&amp;rft_id=info%3Aoclcnum%2F646397065&amp;rft.isbn=9780711231412&amp;rft.aulast=Sanders&amp;rft.aufirst=Rosie&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AApple" class="Z3988"></span></li></ul>
+<div class="mw-heading mw-heading2"><h2 id="External_links">External links</h2></div>
+<ul><li><span class="noviewer" typeof="mw:File"><a href="/wiki/File:Commons-logo.svg" class="mw-file-description"><img alt="" src="//upload.wikimedia.org/wikipedia/en/thumb/4/4a/Commons-logo.svg/12px-Commons-logo.svg.png" decoding="async" width="12" height="16" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/en/thumb/4/4a/Commons-logo.svg/18px-Commons-logo.svg.png 1.5x, //upload.wikimedia.org/wikipedia/en/thumb/4/4a/Commons-logo.svg/24px-Commons-logo.svg.png 2x" data-file-width="1024" data-file-height="1376"></a></span> Media related to <a href="https://commons.wikimedia.org/wiki/Category:Apples" class="extiw" title="commons:Category:Apples">Apples</a> at Wikimedia Commons</li></ul>
+<div class="navbox-styles"><style data-mw-deduplicate="TemplateStyles:r1129693374">.mw-parser-output .hlist dl,.mw-parser-output .hlist ol,.mw-parser-output .hlist ul{margin:0;padding:0}.mw-parser-output .hlist dd,.mw-parser-output .hlist dt,.mw-parser-output .hlist li{margin:0;display:inline}.mw-parser-output .hlist.inline,.mw-parser-output .hlist.inline dl,.mw-parser-output .hlist.inline ol,.mw-parser-output .hlist.inline ul,.mw-parser-output .hlist dl dl,.mw-parser-output .hlist dl ol,.mw-parser-output .hlist dl ul,.mw-parser-output .hlist ol dl,.mw-parser-output .hlist ol ol,.mw-parser-output .hlist ol ul,.mw-parser-output .hlist ul dl,.mw-parser-output .hlist ul ol,.mw-parser-output .hlist ul ul{display:inline}.mw-parser-output .hlist .mw-empty-li{display:none}.mw-parser-output .hlist dt::after{content:": "}.mw-parser-output .hlist dd::after,.mw-parser-output .hlist li::after{content:" · ";font-weight:bold}.mw-parser-output .hlist dd:last-child::after,.mw-parser-output .hlist dt:last-child::after,.mw-parser-output .hlist li:last-child::after{content:none}.mw-parser-output .hlist dd dd:first-child::before,.mw-parser-output .hlist dd dt:first-child::before,.mw-parser-output .hlist dd li:first-child::before,.mw-parser-output .hlist dt dd:first-child::before,.mw-parser-output .hlist dt dt:first-child::before,.mw-parser-output .hlist dt li:first-child::before,.mw-parser-output .hlist li dd:first-child::before,.mw-parser-output .hlist li dt:first-child::before,.mw-parser-output .hlist li li:first-child::before{content:" (";font-weight:normal}.mw-parser-output .hlist dd dd:last-child::after,.mw-parser-output .hlist dd dt:last-child::after,.mw-parser-output .hlist dd li:last-child::after,.mw-parser-output .hlist dt dd:last-child::after,.mw-parser-output .hlist dt dt:last-child::after,.mw-parser-output .hlist dt li:last-child::after,.mw-parser-output .hlist li dd:last-child::after,.mw-parser-output .hlist li dt:last-child::after,.mw-parser-output .hlist li li:last-child::after{content:")";font-weight:normal}.mw-parser-output .hlist ol{counter-reset:listitem}.mw-parser-output .hlist ol>li{counter-increment:listitem}.mw-parser-output .hlist ol>li::before{content:" "counter(listitem)"\a0 "}.mw-parser-output .hlist dd ol>li:first-child::before,.mw-parser-output .hlist dt ol>li:first-child::before,.mw-parser-output .hlist li ol>li:first-child::before{content:" ("counter(listitem)"\a0 "}</style><style data-mw-deduplicate="TemplateStyles:r1236075235">.mw-parser-output .navbox{box-sizing:border-box;border:1px solid #a2a9b1;width:100%;clear:both;font-size:88%;text-align:center;padding:1px;margin:1em auto 0}.mw-parser-output .navbox .navbox{margin-top:0}.mw-parser-output .navbox+.navbox,.mw-parser-output .navbox+.navbox-styles+.navbox{margin-top:-1px}.mw-parser-output .navbox-inner,.mw-parser-output .navbox-subgroup{width:100%}.mw-parser-output .navbox-group,.mw-parser-output .navbox-title,.mw-parser-output .navbox-abovebelow{padding:0.25em 1em;line-height:1.5em;text-align:center}.mw-parser-output .navbox-group{white-space:nowrap;text-align:right}.mw-parser-output .navbox,.mw-parser-output .navbox-subgroup{background-color:#fdfdfd}.mw-parser-output .navbox-list{line-height:1.5em;border-color:#fdfdfd}.mw-parser-output .navbox-list-with-group{text-align:left;border-left-width:2px;border-left-style:solid}.mw-parser-output tr+tr>.navbox-abovebelow,.mw-parser-output tr+tr>.navbox-group,.mw-parser-output tr+tr>.navbox-image,.mw-parser-output tr+tr>.navbox-list{border-top:2px solid #fdfdfd}.mw-parser-output .navbox-title{background-color:#ccf}.mw-parser-output .navbox-abovebelow,.mw-parser-output .navbox-group,.mw-parser-output .navbox-subgroup .navbox-title{background-color:#ddf}.mw-parser-output .navbox-subgroup .navbox-group,.mw-parser-output .navbox-subgroup .navbox-abovebelow{background-color:#e6e6ff}.mw-parser-output .navbox-even{background-color:#f7f7f7}.mw-parser-output .navbox-odd{background-color:transparent}.mw-parser-output .navbox .hlist td dl,.mw-parser-output .navbox .hlist td ol,.mw-parser-output .navbox .hlist td ul,.mw-parser-output .navbox td.hlist dl,.mw-parser-output .navbox td.hlist ol,.mw-parser-output .navbox td.hlist ul{padding:0.125em 0}.mw-parser-output .navbox .navbar{display:block;font-size:100%}.mw-parser-output .navbox-title .navbar{float:left;text-align:left;margin-right:0.5em}body.skin--responsive .mw-parser-output .navbox-image img{max-width:none!important}@media print{body.ns-0 .mw-parser-output .navbox{display:none!important}}</style></div><div role="navigation" class="navbox" aria-labelledby="Apples" style="padding:3px"><table class="nowraplinks hlist mw-collapsible autocollapse navbox-inner mw-made-collapsible mw-collapsed" style="border-spacing:0;background:transparent;color:inherit"><tbody><tr><th scope="col" class="navbox-title" colspan="2" style="background:name;"><button type="button" class="mw-collapsible-toggle mw-collapsible-toggle-default mw-collapsible-toggle-collapsed" aria-expanded="false" tabindex="0"><span class="mw-collapsible-text">show</span></button><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1129693374"><style data-mw-deduplicate="TemplateStyles:r1239400231">.mw-parser-output .navbar{display:inline;font-size:88%;font-weight:normal}.mw-parser-output .navbar-collapse{float:left;text-align:left}.mw-parser-output .navbar-boxtext{word-spacing:0}.mw-parser-output .navbar ul{display:inline-block;white-space:nowrap;line-height:inherit}.mw-parser-output .navbar-brackets::before{margin-right:-0.125em;content:"[ "}.mw-parser-output .navbar-brackets::after{margin-left:-0.125em;content:" ]"}.mw-parser-output .navbar li{word-spacing:-0.125em}.mw-parser-output .navbar a>span,.mw-parser-output .navbar a>abbr{text-decoration:inherit}.mw-parser-output .navbar-mini abbr{font-variant:small-caps;border-bottom:none;text-decoration:none;cursor:inherit}.mw-parser-output .navbar-ct-full{font-size:114%;margin:0 7em}.mw-parser-output .navbar-ct-mini{font-size:114%;margin:0 4em}html.skin-theme-clientpref-night .mw-parser-output .navbar li a abbr{color:var(--color-base)!important}@media(prefers-color-scheme:dark){html.skin-theme-clientpref-os .mw-parser-output .navbar li a abbr{color:var(--color-base)!important}}@media print{.mw-parser-output .navbar{display:none!important}}</style><div class="navbar plainlinks hlist navbar-mini"><ul><li class="nv-view"><a href="/wiki/Template:Apples" title="Template:Apples"><abbr title="View this template">v</abbr></a></li><li class="nv-talk"><a href="/wiki/Template_talk:Apples" title="Template talk:Apples"><abbr title="Discuss this template">t</abbr></a></li><li class="nv-edit"><a href="/wiki/Special:EditPage/Template:Apples" title="Special:EditPage/Template:Apples"><abbr title="Edit this template">e</abbr></a></li></ul></div><div id="Apples" style="font-size:114%;margin:0 4em"><a class="mw-selflink selflink">Apples</a></div></th></tr><tr style="display: none;"><td class="navbox-abovebelow" colspan="2"><div>
+<ul><li><a href="/wiki/List_of_apple_cultivars" title="List of apple cultivars">List of apple cultivars</a></li></ul>
+</div></td></tr><tr style="display: none;"><th scope="row" class="navbox-group" style="width:1%">Species</th><td class="navbox-list-with-group navbox-list navbox-odd" style="width:100%;padding:0"><div style="padding:0 0.25em">
+<ul><li><a class="mw-selflink selflink"><i>Malus domestica</i></a></li>
+<li><i><a href="/wiki/Malus_niedzwetzkyana" title="Malus niedzwetzkyana">Malus niedzwetzkyana</a></i></li>
+<li><i><a href="/wiki/Malus_sieversii" title="Malus sieversii">Malus sieversii</a></i></li></ul>
+</div></td></tr><tr style="display: none;"><th scope="row" class="navbox-group" style="width:1%"><a href="/wiki/Table_apple" title="Table apple">Table apples</a></th><td class="navbox-list-with-group navbox-list navbox-even" style="width:100%;padding:0"><div style="padding:0 0.25em">
+<ul><li><a href="/wiki/Adams_Pearmain" title="Adams Pearmain">Adams Pearmain</a></li>
+<li><a href="/wiki/Aia_Ilu" title="Aia Ilu">Aia Ilu</a></li>
+<li><a href="/wiki/Airlie_Red_Flesh" title="Airlie Red Flesh">Airlie Red Flesh</a></li>
+<li><a href="/wiki/Akane_(apple)" title="Akane (apple)">Akane</a></li>
+<li><a href="/wiki/%C3%85ker%C3%B6" title="Åkerö">Åkerö</a></li>
+<li><a href="/wiki/Alkmene_(apple)" title="Alkmene (apple)">Alkmene</a></li>
+<li><a href="/wiki/Allington_Pippin" title="Allington Pippin">Allington Pippin</a></li>
+<li><a href="/wiki/Ambrosia_(apple)" title="Ambrosia (apple)">Ambrosia</a></li>
+<li><a href="/wiki/Anna_(apple)" title="Anna (apple)">Anna</a></li>
+<li><a href="/wiki/Annurca" title="Annurca">Annurca</a></li>
+<li><a href="/wiki/Ariane_(apple)" title="Ariane (apple)">Ariane</a></li>
+<li><a href="/wiki/Arkansas_Black" title="Arkansas Black">Arkansas Black</a></li>
+<li><a href="/wiki/Ashmead%27s_Kernel" title="Ashmead's Kernel">Ashmead's Kernel</a></li>
+<li><a href="/wiki/Aurora_Golden_Gala" title="Aurora Golden Gala">Aurora Golden Gala</a></li>
+<li><a href="/wiki/Autumn_Bough" title="Autumn Bough">Autumn Bough</a></li>
+<li><a href="/wiki/Autumn_Glory" title="Autumn Glory">Autumn Glory</a></li>
+<li><a href="/wiki/Baldwin_(apple)" title="Baldwin (apple)">Baldwin</a></li>
+<li><a href="/wiki/Beacon_(apple)" title="Beacon (apple)">Beacon</a></li>
+<li><a href="/wiki/Beauty_of_Bath" title="Beauty of Bath">Beauty of Bath</a></li>
+<li><a href="/wiki/Belle_de_Boskoop" title="Belle de Boskoop">Belle de Boskoop</a></li>
+<li><a href="/wiki/Bellflower_apple" title="Bellflower apple">Bellflower</a></li>
+<li><a href="/wiki/Ben_Davis_(apple)" title="Ben Davis (apple)">Ben Davis</a></li>
+<li><a href="/wiki/Birgit_Bonnier" title="Birgit Bonnier">Birgit Bonnier</a></li>
+<li><a href="/wiki/Braeburn" title="Braeburn">Braeburn</a></li>
+<li><a href="/wiki/Brina" title="Brina">Brina</a></li>
+<li><a href="/wiki/Cameo_(apple)" title="Cameo (apple)">Cameo</a></li>
+<li><a href="/wiki/Champion_(apple)" title="Champion (apple)">Champion</a></li>
+<li><a href="/wiki/Civni_apple" title="Civni apple">Civni (Rubens)</a></li>
+<li><a href="/wiki/Claygate_Pearmain" title="Claygate Pearmain">Claygate Pearmain</a></li>
+<li><a href="/wiki/Clivia_(apple)" title="Clivia (apple)">Clivia</a></li>
+<li><a href="/wiki/Cornish_Aromatic" title="Cornish Aromatic">Cornish Aromatic</a></li>
+<li><a href="/wiki/Cornish_Gilliflower" title="Cornish Gilliflower">Cornish Gilliflower</a></li>
+<li><a href="/wiki/Cortland_(apple)" title="Cortland (apple)">Cortland</a></li>
+<li><a href="/wiki/Cosmic_Crisp" title="Cosmic Crisp">Cosmic Crisp</a></li>
+<li><a href="/wiki/Court_Pendu_Plat" title="Court Pendu Plat">Court Pendu Plat</a></li>
+<li><a href="/wiki/Cox%27s_Orange_Pippin" title="Cox's Orange Pippin">Cox's Orange Pippin</a></li>
+<li><a href="/wiki/Crimson_Gold_(apple)" title="Crimson Gold (apple)">Crimson Gold</a></li>
+<li><a href="/wiki/Cripps_Red" title="Cripps Red">Cripps Red</a></li>
+<li><a href="/wiki/Cripps_Pink" title="Cripps Pink">Cripps Pink (Pink Lady)</a></li>
+<li><a href="/wiki/Delbard_Jubil%C3%A9e" title="Delbard Jubilée">Delbard Jubilée</a></li>
+<li><a href="/wiki/Delbarestivale" title="Delbarestivale">Delbarestivale</a></li>
+<li><a href="/wiki/Delrouval" title="Delrouval">Delrouval</a></li>
+<li><a href="/wiki/Devonshire_Quarrenden" title="Devonshire Quarrenden">Devonshire Quarrenden</a></li>
+<li><a href="/wiki/Discovery_(apple)" title="Discovery (apple)">Discovery</a></li>
+<li><a href="/wiki/Dorsett_Golden" title="Dorsett Golden">Dorsett Golden</a></li>
+<li><a href="/wiki/Dougherty_(apple)" title="Dougherty (apple)">Dougherty</a></li>
+<li><a href="/wiki/Duchess_of_Oldenburg_(apple)" title="Duchess of Oldenburg (apple)">Duchess of Oldenburg</a></li>
+<li><a href="/wiki/Dumelow%27s_Seedling" title="Dumelow's Seedling">Dumelow's Seedling</a></li>
+<li><a href="/wiki/Egremont_Russet" title="Egremont Russet">Egremont Russet</a></li>
+<li><a href="/wiki/Ellison%27s_Orange" title="Ellison's Orange">Ellison's Orange</a></li>
+<li><a href="/wiki/Elstar" title="Elstar">Elstar</a></li>
+<li><a href="/wiki/Empire_(apple)" title="Empire (apple)">Empire</a></li>
+<li><a href="/wiki/Enterprise_(apple)" title="Enterprise (apple)">Enterprise</a></li>
+<li><a href="/wiki/Envy_(apple)" title="Envy (apple)">Envy</a></li>
+<li><a href="/wiki/Esopus_Spitzenburg" title="Esopus Spitzenburg">Esopus Spitzenburg</a></li>
+<li><a href="/wiki/Eva_(apple)" title="Eva (apple)">Eva</a></li>
+<li><a href="/wiki/EverCrisp" title="EverCrisp">EverCrisp</a></li>
+<li><a href="/wiki/Fiesta_(apple)" title="Fiesta (apple)">Fiesta</a></li>
+<li><a href="/wiki/Filippa_(apple)" title="Filippa (apple)">Filippa</a></li>
+<li><a href="/wiki/Flamenco_(apple)" title="Flamenco (apple)">Flamenco</a></li>
+<li><a href="/wiki/Florina_(apple)" title="Florina (apple)">Florina</a></li>
+<li><a href="/wiki/Fuji_(apple)" title="Fuji (apple)">Fuji</a></li>
+<li><a href="/wiki/Gala_(apple)" title="Gala (apple)">Gala</a></li>
+<li><a href="/wiki/Gascoyne%27s_Scarlet" title="Gascoyne's Scarlet">Gascoyne's Scarlet</a></li>
+<li><a href="/wiki/Geheimrat_Dr._Oldenburg" title="Geheimrat Dr. Oldenburg">Geheimrat Dr. Oldenburg</a></li>
+<li><a href="/wiki/Ginger_Gold" title="Ginger Gold">Ginger Gold</a></li>
+<li><a href="/wiki/Golden_Delicious" title="Golden Delicious">Golden Delicious</a></li>
+<li><a href="/wiki/Golden_Orange_(apple)" title="Golden Orange (apple)">Golden Orange</a></li>
+<li><a href="/wiki/Goldspur" title="Goldspur">Goldspur</a></li>
+<li><a href="/wiki/Granny_Smith" title="Granny Smith">Granny Smith</a></li>
+<li><a href="/wiki/Gravenstein" title="Gravenstein">Gravenstein</a></li>
+<li><a href="/wiki/Grimes_Golden" title="Grimes Golden">Grimes Golden</a></li>
+<li><a href="/wiki/Haralson_(apple)" title="Haralson (apple)">Haralson</a></li>
+<li><a href="/wiki/Hokuto_(apple)" title="Hokuto (apple)">Hokuto</a></li>
+<li><a href="/wiki/Honeycrisp" title="Honeycrisp">Honeycrisp</a></li>
+<li><a href="/wiki/Honeygold" title="Honeygold">Honeygold</a></li>
+<li><a href="/wiki/Idared" title="Idared">Idared</a></li>
+<li><a href="/wiki/Ingrid_Marie" title="Ingrid Marie">Ingrid Marie</a></li>
+<li><a href="/wiki/James_Grieve_(apple)" title="James Grieve (apple)">James Grieve</a></li>
+<li><a href="/wiki/Jazz_(apple)" title="Jazz (apple)">Jazz</a></li>
+<li><a href="/wiki/Jersey_Black" title="Jersey Black">Jersey Black</a></li>
+<li><a href="/wiki/Jonadel" title="Jonadel">Jonadel</a></li>
+<li><a href="/wiki/Jonagold" title="Jonagold">Jonagold</a></li>
+<li><a href="/wiki/Jonathan_(apple)" title="Jonathan (apple)">Jonathan</a></li>
+<li><a href="/wiki/Jubilee_apple" title="Jubilee apple">Jubilee</a></li>
+<li><a href="/wiki/Julieta_(apple)" title="Julieta (apple)">Julieta</a></li>
+<li><a href="/wiki/Jupiter_(apple)" title="Jupiter (apple)">Jupiter</a></li>
+<li><a href="/wiki/Kanzi_(apple)" title="Kanzi (apple)">Kanzi</a></li>
+<li><a href="/wiki/Karmijn_de_Sonnaville" title="Karmijn de Sonnaville">Karmijn de Sonnaville</a></li>
+<li><a href="/wiki/King_of_the_Pippins" title="King of the Pippins">King of the Pippins</a></li>
+<li><a href="/wiki/Knobby_Russet" title="Knobby Russet">Knobby Russet</a></li>
+<li><a href="/wiki/Lady_Alice_(apple)" title="Lady Alice (apple)">Lady Alice</a></li>
+<li><a href="/wiki/Laxton%27s_Superb" title="Laxton's Superb">Laxton's Superb</a></li>
+<li><a href="/wiki/Liberty_(apple)" title="Liberty (apple)">Liberty</a></li>
+<li><a href="/wiki/Liveland_Raspberry_apple" title="Liveland Raspberry apple">Liveland Raspberry</a></li>
+<li><a href="/wiki/Lodi_(apple)" title="Lodi (apple)">Lodi</a></li>
+<li><a href="/wiki/Lord_Lambourne_(apple)" title="Lord Lambourne (apple)">Lord Lambourne</a></li>
+<li><a href="/wiki/Lucombe%27s_Seedling" title="Lucombe's Seedling">Lucombe's Seedling</a></li>
+<li><a href="/wiki/Macoun_apple" title="Macoun apple">Macoun</a></li>
+<li><a href="/wiki/McIntosh_(apple)" title="McIntosh (apple)">McIntosh</a></li>
+<li><a href="/wiki/Melba_(apple)" title="Melba (apple)">Melba</a></li>
+<li><a href="/wiki/Melrose_(apple)" title="Melrose (apple)">Melrose</a></li>
+<li><a href="/wiki/Mutsu_(apple)" title="Mutsu (apple)">Mutsu</a></li>
+<li><a href="/wiki/Newtown_Pippin" title="Newtown Pippin">Newtown Pippin</a></li>
+<li><a href="/wiki/Nicola_(apple)" title="Nicola (apple)">Nicola</a></li>
+<li><a href="/wiki/Opal_(apple)" title="Opal (apple)">Opal</a></li>
+<li><a href="/wiki/Sciros" title="Sciros">Sciros (Pacific Rose)</a></li>
+<li><a href="/wiki/Pam%27s_Delight" title="Pam's Delight">Pam's Delight</a></li>
+<li><a href="/wiki/Papirovka" title="Papirovka">Papirovka</a></li>
+<li><a href="/wiki/Paula_Red" title="Paula Red">Paula Red</a></li>
+<li><a href="/wiki/Pink_Pearl_(apple)" title="Pink Pearl (apple)">Pink Pearl</a></li>
+<li><a href="/wiki/Pinova" title="Pinova">Pinova</a></li>
+<li><a href="/wiki/Prima_apple" title="Prima apple">Prima</a></li>
+<li><a href="/wiki/Pristine_apple" title="Pristine apple">Pristine</a></li>
+<li><a href="/wiki/Rajka_(apple)" title="Rajka (apple)">Rajka</a></li>
+<li><a href="/wiki/Ralls_Janet" title="Ralls Janet">Ralls Janet</a></li>
+<li><a href="/wiki/Rambo_apple" title="Rambo apple">Rambo</a></li>
+<li><a href="/wiki/MN55_(apple)" title="MN55 (apple)">Rave</a></li>
+<li><a href="/wiki/Red_Astrachan" title="Red Astrachan">Red Astrachan</a></li>
+<li><a href="/wiki/Red_Delicious" title="Red Delicious">Red Delicious</a></li>
+<li><a href="/wiki/Red_Pineapple_(apple)" title="Red Pineapple (apple)">Red Pineapple</a></li>
+<li><a href="/wiki/Redlove_apples" title="Redlove apples">Redlove apples</a></li>
+<li><a href="/wiki/Rhode_Island_Greening" title="Rhode Island Greening">Rhode Island Greening</a></li>
+<li><a href="/wiki/Ribston_Pippin" title="Ribston Pippin">Ribston Pippin</a></li>
+<li><a href="/wiki/Roxbury_Russet" title="Roxbury Russet">Roxbury Russet</a></li>
+<li><a href="/wiki/Sandow_(apple)" title="Sandow (apple)">Sandow</a></li>
+<li><a href="/wiki/Sansa_apple" title="Sansa apple">Sansa</a></li>
+<li><a href="/wiki/Sekai_Ichi" title="Sekai Ichi">Sekai Ichi</a></li>
+<li><a href="/wiki/Spartan_(apple)" title="Spartan (apple)">Spartan</a></li>
+<li><a href="/wiki/Splendour_(apple)" title="Splendour (apple)">Splendour</a></li>
+<li><a href="/wiki/Star_of_Devon" title="Star of Devon">Star of Devon</a></li>
+<li><a href="/wiki/Stayman_(apple)" title="Stayman (apple)">Stayman</a></li>
+<li><a href="/wiki/Sturmer_Pippin" title="Sturmer Pippin">Sturmer Pippin</a></li>
+<li><a href="/wiki/Summerfree" title="Summerfree">Summerfree</a></li>
+<li><a href="/wiki/Cripps_Red" title="Cripps Red">Sundowner</a></li>
+<li><a href="/wiki/Sunset_(apple)" title="Sunset (apple)">Sunset</a></li>
+<li><a href="/wiki/Suntan_(apple)" title="Suntan (apple)">Suntan</a></li>
+<li><a href="/wiki/SweeTango" title="SweeTango">SweeTango</a></li>
+<li><a href="/wiki/Taliaferro_(apple)" title="Taliaferro (apple)">Taliaferro</a></li>
+<li><a href="/wiki/Tartu_Rose" title="Tartu Rose">Tartu Rose</a></li>
+<li><a href="/wiki/Tentation" title="Tentation">Tentation</a></li>
+<li><a href="/wiki/Tompkins_King" title="Tompkins King">Tompkins King</a></li>
+<li><a href="/wiki/Topaz_(apple)" title="Topaz (apple)">Topaz</a></li>
+<li><a href="/wiki/Wealthy_(apple)" title="Wealthy (apple)">Wealthy</a></li>
+<li><a href="/wiki/Winesap" title="Winesap">Winesap</a></li>
+<li><a href="/wiki/Winston_(apple)" title="Winston (apple)">Winston</a></li>
+<li><a href="/wiki/Worcester_Pearmain" title="Worcester Pearmain">Worcester Pearmain</a></li>
+<li><a href="/wiki/Wyken_Pippin" title="Wyken Pippin">Wyken Pippin</a></li>
+<li><a href="/wiki/York_Imperial" title="York Imperial">York Imperial</a></li>
+<li><a href="/wiki/Zestar_apple" title="Zestar apple">Zestar</a></li></ul>
+</div></td></tr><tr style="display: none;"><th scope="row" class="navbox-group" style="width:1%"><a href="/wiki/Cooking_apple" title="Cooking apple">Cooking apples</a></th><td class="navbox-list-with-group navbox-list navbox-odd" style="width:100%;padding:0"><div style="padding:0 0.25em">
+<ul><li><a href="/wiki/Antonovka" title="Antonovka">Antonovka</a></li>
+<li><a href="/wiki/Bismarck_(apple)" title="Bismarck (apple)">Bismarck</a></li>
+<li><a href="/wiki/Blenheim_Orange" title="Blenheim Orange">Blenheim Orange</a></li>
+<li><a href="/wiki/Bramley_apple" title="Bramley apple">Bramley</a></li>
+<li><a href="/wiki/Calville_Blanc_d%27hiver" title="Calville Blanc d'hiver">Calville Blanc d'hiver</a></li>
+<li><a href="/wiki/Campanino" title="Campanino">Campanino</a></li>
+<li><a href="/wiki/Cellini_(apple)" title="Cellini (apple)">Cellini</a></li>
+<li><a href="/wiki/Chelmsford_Wonder" title="Chelmsford Wonder">Chelmsford Wonder</a></li>
+<li><a href="/wiki/Costard_(apple)" title="Costard (apple)">Costard</a></li>
+<li><a href="/wiki/Creston_(apple)" title="Creston (apple)">Creston</a></li>
+<li><a href="/wiki/Crimson_Bramley" title="Crimson Bramley">Crimson Bramley</a></li>
+<li><a href="/wiki/Flower_of_Kent" title="Flower of Kent">Flower of Kent</a></li>
+<li><a href="/wiki/Golden_Noble" title="Golden Noble">Golden Noble</a></li>
+<li><a href="/wiki/Granny_Smith" title="Granny Smith">Granny Smith</a></li>
+<li><a href="/wiki/Grenadier_(apple)" title="Grenadier (apple)">Grenadier</a></li>
+<li><a href="/wiki/King_Byerd" title="King Byerd">King Byerd</a></li>
+<li><a href="/wiki/Manks_Codlin" title="Manks Codlin">Manks Codlin</a></li>
+<li><a href="/wiki/Newton_Wonder" title="Newton Wonder">Newton Wonder</a></li>
+<li><a href="/wiki/Norfolk_Biffin" title="Norfolk Biffin">Norfolk Biffin</a></li>
+<li><a href="/wiki/Northern_Spy" title="Northern Spy">Northern Spy</a></li>
+<li><a href="/wiki/Reinette_du_Canada" title="Reinette du Canada">Reinette du Canada</a></li>
+<li><a href="/wiki/Rome_apple" title="Rome apple">Rome</a></li>
+<li><a href="/wiki/Upton_Pyne_apple" title="Upton Pyne apple">Upton Pyne</a></li>
+<li><a href="/wiki/White_Transparent" title="White Transparent">White Transparent</a></li>
+<li><a href="/wiki/Wolf_River_(apple)" title="Wolf River (apple)">Wolf River</a></li></ul>
+</div></td></tr><tr style="display: none;"><th scope="row" class="navbox-group" style="width:1%"><a href="/wiki/Cider_apple" title="Cider apple">Cider apples</a></th><td class="navbox-list-with-group navbox-list navbox-even" style="width:100%;padding:0"><div style="padding:0 0.25em">
+<ul><li><a href="/wiki/Brown_Snout" title="Brown Snout">Brown Snout</a></li>
+<li><a href="/wiki/Cap_of_Liberty_(apple)" title="Cap of Liberty (apple)">Cap of Liberty</a></li>
+<li><a href="/wiki/Chisel_Jersey" title="Chisel Jersey">Chisel Jersey</a></li>
+<li><a href="/wiki/Coccagee" title="Coccagee">Coccagee</a></li>
+<li><a href="/wiki/Crimson_King_(apple)" title="Crimson King (apple)">Crimson King</a></li>
+<li><a href="/wiki/Dabinett" title="Dabinett">Dabinett</a></li>
+<li><a href="/wiki/Dufflin_(apple)" title="Dufflin (apple)">Dufflin</a></li>
+<li><a href="/wiki/Ellis_Bitter" title="Ellis Bitter">Ellis Bitter</a></li>
+<li><a href="/wiki/Foxwhelp" title="Foxwhelp">Foxwhelp</a></li>
+<li><a href="/wiki/Golden_Russet" title="Golden Russet">Golden Russet</a></li>
+<li><a href="/wiki/Golden_Spire" title="Golden Spire">Golden Spire</a></li>
+<li><a href="/wiki/Hangdown_(apple)" title="Hangdown (apple)">Hangdown</a></li>
+<li><a href="/wiki/Harrison_Cider_Apple" title="Harrison Cider Apple">Harrison Cider</a></li>
+<li><a href="/wiki/Kingston_Black" title="Kingston Black">Kingston Black</a></li>
+<li><a href="/wiki/Major_(cider_apple)" title="Major (cider apple)">Major</a></li>
+<li><a href="/wiki/Michelin_(apple)" title="Michelin (apple)">Michelin</a></li>
+<li><a href="/wiki/Poveshon" title="Poveshon">Poveshon</a></li>
+<li><a href="/wiki/Redstreak" title="Redstreak">Redstreak</a></li>
+<li><a href="/wiki/Slack-ma-Girdle" title="Slack-ma-Girdle">Slack-ma-Girdle</a></li>
+<li><a href="/wiki/Styre" title="Styre">Styre</a></li>
+<li><a href="/wiki/Tom_Putt" title="Tom Putt">Tom Putt</a></li>
+<li><a href="/wiki/Woodcock_(apple)" title="Woodcock (apple)">Woodcock</a></li>
+<li><a href="/wiki/Yarlington_Mill" title="Yarlington Mill">Yarlington Mill</a></li></ul>
+</div></td></tr><tr style="display: none;"><th scope="row" class="navbox-group" style="width:1%"><a href="/wiki/Ornamental_plant" title="Ornamental plant">Ornamental apple</a></th><td class="navbox-list-with-group navbox-list navbox-odd" style="width:100%;padding:0"><div style="padding:0 0.25em">
+<ul><li><a href="/wiki/Flamenco_(apple)" title="Flamenco (apple)">Flamenco</a></li>
+<li><a href="/wiki/Goldspur" title="Goldspur">Goldspur</a></li>
+<li><a href="/wiki/Wijcik_McIntosh" title="Wijcik McIntosh">Wijcik McIntosh</a></li></ul>
+</div></td></tr><tr style="display: none;"><th scope="row" class="navbox-group" style="width:1%"><a href="/wiki/List_of_apple_dishes" title="List of apple dishes">Apple products</a></th><td class="navbox-list-with-group navbox-list navbox-odd" style="width:100%;padding:0"><div style="padding:0 0.25em"></div><table class="nowraplinks navbox-subgroup" style="border-spacing:0"><tbody><tr><th scope="row" class="navbox-group" style="width:1%">Food</th><td class="navbox-list-with-group navbox-list navbox-even" style="width:100%;padding:0"><div style="padding:0 0.25em">
+<ul><li><a href="/wiki/Apple_butter" title="Apple butter">Apple butter</a></li>
+<li><a href="/wiki/Apple_cake" title="Apple cake">Apple cake</a></li>
+<li><a href="/wiki/Apple_cheese" title="Apple cheese">Apple cheese</a></li>
+<li><a href="/wiki/Apple_chip" title="Apple chip">Apple chip</a></li>
+<li><a href="/wiki/Apple_cider_vinegar" title="Apple cider vinegar">Apple cider vinegar</a></li>
+<li><a href="/wiki/Apple_crisp" title="Apple crisp">Apple crisp</a></li>
+<li><a href="/wiki/Apple_flour" title="Apple flour">Apple flour</a></li>
+<li><a href="/wiki/Apple_pie" title="Apple pie">Apple pie</a></li>
+<li><a href="/wiki/Apple_sauce" title="Apple sauce">Apple sauce</a></li>
+<li><a href="/wiki/Apple_seed_oil" title="Apple seed oil">Apple seed oil</a></li>
+<li><a href="/wiki/Apple_strudel" title="Apple strudel">Apple strudel</a></li>
+<li><a href="/wiki/Cooking_apple" title="Cooking apple">Baked apple</a></li>
+<li><a href="/wiki/Candy_apple" title="Candy apple">Candy apple</a></li>
+<li><a href="/wiki/Caramel_apple" title="Caramel apple">Caramel apple</a></li>
+<li><a href="/wiki/Himmel_und_Erde" title="Himmel und Erde">Himmel und Erde</a></li>
+<li><a href="/wiki/Jewish_apple_cake" title="Jewish apple cake">Jewish apple cake</a></li>
+<li><a href="/wiki/Pectin" title="Pectin">Pectin</a></li></ul>
+</div></td></tr><tr><th scope="row" class="navbox-group" style="width:1%">Drink</th><td class="navbox-list-with-group navbox-list navbox-odd" style="width:100%;padding:0"><div style="padding:0 0.25em">
+<ul><li><a href="/wiki/Apfelwein" title="Apfelwein">Apfelwein</a></li>
+<li><a href="/wiki/Apple_cider" title="Apple cider">Apple cider</a></li>
+<li><a href="/wiki/Apple_juice" title="Apple juice">Apple juice</a></li>
+<li><a href="/wiki/Applejack_(drink)" title="Applejack (drink)">Applejack</a></li>
+<li><a href="/wiki/Calvados" title="Calvados">Calvados</a></li>
+<li><a href="/wiki/Cider" title="Cider">Cider</a></li>
+<li><a href="/wiki/Ice_cider" title="Ice cider">Ice cider</a></li>
+<li><a href="/wiki/Pommeau" title="Pommeau">Pommeau</a></li></ul>
+</div></td></tr></tbody></table><div></div></td></tr><tr style="display: none;"><th scope="row" class="navbox-group" style="width:1%">Agriculture</th><td class="navbox-list-with-group navbox-list navbox-even" style="width:100%;padding:0"><div style="padding:0 0.25em">
+<ul><li><a href="/wiki/Apple_picking" class="mw-redirect" title="Apple picking">Apple picking</a></li>
+<li><a href="/wiki/Apple_scab" title="Apple scab">Apple scab</a></li>
+<li><a href="/wiki/Applecrab" title="Applecrab">Applecrab</a></li>
+<li><a href="/wiki/Arctic_Apples" title="Arctic Apples">Arctic Apples</a></li>
+<li><a href="/wiki/Fruit_tree_pruning" title="Fruit tree pruning">Fruit tree pruning</a></li>
+<li><i><a href="/wiki/Gymnosporangium_juniperi-virginianae" title="Gymnosporangium juniperi-virginianae">Gymnosporangium juniperi-virginianae</a></i></li>
+<li><a href="/wiki/Johnny_Appleseed" title="Johnny Appleseed">Johnny Appleseed</a></li>
+<li><a href="/wiki/Malling_series" title="Malling series">Malling series</a></li>
+<li><i><a href="/wiki/Malus" title="Malus">Malus</a></i></li>
+<li><a href="/wiki/Pearmain" title="Pearmain">Pearmain</a></li>
+<li><a href="/wiki/Fruit_tree_pollination#Apples" title="Fruit tree pollination">Pollination</a></li>
+<li><a href="/wiki/Pome" title="Pome">Pome</a></li>
+<li><a href="/wiki/PRI_disease_resistant_apple_breeding_program" title="PRI disease resistant apple breeding program">PRI disease resistant apple breeding program</a></li>
+<li><a href="/wiki/Reinette" title="Reinette">Reinette</a></li>
+<li><a href="/wiki/Russet_apple" title="Russet apple">Russeting</a></li>
+<li><a href="/wiki/US_Apple_Association" class="mw-redirect" title="US Apple Association">US Apple Association</a></li>
+<li>Lists
+<ul><li><a href="/wiki/List_of_countries_by_apple_production" title="List of countries by apple production">Countries by apple production</a></li>
+<li><a href="/wiki/List_of_apple_diseases" title="List of apple diseases">Apple diseases</a></li></ul></li></ul>
+</div></td></tr><tr style="display: none;"><td class="navbox-abovebelow hlist" colspan="2"><div>
+<ul><li><span class="noviewer" typeof="mw:File"><span title="Category"><img alt="" src="//upload.wikimedia.org/wikipedia/en/thumb/9/96/Symbol_category_class.svg/16px-Symbol_category_class.svg.png" decoding="async" width="16" height="16" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/en/thumb/9/96/Symbol_category_class.svg/23px-Symbol_category_class.svg.png 1.5x, //upload.wikimedia.org/wikipedia/en/thumb/9/96/Symbol_category_class.svg/31px-Symbol_category_class.svg.png 2x" data-file-width="180" data-file-height="185"></span></span> <a href="/wiki/Category:Apples" title="Category:Apples">Apples</a></li>
+<li><span class="noviewer" typeof="mw:File"><span title="Category"><img alt="" src="//upload.wikimedia.org/wikipedia/en/thumb/9/96/Symbol_category_class.svg/16px-Symbol_category_class.svg.png" decoding="async" width="16" height="16" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/en/thumb/9/96/Symbol_category_class.svg/23px-Symbol_category_class.svg.png 1.5x, //upload.wikimedia.org/wikipedia/en/thumb/9/96/Symbol_category_class.svg/31px-Symbol_category_class.svg.png 2x" data-file-width="180" data-file-height="185"></span></span> <a href="/wiki/Category:Apple_cultivars" title="Category:Apple cultivars">Cultivars</a></li>
+<li><span class="noviewer" typeof="mw:File"><span title="Category"><img alt="" src="//upload.wikimedia.org/wikipedia/en/thumb/9/96/Symbol_category_class.svg/16px-Symbol_category_class.svg.png" decoding="async" width="16" height="16" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/en/thumb/9/96/Symbol_category_class.svg/23px-Symbol_category_class.svg.png 1.5x, //upload.wikimedia.org/wikipedia/en/thumb/9/96/Symbol_category_class.svg/31px-Symbol_category_class.svg.png 2x" data-file-width="180" data-file-height="185"></span></span> <a href="/wiki/Category:Apple_production" title="Category:Apple production">Production</a></li></ul>
+</div></td></tr></tbody></table></div>
+<div class="navbox-styles"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1129693374"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1236075235"></div><div role="navigation" class="navbox" aria-labelledby="&amp;quot;Crabapple&amp;quot;_or_&amp;quot;Wild_apple&amp;quot;_(of_the_genus_Malus)" style="padding:3px"><table class="nowraplinks hlist mw-collapsible autocollapse navbox-inner mw-made-collapsible mw-collapsed" style="border-spacing:0;background:transparent;color:inherit"><tbody><tr><th scope="col" class="navbox-title" colspan="3" style="background:name;"><button type="button" class="mw-collapsible-toggle mw-collapsible-toggle-default mw-collapsible-toggle-collapsed" aria-expanded="false" tabindex="0"><span class="mw-collapsible-text">show</span></button><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1129693374"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1239400231"><div class="navbar plainlinks hlist navbar-mini"><ul><li class="nv-view"><a href="/wiki/Template:Crabapple" title="Template:Crabapple"><abbr title="View this template">v</abbr></a></li><li class="nv-talk"><a href="/wiki/Template_talk:Crabapple" title="Template talk:Crabapple"><abbr title="Discuss this template">t</abbr></a></li><li class="nv-edit"><a href="/wiki/Special:EditPage/Template:Crabapple" title="Special:EditPage/Template:Crabapple"><abbr title="Edit this template">e</abbr></a></li></ul></div><div id="&amp;quot;Crabapple&amp;quot;_or_&amp;quot;Wild_apple&amp;quot;_(of_the_genus_Malus)" style="font-size:114%;margin:0 4em">"<a href="/wiki/Malus" title="Malus">Crabapple</a>" <small>or</small> "Wild apple" <small>(of the <a href="/wiki/Genus" title="Genus">genus</a></small> <i><a href="/wiki/Malus" title="Malus">Malus</a></i>)</div></th></tr><tr style="display: none;"><th scope="row" class="navbox-group" style="width:1%"><a href="/wiki/Species" title="Species">Species</a>, <a href="/wiki/Variety_(botany)" title="Variety (botany)">varieties</a><br> and <a href="/wiki/Cultivar" title="Cultivar">cultivars</a></th><td class="navbox-list-with-group navbox-list navbox-odd" style="width:100%;padding:0"><div style="padding:0 0.25em">
+<ul><li><i><a href="/wiki/Malus_angustifolia" title="Malus angustifolia">Malus angustifolia</a></i> <small>(Southern)</small></li>
+<li><i><a href="/wiki/Malus_asiatica" title="Malus asiatica">Malus asiatica</a></i> <small>(Chinese pearleaf)</small></li>
+<li><i><a href="/wiki/Malus_baccata" title="Malus baccata">Malus baccata</a></i> <small>(Siberian)</small></li>
+<li><i><a href="/wiki/Malus_bracteata" class="mw-redirect" title="Malus bracteata">Malus bracteata</a></i></li>
+<li><i><a href="/wiki/Malus_brevipes" title="Malus brevipes">Malus brevipes</a></i></li>
+<li><i><a href="/wiki/Malus_coronaria" title="Malus coronaria">Malus coronaria</a></i> <small>(Sweet)</small></li>
+<li><i><a href="/wiki/Malus_crescimannoi" title="Malus crescimannoi">Malus crescimannoi</a></i></li>
+<li><i><a href="/wiki/Malus_doumeri" title="Malus doumeri">Malus doumeri</a></i></li>
+<li><i><a href="/wiki/Malus_%27Evereste%27" title="Malus 'Evereste'">Malus 'Evereste'</a></i></li>
+<li><i><a href="/wiki/Malus_florentina" title="Malus florentina">Malus florentina</a></i></li>
+<li><i><a href="/wiki/Malus_floribunda" title="Malus floribunda">Malus floribunda</a></i> <small>(Japanese)</small></li>
+<li><i><a href="/wiki/Malus_fusca" title="Malus fusca">Malus fusca</a></i> <small>(Oregon/Pacific)</small></li>
+<li><i><a href="/wiki/Malus_glabrata" class="mw-redirect" title="Malus glabrata">Malus glabrata</a></i></li>
+<li><i><a href="/wiki/Malus_glaucescens" class="mw-redirect" title="Malus glaucescens">Malus glaucescens</a></i></li>
+<li><i><a href="/wiki/Malus_halliana" title="Malus halliana">Malus halliana</a></i></li>
+<li><i><a href="/wiki/Malus_honanensis" title="Malus honanensis">Malus honanensis</a></i></li>
+<li><i><a href="/wiki/Malus_hupehensis" title="Malus hupehensis">Malus hupehensis</a></i> <small>(Tea)</small></li>
+<li><i><a href="/wiki/Malus_ioensis" title="Malus ioensis">Malus ioensis</a></i> <small>(Prairie)</small></li>
+<li><i><a href="/wiki/Malus_kansuensis" title="Malus kansuensis">Malus kansuensis</a></i></li>
+<li><i><a href="/wiki/Malus_lancifolia" class="mw-redirect" title="Malus lancifolia">Malus lancifolia</a></i></li>
+<li><i><a href="/wiki/Malus_mandshurica" title="Malus mandshurica">Malus mandshurica</a></i> <small>(Manchurian)</small></li>
+<li><i><a href="/wiki/Malus_niedzwetskyana" class="mw-redirect" title="Malus niedzwetskyana">Malus niedzwetskyana</a></i></li>
+<li><i><a href="/wiki/Malus_orientalis" title="Malus orientalis">Malus orientalis</a></i> (Caucasian)</li>
+<li><i><a href="/wiki/Malus_prattii" title="Malus prattii">Malus prattii</a></i></li>
+<li><i><a href="/wiki/Malus_prunifolia" title="Malus prunifolia">Malus prunifolia</a></i></li>
+<li><i><a href="/wiki/Malus_rockii" title="Malus rockii">Malus rockii</a></i></li>
+<li><i><a href="/wiki/Malus_sargentii" title="Malus sargentii">Malus sargentii</a></i></li>
+<li><i><a href="/wiki/Malus_sieboldii" title="Malus sieboldii">Malus sieboldii</a></i></li>
+<li><i><a href="/wiki/Malus_sieversii" title="Malus sieversii">Malus sieversii</a></i> <small>(Asian wild/Almaty)</small></li>
+<li><i><a href="/wiki/Malus_sikkimensis" title="Malus sikkimensis">Malus sikkimensis</a></i></li>
+<li><i><a href="/wiki/Malus_spectabilis" title="Malus spectabilis">Malus spectabilis</a></i></li>
+<li><i><a href="/wiki/Malus_sublobata" class="mw-redirect" title="Malus sublobata">Malus sublobata</a></i></li>
+<li><i><a href="/wiki/Malus_sylvestris" title="Malus sylvestris">Malus sylvestris</a></i> <small>(European wild)</small></li>
+<li><i><a href="/wiki/Malus_toringoides" title="Malus toringoides">Malus toringoides</a></i></li>
+<li><i><a href="/wiki/Malus_transitoria" title="Malus transitoria">Malus transitoria</a></i></li>
+<li><i><a href="/wiki/Malus_trilobata" title="Malus trilobata">Malus trilobata</a></i></li>
+<li><i><a href="/wiki/Malus_tschonoskii" class="mw-redirect" title="Malus tschonoskii">Malus tschonoskii</a></i></li>
+<li><i><a href="/wiki/Malus_yunnanensis" title="Malus yunnanensis">Malus yunnanensis</a></i></li></ul>
+</div></td><td class="noviewer navbox-image" rowspan="2" style="width:1px;padding:0 0 0 2px"><div><span typeof="mw:File"><a href="/wiki/File:Crab_apples_by_the_roadside_-_geograph.org.uk_-_978786.jpg" class="mw-file-description" title="Crab apples by the roadside"><img alt="Crab apples by the roadside" src="//upload.wikimedia.org/wikipedia/commons/thumb/0/01/Crab_apples_by_the_roadside_-_geograph.org.uk_-_978786.jpg/100px-Crab_apples_by_the_roadside_-_geograph.org.uk_-_978786.jpg" decoding="async" width="100" height="133" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/commons/thumb/0/01/Crab_apples_by_the_roadside_-_geograph.org.uk_-_978786.jpg/150px-Crab_apples_by_the_roadside_-_geograph.org.uk_-_978786.jpg 1.5x, //upload.wikimedia.org/wikipedia/commons/thumb/0/01/Crab_apples_by_the_roadside_-_geograph.org.uk_-_978786.jpg/200px-Crab_apples_by_the_roadside_-_geograph.org.uk_-_978786.jpg 2x" data-file-width="480" data-file-height="640"></a></span></div></td></tr><tr style="display: none;"><th scope="row" class="navbox-group" style="width:1%">Topics</th><td class="navbox-list-with-group navbox-list navbox-even" style="width:100%;padding:0"><div style="padding:0 0.25em">
+<ul><li><a class="mw-selflink selflink">Apple</a></li>
+<li><a href="/wiki/Applecrab" title="Applecrab">Applecrab</a></li>
+<li><a href="/wiki/Malling_series" title="Malling series">Malling series</a></li></ul>
+</div></td></tr><tr style="display: none;"><td class="navbox-abovebelow" colspan="3" style="font-weight:bold;"><div>
+<ul><li><span class="noviewer" typeof="mw:File"><span title="Category"><img alt="" src="//upload.wikimedia.org/wikipedia/en/thumb/9/96/Symbol_category_class.svg/16px-Symbol_category_class.svg.png" decoding="async" width="16" height="16" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/en/thumb/9/96/Symbol_category_class.svg/23px-Symbol_category_class.svg.png 1.5x, //upload.wikimedia.org/wikipedia/en/thumb/9/96/Symbol_category_class.svg/31px-Symbol_category_class.svg.png 2x" data-file-width="180" data-file-height="185"></span></span> <a href="/wiki/Category:Apple_cultivars" title="Category:Apple cultivars">Category</a></li>
+<li><span class="noviewer" typeof="mw:File"><span title="Commons page"><img alt="" src="//upload.wikimedia.org/wikipedia/en/thumb/4/4a/Commons-logo.svg/12px-Commons-logo.svg.png" decoding="async" width="12" height="16" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/en/thumb/4/4a/Commons-logo.svg/18px-Commons-logo.svg.png 1.5x, //upload.wikimedia.org/wikipedia/en/thumb/4/4a/Commons-logo.svg/24px-Commons-logo.svg.png 2x" data-file-width="1024" data-file-height="1376"></span></span> <a href="https://commons.wikimedia.org/wiki/Category:Apple_cultivars" class="extiw" title="commons:Category:Apple cultivars">Commons</a></li></ul>
+</div></td></tr></tbody></table></div>
+<div class="navbox-styles"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1129693374"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1236075235"></div><div role="navigation" class="navbox" aria-labelledby="Taxon_identifiers" style="padding:3px"><table class="nowraplinks hlist navbox-inner" style="border-spacing:0;background:transparent;color:inherit"><tbody><tr><th scope="col" class="navbox-title" colspan="2"><div id="Taxon_identifiers" style="font-size:114%;margin:0 4em"><a href="/wiki/Help:Taxon_identifiers" title="Help:Taxon identifiers">Taxon identifiers</a></div></th></tr><tr><th scope="row" class="navbox-group" style="width:1%;text-align: left;"><i>Malus domestica</i></th><td class="navbox-list-with-group navbox-list navbox-odd" style="width:100%;padding:0"><div style="padding:0 0.25em">
+<ul><li><span style="white-space:nowrap;"><a href="/wiki/Wikidata" title="Wikidata">Wikidata</a>: <span class="uid"><span class="external"><a href="https://www.wikidata.org/wiki/Q18674606" class="extiw" title="wikidata:Q18674606">Q18674606</a></span></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/Wikispecies" title="Wikispecies">Wikispecies</a>: <span class="uid"><span class="external"><a href="https://species.wikimedia.org/wiki/Malus_domestica" class="extiw" title="wikispecies:Malus domestica">Malus domestica</a></span></span></span></li>
+<li><span style="white-space:nowrap;">APDB: <span class="uid"><a rel="nofollow" class="external text" href="https://africanplantdatabase.ch/en/nomen/152668">152668</a></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/Australian_Plant_Name_Index" title="Australian Plant Name Index">APNI</a>: <span class="uid"><a rel="nofollow" class="external text" href="https://id.biodiversity.org.au/name/apni/122984">122984</a></span></span></li>
+<li><span style="white-space:nowrap;">BioLib: <span class="uid"><a rel="nofollow" class="external text" href="https://www.biolib.cz/en/taxon/id39552">39552</a></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/Barcode_of_Life_Data_System" title="Barcode of Life Data System">BOLD</a>: <span class="uid"><a rel="nofollow" class="external text" href="http://www.boldsystems.org/index.php/TaxBrowser_TaxonPage?taxid=254406">254406</a></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/Catalogue_of_Life" title="Catalogue of Life">CoL</a>: <span class="uid"><a rel="nofollow" class="external text" href="https://www.catalogueoflife.org/data/taxon/7NHJZ">7NHJZ</a></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/Ecocrop" title="Ecocrop">Ecocrop</a>: <span class="uid"><a rel="nofollow" class="external text" href="https://ecocrop.review.fao.org/ecocrop/srv/en/cropView?id=1407">1407</a></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/EPPO_Code" title="EPPO Code">EPPO</a>: <span class="uid"><a rel="nofollow" class="external text" href="https://gd.eppo.int/taxon/MABSD">MABSD</a></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/European_Nature_Information_System" class="mw-redirect" title="European Nature Information System">EUNIS</a>: <span class="uid"><a rel="nofollow" class="external text" href="https://eunis.eea.europa.eu/species/180045">180045</a></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/Flora_of_North_America" title="Flora of North America">FNA</a>: <span class="uid"><a rel="nofollow" class="external text" href="http://www.efloras.org/florataxon.aspx?flora_id=1&amp;taxon_id=242331459">242331459</a></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/Global_Biodiversity_Information_Facility" title="Global Biodiversity Information Facility">GBIF</a>: <span class="uid"><a rel="nofollow" class="external text" href="https://www.gbif.org/species/3001244">3001244</a></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/Germplasm_Resources_Information_Network" title="Germplasm Resources Information Network">GRIN</a>: <span class="uid"><a rel="nofollow" class="external text" href="https://npgsweb.ars-grin.gov/gringlobal/taxonomydetail.aspx?id=104681">104681</a></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/INaturalist" title="INaturalist">iNaturalist</a>: <span class="uid"><a rel="nofollow" class="external text" href="https://inaturalist.org/taxa/469472">469472</a></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/International_Plant_Names_Index" title="International Plant Names Index">IPNI</a>: <span class="uid"><a rel="nofollow" class="external text" href="https://www.ipni.org/n/726282-1">726282-1</a></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/Integrated_Taxonomic_Information_System" title="Integrated Taxonomic Information System">ITIS</a>: <span class="uid"><a rel="nofollow" class="external text" href="https://www.itis.gov/servlet/SingleRpt/SingleRpt?search_topic=TSN&amp;search_value=516655">516655</a></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/National_Center_for_Biotechnology_Information" title="National Center for Biotechnology Information">NCBI</a>: <span class="uid"><a rel="nofollow" class="external text" href="https://www.ncbi.nlm.nih.gov/Taxonomy/Browser/wwwtax.cgi?mode=Info&amp;id=3750">3750</a></span></span></li>
+<li><span style="white-space:nowrap;">NZOR: <span class="uid"><a rel="nofollow" class="external text" href="https://www.nzor.org.nz/names/14d024a2-d821-48e3-95d8-f0dd206c70a0">14d024a2-d821-48e3-95d8-f0dd206c70a0</a></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/Observation.org" title="Observation.org">Observation.org</a>: <span class="uid"><a rel="nofollow" class="external text" href="https://observation.org/species/123770/">123770</a></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/Open_Tree_of_Life" title="Open Tree of Life">Open Tree of Life</a>: <span class="uid"><a rel="nofollow" class="external text" href="https://tree.opentreeoflife.org/taxonomy/browse?id=3902985">3902985</a></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/Plants_for_a_Future" title="Plants for a Future">PfaF</a>: <span class="uid"><a rel="nofollow" class="external text" href="https://pfaf.org/user/Plant.aspx?LatinName=Malus+domestica">Malus domestica</a></span></span></li>
+<li><span style="white-space:nowrap;">PFI: <span class="uid"><a rel="nofollow" class="external text" href="http://dryades.units.it/floritaly/index.php?procedure=taxon_page&amp;tipo=all&amp;id=2175">2175</a></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/The_Plant_List" title="The Plant List">Plant List</a>: <span class="uid"><a rel="nofollow" class="external text" href="http://www.theplantlist.org/tpl1.1/record/rjp-454">rjp-454</a></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/Plants_of_the_World_Online" title="Plants of the World Online">POWO</a>: <span class="uid"><a rel="nofollow" class="external text" href="https://powo.science.kew.org/taxon/urn%3Alsid%3Aipni.org%3Anames%3A726282-1">urn:lsid:ipni.org:names:726282-1</a></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/Tropicos" title="Tropicos">Tropicos</a>: <span class="uid"><a rel="nofollow" class="external text" href="http://legacy.tropicos.org/Name/27804420">27804420</a></span></span></li>
+<li><span style="white-space:nowrap;">VASCAN: <span class="uid"><a rel="nofollow" class="external text" href="https://data.canadensys.net/vascan/taxon/20142">20142</a></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/National_Herbarium_of_Victoria" title="National Herbarium of Victoria">VicFlora</a>: <span class="uid"><a rel="nofollow" class="external text" href="https://vicflora.rbg.vic.gov.au/flora/taxon/e41b929d-b709-4f4c-8dbe-2a9241e2342b">e41b929d-b709-4f4c-8dbe-2a9241e2342b</a></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/World_Flora_Online" title="World Flora Online">WFO</a>: <span class="uid"><a rel="nofollow" class="external text" href="https://list.worldfloraonline.org/wfo-0001008355">wfo-0001008355</a></span></span></li></ul>
+</div></td></tr><tr><th scope="row" class="navbox-group" style="width:1%;text-align: left;"><i>Malus pumila</i></th><td class="navbox-list-with-group navbox-list navbox-even" style="width:100%;padding:0"><div style="padding:0 0.25em">
+<ul><li><span style="white-space:nowrap;"><a href="/wiki/Wikidata" title="Wikidata">Wikidata</a>: <span class="uid"><span class="external"><a href="https://www.wikidata.org/wiki/Q158657" class="extiw" title="wikidata:Q158657">Q158657</a></span></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/Wikispecies" title="Wikispecies">Wikispecies</a>: <span class="uid"><span class="external"><a href="https://species.wikimedia.org/wiki/Malus_pumila" class="extiw" title="wikispecies:Malus pumila">Malus pumila</a></span></span></span></li>
+<li><span style="white-space:nowrap;">APA: <span class="uid"><a rel="nofollow" class="external text" href="http://floraofalabama.org/Plant.aspx?id=3159">3159</a></span></span></li>
+<li><span style="white-space:nowrap;">APDB: <span class="uid"><a rel="nofollow" class="external text" href="https://africanplantdatabase.ch/en/nomen/225375">225375</a></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/Australian_Plant_Name_Index" title="Australian Plant Name Index">APNI</a>: <span class="uid"><a rel="nofollow" class="external text" href="https://id.biodiversity.org.au/name/apni/201024">201024</a></span></span></li>
+<li><span style="white-space:nowrap;">BioLib: <span class="uid"><a rel="nofollow" class="external text" href="https://www.biolib.cz/en/taxon/id214890">214890</a></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/Barcode_of_Life_Data_System" title="Barcode of Life Data System">BOLD</a>: <span class="uid"><a rel="nofollow" class="external text" href="http://www.boldsystems.org/index.php/TaxBrowser_TaxonPage?taxid=121191">121191</a></span></span></li>
+<li><span style="white-space:nowrap;">Calflora: <span class="uid"><a rel="nofollow" class="external text" href="https://www.calflora.org/cgi-bin/species_query.cgi?where-calrecnum=10099">10099</a></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/Encyclopedia_of_Life" title="Encyclopedia of Life">EoL</a>: <span class="uid"><a rel="nofollow" class="external text" href="https://eol.org/pages/629943">629943</a></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/EPPO_Code" title="EPPO Code">EPPO</a>: <span class="uid"><a rel="nofollow" class="external text" href="https://gd.eppo.int/taxon/MABPM">MABPM</a></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/European_Nature_Information_System" class="mw-redirect" title="European Nature Information System">EUNIS</a>: <span class="uid"><a rel="nofollow" class="external text" href="https://eunis.eea.europa.eu/species/179710">179710</a></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/Flora_of_North_America" title="Flora of North America">FNA</a>: <span class="uid"><a rel="nofollow" class="external text" href="http://www.efloras.org/florataxon.aspx?flora_id=1&amp;taxon_id=200010913">200010913</a></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/Flora_of_China_(series)" title="Flora of China (series)">FoC</a>: <span class="uid"><a rel="nofollow" class="external text" href="http://www.efloras.org/florataxon.aspx?flora_id=2&amp;taxon_id=200010913">200010913</a></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/Global_Biodiversity_Information_Facility" title="Global Biodiversity Information Facility">GBIF</a>: <span class="uid"><a rel="nofollow" class="external text" href="https://www.gbif.org/species/3001093">3001093</a></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/Germplasm_Resources_Information_Network" title="Germplasm Resources Information Network">GRIN</a>: <span class="uid"><a rel="nofollow" class="external text" href="https://npgsweb.ars-grin.gov/gringlobal/taxonomydetail.aspx?id=23261">23261</a></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/INaturalist" title="INaturalist">iNaturalist</a>: <span class="uid"><a rel="nofollow" class="external text" href="https://inaturalist.org/taxa/77949">77949</a></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/International_Plant_Names_Index" title="International Plant Names Index">IPNI</a>: <span class="uid"><a rel="nofollow" class="external text" href="https://www.ipni.org/n/726372-1">726372-1</a></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/Integrated_Taxonomic_Information_System" title="Integrated Taxonomic Information System">ITIS</a>: <span class="uid"><a rel="nofollow" class="external text" href="https://www.itis.gov/servlet/SingleRpt/SingleRpt?search_topic=TSN&amp;search_value=25262">25262</a></span></span></li>
+<li><span style="white-space:nowrap;">MichiganFlora: <span class="uid"><a rel="nofollow" class="external text" href="https://michiganflora.net/species.aspx?id=2499">2499</a></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/NatureServe" title="NatureServe">NatureServe</a>: <span class="uid"><a rel="nofollow" class="external text" href="https://explorer.natureserve.org/Taxon/ELEMENT_GLOBAL.2.160610/">2.160610</a></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/National_Biodiversity_Network" title="National Biodiversity Network">NBN</a>: <span class="uid"><a rel="nofollow" class="external text" href="https://data.nbn.org.uk/Taxa/NHMSYS0000460571">NHMSYS0000460571</a></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/National_Center_for_Biotechnology_Information" title="National Center for Biotechnology Information">NCBI</a>: <span class="uid"><a rel="nofollow" class="external text" href="https://www.ncbi.nlm.nih.gov/Taxonomy/Browser/wwwtax.cgi?mode=Info&amp;id=283210">283210</a></span></span></li>
+<li><span style="white-space:nowrap;">NZOR: <span class="uid"><a rel="nofollow" class="external text" href="https://www.nzor.org.nz/names/e2b9e72c-b9bc-4ede-91f2-9ddceb5ffea6">e2b9e72c-b9bc-4ede-91f2-9ddceb5ffea6</a></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/Observation.org" title="Observation.org">Observation.org</a>: <span class="uid"><a rel="nofollow" class="external text" href="https://observation.org/species/140258/">140258</a></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/Open_Tree_of_Life" title="Open Tree of Life">Open Tree of Life</a>: <span class="uid"><a rel="nofollow" class="external text" href="https://tree.opentreeoflife.org/taxonomy/browse?id=854961">854961</a></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/Plants_for_a_Future" title="Plants for a Future">PfaF</a>: <span class="uid"><a rel="nofollow" class="external text" href="https://pfaf.org/user/Plant.aspx?LatinName=Malus+pumila">Malus pumila</a></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/The_Plant_List" title="The Plant List">Plant List</a>: <span class="uid"><a rel="nofollow" class="external text" href="http://www.theplantlist.org/tpl1.1/record/rjp-5777">rjp-5777</a></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/Natural_Resources_Conservation_Service#Plants" title="Natural Resources Conservation Service">PLANTS</a>: <span class="uid"><a rel="nofollow" class="external text" href="https://plants.sc.egov.usda.gov/plant-profile/MAPU">MAPU</a></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/Plants_of_the_World_Online" title="Plants of the World Online">POWO</a>: <span class="uid"><a rel="nofollow" class="external text" href="https://powo.science.kew.org/taxon/urn%3Alsid%3Aipni.org%3Anames%3A726372-1">urn:lsid:ipni.org:names:726372-1</a></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/Tropicos" title="Tropicos">Tropicos</a>: <span class="uid"><a rel="nofollow" class="external text" href="http://legacy.tropicos.org/Name/27800985">27800985</a></span></span></li>
+<li><span style="white-space:nowrap;">VASCAN: <span class="uid"><a rel="nofollow" class="external text" href="https://data.canadensys.net/vascan/taxon/8790">8790</a></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/National_Herbarium_of_Victoria" title="National Herbarium of Victoria">VicFlora</a>: <span class="uid"><a rel="nofollow" class="external text" href="https://vicflora.rbg.vic.gov.au/flora/taxon/5ba9c4cd-b261-4bf2-871d-d893d1bc15a8">5ba9c4cd-b261-4bf2-871d-d893d1bc15a8</a></span></span></li>
+<li><span style="white-space:nowrap;">WisFlora: <span class="uid"><a rel="nofollow" class="external text" href="https://wisflora.herbarium.wisc.edu/taxa/index.php?taxon=4188">4188</a></span></span></li>
+<li><span style="white-space:nowrap;"><a href="/wiki/World_Flora_Online" title="World Flora Online">WFO</a>: <span class="uid"><a rel="nofollow" class="external text" href="https://list.worldfloraonline.org/wfo-0001013584">wfo-0001013584</a></span></span></li></ul>
+</div></td></tr></tbody></table></div>
+<div class="navbox-styles"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1129693374"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1236075235"><style data-mw-deduplicate="TemplateStyles:r1038841319">.mw-parser-output .tooltip-dotted{border-bottom:1px dotted;cursor:help}</style><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1038841319"></div><div role="navigation" class="navbox authority-control" aria-labelledby="Authority_control_databases_frameless&amp;#124;text-top&amp;#124;10px&amp;#124;alt=Edit_this_at_Wikidata&amp;#124;link=https&amp;#58;//www.wikidata.org/wiki/Q89#identifiers&amp;#124;class=noprint&amp;#124;Edit_this_at_Wikidata" style="padding:3px"><table class="nowraplinks hlist mw-collapsible autocollapse navbox-inner mw-made-collapsible mw-collapsed" style="border-spacing:0;background:transparent;color:inherit"><tbody><tr><th scope="col" class="navbox-title" colspan="2"><button type="button" class="mw-collapsible-toggle mw-collapsible-toggle-default mw-collapsible-toggle-collapsed" aria-expanded="false" tabindex="0"><span class="mw-collapsible-text">show</span></button><div id="Authority_control_databases_frameless&amp;#124;text-top&amp;#124;10px&amp;#124;alt=Edit_this_at_Wikidata&amp;#124;link=https&amp;#58;//www.wikidata.org/wiki/Q89#identifiers&amp;#124;class=noprint&amp;#124;Edit_this_at_Wikidata" style="font-size:114%;margin:0 4em"><a href="/wiki/Help:Authority_control" title="Help:Authority control">Authority control databases</a> <span class="mw-valign-text-top noprint" typeof="mw:File/Frameless"><a href="https://www.wikidata.org/wiki/Q89#identifiers" title="Edit this at Wikidata"><img alt="Edit this at Wikidata" src="//upload.wikimedia.org/wikipedia/en/thumb/8/8a/OOjs_UI_icon_edit-ltr-progressive.svg/10px-OOjs_UI_icon_edit-ltr-progressive.svg.png" decoding="async" width="10" height="10" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/en/thumb/8/8a/OOjs_UI_icon_edit-ltr-progressive.svg/15px-OOjs_UI_icon_edit-ltr-progressive.svg.png 1.5x, //upload.wikimedia.org/wikipedia/en/thumb/8/8a/OOjs_UI_icon_edit-ltr-progressive.svg/20px-OOjs_UI_icon_edit-ltr-progressive.svg.png 2x" data-file-width="20" data-file-height="20"></a></span></div></th></tr><tr style="display: none;"><th scope="row" class="navbox-group" style="width:1%">National</th><td class="navbox-list-with-group navbox-list navbox-odd" style="width:100%;padding:0"><div style="padding:0 0.25em"><ul><li><span class="uid"><span class="rt-commentedText tooltip tooltip-dotted" title="Apfel"><a rel="nofollow" class="external text" href="https://d-nb.info/gnd/4002405-2">Germany</a></span></span></li><li><span class="uid"><a rel="nofollow" class="external text" href="https://id.loc.gov/authorities/sh85006106">United States</a></span></li><li><span class="uid"><a rel="nofollow" class="external text" href="https://id.ndl.go.jp/auth/ndlna/00569482">Japan</a></span></li><li><span class="uid"><span class="rt-commentedText tooltip tooltip-dotted" title="jablka"><a rel="nofollow" class="external text" href="https://aleph.nkp.cz/F/?func=find-c&amp;local_base=aut&amp;ccl_term=ica=ph121262&amp;CON_LNG=ENG">Czech Republic</a></span></span></li><li><span class="uid"><a rel="nofollow" class="external text" href="https://kopkatalogs.lv/F?func=direct&amp;local_base=lnc10&amp;doc_number=000326810&amp;P_CON_LNG=ENG">Latvia</a></span></li><li><span class="uid"><a rel="nofollow" class="external text" href="http://olduli.nli.org.il/F/?func=find-b&amp;local_base=NLX10&amp;find_code=UID&amp;request=987007294178805171">Israel</a></span></li></ul></div></td></tr><tr style="display: none;"><th scope="row" class="navbox-group" style="width:1%">Other</th><td class="navbox-list-with-group navbox-list navbox-even" style="width:100%;padding:0"><div style="padding:0 0.25em"><ul><li><span class="uid"><a rel="nofollow" class="external text" href="https://catalog.archives.gov/id/10647441">NARA</a></span></li></ul></div></td></tr></tbody></table></div>
+
+
+
+<!-- 
+NewPP limit report
+Parsed by mw‐web.codfw.main‐77cffc86c8‐8h9g9
+Cached time: 20241112180350
+Cache expiry: 2592000
+Reduced expiry: false
+Complications: [vary‐revision‐sha1, show‐toc]
+CPU time usage: 2.306 seconds
+Real time usage: 2.864 seconds
+Preprocessor visited node count: 16631/1000000
+Post‐expand include size: 467066/2097152 bytes
+Template argument size: 31637/2097152 bytes
+Highest expansion depth: 20/100
+Expensive parser function count: 80/500
+Unstrip recursion depth: 1/20
+Unstrip post‐expand size: 512506/5000000 bytes
+Lua time usage: 1.533/10.000 seconds
+Lua memory usage: 21410160/52428800 bytes
+Lua Profile:
+    MediaWiki\Extension\Scribunto\Engines\LuaSandbox\LuaSandboxCallback::getEntity      260 ms       16.2%
+    MediaWiki\Extension\Scribunto\Engines\LuaSandbox\LuaSandboxCallback::callParserFunction      220 ms       13.8%
+    dataWrapper <mw.lua:672>                                         220 ms       13.8%
+    ?                                                                200 ms       12.5%
+    MediaWiki\Extension\Scribunto\Engines\LuaSandbox\LuaSandboxCallback::expandTemplate      100 ms        6.2%
+    MediaWiki\Extension\Scribunto\Engines\LuaSandbox\LuaSandboxCallback::getExpandedArgument       80 ms        5.0%
+    <mw.lua:694>                                                      40 ms        2.5%
+    MediaWiki\Extension\Scribunto\Engines\LuaSandbox\LuaSandboxCallback::getEntityStatements       40 ms        2.5%
+    type                                                              40 ms        2.5%
+    MediaWiki\Extension\Scribunto\Engines\LuaSandbox\LuaSandboxCallback::gsub       40 ms        2.5%
+    [others]                                                         360 ms       22.5%
+Number of Wikibase entities loaded: 37/400
+-->
+<!--
+Transclusion expansion time report (%,ms,calls,template)
+100.00% 2484.540      1 -total
+ 31.75%  788.898      1 Template:Reflist
+ 16.19%  402.247      1 Template:Taxonbar
+ 10.00%  248.415      1 Template:Speciesbox
+  9.71%  241.219      1 Template:Taxobox/core
+  9.68%  240.597     45 Template:Cite_book
+  9.15%  227.420     39 Template:Cite_web
+  7.83%  194.645      7 Template:Infobox
+  7.54%  187.436     25 Template:Cite_journal
+  5.30%  131.578      1 Template:Stack
+-->
+
+<!-- Saved in parser cache with key enwiki:pcache:idhash:18978754-0!canonical and timestamp 20241112180350 and revision id 1256174424. Rendering was triggered because: page-view
+ -->
+</div><!--esi <esi:include src="/esitest-fa8a495983347898/content" /> --><noscript><img src="https://login.wikimedia.org/wiki/Special:CentralAutoLogin/start?type=1x1" alt="" width="1" height="1" style="border: none; position: absolute;"></noscript>
+<div class="printfooter" data-nosnippet="">Retrieved from "<a dir="ltr" href="https://en.wikipedia.org/w/index.php?title=Apple&amp;oldid=1256174424">https://en.wikipedia.org/w/index.php?title=Apple&amp;oldid=1256174424</a>"</div></div>
+					<div id="catlinks" class="catlinks" data-mw="interface"><div id="mw-normal-catlinks" class="mw-normal-catlinks"><a href="/wiki/Help:Category" title="Help:Category">Categories</a>: <ul><li><a href="/wiki/Category:Apples" title="Category:Apples">Apples</a></li><li><a href="/wiki/Category:Fruit" title="Category:Fruit">Fruit</a></li><li><a href="/wiki/Category:Fruits_originating_in_Asia" title="Category:Fruits originating in Asia">Fruits originating in Asia</a></li><li><a href="/wiki/Category:Malus" title="Category:Malus">Malus</a></li><li><a href="/wiki/Category:Plants_described_in_1768" title="Category:Plants described in 1768">Plants described in 1768</a></li></ul></div><div id="mw-hidden-catlinks" class="mw-hidden-catlinks mw-hidden-cats-hidden">Hidden categories: <ul><li><a href="/wiki/Category:CS1:_long_volume_value" title="Category:CS1: long volume value">CS1: long volume value</a></li><li><a href="/wiki/Category:CS1_Spanish-language_sources_(es)" title="Category:CS1 Spanish-language sources (es)">CS1 Spanish-language sources (es)</a></li><li><a href="/wiki/Category:CS1_maint:_bot:_original_URL_status_unknown" title="Category:CS1 maint: bot: original URL status unknown">CS1 maint: bot: original URL status unknown</a></li><li><a href="/wiki/Category:CS1_German-language_sources_(de)" title="Category:CS1 German-language sources (de)">CS1 German-language sources (de)</a></li><li><a href="/wiki/Category:Articles_with_short_description" title="Category:Articles with short description">Articles with short description</a></li><li><a href="/wiki/Category:Short_description_is_different_from_Wikidata" title="Category:Short description is different from Wikidata">Short description is different from Wikidata</a></li><li><a href="/wiki/Category:Wikipedia_indefinitely_semi-protected_pages" title="Category:Wikipedia indefinitely semi-protected pages">Wikipedia indefinitely semi-protected pages</a></li><li><a href="/wiki/Category:Wikipedia_indefinitely_move-protected_pages" title="Category:Wikipedia indefinitely move-protected pages">Wikipedia indefinitely move-protected pages</a></li><li><a href="/wiki/Category:Use_dmy_dates_from_September_2019" title="Category:Use dmy dates from September 2019">Use dmy dates from September 2019</a></li><li><a href="/wiki/Category:Good_articles" title="Category:Good articles">Good articles</a></li><li><a href="/wiki/Category:Articles_with_%27species%27_microformats" title="Category:Articles with 'species' microformats">Articles with 'species' microformats</a></li><li><a href="/wiki/Category:Articles_containing_Old_English_(ca._450-1100)-language_text" title="Category:Articles containing Old English (ca. 450-1100)-language text">Articles containing Old English (ca. 450-1100)-language text</a></li><li><a href="/wiki/Category:Articles_containing_Proto-Germanic-language_text" title="Category:Articles containing Proto-Germanic-language text">Articles containing Proto-Germanic-language text</a></li><li><a href="/wiki/Category:Articles_containing_Proto-Indo-European-language_text" title="Category:Articles containing Proto-Indo-European-language text">Articles containing Proto-Indo-European-language text</a></li><li><a href="/wiki/Category:Articles_containing_Middle_English_(1100-1500)-language_text" title="Category:Articles containing Middle English (1100-1500)-language text">Articles containing Middle English (1100-1500)-language text</a></li><li><a href="/wiki/Category:Articles_with_hAudio_microformats" title="Category:Articles with hAudio microformats">Articles with hAudio microformats</a></li><li><a href="/wiki/Category:Commons_category_link_is_on_Wikidata" title="Category:Commons category link is on Wikidata">Commons category link is on Wikidata</a></li><li><a href="/wiki/Category:Taxonbars_desynced_from_Wikidata" title="Category:Taxonbars desynced from Wikidata">Taxonbars desynced from Wikidata</a></li><li><a href="/wiki/Category:Taxonbars_on_possible_non-taxon_pages" title="Category:Taxonbars on possible non-taxon pages">Taxonbars on possible non-taxon pages</a></li><li><a href="/wiki/Category:Taxonbars_with_multiple_manual_Wikidata_items" title="Category:Taxonbars with multiple manual Wikidata items">Taxonbars with multiple manual Wikidata items</a></li><li><a href="/wiki/Category:Taxonbars_with_25%E2%80%9329_taxon_IDs" title="Category:Taxonbars with 25–29 taxon IDs">Taxonbars with 25–29 taxon IDs</a></li><li><a href="/wiki/Category:Taxonbars_with_30%E2%80%9334_taxon_IDs" title="Category:Taxonbars with 30–34 taxon IDs">Taxonbars with 30–34 taxon IDs</a></li></ul></div></div>
+				</div>
+			</main>
+			
+		</div>
+		<div class="mw-footer-container">
+			
+<footer id="footer" class="mw-footer">
+	<ul id="footer-info">
+	<li id="footer-info-lastmod"> This page was last edited on 8 November 2024, at 16:30<span class="anonymous-show">&nbsp;(UTC)</span>.</li>
+	<li id="footer-info-copyright">Text is available under the <a href="/wiki/Wikipedia:Text_of_the_Creative_Commons_Attribution-ShareAlike_4.0_International_License" title="Wikipedia:Text of the Creative Commons Attribution-ShareAlike 4.0 International License">Creative Commons Attribution-ShareAlike 4.0 License</a>;
+additional terms may apply. By using this site, you agree to the <a href="https://foundation.wikimedia.org/wiki/Special:MyLanguage/Policy:Terms_of_Use" class="extiw" title="foundation:Special:MyLanguage/Policy:Terms of Use">Terms of Use</a> and <a href="https://foundation.wikimedia.org/wiki/Special:MyLanguage/Policy:Privacy_policy" class="extiw" title="foundation:Special:MyLanguage/Policy:Privacy policy">Privacy Policy</a>. Wikipedia® is a registered trademark of the <a rel="nofollow" class="external text" href="https://wikimediafoundation.org/">Wikimedia Foundation, Inc.</a>, a non-profit organization.</li>
+</ul>
+
+	<ul id="footer-places">
+	<li id="footer-places-privacy"><a href="https://foundation.wikimedia.org/wiki/Special:MyLanguage/Policy:Privacy_policy">Privacy policy</a></li>
+	<li id="footer-places-about"><a href="/wiki/Wikipedia:About">About Wikipedia</a></li>
+	<li id="footer-places-disclaimers"><a href="/wiki/Wikipedia:General_disclaimer">Disclaimers</a></li>
+	<li id="footer-places-contact"><a href="//en.wikipedia.org/wiki/Wikipedia:Contact_us">Contact Wikipedia</a></li>
+	<li id="footer-places-wm-codeofconduct"><a href="https://foundation.wikimedia.org/wiki/Special:MyLanguage/Policy:Universal_Code_of_Conduct">Code of Conduct</a></li>
+	<li id="footer-places-developers"><a href="https://developer.wikimedia.org">Developers</a></li>
+	<li id="footer-places-statslink"><a href="https://stats.wikimedia.org/#/en.wikipedia.org">Statistics</a></li>
+	<li id="footer-places-cookiestatement"><a href="https://foundation.wikimedia.org/wiki/Special:MyLanguage/Policy:Cookie_statement">Cookie statement</a></li>
+	<li id="footer-places-mobileview"><a href="//en.m.wikipedia.org/w/index.php?title=Apple&amp;mobileaction=toggle_view_mobile" class="noprint stopMobileRedirectToggle">Mobile view</a></li>
+<li style="display: none;"><a href="#">Edit preview settings</a></li></ul>
+
+	<ul id="footer-icons" class="noprint">
+	<li id="footer-copyrightico"><a href="https://wikimediafoundation.org/" class="cdx-button cdx-button--fake-button cdx-button--size-large cdx-button--fake-button--enabled"><img src="/static/images/footer/wikimedia-button.svg" width="84" height="29" alt="Wikimedia Foundation" loading="lazy"></a></li>
+	<li id="footer-poweredbyico"><a href="https://www.mediawiki.org/" class="cdx-button cdx-button--fake-button cdx-button--size-large cdx-button--fake-button--enabled"><img src="/w/resources/assets/poweredby_mediawiki.svg" alt="Powered by MediaWiki" width="88" height="31" loading="lazy"></a></li>
+</ul>
+
+</footer>
+
+		</div>
+	</div> 
+</div> 
+<div class="vector-settings" id="p-dock-bottom">
+	<ul></ul>
+</div><script>(RLQ=window.RLQ||[]).push(function(){mw.config.set({"wgHostname":"mw-web.codfw.main-5847db6f8b-nhdnp","wgBackendResponseTime":188,"wgPageParseReport":{"limitreport":{"cputime":"2.306","walltime":"2.864","ppvisitednodes":{"value":16631,"limit":1000000},"postexpandincludesize":{"value":467066,"limit":2097152},"templateargumentsize":{"value":31637,"limit":2097152},"expansiondepth":{"value":20,"limit":100},"expensivefunctioncount":{"value":80,"limit":500},"unstrip-depth":{"value":1,"limit":20},"unstrip-size":{"value":512506,"limit":5000000},"entityaccesscount":{"value":37,"limit":400},"timingprofile":["100.00% 2484.540      1 -total"," 31.75%  788.898      1 Template:Reflist"," 16.19%  402.247      1 Template:Taxonbar"," 10.00%  248.415      1 Template:Speciesbox","  9.71%  241.219      1 Template:Taxobox/core","  9.68%  240.597     45 Template:Cite_book","  9.15%  227.420     39 Template:Cite_web","  7.83%  194.645      7 Template:Infobox","  7.54%  187.436     25 Template:Cite_journal","  5.30%  131.578      1 Template:Stack"]},"scribunto":{"limitreport-timeusage":{"value":"1.533","limit":"10.000"},"limitreport-memusage":{"value":21410160,"limit":52428800},"limitreport-profile":[["MediaWiki\\Extension\\Scribunto\\Engines\\LuaSandbox\\LuaSandboxCallback::getEntity","260","16.2"],["MediaWiki\\Extension\\Scribunto\\Engines\\LuaSandbox\\LuaSandboxCallback::callParserFunction","220","13.8"],["dataWrapper \u003Cmw.lua:672\u003E","220","13.8"],["?","200","12.5"],["MediaWiki\\Extension\\Scribunto\\Engines\\LuaSandbox\\LuaSandboxCallback::expandTemplate","100","6.2"],["MediaWiki\\Extension\\Scribunto\\Engines\\LuaSandbox\\LuaSandboxCallback::getExpandedArgument","80","5.0"],["\u003Cmw.lua:694\u003E","40","2.5"],["MediaWiki\\Extension\\Scribunto\\Engines\\LuaSandbox\\LuaSandboxCallback::getEntityStatements","40","2.5"],["type","40","2.5"],["MediaWiki\\Extension\\Scribunto\\Engines\\LuaSandbox\\LuaSandboxCallback::gsub","40","2.5"],["[others]","360","22.5"]]},"cachereport":{"origin":"mw-web.codfw.main-77cffc86c8-8h9g9","timestamp":"20241112180350","ttl":2592000,"transientcontent":false}}});});</script>
+<script type="application/ld+json">{"@context":"https:\/\/schema.org","@type":"Article","name":"Apple","url":"https:\/\/en.wikipedia.org\/wiki\/Apple","sameAs":"http:\/\/www.wikidata.org\/entity\/Q89","mainEntity":"http:\/\/www.wikidata.org\/entity\/Q89","author":{"@type":"Organization","name":"Contributors to Wikimedia projects"},"publisher":{"@type":"Organization","name":"Wikimedia Foundation, Inc.","logo":{"@type":"ImageObject","url":"https:\/\/www.wikimedia.org\/static\/images\/wmf-hor-googpub.png"}},"datePublished":"2001-10-24T01:47:59Z","dateModified":"2024-11-08T16:30:32Z","image":"https:\/\/upload.wikimedia.org\/wikipedia\/commons\/a\/a6\/Pink_lady_and_cross_section.jpg","headline":"fruit of the apple tree"}</script>
+
+<div class="rt-overlay"></div><div id="mw-teleport-target" class="vector-body"></div><a accesskey="v" href="https://en.wikipedia.org/wiki/Apple?action=edit" class="oo-ui-element-hidden"></a></body></html>
\ No newline at end of file
diff --git a/tests/async/test_content_scraper_strategy.py b/tests/async/test_content_scraper_strategy.py
new file mode 100644
index 00000000..5dfa6362
--- /dev/null
+++ b/tests/async/test_content_scraper_strategy.py
@@ -0,0 +1,162 @@
+import asyncio
+from bs4 import BeautifulSoup
+from typing import Dict, Any
+import os
+import sys
+import time
+import csv
+from tabulate import tabulate
+from dataclasses import dataclass
+from typing import List, Dict
+
+parent_dir = os.path.dirname(os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
+sys.path.append(parent_dir)
+__location__ = os.path.realpath(os.path.join(os.getcwd(), os.path.dirname(__file__)))
+
+from crawl4ai.content_scrapping_strategy import WebScrapingStrategy
+from crawl4ai.content_scrapping_strategy import WebScrapingStrategy as WebScrapingStrategyCurrent
+# from crawl4ai.content_scrapping_strategy_current import WebScrapingStrategy as WebScrapingStrategyCurrent
+
+@dataclass
+class TestResult:
+    name: str
+    success: bool
+    images: int
+    internal_links: int
+    external_links: int
+    markdown_length: int
+    execution_time: float
+
+class StrategyTester:
+    def __init__(self):
+        self.new_scraper = WebScrapingStrategy()
+        self.current_scraper = WebScrapingStrategyCurrent()
+        with open(__location__ + '/sample_wikipedia.html', 'r', encoding='utf-8') as f:
+            self.WIKI_HTML = f.read()
+        self.results = {'new': [], 'current': []}
+        
+    def run_test(self, name: str, **kwargs) -> tuple[TestResult, TestResult]:
+        results = []
+        for scraper in [self.new_scraper, self.current_scraper]:
+            start_time = time.time()
+            result = scraper._get_content_of_website_optimized(
+                url="https://en.wikipedia.org/wiki/Test",
+                html=self.WIKI_HTML,
+                **kwargs
+            )
+            execution_time = time.time() - start_time
+            
+            test_result = TestResult(
+                name=name,
+                success=result['success'],
+                images=len(result['media']['images']),
+                internal_links=len(result['links']['internal']),
+                external_links=len(result['links']['external']),
+                markdown_length=len(result['markdown']),
+                execution_time=execution_time
+            )
+            results.append(test_result)
+        
+        return results[0], results[1]  # new, current
+
+    def run_all_tests(self):
+        test_cases = [
+            ("Basic Extraction", {}),
+            ("Exclude Tags", {'excluded_tags': ['table', 'div.infobox', 'div.navbox']}),
+            ("Word Threshold", {'word_count_threshold': 50}),
+            ("CSS Selector", {'css_selector': 'div.mw-parser-output > p'}),
+            ("Link Exclusions", {
+                'exclude_external_links': True,
+                'exclude_social_media_links': True,
+                'exclude_domains': ['facebook.com', 'twitter.com']
+            }),
+            ("Media Handling", {
+                'exclude_external_images': True,
+                'image_description_min_word_threshold': 20
+            }),
+            ("Text Only", {
+                'only_text': True,
+                'remove_forms': True
+            }),
+            ("HTML Cleaning", {
+                'clean_html': True,
+                'keep_data_attributes': True
+            }),
+            ("HTML2Text Options", {
+                'html2text': {
+                    'skip_internal_links': True,
+                    'single_line_break': True,
+                    'mark_code': True,
+                    'preserve_tags': ['pre', 'code']
+                }
+            })
+        ]
+
+        all_results = []
+        for name, kwargs in test_cases:
+            try:
+                new_result, current_result = self.run_test(name, **kwargs)
+                all_results.append((name, new_result, current_result))
+            except Exception as e:
+                print(f"Error in {name}: {str(e)}")
+                
+        self.save_results_to_csv(all_results)
+        self.print_comparison_table(all_results)
+
+    def save_results_to_csv(self, all_results: List[tuple]):
+        csv_file = os.path.join(__location__, 'strategy_comparison_results.csv')
+        with open(csv_file, 'w', newline='') as f:
+            writer = csv.writer(f)
+            writer.writerow(['Test Name', 'Strategy', 'Success', 'Images', 'Internal Links', 
+                           'External Links', 'Markdown Length', 'Execution Time'])
+            
+            for name, new_result, current_result in all_results:
+                writer.writerow([name, 'New', new_result.success, new_result.images,
+                               new_result.internal_links, new_result.external_links,
+                               new_result.markdown_length, f"{new_result.execution_time:.3f}"])
+                writer.writerow([name, 'Current', current_result.success, current_result.images,
+                               current_result.internal_links, current_result.external_links,
+                               current_result.markdown_length, f"{current_result.execution_time:.3f}"])
+
+    def print_comparison_table(self, all_results: List[tuple]):
+        table_data = []
+        headers = ['Test Name', 'Strategy', 'Success', 'Images', 'Internal Links', 
+                  'External Links', 'Markdown Length', 'Time (s)']
+
+        for name, new_result, current_result in all_results:
+            # Check for differences
+            differences = []
+            if new_result.images != current_result.images: differences.append('images')
+            if new_result.internal_links != current_result.internal_links: differences.append('internal_links')
+            if new_result.external_links != current_result.external_links: differences.append('external_links')
+            if new_result.markdown_length != current_result.markdown_length: differences.append('markdown')
+            
+            # Add row for new strategy
+            new_row = [
+                name, 'New', new_result.success, new_result.images,
+                new_result.internal_links, new_result.external_links,
+                new_result.markdown_length, f"{new_result.execution_time:.3f}"
+            ]
+            table_data.append(new_row)
+            
+            # Add row for current strategy
+            current_row = [
+                '', 'Current', current_result.success, current_result.images,
+                current_result.internal_links, current_result.external_links,
+                current_result.markdown_length, f"{current_result.execution_time:.3f}"
+            ]
+            table_data.append(current_row)
+            
+            # Add difference summary if any
+            if differences:
+                table_data.append(['', '⚠️ Differences', ', '.join(differences), '', '', '', '', ''])
+            
+            # Add empty row for better readability
+            table_data.append([''] * len(headers))
+
+        print("\nStrategy Comparison Results:")
+        print(tabulate(table_data, headers=headers, tablefmt='grid'))
+
+if __name__ == "__main__":
+    tester = StrategyTester()
+    tester.run_all_tests()
\ No newline at end of file

From 17913f5acf28cfac775085b74496d1ed5aafcae6 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Wed, 13 Nov 2024 20:00:29 +0800
Subject: [PATCH 018/115] feat(crawler): support local files and raw HTML input
 in AsyncWebCrawler

---
 crawl4ai/async_webcrawler.py | 49 +++++++++++++++++++++---------------
 1 file changed, 29 insertions(+), 20 deletions(-)

diff --git a/crawl4ai/async_webcrawler.py b/crawl4ai/async_webcrawler.py
index 9d0340dc..8415f9b9 100644
--- a/crawl4ai/async_webcrawler.py
+++ b/crawl4ai/async_webcrawler.py
@@ -104,6 +104,10 @@ class AsyncWebCrawler:
             extracted_content = None
             
             is_web_url = url.startswith(('http://', 'https://'))
+            is_local_file = url.startswith("file://")
+            is_raw_html = url.startswith("raw:")
+            _url = url if not is_raw_html else "Raw HTML"
+            
             if is_web_url and not bypass_cache and not self.always_by_pass_cache:
                 cached = await async_db_manager.aget_cached_url(url)
                         
@@ -131,7 +135,7 @@ class AsyncWebCrawler:
                 t2 = time.time()
                 if verbose:
                     print(
-                        f"[LOG] 🚀 Crawling done for {url}, success: {bool(html)}, time taken: {t2 - t1:.2f} seconds"
+                        f"[LOG] 🚀 Crawling done for {_url}, success: {bool(html)}, time taken: {t2 - t1:.2f} seconds"
                     )
 
             crawl_result = await self.aprocess_html(
@@ -147,6 +151,9 @@ class AsyncWebCrawler:
                 is_cached=bool(cached),
                 async_response=async_response,
                 bypass_cache=bypass_cache,
+                is_web_url = is_web_url,
+                is_local_file = is_local_file,
+                is_raw_html = is_raw_html,
                 **kwargs,
             )
             
@@ -164,8 +171,8 @@ class AsyncWebCrawler:
         except Exception as e:
             if not hasattr(e, "msg"):
                 e.msg = str(e)
-            print(f"[ERROR] 🚫 arun(): Failed to crawl {url}, error: {e.msg}")
-            return CrawlResult(url=url, html="", markdown = f"[ERROR] 🚫 arun(): Failed to crawl {url}, error: {e.msg}", success=False, error_message=e.msg)
+            print(f"[ERROR] 🚫 arun(): Failed to crawl {_url}, error: {e.msg}")
+            return CrawlResult(url=url, html="", markdown = f"[ERROR] 🚫 arun(): Failed to crawl {_url}, error: {e.msg}", success=False, error_message=e.msg)
 
     async def arun_many(
         self,
@@ -233,6 +240,7 @@ class AsyncWebCrawler:
         t = time.time()
         # Extract content from HTML
         try:
+            _url = url if not kwargs.get("is_raw_html", False) else "Raw HTML"
             t1 = time.time()
             scrapping_strategy = WebScrapingStrategy()
             # result = await scrapping_strategy.ascrap(
@@ -249,7 +257,7 @@ class AsyncWebCrawler:
             )
             if verbose:
                 print(
-                    f"[LOG] 🚀 Content extracted for {url}, success: True, time taken: {time.time() - t1:.2f} seconds"
+                    f"[LOG] 🚀 Content extracted for {_url}, success: True, time taken: {time.time() - t1:.2f} seconds"
                 )
 
             if result is None:
@@ -270,7 +278,7 @@ class AsyncWebCrawler:
         if extracted_content is None and extraction_strategy and chunking_strategy:
             if verbose:
                 print(
-                    f"[LOG] 🔥 Extracting semantic blocks for {url}, Strategy: {self.__class__.__name__}"
+                    f"[LOG] 🔥 Extracting semantic blocks for {_url}, Strategy: {self.__class__.__name__}"
                 )
 
             # Check if extraction strategy is type of JsonCssExtractionStrategy
@@ -285,7 +293,7 @@ class AsyncWebCrawler:
 
         if verbose:
             print(
-                f"[LOG] 🚀 Extraction done for {url}, time taken: {time.time() - t:.2f} seconds."
+                f"[LOG] 🚀 Extraction done for {_url}, time taken: {time.time() - t:.2f} seconds."
             )
 
         screenshot = None if not screenshot else screenshot
@@ -296,20 +304,21 @@ class AsyncWebCrawler:
             response_headers = json.dumps(async_response.response_headers, ensure_ascii=False)
 
 
-        if not is_cached or kwargs.get("bypass_cache", False) or self.always_by_pass_cache:
-            await async_db_manager.acache_url(
-                url,
-                html,
-                cleaned_html,
-                markdown,
-                extracted_content,
-                True,
-                json.dumps(media),
-                json.dumps(links),
-                json.dumps(metadata),
-                screenshot=screenshot,
-                response_headers=response_headers,
-            )
+        if not kwargs.get("is_raw_html", False):
+            if not is_cached or kwargs.get("bypass_cache", False) or self.always_by_pass_cache:
+                await async_db_manager.acache_url(
+                    url,
+                    html,
+                    cleaned_html,
+                    markdown,
+                    extracted_content,
+                    True,
+                    json.dumps(media),
+                    json.dumps(links),
+                    json.dumps(metadata),
+                    screenshot=screenshot,
+                    response_headers=response_headers,
+                )
 
         return CrawlResult(
             url=url,

From 3d00fee6c28e16556c7a51035586faad7f5e1639 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Thu, 14 Nov 2024 22:50:59 +0800
Subject: [PATCH 019/115] - In this commit, the library is updated to process
 file downloads. Users can now specify a download folder and trigger the
 download process via JavaScript or other means, with all files being saved.
 The list of downloaded files will also be added to the crowd result object. -
 Another thing this commit introduces is the concept of the Relevance Content
 Filter. This is an improvement over Fit Markdown. This class of strategies
 aims to extract the main content from a given page - the part that really
 matters and is useful to be processed. One strategy has been created using
 the BM25 algorithm, which finds chunks of text from the web page relevant to
 its title, descriptions, and keywords, or supports a given user query and
 matches them. The result is then returned to the main engine to be converted
 to Markdown. Plans include adding approaches using language models as well. -
 The cache database was updated to hold information about response headers and
 downloaded files.

---
 crawl4ai/async_crawler_strategy.py        |  63 +-
 crawl4ai/async_crawler_strategy_0.3.73.py | 965 ----------------------
 crawl4ai/async_database.py                |  22 +-
 crawl4ai/async_webcrawler.py              |  47 +-
 crawl4ai/content_cleaning_strategy.py     | 198 -----
 crawl4ai/content_filter_strategy.py       | 344 ++++++++
 crawl4ai/content_scrapping_strategy.py    |  14 +-
 crawl4ai/models.py                        |  18 +-
 crawl4ai/utils.py                         |  55 ++
 tests/async/test_async_doanloader.py      | 229 +++++
 10 files changed, 739 insertions(+), 1216 deletions(-)
 delete mode 100644 crawl4ai/async_crawler_strategy_0.3.73.py
 delete mode 100644 crawl4ai/content_cleaning_strategy.py
 create mode 100644 crawl4ai/content_filter_strategy.py
 create mode 100644 tests/async/test_async_doanloader.py

diff --git a/crawl4ai/async_crawler_strategy.py b/crawl4ai/async_crawler_strategy.py
index baa06e47..83933a35 100644
--- a/crawl4ai/async_crawler_strategy.py
+++ b/crawl4ai/async_crawler_strategy.py
@@ -14,6 +14,7 @@ from pydantic import BaseModel
 import hashlib
 import json
 import uuid
+from .models import AsyncCrawlResponse
 
 from playwright_stealth import StealthConfig, stealth_async
 
@@ -148,15 +149,6 @@ class ManagedBrowser:
             except Exception as e:
                 print(f"Error removing temporary directory: {e}")
 
-class AsyncCrawlResponse(BaseModel):
-    html: str
-    response_headers: Dict[str, str]
-    status_code: int
-    screenshot: Optional[str] = None
-    get_delayed_content: Optional[Callable[[Optional[float]], Awaitable[str]]] = None
-
-    class Config:
-        arbitrary_types_allowed = True
 
 class AsyncCrawlerStrategy(ABC):
     @abstractmethod
@@ -215,6 +207,13 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
             'before_retrieve_html': None
         }
         self.extra_args = kwargs.get("extra_args", [])
+        self.accept_downloads = kwargs.get("accept_downloads", False)
+        self.downloads_path = kwargs.get("downloads_path")
+        self._downloaded_files = []  # Track downloaded files for current crawl
+        if self.accept_downloads and not self.downloads_path:
+            self.downloads_path = os.path.join(os.getcwd(), "downloads")
+            os.makedirs(self.downloads_path, exist_ok=True)        
+        
 
     async def __aenter__(self):
         await self.start()
@@ -250,7 +249,12 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
                 # Set up the default context
                 if self.default_context:
                     await self.default_context.set_extra_http_headers(self.headers)
-                    
+                    if self.accept_downloads:
+                        await self.default_context.set_default_timeout(60000)
+                        await self.default_context.set_default_navigation_timeout(60000)
+                        self.default_context._impl_obj._options["accept_downloads"] = True
+                        self.default_context._impl_obj._options["downloads_path"] = self.downloads_path
+                        
                     if self.user_agent:
                         await self.default_context.set_extra_http_headers({
                             "User-Agent": self.user_agent
@@ -301,12 +305,14 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
                         if self.use_persistent_context and self.user_data_dir:
                             self.browser = await self.playwright.chromium.launch_persistent_context(
                                 user_data_dir=self.user_data_dir,
+                                accept_downloads=self.accept_downloads,
+                                downloads_path=self.downloads_path if self.accept_downloads else None,                                
                                 **browser_args
                             )
                             self.default_context = self.browser
                         else:
                             self.browser = await self.playwright.chromium.launch(**browser_args)
-
+                                
                 except Exception as e:
                     # Fallback to chromium if Chrome channel fails
                     if "chrome" in str(e) and browser_args.get("channel") == "chrome":
@@ -565,6 +571,9 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
         response_headers = {}
         status_code = None
         
+        # Reset downloaded files list for new crawl
+        self._downloaded_files = []
+        
         self._cleanup_expired_sessions()
         session_id = kwargs.get("session_id")
         
@@ -592,10 +601,11 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
                         # Normal context creation for non-persistent or non-Chrome browsers
                         context = await self.browser.new_context(
                             user_agent=self.user_agent,
-                            viewport={"width": 1920, "height": 1080},
+                            viewport={"width": 1200, "height": 800},
                             proxy={"server": self.proxy} if self.proxy else None,
-                            accept_downloads=True,
-                            java_script_enabled=True
+                            java_script_enabled=True,
+                            accept_downloads=self.accept_downloads,
+                            downloads_path=self.downloads_path if self.accept_downloads else None
                         )
                         await context.add_cookies([{"name": "cookiesEnabled", "value": "true", "url": url}])
                         await context.set_extra_http_headers(self.headers)
@@ -655,6 +665,10 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
             page.on("pageerror", lambda exc: print(f"Page Error: {exc}"))
         
         try:
+            # Set up download handling if enabled
+            if self.accept_downloads:
+                page.on("download", lambda download: asyncio.create_task(self._handle_download(download)))
+
             if self.verbose:
                 print(f"[LOG] 🕸️ Crawling {url} using AsyncPlaywrightCrawlerStrategy...")
 
@@ -886,7 +900,8 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
                 response_headers=response_headers, 
                 status_code=status_code,
                 screenshot=screenshot_data,
-                get_delayed_content=get_delayed_content
+                get_delayed_content=get_delayed_content,
+                downloaded_files=self._downloaded_files if self._downloaded_files else None
             )
             return response
         except Error as e:
@@ -896,6 +911,24 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
         #         await page.close()
         #         await context.close()
 
+    async def _handle_download(self, download):
+        """Handle file downloads."""
+        try:
+            suggested_filename = download.suggested_filename
+            download_path = os.path.join(self.downloads_path, suggested_filename)
+            
+            if self.verbose:
+                print(f"[LOG] 📥 Downloading {suggested_filename} to {download_path}")
+                
+            await download.save_as(download_path)
+            self._downloaded_files.append(download_path)
+            
+            if self.verbose:
+                print(f"[LOG] ✅ Downloaded {suggested_filename} successfully")
+        except Exception as e:
+            if self.verbose:
+                print(f"[ERROR] Failed to handle download: {str(e)}")
+    
     async def crawl_many(self, urls: List[str], **kwargs) -> List[AsyncCrawlResponse]:
         semaphore_count = kwargs.get('semaphore_count', 5)  # Adjust as needed
         semaphore = asyncio.Semaphore(semaphore_count)
diff --git a/crawl4ai/async_crawler_strategy_0.3.73.py b/crawl4ai/async_crawler_strategy_0.3.73.py
deleted file mode 100644
index 54835dad..00000000
--- a/crawl4ai/async_crawler_strategy_0.3.73.py
+++ /dev/null
@@ -1,965 +0,0 @@
-import asyncio
-import base64
-import time
-from abc import ABC, abstractmethod
-from typing import Callable, Dict, Any, List, Optional, Awaitable
-import os, sys, shutil
-import tempfile, subprocess
-from playwright.async_api import async_playwright, Page, Browser, Error
-from io import BytesIO
-from PIL import Image, ImageDraw, ImageFont
-from pathlib import Path
-from playwright.async_api import ProxySettings
-from pydantic import BaseModel
-import hashlib
-import json
-import uuid
-
-from playwright_stealth import StealthConfig, stealth_async
-
-stealth_config = StealthConfig(
-    webdriver=True,
-    chrome_app=True,
-    chrome_csi=True,
-    chrome_load_times=True,
-    chrome_runtime=True,
-    navigator_languages=True,
-    navigator_plugins=True,
-    navigator_permissions=True,
-    webgl_vendor=True,
-    outerdimensions=True,
-    navigator_hardware_concurrency=True,
-    media_codecs=True,
-)
-
-
-class ManagedBrowser:
-    def __init__(self, browser_type: str = "chromium", user_data_dir: Optional[str] = None, headless: bool = False):
-        self.browser_type = browser_type
-        self.user_data_dir = user_data_dir
-        self.headless = headless
-        self.browser_process = None
-        self.temp_dir = None
-        self.debugging_port = 9222
-
-    async def start(self) -> str:
-        """
-        Starts the browser process and returns the CDP endpoint URL.
-        If user_data_dir is not provided, creates a temporary directory.
-        """
-        
-        # Create temp dir if needed
-        if not self.user_data_dir:
-            self.temp_dir = tempfile.mkdtemp(prefix="browser-profile-")
-            self.user_data_dir = self.temp_dir
-
-        # Get browser path and args based on OS and browser type
-        browser_path = self._get_browser_path()
-        args = self._get_browser_args()
-
-        # Start browser process
-        try:
-            self.browser_process = subprocess.Popen(
-                args,
-                stdout=subprocess.PIPE,
-                stderr=subprocess.PIPE
-            )
-            await asyncio.sleep(2)  # Give browser time to start
-            return f"http://localhost:{self.debugging_port}"
-        except Exception as e:
-            await self.cleanup()
-            raise Exception(f"Failed to start browser: {e}")
-
-    def _get_browser_path(self) -> str:
-        """Returns the browser executable path based on OS and browser type"""
-        if sys.platform == "darwin":  # macOS
-            paths = {
-                "chromium": "/Applications/Google Chrome.app/Contents/MacOS/Google Chrome",
-                "firefox": "/Applications/Firefox.app/Contents/MacOS/firefox",
-                "webkit": "/Applications/Safari.app/Contents/MacOS/Safari"
-            }
-        elif sys.platform == "win32":  # Windows
-            paths = {
-                "chromium": "C:\\Program Files\\Google\\Chrome\\Application\\chrome.exe",
-                "firefox": "C:\\Program Files\\Mozilla Firefox\\firefox.exe",
-                "webkit": None  # WebKit not supported on Windows
-            }
-        else:  # Linux
-            paths = {
-                "chromium": "google-chrome",
-                "firefox": "firefox",
-                "webkit": None  # WebKit not supported on Linux
-            }
-        
-        return paths.get(self.browser_type)
-
-    def _get_browser_args(self) -> List[str]:
-        """Returns browser-specific command line arguments"""
-        base_args = [self._get_browser_path()]
-        
-        if self.browser_type == "chromium":
-            args = [
-                f"--remote-debugging-port={self.debugging_port}",
-                f"--user-data-dir={self.user_data_dir}",
-            ]
-            if self.headless:
-                args.append("--headless=new")
-        elif self.browser_type == "firefox":
-            args = [
-                "--remote-debugging-port", str(self.debugging_port),
-                "--profile", self.user_data_dir,
-            ]
-            if self.headless:
-                args.append("--headless")
-        else:
-            raise NotImplementedError(f"Browser type {self.browser_type} not supported")
-            
-        return base_args + args
-
-    async def cleanup(self):
-        """Cleanup browser process and temporary directory"""
-        if self.browser_process:
-            try:
-                self.browser_process.terminate()
-                await asyncio.sleep(1)
-                if self.browser_process.poll() is None:
-                    self.browser_process.kill()
-            except Exception as e:
-                print(f"Error terminating browser: {e}")
-
-        if self.temp_dir and os.path.exists(self.temp_dir):
-            try:
-                shutil.rmtree(self.temp_dir)
-            except Exception as e:
-                print(f"Error removing temporary directory: {e}")
-
-class AsyncCrawlResponse(BaseModel):
-    html: str
-    response_headers: Dict[str, str]
-    status_code: int
-    screenshot: Optional[str] = None
-    get_delayed_content: Optional[Callable[[Optional[float]], Awaitable[str]]] = None
-
-    class Config:
-        arbitrary_types_allowed = True
-
-class AsyncCrawlerStrategy(ABC):
-    @abstractmethod
-    async def crawl(self, url: str, **kwargs) -> AsyncCrawlResponse:
-        pass
-    
-    @abstractmethod
-    async def crawl_many(self, urls: List[str], **kwargs) -> List[AsyncCrawlResponse]:
-        pass
-    
-    @abstractmethod
-    async def take_screenshot(self, **kwargs) -> str:
-        pass
-    
-    @abstractmethod
-    def update_user_agent(self, user_agent: str):
-        pass
-    
-    @abstractmethod
-    def set_hook(self, hook_type: str, hook: Callable):
-        pass
-
-class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
-    def __init__(self, use_cached_html=False, js_code=None, **kwargs):
-        self.use_cached_html = use_cached_html
-        self.user_agent = kwargs.get(
-            "user_agent",
-            "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 "
-            "(KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36"
-        )
-        self.proxy = kwargs.get("proxy")
-        self.proxy_config = kwargs.get("proxy_config")
-        self.headless = kwargs.get("headless", True)
-        self.browser_type = kwargs.get("browser_type", "chromium")
-        self.headers = kwargs.get("headers", {})
-        self.sessions = {}
-        self.session_ttl = 1800 
-        self.js_code = js_code
-        self.verbose = kwargs.get("verbose", False)
-        self.playwright = None
-        self.browser = None
-        self.sleep_on_close = kwargs.get("sleep_on_close", False)
-        self.use_managed_browser = kwargs.get("use_managed_browser", False)
-        self.user_data_dir = kwargs.get("user_data_dir", None)
-        self.use_persistent_context = kwargs.get("use_persistent_context", False)
-        self.chrome_channel = kwargs.get("chrome_channel", "chrome")
-        self.managed_browser = None
-        self.default_context = None
-        self.hooks = {
-            'on_browser_created': None,
-            'on_user_agent_updated': None,
-            'on_execution_started': None,
-            'before_goto': None,
-            'after_goto': None,
-            'before_return_html': None,
-            'before_retrieve_html': None
-        }
-        self.extra_args = kwargs.get("extra_args", [])
-
-    async def __aenter__(self):
-        await self.start()
-        return self
-
-    async def __aexit__(self, exc_type, exc_val, exc_tb):
-        await self.close()
-
-    async def start(self):
-        if self.playwright is None:
-            self.playwright = await async_playwright().start()
-        if self.browser is None:
-            if self.use_managed_browser:
-                # Use managed browser approach
-                self.managed_browser = ManagedBrowser(
-                    browser_type=self.browser_type,
-                    user_data_dir=self.user_data_dir,
-                    headless=self.headless
-                )
-                cdp_url = await self.managed_browser.start()
-                self.browser = await self.playwright.chromium.connect_over_cdp(cdp_url)
-                
-                # Get the default context that maintains the user profile
-                contexts = self.browser.contexts
-                if contexts:
-                    self.default_context = contexts[0]
-                else:
-                    # If no default context exists, create one
-                    self.default_context = await self.browser.new_context(
-                        viewport={"width": 1920, "height": 1080}
-                    )
-                
-                # Set up the default context
-                if self.default_context:
-                    await self.default_context.set_extra_http_headers(self.headers)
-                    
-                    if self.user_agent:
-                        await self.default_context.set_extra_http_headers({
-                            "User-Agent": self.user_agent
-                        })
-            else:
-                browser_args = {
-                    "headless": self.headless,
-                    "args": [
-                        "--disable-gpu",
-                        "--no-sandbox",
-                        "--disable-dev-shm-usage",
-                        "--disable-blink-features=AutomationControlled",
-                        "--disable-infobars",
-                        "--window-position=0,0",
-                        "--ignore-certificate-errors",
-                        "--ignore-certificate-errors-spki-list",
-                        # "--disable-http2",
-                        # "--headless=new",  # Use the new headless mode
-                    ]
-                }
-                
-                # Add extra args if provided
-                if self.extra_args:
-                    browser_args["args"].extend(self.extra_args)
-                
-                # Add proxy settings if a proxy is specified
-                if self.proxy:
-                    proxy_settings = ProxySettings(server=self.proxy)
-                    browser_args["proxy"] = proxy_settings
-                elif self.proxy_config:
-                    proxy_settings = ProxySettings(server=self.proxy_config.get("server"), username=self.proxy_config.get("username"), password=self.proxy_config.get("password"))
-                    browser_args["proxy"] = proxy_settings
-                    
-                # Select the appropriate browser based on the browser_type
-                if self.browser_type == "firefox":
-                    self.browser = await self.playwright.firefox.launch(**browser_args)
-                elif self.browser_type == "webkit":
-                    self.browser = await self.playwright.webkit.launch(**browser_args)
-                else:
-                    self.browser = await self.playwright.chromium.launch(**browser_args)
-                    
-                # Update the headless configuration
-                if self.headless:
-                    # Use the new headless mode explicitly
-                    browser_args["args"].append("--headless=new")
-
-            await self.execute_hook('on_browser_created', self.browser)
-
-    async def close(self):
-        if self.sleep_on_close:
-            await asyncio.sleep(0.5)
-            
-        # Close all active sessions
-        session_ids = list(self.sessions.keys())
-        for session_id in session_ids:
-            await self.kill_session(session_id)
-            
-        if self.browser:
-            await self.browser.close()
-            self.browser = None
-            
-        if self.managed_browser:
-            await self.managed_browser.cleanup()
-            self.managed_browser = None
-            
-        if self.playwright:
-            await self.playwright.stop()
-            self.playwright = None
-
-    def __del__(self):
-        if self.browser or self.playwright:
-            asyncio.get_event_loop().run_until_complete(self.close())
-
-    def set_hook(self, hook_type: str, hook: Callable):
-        if hook_type in self.hooks:
-            self.hooks[hook_type] = hook
-        else:
-            raise ValueError(f"Invalid hook type: {hook_type}")
-
-    async def execute_hook(self, hook_type: str, *args):
-        hook = self.hooks.get(hook_type)
-        if hook:
-            if asyncio.iscoroutinefunction(hook):
-                return await hook(*args)
-            else:
-                return hook(*args)
-        return args[0] if args else None
-
-    def update_user_agent(self, user_agent: str):
-        self.user_agent = user_agent
-
-    def set_custom_headers(self, headers: Dict[str, str]):
-        self.headers = headers
-
-    async def kill_session(self, session_id: str):
-        if session_id in self.sessions:
-            context, page, _ = self.sessions[session_id]
-            await page.close()
-            if not self.use_managed_browser:
-                await context.close()
-            del self.sessions[session_id]
-
-    def _cleanup_expired_sessions(self):
-        current_time = time.time()
-        expired_sessions = [
-            sid for sid, (_, _, last_used) in self.sessions.items() 
-            if current_time - last_used > self.session_ttl
-        ]
-        for sid in expired_sessions:
-            asyncio.create_task(self.kill_session(sid))
-            
-    async def smart_wait(self, page: Page, wait_for: str, timeout: float = 30000):
-        wait_for = wait_for.strip()
-        
-        if wait_for.startswith('js:'):
-            # Explicitly specified JavaScript
-            js_code = wait_for[3:].strip()
-            return await self.csp_compliant_wait(page, js_code, timeout)
-        elif wait_for.startswith('css:'):
-            # Explicitly specified CSS selector
-            css_selector = wait_for[4:].strip()
-            try:
-                await page.wait_for_selector(css_selector, timeout=timeout)
-            except Error as e:
-                if 'Timeout' in str(e):
-                    raise TimeoutError(f"Timeout after {timeout}ms waiting for selector '{css_selector}'")
-                else:
-                    raise ValueError(f"Invalid CSS selector: '{css_selector}'")
-        else:
-            # Auto-detect based on content
-            if wait_for.startswith('()') or wait_for.startswith('function'):
-                # It's likely a JavaScript function
-                return await self.csp_compliant_wait(page, wait_for, timeout)
-            else:
-                # Assume it's a CSS selector first
-                try:
-                    await page.wait_for_selector(wait_for, timeout=timeout)
-                except Error as e:
-                    if 'Timeout' in str(e):
-                        raise TimeoutError(f"Timeout after {timeout}ms waiting for selector '{wait_for}'")
-                    else:
-                        # If it's not a timeout error, it might be an invalid selector
-                        # Let's try to evaluate it as a JavaScript function as a fallback
-                        try:
-                            return await self.csp_compliant_wait(page, f"() => {{{wait_for}}}", timeout)
-                        except Error:
-                            raise ValueError(f"Invalid wait_for parameter: '{wait_for}'. "
-                                             "It should be either a valid CSS selector, a JavaScript function, "
-                                             "or explicitly prefixed with 'js:' or 'css:'.")
-    
-    async def csp_compliant_wait(self, page: Page, user_wait_function: str, timeout: float = 30000):
-        wrapper_js = f"""
-        async () => {{
-            const userFunction = {user_wait_function};
-            const startTime = Date.now();
-            while (true) {{
-                if (await userFunction()) {{
-                    return true;
-                }}
-                if (Date.now() - startTime > {timeout}) {{
-                    throw new Error('Timeout waiting for condition');
-                }}
-                await new Promise(resolve => setTimeout(resolve, 100));
-            }}
-        }}
-        """
-        
-        try:
-            await page.evaluate(wrapper_js)
-        except TimeoutError:
-            raise TimeoutError(f"Timeout after {timeout}ms waiting for condition")
-        except Exception as e:
-            raise RuntimeError(f"Error in wait condition: {str(e)}")
-
-    async def process_iframes(self, page):
-        # Find all iframes
-        iframes = await page.query_selector_all('iframe')
-        
-        for i, iframe in enumerate(iframes):
-            try:
-                # Add a unique identifier to the iframe
-                await iframe.evaluate(f'(element) => element.id = "iframe-{i}"')
-                
-                # Get the frame associated with this iframe
-                frame = await iframe.content_frame()
-                
-                if frame:
-                    # Wait for the frame to load
-                    await frame.wait_for_load_state('load', timeout=30000)  # 30 seconds timeout
-                    
-                    # Extract the content of the iframe's body
-                    iframe_content = await frame.evaluate('() => document.body.innerHTML')
-                    
-                    # Generate a unique class name for this iframe
-                    class_name = f'extracted-iframe-content-{i}'
-                    
-                    # Replace the iframe with a div containing the extracted content
-                    _iframe = iframe_content.replace('`', '\\`')
-                    await page.evaluate(f"""
-                        () => {{
-                            const iframe = document.getElementById('iframe-{i}');
-                            const div = document.createElement('div');
-                            div.innerHTML = `{_iframe}`;
-                            div.className = '{class_name}';
-                            iframe.replaceWith(div);
-                        }}
-                    """)
-                else:
-                    print(f"Warning: Could not access content frame for iframe {i}")
-            except Exception as e:
-                print(f"Error processing iframe {i}: {str(e)}")
-
-        # Return the page object
-        return page  
-    
-    async def crawl(self, url: str, **kwargs) -> AsyncCrawlResponse:
-        response_headers = {}
-        status_code = None
-        
-        self._cleanup_expired_sessions()
-        session_id = kwargs.get("session_id")
-        
-        # Handle page creation differently for managed browser
-        if self.use_managed_browser:
-            if session_id:
-                # Reuse existing session if available
-                context, page, _ = self.sessions.get(session_id, (None, None, None))
-                if not page:
-                    # Create new page in default context if session doesn't exist
-                    page = await self.default_context.new_page()
-                    self.sessions[session_id] = (self.default_context, page, time.time())
-            else:
-                # Create new page in default context for non-session requests
-                page = await self.default_context.new_page()
-        else:
-            if session_id:
-                context, page, _ = self.sessions.get(session_id, (None, None, None))
-                if not context:
-                    context = await self.browser.new_context(
-                        user_agent=self.user_agent,
-                        viewport={"width": 1920, "height": 1080},
-                        proxy={"server": self.proxy} if self.proxy else None,
-                        accept_downloads=True,
-                        java_script_enabled=True
-                    )
-                    await context.add_cookies([{"name": "cookiesEnabled", "value": "true", "url": url}])
-                    await context.set_extra_http_headers(self.headers)
-                    page = await context.new_page()
-                    self.sessions[session_id] = (context, page, time.time())
-            else:
-                context = await self.browser.new_context(
-                    user_agent=self.user_agent,
-                    viewport={"width": 1920, "height": 1080},
-                    proxy={"server": self.proxy} if self.proxy else None
-                )
-                await context.set_extra_http_headers(self.headers)
-                
-                if kwargs.get("override_navigator", False) or kwargs.get("simulate_user", False) or kwargs.get("magic", False):
-                    # Inject scripts to override navigator properties
-                    await context.add_init_script("""
-                        // Pass the Permissions Test.
-                        const originalQuery = window.navigator.permissions.query;
-                        window.navigator.permissions.query = (parameters) => (
-                            parameters.name === 'notifications' ?
-                                Promise.resolve({ state: Notification.permission }) :
-                                originalQuery(parameters)
-                        );
-                        Object.defineProperty(navigator, 'webdriver', {
-                            get: () => undefined
-                        });
-                        window.navigator.chrome = {
-                            runtime: {},
-                            // Add other properties if necessary
-                        };
-                        Object.defineProperty(navigator, 'plugins', {
-                            get: () => [1, 2, 3, 4, 5],
-                        });
-                        Object.defineProperty(navigator, 'languages', {
-                            get: () => ['en-US', 'en'],
-                        });
-                        Object.defineProperty(document, 'hidden', {
-                            get: () => false
-                        });
-                        Object.defineProperty(document, 'visibilityState', {
-                            get: () => 'visible'
-                        });
-                    """)
-                
-                page = await context.new_page()
-                if kwargs.get("magic", False):
-                    await stealth_async(page, stealth_config)
-
-        # Add console message and error logging
-        if kwargs.get("log_console", False):
-            page.on("console", lambda msg: print(f"Console: {msg.text}"))
-            page.on("pageerror", lambda exc: print(f"Page Error: {exc}"))
-        
-        try:
-            if self.verbose:
-                print(f"[LOG] 🕸️ Crawling {url} using AsyncPlaywrightCrawlerStrategy...")
-
-            if self.use_cached_html:
-                cache_file_path = os.path.join(
-                    Path.home(), ".crawl4ai", "cache", hashlib.md5(url.encode()).hexdigest()
-                )
-                if os.path.exists(cache_file_path):
-                    html = ""
-                    with open(cache_file_path, "r") as f:
-                        html = f.read()
-                    # retrieve response headers and status code from cache
-                    with open(cache_file_path + ".meta", "r") as f:
-                        meta = json.load(f)
-                        response_headers = meta.get("response_headers", {})
-                        status_code = meta.get("status_code")
-                    response = AsyncCrawlResponse(
-                        html=html, response_headers=response_headers, status_code=status_code
-                    )
-                    return response
-
-            if not kwargs.get("js_only", False):
-                await self.execute_hook('before_goto', page)
-                
-                # response = await page.goto(
-                #     url, wait_until="domcontentloaded", timeout=kwargs.get("page_timeout", 60000)
-                # )
-                
-                # Add retry logic for HTTP2 errors
-                max_retries = kwargs.get("max_retries", 3)
-                current_try = 0
-                
-                while current_try < max_retries:
-                    try:
-                        response = await page.goto(
-                            url,
-                            # wait_until=kwargs.get("wait_until", ["domcontentloaded", "networkidle"]),
-                            wait_until=kwargs.get("wait_until", "networkidle"),
-                            timeout=kwargs.get("page_timeout", 60000)
-                        )
-                        break
-                    except Exception as e:
-                        current_try += 1
-                        if "ERR_HTTP2_PROTOCOL_ERROR" in str(e):
-                            if current_try < max_retries:
-                                # Add exponential backoff
-                                await asyncio.sleep(2 ** current_try)
-                                # Try with different protocol
-                                if 'args' not in kwargs:
-                                    kwargs['args'] = []
-                                kwargs['args'].extend(['--disable-http2'])
-                                continue
-                        if current_try == max_retries:
-                            raise
-                
-                # response = await page.goto("about:blank")
-                # await page.evaluate(f"window.location.href = '{url}'")
-                
-                await self.execute_hook('after_goto', page)
-                
-                # Get status code and headers
-                status_code = response.status
-                response_headers = response.headers
-            else:
-                status_code = 200
-                response_headers = {}
-
-            # Replace the current wait_for_selector line with this more robust check:
-            try:
-                # First wait for body to exist, regardless of visibility
-                await page.wait_for_selector('body', state='attached', timeout=30000)
-                
-                # Then wait for it to become visible by checking CSS
-                await page.wait_for_function("""
-                    () => {
-                        const body = document.body;
-                        const style = window.getComputedStyle(body);
-                        return style.display !== 'none' && 
-                            style.visibility !== 'hidden' && 
-                            style.opacity !== '0';
-                    }
-                """, timeout=30000)
-                
-            except Error as e:
-                # If waiting fails, let's try to diagnose the issue
-                visibility_info = await page.evaluate("""
-                    () => {
-                        const body = document.body;
-                        const style = window.getComputedStyle(body);
-                        return {
-                            display: style.display,
-                            visibility: style.visibility,
-                            opacity: style.opacity,
-                            hasContent: body.innerHTML.length,
-                            classList: Array.from(body.classList)
-                        }
-                    }
-                """)
-                
-                if self.verbose:
-                    print(f"Body visibility debug info: {visibility_info}")
-                
-                # Even if body is hidden, we might still want to proceed
-                if kwargs.get('ignore_body_visibility', True):
-                    if self.verbose:
-                        print("Proceeding despite hidden body...")
-                    pass
-                else:
-                    raise Error(f"Body element is hidden: {visibility_info}")
-            
-            await page.evaluate("window.scrollTo(0, document.body.scrollHeight)")
-
-            js_code = kwargs.get("js_code", kwargs.get("js", self.js_code))
-            if js_code:
-                if isinstance(js_code, str):
-                    await page.evaluate(js_code)
-                elif isinstance(js_code, list):
-                    for js in js_code:
-                        await page.evaluate(js)
-                
-                await page.wait_for_load_state('networkidle')
-                # Check for on execution event
-                await self.execute_hook('on_execution_started', page)
-                
-            if kwargs.get("simulate_user", False) or kwargs.get("magic", False):
-                # Simulate user interactions
-                await page.mouse.move(100, 100)
-                await page.mouse.down()
-                await page.mouse.up()
-                await page.keyboard.press('ArrowDown')
-
-            # Handle the wait_for parameter
-            wait_for = kwargs.get("wait_for")
-            if wait_for:
-                try:
-                    await self.smart_wait(page, wait_for, timeout=kwargs.get("page_timeout", 60000))
-                except Exception as e:
-                    raise RuntimeError(f"Wait condition failed: {str(e)}")
-
-            # Update image dimensions
-            update_image_dimensions_js = """
-            () => {
-                return new Promise((resolve) => {
-                    const filterImage = (img) => {
-                        // Filter out images that are too small
-                        if (img.width < 100 && img.height < 100) return false;
-                        
-                        // Filter out images that are not visible
-                        const rect = img.getBoundingClientRect();
-                        if (rect.width === 0 || rect.height === 0) return false;
-                        
-                        // Filter out images with certain class names (e.g., icons, thumbnails)
-                        if (img.classList.contains('icon') || img.classList.contains('thumbnail')) return false;
-                        
-                        // Filter out images with certain patterns in their src (e.g., placeholder images)
-                        if (img.src.includes('placeholder') || img.src.includes('icon')) return false;
-                        
-                        return true;
-                    };
-
-                    const images = Array.from(document.querySelectorAll('img')).filter(filterImage);
-                    let imagesLeft = images.length;
-                    
-                    if (imagesLeft === 0) {
-                        resolve();
-                        return;
-                    }
-
-                    const checkImage = (img) => {
-                        if (img.complete && img.naturalWidth !== 0) {
-                            img.setAttribute('width', img.naturalWidth);
-                            img.setAttribute('height', img.naturalHeight);
-                            imagesLeft--;
-                            if (imagesLeft === 0) resolve();
-                        }
-                    };
-
-                    images.forEach(img => {
-                        checkImage(img);
-                        if (!img.complete) {
-                            img.onload = () => {
-                                checkImage(img);
-                            };
-                            img.onerror = () => {
-                                imagesLeft--;
-                                if (imagesLeft === 0) resolve();
-                            };
-                        }
-                    });
-
-                    // Fallback timeout of 5 seconds
-                    // setTimeout(() => resolve(), 5000);
-                    resolve();
-                });
-            }
-            """
-            await page.evaluate(update_image_dimensions_js)
-
-            # Wait a bit for any onload events to complete
-            await page.wait_for_timeout(100)
-
-            # Process iframes
-            if kwargs.get("process_iframes", False):
-                page = await self.process_iframes(page)
-            
-            await self.execute_hook('before_retrieve_html', page)
-            # Check if delay_before_return_html is set then wait for that time
-            delay_before_return_html = kwargs.get("delay_before_return_html")
-            if delay_before_return_html:
-                await asyncio.sleep(delay_before_return_html)
-                
-            # Check for remove_overlay_elements parameter
-            if kwargs.get("remove_overlay_elements", False):
-                await self.remove_overlay_elements(page)
-            
-            html = await page.content()
-            await self.execute_hook('before_return_html', page, html)
-            
-            # Check if kwargs has screenshot=True then take screenshot
-            screenshot_data = None
-            if kwargs.get("screenshot"):
-                # Check we have screenshot_wait_for parameter, if we have simply wait for that time
-                screenshot_wait_for = kwargs.get("screenshot_wait_for")
-                if screenshot_wait_for:
-                    await asyncio.sleep(screenshot_wait_for)
-                screenshot_data = await self.take_screenshot(page)          
-
-            if self.verbose:
-                print(f"[LOG] ✅ Crawled {url} successfully!")
-
-            if self.use_cached_html:
-                cache_file_path = os.path.join(
-                    Path.home(), ".crawl4ai", "cache", hashlib.md5(url.encode()).hexdigest()
-                )
-                with open(cache_file_path, "w", encoding="utf-8") as f:
-                    f.write(html)
-                # store response headers and status code in cache
-                with open(cache_file_path + ".meta", "w", encoding="utf-8") as f:
-                    json.dump({
-                        "response_headers": response_headers,
-                        "status_code": status_code
-                    }, f)
-
-            async def get_delayed_content(delay: float = 5.0) -> str:
-                if self.verbose:
-                    print(f"[LOG] Waiting for {delay} seconds before retrieving content for {url}")
-                await asyncio.sleep(delay)
-                return await page.content()
-                
-            response = AsyncCrawlResponse(
-                html=html, 
-                response_headers=response_headers, 
-                status_code=status_code,
-                screenshot=screenshot_data,
-                get_delayed_content=get_delayed_content
-            )
-            return response
-        except Error as e:
-            raise Error(f"[ERROR] 🚫 crawl(): Failed to crawl {url}: {str(e)}")
-        # finally:
-        #     if not session_id:
-        #         await page.close()
-        #         await context.close()
-
-    async def crawl_many(self, urls: List[str], **kwargs) -> List[AsyncCrawlResponse]:
-        semaphore_count = kwargs.get('semaphore_count', 5)  # Adjust as needed
-        semaphore = asyncio.Semaphore(semaphore_count)
-
-        async def crawl_with_semaphore(url):
-            async with semaphore:
-                return await self.crawl(url, **kwargs)
-
-        tasks = [crawl_with_semaphore(url) for url in urls]
-        results = await asyncio.gather(*tasks, return_exceptions=True)
-        return [result if not isinstance(result, Exception) else str(result) for result in results]
-
-    async def remove_overlay_elements(self, page: Page) -> None:
-        """
-        Removes popup overlays, modals, cookie notices, and other intrusive elements from the page.
-        
-        Args:
-            page (Page): The Playwright page instance
-        """
-        remove_overlays_js = """
-        async () => {
-            // Function to check if element is visible
-            const isVisible = (elem) => {
-                const style = window.getComputedStyle(elem);
-                return style.display !== 'none' && 
-                       style.visibility !== 'hidden' && 
-                       style.opacity !== '0';
-            };
-
-            // Common selectors for popups and overlays
-            const commonSelectors = [
-                // Close buttons first
-                'button[class*="close" i]', 'button[class*="dismiss" i]', 
-                'button[aria-label*="close" i]', 'button[title*="close" i]',
-                'a[class*="close" i]', 'span[class*="close" i]',
-                
-                // Cookie notices
-                '[class*="cookie-banner" i]', '[id*="cookie-banner" i]',
-                '[class*="cookie-consent" i]', '[id*="cookie-consent" i]',
-                
-                // Newsletter/subscription dialogs
-                '[class*="newsletter" i]', '[class*="subscribe" i]',
-                
-                // Generic popups/modals
-                '[class*="popup" i]', '[class*="modal" i]', 
-                '[class*="overlay" i]', '[class*="dialog" i]',
-                '[role="dialog"]', '[role="alertdialog"]'
-            ];
-
-            // Try to click close buttons first
-            for (const selector of commonSelectors.slice(0, 6)) {
-                const closeButtons = document.querySelectorAll(selector);
-                for (const button of closeButtons) {
-                    if (isVisible(button)) {
-                        try {
-                            button.click();
-                            await new Promise(resolve => setTimeout(resolve, 100));
-                        } catch (e) {
-                            console.log('Error clicking button:', e);
-                        }
-                    }
-                }
-            }
-
-            // Remove remaining overlay elements
-            const removeOverlays = () => {
-                // Find elements with high z-index
-                const allElements = document.querySelectorAll('*');
-                for (const elem of allElements) {
-                    const style = window.getComputedStyle(elem);
-                    const zIndex = parseInt(style.zIndex);
-                    const position = style.position;
-                    
-                    if (
-                        isVisible(elem) && 
-                        (zIndex > 999 || position === 'fixed' || position === 'absolute') &&
-                        (
-                            elem.offsetWidth > window.innerWidth * 0.5 ||
-                            elem.offsetHeight > window.innerHeight * 0.5 ||
-                            style.backgroundColor.includes('rgba') ||
-                            parseFloat(style.opacity) < 1
-                        )
-                    ) {
-                        elem.remove();
-                    }
-                }
-
-                // Remove elements matching common selectors
-                for (const selector of commonSelectors) {
-                    const elements = document.querySelectorAll(selector);
-                    elements.forEach(elem => {
-                        if (isVisible(elem)) {
-                            elem.remove();
-                        }
-                    });
-                }
-            };
-
-            // Remove overlay elements
-            removeOverlays();
-
-            // Remove any fixed/sticky position elements at the top/bottom
-            const removeFixedElements = () => {
-                const elements = document.querySelectorAll('*');
-                elements.forEach(elem => {
-                    const style = window.getComputedStyle(elem);
-                    if (
-                        (style.position === 'fixed' || style.position === 'sticky') &&
-                        isVisible(elem)
-                    ) {
-                        elem.remove();
-                    }
-                });
-            };
-
-            removeFixedElements();
-            
-            // Remove empty block elements as: div, p, span, etc.
-            const removeEmptyBlockElements = () => {
-                const blockElements = document.querySelectorAll('div, p, span, section, article, header, footer, aside, nav, main, ul, ol, li, dl, dt, dd, h1, h2, h3, h4, h5, h6');
-                blockElements.forEach(elem => {
-                    if (elem.innerText.trim() === '') {
-                        elem.remove();
-                    }
-                });
-            };
-
-            // Remove margin-right and padding-right from body (often added by modal scripts)
-            document.body.style.marginRight = '0px';
-            document.body.style.paddingRight = '0px';
-            document.body.style.overflow = 'auto';
-
-            // Wait a bit for any animations to complete
-            await new Promise(resolve => setTimeout(resolve, 100));
-        }
-        """
-        
-        try:
-            await page.evaluate(remove_overlays_js)
-            await page.wait_for_timeout(500)  # Wait for any animations to complete
-        except Exception as e:
-            if self.verbose:
-                print(f"Warning: Failed to remove overlay elements: {str(e)}")
-
-    async def take_screenshot(self, page: Page) -> str:
-        try:
-            # The page is already loaded, just take the screenshot
-            screenshot = await page.screenshot(full_page=True)
-            return base64.b64encode(screenshot).decode('utf-8')
-        except Exception as e:
-            error_message = f"Failed to take screenshot: {str(e)}"
-            print(error_message)
-
-            # Generate an error image
-            img = Image.new('RGB', (800, 600), color='black')
-            draw = ImageDraw.Draw(img)
-            font = ImageFont.load_default()
-            draw.text((10, 10), error_message, fill=(255, 255, 255), font=font)
-            
-            buffered = BytesIO()
-            img.save(buffered, format="JPEG")
-            return base64.b64encode(buffered.getvalue()).decode('utf-8')
-        finally:
-            await page.close()
-
diff --git a/crawl4ai/async_database.py b/crawl4ai/async_database.py
index 273ca6c9..c52e3db6 100644
--- a/crawl4ai/async_database.py
+++ b/crawl4ai/async_database.py
@@ -91,7 +91,8 @@ class AsyncDatabaseManager:
                     links TEXT DEFAULT "{}",
                     metadata TEXT DEFAULT "{}",
                     screenshot TEXT DEFAULT "",
-                    response_headers TEXT DEFAULT "{}"  -- New column added
+                    response_headers TEXT DEFAULT "{}",
+                    downloaded_files TEXT DEFAULT "{}"  -- New column added
                 )
             ''')
         
@@ -108,7 +109,7 @@ class AsyncDatabaseManager:
         column_names = await self.execute_with_retry(_check_columns)
         
         # List of new columns to add
-        new_columns = ['media', 'links', 'metadata', 'screenshot', 'response_headers']
+        new_columns = ['media', 'links', 'metadata', 'screenshot', 'response_headers', 'downloaded_files']
         
         for column in new_columns:
             if column not in column_names:
@@ -130,7 +131,7 @@ class AsyncDatabaseManager:
         async def _get(db):
             async with db.execute(
                 '''
-                SELECT url, html, cleaned_html, markdown, extracted_content, success, media, links, metadata, screenshot, response_headers
+                SELECT url, html, cleaned_html, markdown, extracted_content, success, media, links, metadata, screenshot, response_headers, downloaded_files
                 FROM crawled_data WHERE url = ?
                 ''',
                 (url,)
@@ -149,7 +150,8 @@ class AsyncDatabaseManager:
                         json.loads(row[7] or '{}'),  # links
                         json.loads(row[8] or '{}'),  # metadata
                         row[9],  # screenshot
-                        json.loads(row[10] or '{}')  # response_headers
+                        json.loads(row[10] or '{}'),  # response_headers
+                        json.loads(row[11] or '[]')  # downloaded_files
                     )
                 return None
 
@@ -171,15 +173,16 @@ class AsyncDatabaseManager:
         links: str = "{}",
         metadata: str = "{}",
         screenshot: str = "",
-        response_headers: str = "{}"  # New parameter added
+        response_headers: str = "{}",
+        downloaded_files: str = "[]"
     ):
         """Cache URL data with retry logic"""
         async def _cache(db):
             await db.execute('''
                 INSERT INTO crawled_data (
-                    url, html, cleaned_html, markdown, extracted_content, success, media, links, metadata, screenshot, response_headers
+                    url, html, cleaned_html, markdown, extracted_content, success, media, links, metadata, screenshot, response_headers, downloaded_files
                 )
-                VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)
+                VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)
                 ON CONFLICT(url) DO UPDATE SET
                     html = excluded.html,
                     cleaned_html = excluded.cleaned_html,
@@ -190,8 +193,9 @@ class AsyncDatabaseManager:
                     links = excluded.links,    
                     metadata = excluded.metadata,      
                     screenshot = excluded.screenshot,
-                    response_headers = excluded.response_headers  -- Update response_headers
-            ''', (url, html, cleaned_html, markdown, extracted_content, success, media, links, metadata, screenshot, response_headers))
+                    response_headers = excluded.response_headers,  -- Update response_headers
+                    downloaded_files = excluded.downloaded_files
+            ''', (url, html, cleaned_html, markdown, extracted_content, success, media, links, metadata, screenshot, response_headers, downloaded_files))
 
         try:
             await self.execute_with_retry(_cache)
diff --git a/crawl4ai/async_webcrawler.py b/crawl4ai/async_webcrawler.py
index 8415f9b9..cec1ace0 100644
--- a/crawl4ai/async_webcrawler.py
+++ b/crawl4ai/async_webcrawler.py
@@ -160,12 +160,35 @@ class AsyncWebCrawler:
             if async_response:
                 crawl_result.status_code = async_response.status_code
                 crawl_result.response_headers = async_response.response_headers
+                crawl_result.downloaded_files = async_response.downloaded_files
             else:
                 crawl_result.status_code = 200
                 crawl_result.response_headers = cached[10]
+                # crawl_result.downloaded_files = cached[11]
 
             crawl_result.success = bool(html)
             crawl_result.session_id = kwargs.get("session_id", None)
+
+
+            if not is_raw_html:
+                if not bool(cached) or kwargs.get("bypass_cache", False) or self.always_by_pass_cache:
+                    await async_db_manager.acache_url(
+                        url = url,
+                        html = html,
+                        cleaned_html = crawl_result.cleaned_html,
+                        markdown = crawl_result.markdown,
+                        extracted_content = extracted_content,
+                        success = True,
+                        media = json.dumps(crawl_result.media),
+                        links = json.dumps(crawl_result.links),
+                        metadata = json.dumps(crawl_result.metadata),
+                        screenshot=screenshot,
+                        response_headers=json.dumps(crawl_result.response_headers),
+                        downloaded_files=json.dumps(crawl_result.downloaded_files),
+                        
+                    )
+
+
             return crawl_result
         
         except Exception as e:
@@ -233,8 +256,6 @@ class AsyncWebCrawler:
         css_selector: str,
         screenshot: str,
         verbose: bool,
-        is_cached: bool,
-        async_response: Optional[AsyncCrawlResponse],
         **kwargs,
     ) -> CrawlResult:
         t = time.time()
@@ -298,28 +319,6 @@ class AsyncWebCrawler:
 
         screenshot = None if not screenshot else screenshot
         
-        response_headers = "{}"  # Default value
-        if async_response:
-            # Serialize response_headers dict to JSON string
-            response_headers = json.dumps(async_response.response_headers, ensure_ascii=False)
-
-
-        if not kwargs.get("is_raw_html", False):
-            if not is_cached or kwargs.get("bypass_cache", False) or self.always_by_pass_cache:
-                await async_db_manager.acache_url(
-                    url,
-                    html,
-                    cleaned_html,
-                    markdown,
-                    extracted_content,
-                    True,
-                    json.dumps(media),
-                    json.dumps(links),
-                    json.dumps(metadata),
-                    screenshot=screenshot,
-                    response_headers=response_headers,
-                )
-
         return CrawlResult(
             url=url,
             html=html,
diff --git a/crawl4ai/content_cleaning_strategy.py b/crawl4ai/content_cleaning_strategy.py
deleted file mode 100644
index b8a5053d..00000000
--- a/crawl4ai/content_cleaning_strategy.py
+++ /dev/null
@@ -1,198 +0,0 @@
-from bs4 import BeautifulSoup, Tag
-import re
-from typing import Optional
-
-class ContentCleaningStrategy:
-    def __init__(self):
-        # Precompile regex patterns for performance
-        self.negative_patterns = re.compile(r'nav|footer|header|sidebar|ads|comment', re.I)
-        self.positive_patterns = re.compile(r'content|article|main|post', re.I)
-        self.priority_tags = {'article', 'main', 'section', 'div'}
-        self.non_content_tags = {'nav', 'footer', 'header', 'aside'}
-        # Thresholds
-        self.text_density_threshold = 9.0
-        self.min_word_count = 50
-        self.link_density_threshold = 0.2
-        self.max_dom_depth = 10  # To prevent excessive DOM traversal
-
-    def clean(self, clean_html: str, soup = None) -> str:
-        """
-        Main function that takes cleaned HTML and returns super cleaned HTML.
-
-        Args:
-            clean_html (str): The cleaned HTML content.
-
-        Returns:
-            str: The super cleaned HTML containing only the main content.
-        """
-        try:
-            if not clean_html or not isinstance(clean_html, str):
-                return ''
-            if not soup:
-                # soup = BeautifulSoup(clean_html, 'html.parser')
-                soup = BeautifulSoup(clean_html, 'lxml')
-            main_content = self.extract_main_content(soup)
-            if main_content:
-                super_clean_element = self.clean_element(main_content)
-                return super_clean_element.encode_contents().decode('utf-8')
-            else:
-                return ''
-        except Exception:
-            # Handle exceptions silently or log them as needed
-            return ''
-
-    def extract_main_content(self, soup) -> Optional[Tag]:
-        """
-        Identifies and extracts the main content element from the HTML.
-
-        Args:
-            soup (BeautifulSoup): The parsed HTML soup.
-
-        Returns:
-            Optional[Tag]: The Tag object containing the main content, or None if not found.
-        """
-        candidates = []
-        for element in soup.find_all(self.priority_tags):
-            if self.is_non_content_tag(element):
-                continue
-            if self.has_negative_class_id(element):
-                continue
-            score = self.calculate_content_score(element)
-            candidates.append((score, element))
-        
-        if not candidates:
-            return None
-
-        # Sort candidates by score in descending order
-        candidates.sort(key=lambda x: x[0], reverse=True)
-        # Select the element with the highest score
-        best_element = candidates[0][1]
-        return best_element
-
-    def calculate_content_score(self, element: Tag) -> float:
-        """
-        Calculates a score for an element based on various heuristics.
-
-        Args:
-            element (Tag): The HTML element to score.
-
-        Returns:
-            float: The content score of the element.
-        """
-        score = 0.0
-
-        if self.is_priority_tag(element):
-            score += 5.0
-        if self.has_positive_class_id(element):
-            score += 3.0
-        if self.has_negative_class_id(element):
-            score -= 3.0
-        if self.is_high_text_density(element):
-            score += 2.0
-        if self.is_low_link_density(element):
-            score += 2.0
-        if self.has_sufficient_content(element):
-            score += 2.0
-        if self.has_headings(element):
-            score += 3.0
-
-        dom_depth = self.calculate_dom_depth(element)
-        score += min(dom_depth, self.max_dom_depth) * 0.5  # Adjust weight as needed
-
-        return score
-
-    def is_priority_tag(self, element: Tag) -> bool:
-        """Checks if the element is a priority tag."""
-        return element.name in self.priority_tags
-
-    def is_non_content_tag(self, element: Tag) -> bool:
-        """Checks if the element is a non-content tag."""
-        return element.name in self.non_content_tags
-
-    def has_negative_class_id(self, element: Tag) -> bool:
-        """Checks if the element has negative indicators in its class or id."""
-        class_id = ' '.join(filter(None, [
-            self.get_attr_str(element.get('class')),
-            element.get('id', '')
-        ]))
-        return bool(self.negative_patterns.search(class_id))
-
-    def has_positive_class_id(self, element: Tag) -> bool:
-        """Checks if the element has positive indicators in its class or id."""
-        class_id = ' '.join(filter(None, [
-            self.get_attr_str(element.get('class')),
-            element.get('id', '')
-        ]))
-        return bool(self.positive_patterns.search(class_id))
-
-    @staticmethod
-    def get_attr_str(attr) -> str:
-        """Converts an attribute value to a string."""
-        if isinstance(attr, list):
-            return ' '.join(attr)
-        elif isinstance(attr, str):
-            return attr
-        else:
-            return ''
-
-    def is_high_text_density(self, element: Tag) -> bool:
-        """Determines if the element has high text density."""
-        text_density = self.calculate_text_density(element)
-        return text_density > self.text_density_threshold
-
-    def calculate_text_density(self, element: Tag) -> float:
-        """Calculates the text density of an element."""
-        text_length = len(element.get_text(strip=True))
-        tag_count = len(element.find_all())
-        tag_count = tag_count or 1  # Prevent division by zero
-        return text_length / tag_count
-
-    def is_low_link_density(self, element: Tag) -> bool:
-        """Determines if the element has low link density."""
-        link_density = self.calculate_link_density(element)
-        return link_density < self.link_density_threshold
-
-    def calculate_link_density(self, element: Tag) -> float:
-        """Calculates the link density of an element."""
-        text = element.get_text(strip=True)
-        if not text:
-            return 0.0
-        link_text = ' '.join(a.get_text(strip=True) for a in element.find_all('a'))
-        return len(link_text) / len(text) if text else 0.0
-
-    def has_sufficient_content(self, element: Tag) -> bool:
-        """Checks if the element has sufficient word count."""
-        word_count = len(element.get_text(strip=True).split())
-        return word_count >= self.min_word_count
-
-    def calculate_dom_depth(self, element: Tag) -> int:
-        """Calculates the depth of an element in the DOM tree."""
-        depth = 0
-        current_element = element
-        while current_element.parent and depth < self.max_dom_depth:
-            depth += 1
-            current_element = current_element.parent
-        return depth
-
-    def has_headings(self, element: Tag) -> bool:
-        """Checks if the element contains heading tags."""
-        return bool(element.find(['h1', 'h2', 'h3']))
-
-    def clean_element(self, element: Tag) -> Tag:
-        """
-        Cleans the selected element by removing unnecessary attributes and nested non-content elements.
-
-        Args:
-            element (Tag): The HTML element to clean.
-
-        Returns:
-            Tag: The cleaned HTML element.
-        """
-        for tag in element.find_all(['script', 'style', 'aside']):
-            tag.decompose()
-        for tag in element.find_all():
-            attrs = dict(tag.attrs)
-            for attr in attrs:
-                if attr in ['style', 'onclick', 'onmouseover', 'align', 'bgcolor']:
-                    del tag.attrs[attr]
-        return element
diff --git a/crawl4ai/content_filter_strategy.py b/crawl4ai/content_filter_strategy.py
new file mode 100644
index 00000000..850ebf11
--- /dev/null
+++ b/crawl4ai/content_filter_strategy.py
@@ -0,0 +1,344 @@
+import os
+import re
+import time
+from bs4 import BeautifulSoup, Tag
+from typing import List, Tuple, Dict
+from rank_bm25 import BM25Okapi
+import nltk
+from time import perf_counter
+from html5lib import parse, treebuilders
+from time import perf_counter
+from collections import deque
+from bs4 import BeautifulSoup, NavigableString, Tag
+from .utils import clean_tokens
+from abc import ABC, abstractmethod
+
+class RelevantContentFilter(ABC):
+    def __init__(self, user_query: str = None):
+        self.user_query = user_query
+        self.included_tags = {
+            # Primary structure
+            'article', 'main', 'section', 'div', 
+            # List structures
+            'ul', 'ol', 'li', 'dl', 'dt', 'dd',
+            # Text content
+            'p', 'span', 'blockquote', 'pre', 'code',
+            # Headers
+            'h1', 'h2', 'h3', 'h4', 'h5', 'h6',
+            # Tables
+            'table', 'thead', 'tbody', 'tr', 'td', 'th',
+            # Other semantic elements
+            'figure', 'figcaption', 'details', 'summary',
+            # Text formatting
+            'em', 'strong', 'b', 'i', 'mark', 'small',
+            # Rich content
+            'time', 'address', 'cite', 'q'
+        }
+        self.excluded_tags = {
+            'nav', 'footer', 'header', 'aside', 'script',
+            'style', 'form', 'iframe', 'noscript'
+        }
+        self.header_tags = {'h1', 'h2', 'h3', 'h4', 'h5', 'h6'}
+        self.negative_patterns = re.compile(
+            r'nav|footer|header|sidebar|ads|comment|promo|advert|social|share',
+            re.I
+        )
+        self.min_word_count = 2
+        
+    @abstractmethod
+    def filter_content(self, html: str) -> List[str]:
+        """Abstract method to be implemented by specific filtering strategies"""
+        pass
+    
+    def extract_page_query(self, soup: BeautifulSoup, body: Tag) -> str:
+        """Common method to extract page metadata with fallbacks"""
+        if self.user_query:
+            return self.user_query
+
+        query_parts = []
+        
+        # Title
+        if soup.title:
+            query_parts.append(soup.title.string)
+        elif soup.find('h1'):
+            query_parts.append(soup.find('h1').get_text())
+            
+        # Meta tags
+        temp = ""
+        for meta_name in ['keywords', 'description']:
+            meta = soup.find('meta', attrs={'name': meta_name})
+            if meta and meta.get('content'):
+                query_parts.append(meta['content'])
+                temp += meta['content']
+                
+        # If still empty, grab first significant paragraph
+        if not temp:
+            # Find the first tag P thatits text contains more than 50 characters
+            for p in body.find_all('p'):
+                if len(p.get_text()) > 150:
+                    query_parts.append(p.get_text()[:150])
+                    break        
+                                
+        return ' '.join(filter(None, query_parts))
+
+
+    def extract_text_chunks(self, body: Tag) -> List[Tuple[str, str]]:
+        """
+        Extracts text chunks from a BeautifulSoup body element while preserving order.
+        Returns list of tuples (text, tag_name) for classification.
+        
+        Args:
+            body: BeautifulSoup Tag object representing the body element
+            
+        Returns:
+            List of (text, tag_name) tuples
+        """
+        # Tags to ignore - inline elements that shouldn't break text flow
+        INLINE_TAGS = {
+            'a', 'abbr', 'acronym', 'b', 'bdo', 'big', 'br', 'button', 'cite', 'code',
+            'dfn', 'em', 'i', 'img', 'input', 'kbd', 'label', 'map', 'object', 'q',
+            'samp', 'script', 'select', 'small', 'span', 'strong', 'sub', 'sup',
+            'textarea', 'time', 'tt', 'var'
+        }
+        
+        # Tags that typically contain meaningful headers
+        HEADER_TAGS = {'h1', 'h2', 'h3', 'h4', 'h5', 'h6', 'header'}
+        
+        chunks = []
+        current_text = []
+        chunk_index = 0
+    
+        def should_break_chunk(tag: Tag) -> bool:
+            """Determine if a tag should cause a break in the current text chunk"""
+            return (
+                tag.name not in INLINE_TAGS
+                and not (tag.name == 'p' and len(current_text) == 0)
+            )
+        
+        # Use deque for efficient push/pop operations
+        stack = deque([(body, False)])
+        
+        while stack:
+            element, visited = stack.pop()
+            
+            if visited:
+                # End of block element - flush accumulated text
+                if current_text and should_break_chunk(element):
+                    text = ' '.join(''.join(current_text).split())
+                    if text:
+                        tag_type = 'header' if element.name in HEADER_TAGS else 'content'
+                        chunks.append((chunk_index, text, tag_type, element))
+                        chunk_index += 1
+                    current_text = []
+                continue
+                
+            if isinstance(element, NavigableString):
+                if str(element).strip():
+                    current_text.append(str(element).strip())
+                continue
+                
+            # Pre-allocate children to avoid multiple list operations
+            children = list(element.children)
+            if not children:
+                continue
+                
+            # Mark block for revisit after processing children
+            stack.append((element, True))
+            
+            # Add children in reverse order for correct processing
+            for child in reversed(children):
+                if isinstance(child, (Tag, NavigableString)):
+                    stack.append((child, False))
+        
+        # Handle any remaining text
+        if current_text:
+            text = ' '.join(''.join(current_text).split())
+            if text:
+                chunks.append((chunk_index, text, 'content', body))
+        
+        return chunks    
+    
+
+    def extract_text_chunks1(self, soup: BeautifulSoup) -> List[Tuple[int, str, Tag]]:
+        """Common method for extracting text chunks"""
+        _text_cache = {}
+        def fast_text(element: Tag) -> str:
+            elem_id = id(element)
+            if elem_id in _text_cache:
+                return _text_cache[elem_id]
+            texts = []
+            for content in element.contents:
+                if isinstance(content, str):
+                    text = content.strip()
+                    if text:
+                        texts.append(text)
+            result = ' '.join(texts)
+            _text_cache[elem_id] = result
+            return result
+        
+        candidates = []
+        index = 0
+        
+        def dfs(element):
+            nonlocal index
+            if isinstance(element, Tag):
+                if element.name in self.included_tags:
+                    if not self.is_excluded(element):
+                        text = fast_text(element)
+                        word_count = len(text.split())
+                        
+                        # Headers pass through with adjusted minimum
+                        if element.name in self.header_tags:
+                            if word_count >= 3:  # Minimal sanity check for headers
+                                candidates.append((index, text, element))
+                                index += 1
+                        # Regular content uses standard minimum
+                        elif word_count >= self.min_word_count:
+                            candidates.append((index, text, element))
+                            index += 1
+                            
+                for child in element.children:
+                    dfs(child)
+
+        dfs(soup.body if soup.body else soup)
+        return candidates
+
+    def is_excluded(self, tag: Tag) -> bool:
+        """Common method for exclusion logic"""
+        if tag.name in self.excluded_tags:
+            return True
+        class_id = ' '.join(filter(None, [
+            ' '.join(tag.get('class', [])),
+            tag.get('id', '')
+        ]))
+        return bool(self.negative_patterns.search(class_id))
+
+    def clean_element(self, tag: Tag) -> str:
+        """Common method for cleaning HTML elements with minimal overhead"""
+        if not tag or not isinstance(tag, Tag):
+            return ""
+            
+        unwanted_tags = {'script', 'style', 'aside', 'form', 'iframe', 'noscript'}
+        unwanted_attrs = {'style', 'onclick', 'onmouseover', 'align', 'bgcolor', 'class', 'id'}
+        
+        # Use string builder pattern for better performance
+        builder = []
+        
+        def render_tag(elem):
+            if not isinstance(elem, Tag):
+                if isinstance(elem, str):
+                    builder.append(elem.strip())
+                return
+                
+            if elem.name in unwanted_tags:
+                return
+                
+            # Start tag
+            builder.append(f'<{elem.name}')
+            
+            # Add cleaned attributes
+            attrs = {k: v for k, v in elem.attrs.items() if k not in unwanted_attrs}
+            for key, value in attrs.items():
+                builder.append(f' {key}="{value}"')
+                
+            builder.append('>')
+            
+            # Process children
+            for child in elem.children:
+                render_tag(child)
+                
+            # Close tag
+            builder.append(f'</{elem.name}>')
+        
+        try:
+            render_tag(tag)
+            return ''.join(builder)
+        except Exception:
+            return str(tag)  # Fallback to original if anything fails
+
+class BM25ContentFilter(RelevantContentFilter):
+    def __init__(self, user_query: str = None, bm25_threshold: float = 1.0):
+        super().__init__(user_query=user_query)
+        self.bm25_threshold = bm25_threshold
+        self.priority_tags = {
+            'h1': 5.0,
+            'h2': 4.0,
+            'h3': 3.0,
+            'title': 4.0,
+            'strong': 2.0,
+            'b': 1.5,
+            'em': 1.5,
+            'blockquote': 2.0,
+            'code': 2.0,
+            'pre': 1.5,
+            'th': 1.5,  # Table headers
+        }
+
+    def filter_content(self, html: str) -> List[str]:
+        """Implements content filtering using BM25 algorithm with priority tag handling"""
+        if not html or not isinstance(html, str):
+            return []
+
+        soup = BeautifulSoup(html, 'lxml')
+        body = soup.find('body')
+        query = self.extract_page_query(soup.find('head'), body)
+        candidates = self.extract_text_chunks(body)
+
+        if not candidates:
+            return []
+
+        # Split into priority and regular candidates
+        priority_candidates = []
+        regular_candidates = []
+        
+        for index, chunk, tag_type, tag in candidates:
+            if tag.name in self.priority_tags:
+                priority_candidates.append((index, chunk, tag_type, tag))
+            else:
+                regular_candidates.append((index, chunk, tag_type, tag))
+
+        # Process regular content with BM25
+        tokenized_corpus = [chunk.lower().split() for _, chunk, _, _ in regular_candidates]
+        tokenized_query = query.lower().split()
+        
+        # Clean from stop words and noise
+        tokenized_corpus = [clean_tokens(tokens) for tokens in tokenized_corpus]
+        tokenized_query = clean_tokens(tokenized_query)
+        
+        bm25 = BM25Okapi(tokenized_corpus)
+        scores = bm25.get_scores(tokenized_query)
+
+        # Score and boost regular candidates
+        scored_candidates = [
+            (score * self.priority_tags.get(tag.name, 1.0), index, chunk, tag_type, tag)
+            for score, (index, chunk, tag_type, tag) in zip(scores, regular_candidates)
+        ]
+        scored_candidates.sort(key=lambda x: x[0], reverse=True)
+
+        # Process scored candidates
+        selected_tags = set()
+        selected_candidates = []
+
+        # First add all priority candidates
+        for index, chunk, tag_type, tag in priority_candidates:
+            tag_id = id(tag)
+            if tag_id not in selected_tags:
+                selected_candidates.append((index, chunk, tag))
+                selected_tags.add(tag_id)
+
+        # Then add scored regular candidates that meet threshold
+        for score, index, chunk, tag_type, tag in scored_candidates:
+            if score < self.bm25_threshold:
+                continue
+            tag_id = id(tag)
+            if tag_id not in selected_tags:
+                selected_candidates.append((index, chunk, tag))
+                selected_tags.add(tag_id)
+
+        if not selected_candidates:
+            return []
+
+        # Sort by original document order
+        selected_candidates.sort(key=lambda x: x[0])
+        return [self.clean_element(tag) for _, _, tag in selected_candidates]
+
diff --git a/crawl4ai/content_scrapping_strategy.py b/crawl4ai/content_scrapping_strategy.py
index a2dbbd96..9c81638c 100644
--- a/crawl4ai/content_scrapping_strategy.py
+++ b/crawl4ai/content_scrapping_strategy.py
@@ -8,7 +8,8 @@ from .config import *
 from bs4 import element, NavigableString, Comment
 from urllib.parse import urljoin
 from requests.exceptions import InvalidSchema
-from .content_cleaning_strategy import ContentCleaningStrategy
+# from .content_cleaning_strategy import ContentCleaningStrategy
+from .content_filter_strategy import RelevantContentFilter, BM25ContentFilter
 
 from .utils import (
     sanitize_input_encode,
@@ -532,8 +533,15 @@ class WebScrapingStrategy(ContentScrapingStrategy):
         fit_markdown = "Set flag 'fit_markdown' to True to get cleaned HTML content."
         fit_html = "Set flag 'fit_markdown' to True to get cleaned HTML content."
         if kwargs.get('fit_markdown', False):
-            cleaner = ContentCleaningStrategy()
-            fit_html = cleaner.clean(cleaned_html)
+            # cleaner = ContentCleaningStrategy()
+            # fit_html = cleaner.clean(cleaned_html)
+            # fit_markdown = h.handle(fit_html)
+            content_filter = BM25ContentFilter(
+                user_query= kwargs.get('fit_markdown_user_query', None),
+                bm25_threshold= kwargs.get('fit_markdown_bm25_threshold', 1.0)
+            )
+            fit_html = content_filter.filter_content(html)
+            fit_html = '\n'.join('<div>{}</div>'.format(s) for s in fit_html)
             fit_markdown = h.handle(fit_html)
 
         cleaned_html = sanitize_html(cleaned_html)
diff --git a/crawl4ai/models.py b/crawl4ai/models.py
index 4ac06797..cab4c45b 100644
--- a/crawl4ai/models.py
+++ b/crawl4ai/models.py
@@ -1,5 +1,7 @@
 from pydantic import BaseModel, HttpUrl
-from typing import List, Dict, Optional
+from typing import List, Dict, Optional, Callable, Awaitable
+
+
 
 class UrlModel(BaseModel):
     url: HttpUrl
@@ -12,6 +14,7 @@ class CrawlResult(BaseModel):
     cleaned_html: Optional[str] = None
     media: Dict[str, List[Dict]] = {}
     links: Dict[str, List[Dict]] = {}
+    downloaded_files: Optional[List[str]] = None
     screenshot: Optional[str] = None
     markdown: Optional[str] = None
     fit_markdown: Optional[str] = None
@@ -21,4 +24,15 @@ class CrawlResult(BaseModel):
     error_message: Optional[str] = None
     session_id: Optional[str] = None
     response_headers: Optional[dict] = None
-    status_code: Optional[int] = None
\ No newline at end of file
+    status_code: Optional[int] = None
+    
+class AsyncCrawlResponse(BaseModel):
+    html: str
+    response_headers: Dict[str, str]
+    status_code: int
+    screenshot: Optional[str] = None
+    get_delayed_content: Optional[Callable[[Optional[float]], Awaitable[str]]] = None
+    downloaded_files: Optional[List[str]] = None
+
+    class Config:
+        arbitrary_types_allowed = True
diff --git a/crawl4ai/utils.py b/crawl4ai/utils.py
index d8bd6992..49483f43 100644
--- a/crawl4ai/utils.py
+++ b/crawl4ai/utils.py
@@ -1054,3 +1054,58 @@ def is_external_url(url, base_domain):
         return False
         
     return False
+
+def clean_tokens(tokens: list[str]) -> list[str]:
+    # Set of tokens to remove
+    noise = {'ccp', 'up', '↑', '▲', '⬆️', 'a', 'an', 'at', 'by', 'in', 'of', 'on', 'to', 'the'}
+
+    STOP_WORDS = {
+        'a', 'an', 'and', 'are', 'as', 'at', 'be', 'by', 'for', 'from', 
+        'has', 'he', 'in', 'is', 'it', 'its', 'of', 'on', 'that', 'the', 
+        'to', 'was', 'were', 'will', 'with',
+        
+        # Pronouns
+        'i', 'you', 'he', 'she', 'it', 'we', 'they',
+        'me', 'him', 'her', 'us', 'them',
+        'my', 'your', 'his', 'her', 'its', 'our', 'their',
+        'mine', 'yours', 'hers', 'ours', 'theirs',
+        'myself', 'yourself', 'himself', 'herself', 'itself', 'ourselves', 'themselves',
+        
+        # Common verbs
+        'am', 'is', 'are', 'was', 'were', 'be', 'been', 'being',
+        'have', 'has', 'had', 'having', 'do', 'does', 'did', 'doing',
+        
+        # Prepositions
+        'about', 'above', 'across', 'after', 'against', 'along', 'among', 'around',
+        'at', 'before', 'behind', 'below', 'beneath', 'beside', 'between', 'beyond',
+        'by', 'down', 'during', 'except', 'for', 'from', 'in', 'inside', 'into',
+        'near', 'of', 'off', 'on', 'out', 'outside', 'over', 'past', 'through',
+        'to', 'toward', 'under', 'underneath', 'until', 'up', 'upon', 'with', 'within',
+        
+        # Conjunctions
+        'and', 'but', 'or', 'nor', 'for', 'yet', 'so',
+        'although', 'because', 'since', 'unless',
+        
+        # Articles
+        'a', 'an', 'the',
+        
+        # Other common words
+        'this', 'that', 'these', 'those',
+        'what', 'which', 'who', 'whom', 'whose',
+        'when', 'where', 'why', 'how',
+        'all', 'any', 'both', 'each', 'few', 'more', 'most', 'other', 'some', 'such',
+        'can', 'cannot', "can't", 'could', "couldn't",
+        'may', 'might', 'must', "mustn't",
+        'shall', 'should', "shouldn't",
+        'will', "won't", 'would', "wouldn't",
+        'not', "n't", 'no', 'nor', 'none'
+    }   
+   
+    # Single comprehension, more efficient than multiple passes
+    return [token for token in tokens 
+            if len(token) > 2 
+            and token not in noise 
+            and token not in STOP_WORDS
+            and not token.startswith('↑')
+            and not token.startswith('▲')
+            and not token.startswith('⬆')]
diff --git a/tests/async/test_async_doanloader.py b/tests/async/test_async_doanloader.py
new file mode 100644
index 00000000..4798b4ca
--- /dev/null
+++ b/tests/async/test_async_doanloader.py
@@ -0,0 +1,229 @@
+import os
+import sys
+import asyncio
+import shutil
+from typing import List
+import tempfile
+import time
+
+# Add the parent directory to the Python path
+parent_dir = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
+sys.path.append(parent_dir)
+
+from crawl4ai.async_webcrawler import AsyncWebCrawler
+
+class TestDownloads:
+    def __init__(self):
+        self.temp_dir = tempfile.mkdtemp(prefix="crawl4ai_test_")
+        self.download_dir = os.path.join(self.temp_dir, "downloads")
+        os.makedirs(self.download_dir, exist_ok=True)
+        self.results: List[str] = []
+        
+    def cleanup(self):
+        shutil.rmtree(self.temp_dir)
+        
+    def log_result(self, test_name: str, success: bool, message: str = ""):
+        result = f"{'✅' if success else '❌'} {test_name}: {message}"
+        self.results.append(result)
+        print(result)
+        
+    async def test_basic_download(self):
+        """Test basic file download functionality"""
+        try:
+            async with AsyncWebCrawler(
+                accept_downloads=True,
+                downloads_path=self.download_dir,
+                verbose=True
+            ) as crawler:
+                # Python.org downloads page typically has stable download links
+                result = await crawler.arun(
+                    url="https://www.python.org/downloads/",
+                    js_code="""
+                    // Click first download link
+                    const downloadLink = document.querySelector('a[href$=".exe"]');
+                    if (downloadLink) downloadLink.click();
+                    """
+                )
+                
+                success = result.downloaded_files is not None and len(result.downloaded_files) > 0
+                self.log_result(
+                    "Basic Download",
+                    success,
+                    f"Downloaded {len(result.downloaded_files or [])} files" if success else "No files downloaded"
+                )
+        except Exception as e:
+            self.log_result("Basic Download", False, str(e))
+
+    async def test_persistent_context_download(self):
+        """Test downloads with persistent context"""
+        try:
+            user_data_dir = os.path.join(self.temp_dir, "user_data")
+            os.makedirs(user_data_dir, exist_ok=True)
+            
+            async with AsyncWebCrawler(
+                accept_downloads=True,
+                downloads_path=self.download_dir,
+                use_persistent_context=True,
+                user_data_dir=user_data_dir,
+                verbose=True
+            ) as crawler:
+                result = await crawler.arun(
+                    url="https://www.python.org/downloads/",
+                    js_code="""
+                    const downloadLink = document.querySelector('a[href$=".exe"]');
+                    if (downloadLink) downloadLink.click();
+                    """
+                )
+                
+                success = result.downloaded_files is not None and len(result.downloaded_files) > 0
+                self.log_result(
+                    "Persistent Context Download",
+                    success,
+                    f"Downloaded {len(result.downloaded_files or [])} files" if success else "No files downloaded"
+                )
+        except Exception as e:
+            self.log_result("Persistent Context Download", False, str(e))
+
+    async def test_multiple_downloads(self):
+        """Test multiple simultaneous downloads"""
+        try:
+            async with AsyncWebCrawler(
+                accept_downloads=True,
+                downloads_path=self.download_dir,
+                verbose=True
+            ) as crawler:
+                result = await crawler.arun(
+                    url="https://www.python.org/downloads/",
+                    js_code="""
+                    // Click multiple download links
+                    const downloadLinks = document.querySelectorAll('a[href$=".exe"]');
+                    downloadLinks.forEach(link => link.click());
+                    """
+                )
+                
+                success = result.downloaded_files is not None and len(result.downloaded_files) > 1
+                self.log_result(
+                    "Multiple Downloads",
+                    success,
+                    f"Downloaded {len(result.downloaded_files or [])} files" if success else "Not enough files downloaded"
+                )
+        except Exception as e:
+            self.log_result("Multiple Downloads", False, str(e))
+
+    async def test_different_browsers(self):
+        """Test downloads across different browser types"""
+        browsers = ["chromium", "firefox", "webkit"]
+        
+        for browser_type in browsers:
+            try:
+                async with AsyncWebCrawler(
+                    accept_downloads=True,
+                    downloads_path=self.download_dir,
+                    browser_type=browser_type,
+                    verbose=True
+                ) as crawler:
+                    result = await crawler.arun(
+                        url="https://www.python.org/downloads/",
+                        js_code="""
+                        const downloadLink = document.querySelector('a[href$=".exe"]');
+                        if (downloadLink) downloadLink.click();
+                        """
+                    )
+                    
+                    success = result.downloaded_files is not None and len(result.downloaded_files) > 0
+                    self.log_result(
+                        f"{browser_type.title()} Download",
+                        success,
+                        f"Downloaded {len(result.downloaded_files or [])} files" if success else "No files downloaded"
+                    )
+            except Exception as e:
+                self.log_result(f"{browser_type.title()} Download", False, str(e))
+
+    async def test_edge_cases(self):
+        """Test various edge cases"""
+        
+        # Test 1: Downloads without specifying download path
+        try:
+            async with AsyncWebCrawler(
+                accept_downloads=True,
+                verbose=True
+            ) as crawler:
+                result = await crawler.arun(
+                    url="https://www.python.org/downloads/",
+                    js_code="document.querySelector('a[href$=\".exe\"]').click()"
+                )
+                self.log_result(
+                    "Default Download Path",
+                    True,
+                    f"Downloaded to default path: {result.downloaded_files[0] if result.downloaded_files else 'None'}"
+                )
+        except Exception as e:
+            self.log_result("Default Download Path", False, str(e))
+
+        # Test 2: Downloads with invalid path
+        try:
+            async with AsyncWebCrawler(
+                accept_downloads=True,
+                downloads_path="/invalid/path/that/doesnt/exist",
+                verbose=True
+            ) as crawler:
+                result = await crawler.arun(
+                    url="https://www.python.org/downloads/",
+                    js_code="document.querySelector('a[href$=\".exe\"]').click()"
+                )
+                self.log_result("Invalid Download Path", False, "Should have raised an error")
+        except Exception as e:
+            self.log_result("Invalid Download Path", True, "Correctly handled invalid path")
+
+        # Test 3: Download with accept_downloads=False
+        try:
+            async with AsyncWebCrawler(
+                accept_downloads=False,
+                verbose=True
+            ) as crawler:
+                result = await crawler.arun(
+                    url="https://www.python.org/downloads/",
+                    js_code="document.querySelector('a[href$=\".exe\"]').click()"
+                )
+                success = result.downloaded_files is None
+                self.log_result(
+                    "Disabled Downloads",
+                    success,
+                    "Correctly ignored downloads" if success else "Unexpectedly downloaded files"
+                )
+        except Exception as e:
+            self.log_result("Disabled Downloads", False, str(e))
+
+    async def run_all_tests(self):
+        """Run all test cases"""
+        print("\n🧪 Running Download Tests...\n")
+        
+        test_methods = [
+            self.test_basic_download,
+            self.test_persistent_context_download,
+            self.test_multiple_downloads,
+            self.test_different_browsers,
+            self.test_edge_cases
+        ]
+        
+        for test in test_methods:
+            print(f"\n📝 Running {test.__doc__}...")
+            await test()
+            await asyncio.sleep(2)  # Brief pause between tests
+            
+        print("\n📊 Test Results Summary:")
+        for result in self.results:
+            print(result)
+            
+        successes = len([r for r in self.results if '✅' in r])
+        total = len(self.results)
+        print(f"\nTotal: {successes}/{total} tests passed")
+        
+        self.cleanup()
+
+async def main():
+    tester = TestDownloads()
+    await tester.run_all_tests()
+
+if __name__ == "__main__":
+    asyncio.run(main())
\ No newline at end of file

From 7f1ae5adcf8552f9520d93eeec446c6ea7cd57e6 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Thu, 14 Nov 2024 22:51:51 +0800
Subject: [PATCH 020/115] Update changelog

---
 CHANGELOG.md | 7 +++++++
 1 file changed, 7 insertions(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 33d09184..7a00aa2e 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -1,5 +1,12 @@
 # Changelog
 
+# [0.3.74] November 14, 2024
+
+- In this commit, the library is updated to process file downloads. Users can now specify a download folder and trigger the download process via JavaScript or other means, with all files being saved. The list of downloaded files will also be added to the crowd result object.
+- Another thing this commit introduces is the concept of the Relevance Content Filter. This is an improvement over Fit Markdown. This class of strategies aims to extract the main content from a given page - the part that really matters and is useful to be processed. One strategy has been created using the BM25 algorithm, which finds chunks of text from the web page relevant to its title, descriptions, and keywords, or supports a given user query and matches them. The result is then returned to the main engine to be converted to Markdown. Plans include adding approaches using language models as well.
+- The cache database was updated to hold information about response headers and downloaded files.
+
+
 # Changelog - November 13, 2024
 
 ### Added

From 1f269f98344f08bc3390a4f9ec689787cdf5b59b Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Fri, 15 Nov 2024 18:11:11 +0800
Subject: [PATCH 021/115] test(content_filter): add comprehensive tests for
 BM25ContentFilter functionality

---
 tests/async/test_content_filter.py | 175 +++++++++++++++++++++++++++++
 1 file changed, 175 insertions(+)
 create mode 100644 tests/async/test_content_filter.py

diff --git a/tests/async/test_content_filter.py b/tests/async/test_content_filter.py
new file mode 100644
index 00000000..a873c414
--- /dev/null
+++ b/tests/async/test_content_filter.py
@@ -0,0 +1,175 @@
+import os, sys
+import pytest
+from bs4 import BeautifulSoup
+from typing import List
+
+# Add the parent directory to the Python path
+parent_dir = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
+sys.path.append(parent_dir)
+
+from crawl4ai.content_filter_strategy import BM25ContentFilter
+
+@pytest.fixture
+def basic_html():
+    return """
+    <html>
+        <head>
+            <title>Test Article</title>
+            <meta name="description" content="Test description">
+            <meta name="keywords" content="test, keywords">
+        </head>
+        <body>
+            <h1>Main Heading</h1>
+            <article>
+                <p>This is a long paragraph with more than fifty words. It continues with more text to ensure we meet the minimum word count threshold. We need to make sure this paragraph is substantial enough to be considered for extraction according to our filtering rules. This should be enough words now.</p>
+                <div class="navigation">Skip this nav content</div>
+            </article>
+        </body>
+    </html>
+    """
+
+@pytest.fixture
+def wiki_html():
+    return """
+    <html>
+        <head>
+            <title>Wikipedia Article</title>
+        </head>
+        <body>
+            <h1>Article Title</h1>
+            <h2>Section 1</h2>
+            <p>Short but important section header description.</p>
+            <div class="content">
+                <p>Long paragraph with sufficient words to meet the minimum threshold. This paragraph continues with more text to ensure we have enough content for proper testing. We need to make sure this has enough words to pass our filters and be considered valid content for extraction purposes.</p>
+            </div>
+        </body>
+    </html>
+    """
+
+@pytest.fixture
+def no_meta_html():
+    return """
+    <html>
+        <body>
+            <h1>Simple Page</h1>
+            <p>First paragraph that should be used as fallback for query when no meta tags exist. This text needs to be long enough to serve as a meaningful fallback for our content extraction process.</p>
+        </body>
+    </html>
+    """
+
+class TestBM25ContentFilter:
+    def test_basic_extraction(self, basic_html):
+        """Test basic content extraction functionality"""
+        filter = BM25ContentFilter()
+        contents = filter.filter_content(basic_html)
+        
+        assert contents, "Should extract content"
+        assert len(contents) >= 1, "Should extract at least one content block"
+        assert "long paragraph" in ' '.join(contents).lower()
+        assert "navigation" not in ' '.join(contents).lower()
+
+    def test_user_query_override(self, basic_html):
+        """Test that user query overrides metadata extraction"""
+        user_query = "specific test query"
+        filter = BM25ContentFilter(user_query=user_query)
+        
+        # Access internal state to verify query usage
+        soup = BeautifulSoup(basic_html, 'lxml')
+        extracted_query = filter.extract_page_query(soup.find('head'))
+        
+        assert extracted_query == user_query
+        assert "Test description" not in extracted_query
+
+    def test_header_extraction(self, wiki_html):
+        """Test that headers are properly extracted despite length"""
+        filter = BM25ContentFilter()
+        contents = filter.filter_content(wiki_html)
+        
+        combined_content = ' '.join(contents).lower()
+        assert "section 1" in combined_content, "Should include section header"
+        assert "article title" in combined_content, "Should include main title"
+
+    def test_no_metadata_fallback(self, no_meta_html):
+        """Test fallback behavior when no metadata is present"""
+        filter = BM25ContentFilter()
+        contents = filter.filter_content(no_meta_html)
+        
+        assert contents, "Should extract content even without metadata"
+        assert "First paragraph" in ' '.join(contents), "Should use first paragraph content"
+
+    def test_empty_input(self):
+        """Test handling of empty input"""
+        filter = BM25ContentFilter()
+        assert filter.filter_content("") == []
+        assert filter.filter_content(None) == []
+
+    def test_malformed_html(self):
+        """Test handling of malformed HTML"""
+        malformed_html = "<p>Unclosed paragraph<div>Nested content</p></div>"
+        filter = BM25ContentFilter()
+        contents = filter.filter_content(malformed_html)
+        
+        assert isinstance(contents, list), "Should return list even with malformed HTML"
+        
+    def test_threshold_behavior(self, basic_html):
+        """Test different BM25 threshold values"""
+        strict_filter = BM25ContentFilter(bm25_threshold=2.0)
+        lenient_filter = BM25ContentFilter(bm25_threshold=0.5)
+        
+        strict_contents = strict_filter.filter_content(basic_html)
+        lenient_contents = lenient_filter.filter_content(basic_html)
+        
+        assert len(strict_contents) <= len(lenient_contents), \
+            "Strict threshold should extract fewer elements"
+
+    def test_html_cleaning(self, basic_html):
+        """Test HTML cleaning functionality"""
+        filter = BM25ContentFilter()
+        contents = filter.filter_content(basic_html)
+        
+        cleaned_content = ' '.join(contents)
+        assert 'class=' not in cleaned_content, "Should remove class attributes"
+        assert 'style=' not in cleaned_content, "Should remove style attributes"
+        assert '<script' not in cleaned_content, "Should remove script tags"
+
+    def test_large_content(self):
+        """Test handling of large content blocks"""
+        large_html = f"""
+        <html><body>
+            <article>{'<p>Test content. ' * 1000}</article>
+        </body></html>
+        """
+        filter = BM25ContentFilter()
+        contents = filter.filter_content(large_html)
+        assert contents, "Should handle large content blocks"
+
+    @pytest.mark.parametrize("unwanted_tag", [
+        'script', 'style', 'nav', 'footer', 'header'
+    ])
+    def test_excluded_tags(self, unwanted_tag):
+        """Test that specific tags are properly excluded"""
+        html = f"""
+        <html><body>
+            <{unwanted_tag}>Should not appear</{unwanted_tag}>
+            <p>Should appear</p>
+        </body></html>
+        """
+        filter = BM25ContentFilter()
+        contents = filter.filter_content(html)
+        
+        combined_content = ' '.join(contents).lower()
+        assert "should not appear" not in combined_content
+        
+    def test_performance(self, basic_html):
+        """Test performance with timer"""
+        filter = BM25ContentFilter()
+        
+        import time
+        start = time.perf_counter()
+        filter.filter_content(basic_html)
+        duration = time.perf_counter() - start
+        
+        assert duration < 1.0, f"Processing took too long: {duration:.2f} seconds"
+
+if __name__ == "__main__":
+    pytest.main([__file__])
\ No newline at end of file

From ae7ebc0bd82e6d621f0d13a8a22d537f31dff0f6 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Fri, 15 Nov 2024 20:16:13 +0800
Subject: [PATCH 022/115] chore: update .gitignore and enhance changelog with
 major feature additions and examples

---
 .gitignore                        |   3 +-
 CHANGELOG.md                      |  30 +++++
 docs/examples/v0.3.74.overview.py | 195 ++++++++++++++++++++++++++++++
 3 files changed, 227 insertions(+), 1 deletion(-)
 create mode 100644 docs/examples/v0.3.74.overview.py

diff --git a/.gitignore b/.gitignore
index aca02959..0acec10f 100644
--- a/.gitignore
+++ b/.gitignore
@@ -209,4 +209,5 @@ git_issues.md
 .tests/
 .issues/
 .docs/
-.issues/
\ No newline at end of file
+.issues/
+.gitboss/
\ No newline at end of file
diff --git a/CHANGELOG.md b/CHANGELOG.md
index 7a00aa2e..e82fa6a2 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -1,5 +1,35 @@
 # Changelog
 
+
+## Version 0.3.74, Major Changes
+
+1. **File Download Processing** (Nov 14, 2024)
+   - Added capability for users to specify download folders
+   - Implemented file download tracking in crowd result object
+   - Created new file: `tests/async/test_async_doanloader.py`
+
+2. **Content Filtering Improvements** (Nov 14, 2024)
+   - Introduced Relevance Content Filter as an improvement over Fit Markdown
+   - Implemented BM25 algorithm for content relevance matching
+   - Added new file: `crawl4ai/content_filter_strategy.py`
+   - Removed deprecated: `crawl4ai/content_cleaning_strategy.py`
+
+3. **Local File and Raw HTML Support** (Nov 13, 2024)
+   - Added support for processing local files
+   - Implemented raw HTML input handling in AsyncWebCrawler
+   - Enhanced `crawl4ai/async_webcrawler.py` with significant performance improvements
+
+4. **Browser Management Enhancements** (Nov 12, 2024)
+   - Implemented new async crawler strategy using Playwright
+   - Introduced ManagedBrowser for better browser session handling
+   - Added support for persistent browser sessions
+   - Updated from playwright_stealth to tf-playwright-stealth
+
+5. **API Server Component**
+   - Added CORS support
+   - Implemented static file serving
+   - Enhanced root redirect functionality
+
 # [0.3.74] November 14, 2024
 
 - In this commit, the library is updated to process file downloads. Users can now specify a download folder and trigger the download process via JavaScript or other means, with all files being saved. The list of downloaded files will also be added to the crowd result object.
diff --git a/docs/examples/v0.3.74.overview.py b/docs/examples/v0.3.74.overview.py
new file mode 100644
index 00000000..579d05dd
--- /dev/null
+++ b/docs/examples/v0.3.74.overview.py
@@ -0,0 +1,195 @@
+import asyncio
+import os
+from pathlib import Path
+import aiohttp
+import json
+from crawl4ai import AsyncWebCrawler
+from crawl4ai.content_filter_strategy import BM25ContentFilter
+
+# 1. File Download Processing Example
+async def download_example():
+    """Example of downloading files from Python.org"""
+    # downloads_path = os.path.join(os.getcwd(), "downloads")
+    downloads_path = os.path.join(Path.home(), ".crawl4ai", "downloads")
+    os.makedirs(downloads_path, exist_ok=True)
+    
+    print(f"Downloads will be saved to: {downloads_path}")
+    
+    async with AsyncWebCrawler(
+        accept_downloads=True,
+        downloads_path=downloads_path,
+        verbose=True
+    ) as crawler:
+        result = await crawler.arun(
+            url="https://www.python.org/downloads/",
+            js_code="""
+            // Find and click the first Windows installer link
+            const downloadLink = document.querySelector('a[href$=".exe"]');
+            if (downloadLink) {
+                console.log('Found download link:', downloadLink.href);
+                downloadLink.click();
+            } else {
+                console.log('No .exe download link found');
+            }
+            """,
+            wait_for=5  # Wait 5 seconds to ensure download starts
+        )
+        
+        if result.downloaded_files:
+            print("\nDownload successful!")
+            print("Downloaded files:")
+            for file_path in result.downloaded_files:
+                print(f"- {file_path}")
+                print(f"  File size: {os.path.getsize(file_path) / (1024*1024):.2f} MB")
+        else:
+            print("\nNo files were downloaded")
+
+# 2. Content Filtering with BM25 Example
+async def content_filtering_example():
+    """Example of using the new BM25 content filtering"""
+    async with AsyncWebCrawler(verbose=True) as crawler:
+        # Create filter with custom query for OpenAI's blog
+        content_filter = BM25ContentFilter(
+            user_query="AI language models research innovation",
+            bm25_threshold=1.0
+        )
+        
+        result = await crawler.arun(
+            url="https://openai.com/blog",
+            extraction_strategy=content_filter
+        )
+        
+        print(f"Filtered content: {result.extracted_content}")
+
+# 3. Local File and Raw HTML Processing Example
+async def local_and_raw_html_example():
+    """Example of processing local files and raw HTML"""
+    # Create a sample HTML file
+    sample_file = "sample.html"
+    with open(sample_file, "w") as f:
+        f.write("""
+        <html><body>
+            <h1>Test Content</h1>
+            <p>This is a test paragraph.</p>
+        </body></html>
+        """)
+    
+    async with AsyncWebCrawler(verbose=True) as crawler:
+        # Process local file
+        local_result = await crawler.arun(
+            url=f"file://{os.path.abspath(sample_file)}"
+        )
+        
+        # Process raw HTML
+        raw_html = """
+        <html><body>
+            <h1>Raw HTML Test</h1>
+            <p>This is a test of raw HTML processing.</p>
+        </body></html>
+        """
+        raw_result = await crawler.arun(
+            url=f"raw:{raw_html}"
+        )
+        
+        # Clean up
+        os.remove(sample_file)
+        
+        print("Local file content:", local_result.markdown)
+        print("\nRaw HTML content:", raw_result.markdown)
+
+# 4. Browser Management Example
+async def browser_management_example():
+    """Example of using enhanced browser management features"""
+    # Use the specified user directory path
+    user_data_dir = os.path.join(Path.home(), ".crawl4ai", "browser_profile")
+    os.makedirs(user_data_dir, exist_ok=True)
+    
+    print(f"Browser profile will be saved to: {user_data_dir}")
+    
+    async with AsyncWebCrawler(
+        use_managed_browser=True,
+        user_data_dir=user_data_dir,
+        headless=False,
+        verbose=True
+    ) as crawler:
+        # Use GitHub as an example - it's a good test for browser management
+        # because it requires proper browser handling
+        result = await crawler.arun(
+            url="https://github.com/trending",
+            session_id="persistent_session_1",
+            js_code="""
+            // Custom JavaScript to execute on GitHub's trending page
+            const repos = document.querySelectorAll('article.Box-row');
+            const data = Array.from(repos).map(repo => ({
+                name: repo.querySelector('h2')?.textContent?.trim(),
+                description: repo.querySelector('p')?.textContent?.trim(),
+                language: repo.querySelector('[itemprop="programmingLanguage"]')?.textContent?.trim()
+            }));
+            console.log('Trending repositories:', JSON.stringify(data, null, 2));
+            """
+        )
+        
+        print("\nBrowser session result:", result.success)
+        if result.success:
+            print("Page title:", result.metadata.get('title', 'No title found'))
+
+# 5. API Usage Example
+async def api_example():
+    """Example of using the new API endpoints"""
+    async with aiohttp.ClientSession() as session:
+        # Submit crawl job
+        crawl_request = {
+            "urls": ["https://news.ycombinator.com"],  # Hacker News as an example
+            "extraction_config": {
+                "type": "json_css",
+                "params": {
+                    "selectors": {
+                        "titles": ".title a",
+                        "scores": ".score",
+                        "comments": ".comment-tree"
+                    }
+                }
+            },
+            "crawler_params": {
+                "headless": True,
+                "use_managed_browser": True
+            },
+            "screenshot": True,
+            "magic": True
+        }
+        
+        async with session.post(
+            "http://localhost:11235/crawl",
+            json=crawl_request
+        ) as response:
+            task_data = await response.json()
+            task_id = task_data["task_id"]
+            
+            # Check task status
+            async with session.get(
+                f"http://localhost:11235/task/{task_id}"
+            ) as status_response:
+                result = await status_response.json()
+                print(f"Task result: {result}")
+
+# Main execution
+async def main():
+    print("Running Crawl4AI feature examples...")
+    
+    print("\n1. Running Download Example:")
+    await download_example()
+    
+    print("\n2. Running Content Filtering Example:")
+    await content_filtering_example()
+    
+    print("\n3. Running Local and Raw HTML Example:")
+    await local_and_raw_html_example()
+    
+    print("\n4. Running Browser Management Example:")
+    await browser_management_example()
+    
+    print("\n5. Running API Example:")
+    await api_example()
+
+if __name__ == "__main__":
+    asyncio.run(main())
\ No newline at end of file

From d0014c67931a27f3969e257da59aa9b70527b4cf Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Sat, 16 Nov 2024 14:54:41 +0800
Subject: [PATCH 023/115]   New async database manager and migration support  
 - Introduced AsyncDatabaseManager for async DB management.   - Added
 migration feature to transition to file-based storage.   - Enhanced web
 crawler with improved caching logic.   - Updated requirements and setup for
 async processing.

---
 crawl4ai/async_database.3.73.py | 285 ++++++++++++++++++++++++++++++++
 crawl4ai/async_database.py      | 185 +++++++++++++++------
 crawl4ai/async_webcrawler.py    | 116 +++++++------
 crawl4ai/config.py              |   4 +-
 crawl4ai/migrations.py          | 152 +++++++++++++++++
 crawl4ai/utils.py               |  27 +++
 requirements.txt                |   1 +
 setup.py                        |  34 +++-
 8 files changed, 685 insertions(+), 119 deletions(-)
 create mode 100644 crawl4ai/async_database.3.73.py
 create mode 100644 crawl4ai/migrations.py

diff --git a/crawl4ai/async_database.3.73.py b/crawl4ai/async_database.3.73.py
new file mode 100644
index 00000000..f86c7f1d
--- /dev/null
+++ b/crawl4ai/async_database.3.73.py
@@ -0,0 +1,285 @@
+import os
+from pathlib import Path
+import aiosqlite
+import asyncio
+from typing import Optional, Tuple, Dict
+from contextlib import asynccontextmanager
+import logging
+import json  # Added for serialization/deserialization
+from .utils import ensure_content_dirs, generate_content_hash
+import xxhash
+import aiofiles
+# Set up logging
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
+
+DB_PATH = os.path.join(Path.home(), ".crawl4ai")
+os.makedirs(DB_PATH, exist_ok=True)
+DB_PATH = os.path.join(DB_PATH, "crawl4ai.db")
+
+class AsyncDatabaseManager:
+    def __init__(self, pool_size: int = 10, max_retries: int = 3):
+        self.db_path = DB_PATH
+        self.content_paths = ensure_content_dirs(os.path.dirname(DB_PATH))
+        self.pool_size = pool_size
+        self.max_retries = max_retries
+        self.connection_pool: Dict[int, aiosqlite.Connection] = {}
+        self.pool_lock = asyncio.Lock()
+        self.connection_semaphore = asyncio.Semaphore(pool_size)
+        
+    async def initialize(self):
+        """Initialize the database and connection pool"""
+        await self.ainit_db()
+        
+    async def cleanup(self):
+        """Cleanup connections when shutting down"""
+        async with self.pool_lock:
+            for conn in self.connection_pool.values():
+                await conn.close()
+            self.connection_pool.clear()
+
+    @asynccontextmanager
+    async def get_connection(self):
+        """Connection pool manager"""
+        async with self.connection_semaphore:
+            task_id = id(asyncio.current_task())
+            try:
+                async with self.pool_lock:
+                    if task_id not in self.connection_pool:
+                        conn = await aiosqlite.connect(
+                            self.db_path,
+                            timeout=30.0
+                        )
+                        await conn.execute('PRAGMA journal_mode = WAL')
+                        await conn.execute('PRAGMA busy_timeout = 5000')
+                        self.connection_pool[task_id] = conn
+                    
+                yield self.connection_pool[task_id]
+                
+            except Exception as e:
+                logger.error(f"Connection error: {e}")
+                raise
+            finally:
+                async with self.pool_lock:
+                    if task_id in self.connection_pool:
+                        await self.connection_pool[task_id].close()
+                        del self.connection_pool[task_id]
+
+    async def execute_with_retry(self, operation, *args):
+        """Execute database operations with retry logic"""
+        for attempt in range(self.max_retries):
+            try:
+                async with self.get_connection() as db:
+                    result = await operation(db, *args)
+                    await db.commit()
+                    return result
+            except Exception as e:
+                if attempt == self.max_retries - 1:
+                    logger.error(f"Operation failed after {self.max_retries} attempts: {e}")
+                    raise
+                await asyncio.sleep(1 * (attempt + 1))  # Exponential backoff
+
+    async def ainit_db(self):
+        """Initialize database schema"""
+        async def _init(db):
+            await db.execute('''
+                CREATE TABLE IF NOT EXISTS crawled_data (
+                    url TEXT PRIMARY KEY,
+                    html TEXT,
+                    cleaned_html TEXT,
+                    markdown TEXT,
+                    extracted_content TEXT,
+                    success BOOLEAN,
+                    media TEXT DEFAULT "{}",
+                    links TEXT DEFAULT "{}",
+                    metadata TEXT DEFAULT "{}",
+                    screenshot TEXT DEFAULT "",
+                    response_headers TEXT DEFAULT "{}",
+                    downloaded_files TEXT DEFAULT "{}"  -- New column added
+                )
+            ''')
+        
+        await self.execute_with_retry(_init)
+        await self.update_db_schema()
+
+    async def update_db_schema(self):
+        """Update database schema if needed"""
+        async def _check_columns(db):
+            cursor = await db.execute("PRAGMA table_info(crawled_data)")
+            columns = await cursor.fetchall()
+            return [column[1] for column in columns]
+
+        column_names = await self.execute_with_retry(_check_columns)
+        
+        # List of new columns to add
+        new_columns = ['media', 'links', 'metadata', 'screenshot', 'response_headers', 'downloaded_files']
+        
+        for column in new_columns:
+            if column not in column_names:
+                await self.aalter_db_add_column(column)
+
+    async def aalter_db_add_column(self, new_column: str):
+        """Add new column to the database"""
+        async def _alter(db):
+            if new_column == 'response_headers':
+                await db.execute(f'ALTER TABLE crawled_data ADD COLUMN {new_column} TEXT DEFAULT "{{}}"')
+            else:
+                await db.execute(f'ALTER TABLE crawled_data ADD COLUMN {new_column} TEXT DEFAULT ""')
+            logger.info(f"Added column '{new_column}' to the database.")
+
+        await self.execute_with_retry(_alter)
+
+
+    async def aget_cached_url(self, url: str) -> Optional[Tuple[str, str, str, str, str, bool, str, str, str, str]]:
+        """Retrieve cached URL data"""
+        async def _get(db):
+            async with db.execute(
+                '''
+                SELECT url, html, cleaned_html, markdown, 
+                    extracted_content, success, media, links,
+                    metadata, screenshot, response_headers,
+                    downloaded_files
+                FROM crawled_data WHERE url = ?
+                ''',
+                (url,)
+            ) as cursor:
+                row = await cursor.fetchone()
+                if row:
+                    # Load content from files using stored hashes
+                    html = await self._load_content(row[1], 'html') if row[1] else ""
+                    cleaned = await self._load_content(row[2], 'cleaned') if row[2] else ""
+                    markdown = await self._load_content(row[3], 'markdown') if row[3] else ""
+                    extracted = await self._load_content(row[4], 'extracted') if row[4] else ""
+                    screenshot = await self._load_content(row[9], 'screenshots') if row[9] else ""
+                    
+                    return (
+                        row[0],  # url
+                        html or "",  # Return empty string if file not found
+                        cleaned or "",
+                        markdown or "", 
+                        extracted or "",
+                        row[5],  # success
+                        json.loads(row[6] or '{}'),  # media
+                        json.loads(row[7] or '{}'),  # links
+                        json.loads(row[8] or '{}'),  # metadata
+                        screenshot or "",
+                        json.loads(row[10] or '{}'),  # response_headers
+                        json.loads(row[11] or '[]')  # downloaded_files
+                    )
+                return None
+
+        try:
+            return await self.execute_with_retry(_get)
+        except Exception as e:
+            logger.error(f"Error retrieving cached URL: {e}")
+            return None
+
+    async def acache_url(self, url: str, html: str, cleaned_html: str, 
+                        markdown: str, extracted_content: str, success: bool,
+                        media: str = "{}", links: str = "{}", 
+                        metadata: str = "{}", screenshot: str = "",
+                        response_headers: str = "{}", downloaded_files: str = "[]"):
+        """Cache URL data with content stored in filesystem"""
+        
+        # Store content files and get hashes
+        html_hash = await self._store_content(html, 'html')
+        cleaned_hash = await self._store_content(cleaned_html, 'cleaned')
+        markdown_hash = await self._store_content(markdown, 'markdown')
+        extracted_hash = await self._store_content(extracted_content, 'extracted')
+        screenshot_hash = await self._store_content(screenshot, 'screenshots')
+
+        async def _cache(db):
+            await db.execute('''
+                INSERT INTO crawled_data (
+                    url, html, cleaned_html, markdown,
+                    extracted_content, success, media, links, metadata,
+                    screenshot, response_headers, downloaded_files
+                )
+                VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)
+                ON CONFLICT(url) DO UPDATE SET
+                    html = excluded.html,
+                    cleaned_html = excluded.cleaned_html,
+                    markdown = excluded.markdown,
+                    extracted_content = excluded.extracted_content,
+                    success = excluded.success,
+                    media = excluded.media,      
+                    links = excluded.links,    
+                    metadata = excluded.metadata,      
+                    screenshot = excluded.screenshot,
+                    response_headers = excluded.response_headers,
+                    downloaded_files = excluded.downloaded_files
+            ''', (url, html_hash, cleaned_hash, markdown_hash, extracted_hash,
+                success, media, links, metadata, screenshot_hash,
+                response_headers, downloaded_files))
+
+        try:
+            await self.execute_with_retry(_cache)
+        except Exception as e:
+            logger.error(f"Error caching URL: {e}")
+
+
+
+    async def aget_total_count(self) -> int:
+        """Get total number of cached URLs"""
+        async def _count(db):
+            async with db.execute('SELECT COUNT(*) FROM crawled_data') as cursor:
+                result = await cursor.fetchone()
+                return result[0] if result else 0
+
+        try:
+            return await self.execute_with_retry(_count)
+        except Exception as e:
+            logger.error(f"Error getting total count: {e}")
+            return 0
+
+    async def aclear_db(self):
+        """Clear all data from the database"""
+        async def _clear(db):
+            await db.execute('DELETE FROM crawled_data')
+
+        try:
+            await self.execute_with_retry(_clear)
+        except Exception as e:
+            logger.error(f"Error clearing database: {e}")
+
+    async def aflush_db(self):
+        """Drop the entire table"""
+        async def _flush(db):
+            await db.execute('DROP TABLE IF EXISTS crawled_data')
+
+        try:
+            await self.execute_with_retry(_flush)
+        except Exception as e:
+            logger.error(f"Error flushing database: {e}")
+            
+                
+    async def _store_content(self, content: str, content_type: str) -> str:
+        """Store content in filesystem and return hash"""
+        if not content:
+            return ""
+            
+        content_hash = generate_content_hash(content)
+        file_path = os.path.join(self.content_paths[content_type], content_hash)
+        
+        # Only write if file doesn't exist
+        if not os.path.exists(file_path):
+            async with aiofiles.open(file_path, 'w', encoding='utf-8') as f:
+                await f.write(content)
+                
+        return content_hash
+
+    async def _load_content(self, content_hash: str, content_type: str) -> Optional[str]:
+        """Load content from filesystem by hash"""
+        if not content_hash:
+            return None
+            
+        file_path = os.path.join(self.content_paths[content_type], content_hash)
+        try:
+            async with aiofiles.open(file_path, 'r', encoding='utf-8') as f:
+                return await f.read()
+        except:
+            logger.error(f"Failed to load content: {file_path}")
+            return None
+
+# Create a singleton instance
+async_db_manager = AsyncDatabaseManager()
diff --git a/crawl4ai/async_database.py b/crawl4ai/async_database.py
index c52e3db6..f97d8131 100644
--- a/crawl4ai/async_database.py
+++ b/crawl4ai/async_database.py
@@ -6,7 +6,11 @@ from typing import Optional, Tuple, Dict
 from contextlib import asynccontextmanager
 import logging
 import json  # Added for serialization/deserialization
-
+from .utils import ensure_content_dirs, generate_content_hash
+from .models import CrawlResult
+import xxhash
+import aiofiles
+from .config import NEED_MIGRATION
 # Set up logging
 logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger(__name__)
@@ -18,6 +22,7 @@ DB_PATH = os.path.join(DB_PATH, "crawl4ai.db")
 class AsyncDatabaseManager:
     def __init__(self, pool_size: int = 10, max_retries: int = 3):
         self.db_path = DB_PATH
+        self.content_paths = ensure_content_dirs(os.path.dirname(DB_PATH))
         self.pool_size = pool_size
         self.max_retries = max_retries
         self.connection_pool: Dict[int, aiosqlite.Connection] = {}
@@ -26,8 +31,20 @@ class AsyncDatabaseManager:
         
     async def initialize(self):
         """Initialize the database and connection pool"""
-        await self.ainit_db()
-        
+        try:
+            logger.info("Initializing database...")
+            await self.ainit_db()
+            if NEED_MIGRATION:
+                await self.update_db_schema()
+                from .migrations import run_migration  # Import here to avoid circular imports
+                await run_migration()
+                logger.info("Database initialization and migration completed successfully")
+            else:
+                logger.info("Database initialization completed successfully")
+        except Exception as e:
+            logger.error(f"Database initialization error: {e}")
+            logger.info("Database will be initialized on first use")
+            
     async def cleanup(self):
         """Cleanup connections when shutting down"""
         async with self.pool_lock:
@@ -97,7 +114,7 @@ class AsyncDatabaseManager:
             ''')
         
         await self.execute_with_retry(_init)
-        await self.update_db_schema()
+        
 
     async def update_db_schema(self):
         """Update database schema if needed"""
@@ -126,34 +143,59 @@ class AsyncDatabaseManager:
 
         await self.execute_with_retry(_alter)
 
-    async def aget_cached_url(self, url: str) -> Optional[Tuple[str, str, str, str, str, bool, str, str, str, str]]:
-        """Retrieve cached URL data"""
+    async def aget_cached_url(self, url: str) -> Optional[CrawlResult]:
+        """Retrieve cached URL data as CrawlResult"""
         async def _get(db):
             async with db.execute(
-                '''
-                SELECT url, html, cleaned_html, markdown, extracted_content, success, media, links, metadata, screenshot, response_headers, downloaded_files
-                FROM crawled_data WHERE url = ?
-                ''',
-                (url,)
+                'SELECT * FROM crawled_data WHERE url = ?', (url,)
             ) as cursor:
                 row = await cursor.fetchone()
-                if row:
-                    # Deserialize JSON fields
-                    return (
-                        row[0],  # url
-                        row[1],  # html
-                        row[2],  # cleaned_html
-                        row[3],  # markdown
-                        row[4],  # extracted_content
-                        row[5],  # success
-                        json.loads(row[6] or '{}'),  # media
-                        json.loads(row[7] or '{}'),  # links
-                        json.loads(row[8] or '{}'),  # metadata
-                        row[9],  # screenshot
-                        json.loads(row[10] or '{}'),  # response_headers
-                        json.loads(row[11] or '[]')  # downloaded_files
-                    )
-                return None
+                if not row:
+                    return None
+                    
+                # Get column names
+                columns = [description[0] for description in cursor.description]
+                # Create dict from row data
+                row_dict = dict(zip(columns, row))
+                
+                # Load content from files using stored hashes
+                content_fields = {
+                    'html': row_dict['html'],
+                    'cleaned_html': row_dict['cleaned_html'],
+                    'markdown': row_dict['markdown'],
+                    'extracted_content': row_dict['extracted_content'],
+                    'screenshot': row_dict['screenshot']
+                }
+                
+                for field, hash_value in content_fields.items():
+                    if hash_value:
+                        content = await self._load_content(
+                            hash_value, 
+                            field.split('_')[0]  # Get content type from field name
+                        )
+                        row_dict[field] = content or ""
+                    else:
+                        row_dict[field] = ""
+
+                # Parse JSON fields
+                json_fields = ['media', 'links', 'metadata', 'response_headers']
+                for field in json_fields:
+                    try:
+                        row_dict[field] = json.loads(row_dict[field]) if row_dict[field] else {}
+                    except json.JSONDecodeError:
+                        row_dict[field] = {}
+
+                # Parse downloaded_files
+                try:
+                    row_dict['downloaded_files'] = json.loads(row_dict['downloaded_files']) if row_dict['downloaded_files'] else []
+                except json.JSONDecodeError:
+                    row_dict['downloaded_files'] = []
+
+                # Remove any fields not in CrawlResult model
+                valid_fields = CrawlResult.__annotations__.keys()
+                filtered_dict = {k: v for k, v in row_dict.items() if k in valid_fields}
+                
+                return CrawlResult(**filtered_dict)
 
         try:
             return await self.execute_with_retry(_get)
@@ -161,26 +203,27 @@ class AsyncDatabaseManager:
             logger.error(f"Error retrieving cached URL: {e}")
             return None
 
-    async def acache_url(
-        self,
-        url: str,
-        html: str,
-        cleaned_html: str,
-        markdown: str,
-        extracted_content: str,
-        success: bool,
-        media: str = "{}",
-        links: str = "{}",
-        metadata: str = "{}",
-        screenshot: str = "",
-        response_headers: str = "{}",
-        downloaded_files: str = "[]"
-    ):
-        """Cache URL data with retry logic"""
+    async def acache_url(self, result: CrawlResult):
+        """Cache CrawlResult data"""
+        # Store content files and get hashes
+        content_map = {
+            'html': (result.html, 'html'),
+            'cleaned_html': (result.cleaned_html or "", 'cleaned'),
+            'markdown': (result.markdown or "", 'markdown'),
+            'extracted_content': (result.extracted_content or "", 'extracted'),
+            'screenshot': (result.screenshot or "", 'screenshots')
+        }
+        
+        content_hashes = {}
+        for field, (content, content_type) in content_map.items():
+            content_hashes[field] = await self._store_content(content, content_type)
+
         async def _cache(db):
             await db.execute('''
                 INSERT INTO crawled_data (
-                    url, html, cleaned_html, markdown, extracted_content, success, media, links, metadata, screenshot, response_headers, downloaded_files
+                    url, html, cleaned_html, markdown,
+                    extracted_content, success, media, links, metadata,
+                    screenshot, response_headers, downloaded_files
                 )
                 VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)
                 ON CONFLICT(url) DO UPDATE SET
@@ -189,13 +232,26 @@ class AsyncDatabaseManager:
                     markdown = excluded.markdown,
                     extracted_content = excluded.extracted_content,
                     success = excluded.success,
-                    media = excluded.media,      
-                    links = excluded.links,    
-                    metadata = excluded.metadata,      
+                    media = excluded.media,
+                    links = excluded.links,
+                    metadata = excluded.metadata,
                     screenshot = excluded.screenshot,
-                    response_headers = excluded.response_headers,  -- Update response_headers
+                    response_headers = excluded.response_headers,
                     downloaded_files = excluded.downloaded_files
-            ''', (url, html, cleaned_html, markdown, extracted_content, success, media, links, metadata, screenshot, response_headers, downloaded_files))
+            ''', (
+                result.url,
+                content_hashes['html'],
+                content_hashes['cleaned_html'],
+                content_hashes['markdown'],
+                content_hashes['extracted_content'],
+                result.success,
+                json.dumps(result.media),
+                json.dumps(result.links),
+                json.dumps(result.metadata or {}),
+                content_hashes['screenshot'],
+                json.dumps(result.response_headers or {}),
+                json.dumps(result.downloaded_files or [])
+            ))
 
         try:
             await self.execute_with_retry(_cache)
@@ -234,6 +290,35 @@ class AsyncDatabaseManager:
             await self.execute_with_retry(_flush)
         except Exception as e:
             logger.error(f"Error flushing database: {e}")
+            
+                
+    async def _store_content(self, content: str, content_type: str) -> str:
+        """Store content in filesystem and return hash"""
+        if not content:
+            return ""
+            
+        content_hash = generate_content_hash(content)
+        file_path = os.path.join(self.content_paths[content_type], content_hash)
+        
+        # Only write if file doesn't exist
+        if not os.path.exists(file_path):
+            async with aiofiles.open(file_path, 'w', encoding='utf-8') as f:
+                await f.write(content)
+                
+        return content_hash
+
+    async def _load_content(self, content_hash: str, content_type: str) -> Optional[str]:
+        """Load content from filesystem by hash"""
+        if not content_hash:
+            return None
+            
+        file_path = os.path.join(self.content_paths[content_type], content_hash)
+        try:
+            async with aiofiles.open(file_path, 'r', encoding='utf-8') as f:
+                return await f.read()
+        except:
+            logger.error(f"Failed to load content: {file_path}")
+            return None
 
 # Create a singleton instance
 async_db_manager = AsyncDatabaseManager()
diff --git a/crawl4ai/async_webcrawler.py b/crawl4ai/async_webcrawler.py
index cec1ace0..febc01d3 100644
--- a/crawl4ai/async_webcrawler.py
+++ b/crawl4ai/async_webcrawler.py
@@ -47,17 +47,17 @@ class AsyncWebCrawler:
 
     async def awarmup(self):
         # Print a message for crawl4ai and its version
-        print(f"[LOG] 🚀 Crawl4AI {crawl4ai_version}")
         if self.verbose:
+            print(f"[LOG] 🚀 Crawl4AI {crawl4ai_version}")
             print("[LOG] 🌤️  Warming up the AsyncWebCrawler")
         # await async_db_manager.ainit_db()
-        await async_db_manager.initialize()
-        await self.arun(
-            url="https://google.com/",
-            word_count_threshold=5,
-            bypass_cache=False,
-            verbose=False,
-        )
+        # # await async_db_manager.initialize()
+        # await self.arun(
+        #     url="https://google.com/",
+        #     word_count_threshold=5,
+        #     bypass_cache=False,
+        #     verbose=False,
+        # )
         self.ready = True
         if self.verbose:
             print("[LOG] 🌞 AsyncWebCrawler is ready to crawl")
@@ -73,6 +73,9 @@ class AsyncWebCrawler:
         screenshot: bool = False,
         user_agent: str = None,
         verbose=True,
+        disable_cache: bool = False,
+        no_cache_read: bool = False,
+        no_cache_write: bool = False,
         **kwargs,
     ) -> CrawlResult:
         """
@@ -89,6 +92,11 @@ class AsyncWebCrawler:
             CrawlResult: The result of the crawling and processing.
         """
         try:
+            if disable_cache:
+                bypass_cache = True
+                no_cache_read = True
+                no_cache_write = True
+            
             extraction_strategy = extraction_strategy or NoExtractionStrategy()
             extraction_strategy.verbose = verbose
             if not isinstance(extraction_strategy, ExtractionStrategy):
@@ -108,36 +116,39 @@ class AsyncWebCrawler:
             is_raw_html = url.startswith("raw:")
             _url = url if not is_raw_html else "Raw HTML"
             
-            if is_web_url and not bypass_cache and not self.always_by_pass_cache:
-                cached = await async_db_manager.aget_cached_url(url)
+            start_time = time.perf_counter()
+            cached_result = None
+            if is_web_url and (not bypass_cache or not no_cache_read) and not self.always_by_pass_cache:
+                cached_result = await async_db_manager.aget_cached_url(url)
                         
-            # if not bypass_cache and not self.always_by_pass_cache:
-            #     cached = await async_db_manager.aget_cached_url(url)
-
-            if kwargs.get("warmup", True) and not self.ready:
-                return None
-
-            if cached:
-                html = sanitize_input_encode(cached[1])
-                extracted_content = sanitize_input_encode(cached[4])
+            if cached_result:
+                html = sanitize_input_encode(cached_result.html)
+                extracted_content = sanitize_input_encode(cached_result.extracted_content or "")
                 if screenshot:
-                    screenshot_data = cached[9]
+                    screenshot_data = cached_result.screenshot
                     if not screenshot_data:
-                        cached = None
+                        cached_result = None
+                if verbose:
+                    print(
+                        f"[LOG] 1️⃣  ✅ Page fetched (cache) for {_url}, success: {bool(html)}, time taken: {time.perf_counter() - start_time:.2f} seconds"
+                    )
+
 
             if not cached or not html:
-                t1 = time.time()
+                t1 = time.perf_counter()
+                
                 if user_agent:
                     self.crawler_strategy.update_user_agent(user_agent)
                 async_response: AsyncCrawlResponse = await self.crawler_strategy.crawl(url, screenshot=screenshot, **kwargs)
                 html = sanitize_input_encode(async_response.html)
                 screenshot_data = async_response.screenshot
-                t2 = time.time()
+                t2 = time.perf_counter()
                 if verbose:
                     print(
-                        f"[LOG] 🚀 Crawling done for {_url}, success: {bool(html)}, time taken: {t2 - t1:.2f} seconds"
+                        f"[LOG] 1️⃣  ✅ Page fetched (no-cache) for {_url}, success: {bool(html)}, time taken: {t2 - t1:.2f} seconds"
                     )
 
+            t1 = time.perf_counter()
             crawl_result = await self.aprocess_html(
                 url=url,
                 html=html,
@@ -163,30 +174,19 @@ class AsyncWebCrawler:
                 crawl_result.downloaded_files = async_response.downloaded_files
             else:
                 crawl_result.status_code = 200
-                crawl_result.response_headers = cached[10]
-                # crawl_result.downloaded_files = cached[11]
+                crawl_result.response_headers = cached_result.response_headers if cached_result else {}
 
             crawl_result.success = bool(html)
             crawl_result.session_id = kwargs.get("session_id", None)
 
+            if verbose:
+                print(
+                    f"[LOG] 🔥 🚀 Crawling done for {_url}, success: {crawl_result.success}, time taken: {time.perf_counter() - start_time:.2f} seconds"
+                )
 
-            if not is_raw_html:
-                if not bool(cached) or kwargs.get("bypass_cache", False) or self.always_by_pass_cache:
-                    await async_db_manager.acache_url(
-                        url = url,
-                        html = html,
-                        cleaned_html = crawl_result.cleaned_html,
-                        markdown = crawl_result.markdown,
-                        extracted_content = extracted_content,
-                        success = True,
-                        media = json.dumps(crawl_result.media),
-                        links = json.dumps(crawl_result.links),
-                        metadata = json.dumps(crawl_result.metadata),
-                        screenshot=screenshot,
-                        response_headers=json.dumps(crawl_result.response_headers),
-                        downloaded_files=json.dumps(crawl_result.downloaded_files),
-                        
-                    )
+            if not is_raw_html and not no_cache_write:
+                if not bool(cached_result) or kwargs.get("bypass_cache", False) or self.always_by_pass_cache:
+                    await async_db_manager.acache_url(crawl_result)
 
 
             return crawl_result
@@ -258,11 +258,11 @@ class AsyncWebCrawler:
         verbose: bool,
         **kwargs,
     ) -> CrawlResult:
-        t = time.time()
+        t = time.perf_counter()
         # Extract content from HTML
         try:
             _url = url if not kwargs.get("is_raw_html", False) else "Raw HTML"
-            t1 = time.time()
+            t1 = time.perf_counter()
             scrapping_strategy = WebScrapingStrategy()
             # result = await scrapping_strategy.ascrap(
             result = scrapping_strategy.scrap(
@@ -276,10 +276,6 @@ class AsyncWebCrawler:
                 ),
                 **kwargs,
             )
-            if verbose:
-                print(
-                    f"[LOG] 🚀 Content extracted for {_url}, success: True, time taken: {time.time() - t1:.2f} seconds"
-                )
 
             if result is None:
                 raise ValueError(f"Process HTML, Failed to extract content from the website: {url}")
@@ -295,13 +291,14 @@ class AsyncWebCrawler:
         media = result.get("media", [])
         links = result.get("links", [])
         metadata = result.get("metadata", {})
+        
+        if verbose:
+            print(
+                f"[LOG] 2️⃣  ✅ Scraping done for {_url}, success: True, time taken: {time.perf_counter() - t1:.2f} seconds"
+            )        
 
-        if extracted_content is None and extraction_strategy and chunking_strategy:
-            if verbose:
-                print(
-                    f"[LOG] 🔥 Extracting semantic blocks for {_url}, Strategy: {self.__class__.__name__}"
-                )
-
+        if extracted_content is None and extraction_strategy and chunking_strategy and not isinstance(extraction_strategy, NoExtractionStrategy):
+            t1 = time.perf_counter()
             # Check if extraction strategy is type of JsonCssExtractionStrategy
             if isinstance(extraction_strategy, JsonCssExtractionStrategy) or isinstance(extraction_strategy, JsonCssExtractionStrategy):
                 extraction_strategy.verbose = verbose
@@ -311,11 +308,10 @@ class AsyncWebCrawler:
                 sections = chunking_strategy.chunk(markdown)
                 extracted_content = extraction_strategy.run(url, sections)
                 extracted_content = json.dumps(extracted_content, indent=4, default=str, ensure_ascii=False)
-
-        if verbose:
-            print(
-                f"[LOG] 🚀 Extraction done for {_url}, time taken: {time.time() - t:.2f} seconds."
-            )
+            if verbose:
+                print(
+                    f"[LOG] 3️⃣  ✅ Extraction done for {_url}, time taken: {time.perf_counter() - t1:.2f} seconds"
+                )
 
         screenshot = None if not screenshot else screenshot
         
diff --git a/crawl4ai/config.py b/crawl4ai/config.py
index 16638b6d..5bc284bf 100644
--- a/crawl4ai/config.py
+++ b/crawl4ai/config.py
@@ -52,4 +52,6 @@ SOCIAL_MEDIA_DOMAINS = [
 # If image is in the first half of the total images extracted from the page
 IMAGE_SCORE_THRESHOLD = 2
 
-MAX_METRICS_HISTORY = 1000
\ No newline at end of file
+MAX_METRICS_HISTORY = 1000
+
+NEED_MIGRATION = True
\ No newline at end of file
diff --git a/crawl4ai/migrations.py b/crawl4ai/migrations.py
new file mode 100644
index 00000000..77616086
--- /dev/null
+++ b/crawl4ai/migrations.py
@@ -0,0 +1,152 @@
+import os
+import asyncio
+import logging
+from pathlib import Path
+import aiosqlite
+from typing import Optional
+import xxhash
+import aiofiles
+import shutil
+import time
+from datetime import datetime
+
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
+
+class DatabaseMigration:
+    def __init__(self, db_path: str):
+        self.db_path = db_path
+        self.content_paths = self._ensure_content_dirs(os.path.dirname(db_path))
+        
+    def _ensure_content_dirs(self, base_path: str) -> dict:
+        dirs = {
+            'html': 'html_content',
+            'cleaned': 'cleaned_html',
+            'markdown': 'markdown_content', 
+            'extracted': 'extracted_content',
+            'screenshots': 'screenshots'
+        }
+        content_paths = {}
+        for key, dirname in dirs.items():
+            path = os.path.join(base_path, dirname)
+            os.makedirs(path, exist_ok=True)
+            content_paths[key] = path
+        return content_paths
+
+    def _generate_content_hash(self, content: str) -> str:
+        x = xxhash.xxh64()
+        x.update(content.encode())
+        content_hash = x.hexdigest()
+        return content_hash
+        # return hashlib.sha256(content.encode()).hexdigest()
+
+    async def _store_content(self, content: str, content_type: str) -> str:
+        if not content:
+            return ""
+        
+        content_hash = self._generate_content_hash(content)
+        file_path = os.path.join(self.content_paths[content_type], content_hash)
+        
+        if not os.path.exists(file_path):
+            async with aiofiles.open(file_path, 'w', encoding='utf-8') as f:
+                await f.write(content)
+                
+        return content_hash
+
+    async def migrate_database(self):
+        """Migrate existing database to file-based storage"""
+        logger.info("Starting database migration...")
+        
+        try:
+            async with aiosqlite.connect(self.db_path) as db:
+                # Get all rows
+                async with db.execute(
+                    '''SELECT url, html, cleaned_html, markdown, 
+                       extracted_content, screenshot FROM crawled_data'''
+                ) as cursor:
+                    rows = await cursor.fetchall()
+
+                migrated_count = 0
+                for row in rows:
+                    url, html, cleaned_html, markdown, extracted_content, screenshot = row
+                    
+                    # Store content in files and get hashes
+                    html_hash = await self._store_content(html, 'html')
+                    cleaned_hash = await self._store_content(cleaned_html, 'cleaned')
+                    markdown_hash = await self._store_content(markdown, 'markdown')
+                    extracted_hash = await self._store_content(extracted_content, 'extracted')
+                    screenshot_hash = await self._store_content(screenshot, 'screenshots')
+
+                    # Update database with hashes
+                    await db.execute('''
+                        UPDATE crawled_data 
+                        SET html = ?, 
+                            cleaned_html = ?,
+                            markdown = ?,
+                            extracted_content = ?,
+                            screenshot = ?
+                        WHERE url = ?
+                    ''', (html_hash, cleaned_hash, markdown_hash, 
+                         extracted_hash, screenshot_hash, url))
+                    
+                    migrated_count += 1
+                    if migrated_count % 100 == 0:
+                        logger.info(f"Migrated {migrated_count} records...")
+
+                await db.commit()
+                logger.info(f"Migration completed. {migrated_count} records processed.")
+
+        except Exception as e:
+            logger.error(f"Migration failed: {e}")
+            raise
+
+async def backup_database(db_path: str) -> str:
+    """Create backup of existing database"""
+    if not os.path.exists(db_path):
+        logger.info("No existing database found. Skipping backup.")
+        return None
+        
+    # Create backup with timestamp
+    timestamp = datetime.now().strftime('%Y%m%d_%H%M%S')
+    backup_path = f"{db_path}.backup_{timestamp}"
+    
+    try:
+        # Wait for any potential write operations to finish
+        await asyncio.sleep(1)
+        
+        # Create backup
+        shutil.copy2(db_path, backup_path)
+        logger.info(f"Database backup created at: {backup_path}")
+        return backup_path
+    except Exception as e:
+        logger.error(f"Backup failed: {e}")
+        raise
+    
+async def run_migration(db_path: Optional[str] = None):
+    """Run database migration"""
+    if db_path is None:
+        db_path = os.path.join(Path.home(), ".crawl4ai", "crawl4ai.db")
+    
+    if not os.path.exists(db_path):
+        logger.info("No existing database found. Skipping migration.")
+        return
+        
+    # Create backup first
+    backup_path = await backup_database(db_path)
+    if not backup_path:
+        return
+    
+    migration = DatabaseMigration(db_path)
+    await migration.migrate_database()
+    
+def main():
+    """CLI entry point for migration"""
+    import argparse
+    parser = argparse.ArgumentParser(description='Migrate Crawl4AI database to file-based storage')
+    parser.add_argument('--db-path', help='Custom database path')
+    args = parser.parse_args()
+    
+    asyncio.run(run_migration(args.db_path))
+
+if __name__ == "__main__":
+    main()
\ No newline at end of file
diff --git a/crawl4ai/utils.py b/crawl4ai/utils.py
index 49483f43..a80cf09a 100644
--- a/crawl4ai/utils.py
+++ b/crawl4ai/utils.py
@@ -14,6 +14,9 @@ from typing import Dict, Any
 from urllib.parse import urljoin
 import requests
 from requests.exceptions import InvalidSchema
+import hashlib
+from typing import Optional, Tuple, Dict, Any
+import xxhash
 
 class InvalidCSSSelectorError(Exception):
     pass
@@ -1109,3 +1112,27 @@ def clean_tokens(tokens: list[str]) -> list[str]:
             and not token.startswith('↑')
             and not token.startswith('▲')
             and not token.startswith('⬆')]
+
+
+def generate_content_hash(content: str) -> str:
+    """Generate a unique hash for content"""
+    return xxhash.xxh64(content.encode()).hexdigest()
+    # return hashlib.sha256(content.encode()).hexdigest()
+
+def ensure_content_dirs(base_path: str) -> Dict[str, str]:
+    """Create content directories if they don't exist"""
+    dirs = {
+        'html': 'html_content',
+        'cleaned': 'cleaned_html',
+        'markdown': 'markdown_content', 
+        'extracted': 'extracted_content',
+        'screenshots': 'screenshots'
+    }
+    
+    content_paths = {}
+    for key, dirname in dirs.items():
+        path = os.path.join(base_path, dirname)
+        os.makedirs(path, exist_ok=True)
+        content_paths[key] = path
+        
+    return content_paths
\ No newline at end of file
diff --git a/requirements.txt b/requirements.txt
index e83643b3..94f741ca 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -9,3 +9,4 @@ python-dotenv~=1.0
 requests~=2.26
 beautifulsoup4~=4.12
 tf-playwright-stealth~=1.0
+xxhash~=3.4
diff --git a/setup.py b/setup.py
index 93190291..d3145ac1 100644
--- a/setup.py
+++ b/setup.py
@@ -5,34 +5,37 @@ from pathlib import Path
 import shutil
 import subprocess
 import sys
+import asyncio
 
-# Create the .crawl4ai folder in the user's home directory if it doesn't exist
-# If the folder already exists, remove the cache folder
+# Create the .crawl4ai folder structure
 crawl4ai_folder = Path.home() / ".crawl4ai"
 cache_folder = crawl4ai_folder / "cache"
+content_folders = ['html_content', 'cleaned_html', 'markdown_content', 
+                  'extracted_content', 'screenshots']
 
+# Clean up old cache if exists
 if cache_folder.exists():
     shutil.rmtree(cache_folder)
 
+# Create new folder structure
 crawl4ai_folder.mkdir(exist_ok=True)
 cache_folder.mkdir(exist_ok=True)
+for folder in content_folders:
+    (crawl4ai_folder / folder).mkdir(exist_ok=True)
 
-# Read the requirements from requirements.txt
+# Read requirements and version
 __location__ = os.path.realpath(os.path.join(os.getcwd(), os.path.dirname(__file__)))
 with open(os.path.join(__location__, "requirements.txt")) as f:
     requirements = f.read().splitlines()
     
-# Read version from __init__.py
 with open("crawl4ai/_version.py") as f:
     for line in f:
         if line.startswith("__version__"):
             version = line.split("=")[1].strip().strip('"')
             break
 
-# Define the requirements for different environments
+# Define requirements
 default_requirements = requirements
-# torch_requirements = ["torch", "nltk", "spacy", "scikit-learn"]
-# transformer_requirements = ["transformers", "tokenizers", "onnxruntime"]
 torch_requirements = ["torch", "nltk",  "scikit-learn"]
 transformer_requirements = ["transformers", "tokenizers"]
 cosine_similarity_requirements = ["torch", "transformers", "nltk" ]
@@ -50,10 +53,24 @@ def install_playwright():
         print(f"Unexpected error during Playwright installation: {e}")
         print("Please run 'python -m playwright install' manually after the installation.")
 
+def run_migration():
+    """Initialize database during installation"""
+    try:
+        print("Starting database initialization...")
+        from crawl4ai.async_database import async_db_manager
+        asyncio.run(async_db_manager.initialize())
+        print("Database initialization completed successfully.")
+    except ImportError:
+        print("Warning: Database module not found. Will initialize on first use.")
+    except Exception as e:
+        print(f"Warning: Database initialization failed: {e}")
+        print("Database will be initialized on first use")
+
 class PostInstallCommand(install):
     def run(self):
         install.run(self)
         install_playwright()
+        run_migration()
 
 setup(
     name="Crawl4AI",
@@ -66,7 +83,7 @@ setup(
     author_email="unclecode@kidocode.com",
     license="MIT",
     packages=find_packages(),
-    install_requires=default_requirements + ["playwright"],  # Add playwright to default requirements
+    install_requires=default_requirements + ["playwright", "aiofiles"],  # Added aiofiles
     extras_require={
         "torch": torch_requirements,
         "transformer": transformer_requirements,
@@ -77,6 +94,7 @@ setup(
     entry_points={
         'console_scripts': [
             'crawl4ai-download-models=crawl4ai.model_loader:main',
+            'crawl4ai-migrate=crawl4ai.migrations:main',  # Added migration command
         ],
     },
     classifiers=[

From 509844208617673ee4cd066a4386a6c76fdadf91 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Sat, 16 Nov 2024 15:30:24 +0800
Subject: [PATCH 024/115] refactor: migrate versioning to __version__.py and
 remove deprecated _version.py

---
 crawl4ai/__init__.py                     | 2 +-
 crawl4ai/{_version.py => __version__.py} | 0
 crawl4ai/async_webcrawler.py             | 2 +-
 crawl4ai/content_filter_strategy.py      | 5 -----
 middlewares.py                           | 0
 requirements-dev.txt                     | 5 -----
 requirements.txt                         | 2 ++
 setup.py                                 | 2 +-
 8 files changed, 5 insertions(+), 13 deletions(-)
 rename crawl4ai/{_version.py => __version__.py} (100%)
 delete mode 100644 middlewares.py
 delete mode 100644 requirements-dev.txt

diff --git a/crawl4ai/__init__.py b/crawl4ai/__init__.py
index 1bcc491c..e55aaf73 100644
--- a/crawl4ai/__init__.py
+++ b/crawl4ai/__init__.py
@@ -2,7 +2,7 @@
 
 from .async_webcrawler import AsyncWebCrawler
 from .models import CrawlResult
-from ._version import __version__
+from .__version__ import __version__
 # __version__ = "0.3.73"
 
 __all__ = [
diff --git a/crawl4ai/_version.py b/crawl4ai/__version__.py
similarity index 100%
rename from crawl4ai/_version.py
rename to crawl4ai/__version__.py
diff --git a/crawl4ai/async_webcrawler.py b/crawl4ai/async_webcrawler.py
index febc01d3..03e7a393 100644
--- a/crawl4ai/async_webcrawler.py
+++ b/crawl4ai/async_webcrawler.py
@@ -16,7 +16,7 @@ from .utils import (
     InvalidCSSSelectorError,
     format_html
 )
-from ._version import __version__ as crawl4ai_version
+from .__version__ import __version__ as crawl4ai_version
 
 class AsyncWebCrawler:
     def __init__(
diff --git a/crawl4ai/content_filter_strategy.py b/crawl4ai/content_filter_strategy.py
index 850ebf11..88375da9 100644
--- a/crawl4ai/content_filter_strategy.py
+++ b/crawl4ai/content_filter_strategy.py
@@ -1,12 +1,7 @@
-import os
 import re
-import time
 from bs4 import BeautifulSoup, Tag
 from typing import List, Tuple, Dict
 from rank_bm25 import BM25Okapi
-import nltk
-from time import perf_counter
-from html5lib import parse, treebuilders
 from time import perf_counter
 from collections import deque
 from bs4 import BeautifulSoup, NavigableString, Tag
diff --git a/middlewares.py b/middlewares.py
deleted file mode 100644
index e69de29b..00000000
diff --git a/requirements-dev.txt b/requirements-dev.txt
deleted file mode 100644
index 7bc121a4..00000000
--- a/requirements-dev.txt
+++ /dev/null
@@ -1,5 +0,0 @@
--r requirements.txt
-pytest
-pytest-asyncio
-selenium
-setuptools
diff --git a/requirements.txt b/requirements.txt
index 94f741ca..74e8b3d6 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -10,3 +10,5 @@ requests~=2.26
 beautifulsoup4~=4.12
 tf-playwright-stealth~=1.0
 xxhash~=3.4
+rank-bm25~=0.2
+aiofiles~=24.0
\ No newline at end of file
diff --git a/setup.py b/setup.py
index d3145ac1..d8ad2cd3 100644
--- a/setup.py
+++ b/setup.py
@@ -28,7 +28,7 @@ __location__ = os.path.realpath(os.path.join(os.getcwd(), os.path.dirname(__file
 with open(os.path.join(__location__, "requirements.txt")) as f:
     requirements = f.read().splitlines()
     
-with open("crawl4ai/_version.py") as f:
+with open("crawl4ai/__version__.py") as f:
     for line in f:
         if line.startswith("__version__"):
             version = line.split("=")[1].strip().strip('"')

From 90df6921b7be573d95795907fcdebd28002dfd9b Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Sat, 16 Nov 2024 15:34:30 +0800
Subject: [PATCH 025/115] feat(crawl_sync): add synchronous crawl endpoint and
 corresponding test

---
 docs/examples/docker_example.py | 21 +++++++++++++++++++++
 main.py                         | 24 ++++++++++++++++++++++++
 2 files changed, 45 insertions(+)

diff --git a/docs/examples/docker_example.py b/docs/examples/docker_example.py
index c22acd55..502f1e52 100644
--- a/docs/examples/docker_example.py
+++ b/docs/examples/docker_example.py
@@ -33,6 +33,13 @@ class Crawl4AiTester:
                 return status
                 
             time.sleep(2)
+            
+    def submit_sync(self, request_data: Dict[str, Any]) -> Dict[str, Any]:
+        response = requests.post(f"{self.base_url}/crawl_sync", json=request_data, timeout=60)
+        if response.status_code == 408:
+            raise TimeoutError("Task did not complete within server timeout")
+        response.raise_for_status()
+        return response.json()
 
 def test_docker_deployment(version="basic"):
     tester = Crawl4AiTester()
@@ -54,6 +61,7 @@ def test_docker_deployment(version="basic"):
     
     # Test cases based on version
     test_basic_crawl(tester)
+    test_basic_crawl_sync(tester)
     
     # if version in ["full", "transformer"]:
     #     test_cosine_extraction(tester)
@@ -78,6 +86,19 @@ def test_basic_crawl(tester: Crawl4AiTester):
     assert result["result"]["success"]
     assert len(result["result"]["markdown"]) > 0
 
+def test_basic_crawl_sync(tester: Crawl4AiTester):
+    print("\n=== Testing Basic Crawl (Sync) ===")
+    request = {
+        "urls": "https://www.nbcnews.com/business",
+        "priority": 10
+    }
+    
+    result = tester.submit_sync(request)
+    print(f"Basic crawl result length: {len(result['result']['markdown'])}")
+    assert result['status'] == 'completed'
+    assert result['result']['success']
+    assert len(result['result']['markdown']) > 0
+    
 def test_js_execution(tester: Crawl4AiTester):
     print("\n=== Testing JS Execution ===")
     request = {
diff --git a/main.py b/main.py
index a5da029c..660c3366 100644
--- a/main.py
+++ b/main.py
@@ -375,6 +375,30 @@ async def get_task_status(task_id: str):
 
     return response
 
+@app.post("/crawl_sync")
+async def crawl_sync(request: CrawlRequest) -> Dict[str, Any]:
+    task_id = await crawler_service.submit_task(request)
+    
+    # Wait up to 60 seconds for task completion
+    for _ in range(60):
+        task_info = crawler_service.task_manager.get_task(task_id)
+        if not task_info:
+            raise HTTPException(status_code=404, detail="Task not found")
+            
+        if task_info.status == TaskStatus.COMPLETED:
+            # Return same format as /task/{task_id} endpoint
+            if isinstance(task_info.result, list):
+                return {"status": task_info.status, "results": [result.dict() for result in task_info.result]}
+            return {"status": task_info.status, "result": task_info.result.dict()}
+            
+        if task_info.status == TaskStatus.FAILED:
+            raise HTTPException(status_code=500, detail=task_info.error)
+            
+        await asyncio.sleep(1)
+    
+    # If we get here, task didn't complete within timeout
+    raise HTTPException(status_code=408, detail="Task timed out")
+
 @app.get("/health")
 async def health_check():
     available_slots = await crawler_service.resource_monitor.get_available_slots()

From e62c80729559457c937b9740cb3bab960e6103d3 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Sat, 16 Nov 2024 16:38:13 +0800
Subject: [PATCH 026/115] feat(deploy): add Railway deployment configuration
 and setup instructions

---
 deploy/railway/README.md    | 19 +++++++++++++++++++
 deploy/railway/button.json  | 33 +++++++++++++++++++++++++++++++++
 deploy/railway/railway.toml | 18 ++++++++++++++++++
 3 files changed, 70 insertions(+)
 create mode 100644 deploy/railway/README.md
 create mode 100644 deploy/railway/button.json
 create mode 100644 deploy/railway/railway.toml

diff --git a/deploy/railway/README.md b/deploy/railway/README.md
new file mode 100644
index 00000000..155e7642
--- /dev/null
+++ b/deploy/railway/README.md
@@ -0,0 +1,19 @@
+# Railway Deployment
+
+## Quick Deploy
+[![Deploy on Railway](https://railway.app/button.svg)](https://railway.app/template/crawl4ai)
+
+## Manual Setup
+1. Fork this repository
+2. Create a new Railway project 
+3. Configure environment variables:
+   - `INSTALL_TYPE`: basic or all
+   - `ENABLE_GPU`: true/false
+4. Deploy!
+
+## Configuration
+See `railway.toml` for:
+- Memory limits
+- Health checks
+- Restart policies
+- Scaling options
\ No newline at end of file
diff --git a/deploy/railway/button.json b/deploy/railway/button.json
new file mode 100644
index 00000000..1fc52167
--- /dev/null
+++ b/deploy/railway/button.json
@@ -0,0 +1,33 @@
+{
+    "name": "Crawl4AI",
+    "description": "LLM Friendly Web Crawler & Scraper",
+    "render": {
+      "dockerfile": {
+        "path": "Dockerfile"
+      }
+    },
+    "env": [
+      {
+        "key": "INSTALL_TYPE",
+        "description": "Installation type (basic/all)",
+        "default": "basic",
+        "required": true
+      },
+      {
+        "key": "ENABLE_GPU",
+        "description": "Enable GPU support",
+        "default": "false",
+        "required": false
+      }
+    ],
+    "services": [
+      {
+        "name": "web",
+        "dockerfile": "./Dockerfile",
+        "healthcheck": {
+          "path": "/health",
+          "port": 11235
+        }
+      }
+    ]
+  }
\ No newline at end of file
diff --git a/deploy/railway/railway.toml b/deploy/railway/railway.toml
new file mode 100644
index 00000000..f24d8fab
--- /dev/null
+++ b/deploy/railway/railway.toml
@@ -0,0 +1,18 @@
+# railway.toml
+[build]
+builder = "DOCKERFILE"
+dockerfilePath = "Dockerfile"
+
+[deploy]
+startCommand = "uvicorn main:app --host 0.0.0.0 --port $PORT"
+healthcheckPath = "/health"
+restartPolicyType = "ON_FAILURE"
+restartPolicyMaxRetries = 3
+
+[deploy.memory]
+soft = 2048 # 2GB min for Playwright
+hard = 4096 # 4GB max
+
+[deploy.scaling]
+min = 1
+max = 1

From f77f06a3bd4c1ef6e45b69a64959b55164bf4512 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Sat, 16 Nov 2024 16:43:31 +0800
Subject: [PATCH 027/115] feat(deploy): add deployment configuration and
 templates for crawl4ai

---
 .do/app.yaml             | 19 +++++++++++++++++++
 .do/deploy.template.yaml | 22 ++++++++++++++++++++++
 2 files changed, 41 insertions(+)
 create mode 100644 .do/app.yaml
 create mode 100644 .do/deploy.template.yaml

diff --git a/.do/app.yaml b/.do/app.yaml
new file mode 100644
index 00000000..7e11aab7
--- /dev/null
+++ b/.do/app.yaml
@@ -0,0 +1,19 @@
+alerts:
+- rule: DEPLOYMENT_FAILED
+- rule: DOMAIN_FAILED
+name: crawl4ai
+region: nyc
+services:
+- dockerfile_path: Dockerfile
+  github:
+    branch: main
+    deploy_on_push: true
+    repo: unclecode/crawl4ai 
+  health_check:
+    http_path: /health
+  http_port: 11235
+  instance_count: 1
+  instance_size_slug: basic-xs
+  name: web
+  routes:
+  - path: /
\ No newline at end of file
diff --git a/.do/deploy.template.yaml b/.do/deploy.template.yaml
new file mode 100644
index 00000000..ab76795d
--- /dev/null
+++ b/.do/deploy.template.yaml
@@ -0,0 +1,22 @@
+spec:
+  name: crawl4ai
+  services:
+    - name: crawl4ai
+      git:
+        branch: main
+        repo_clone_url: https://github.com/unclecode/crawl4ai.git
+      dockerfile_path: Dockerfile
+      http_port: 11235
+      instance_count: 1
+      instance_size_slug: basic-xs
+      health_check:
+        http_path: /health
+      envs:
+        - key: INSTALL_TYPE
+          value: "basic"
+        - key: PYTHON_VERSION  
+          value: "3.10"
+        - key: ENABLE_GPU
+          value: "false"
+      routes:
+        - path: /
\ No newline at end of file

From fca1319b7d1c3e3da5b07898d3890bced4a7719e Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Sat, 16 Nov 2024 17:10:30 +0800
Subject: [PATCH 028/115] feat(docker): add MkDocs installation and build step
 for documentation

---
 Dockerfile | 14 ++++++++++----
 1 file changed, 10 insertions(+), 4 deletions(-)

diff --git a/Dockerfile b/Dockerfile
index 125fb9b8..54ac641c 100644
--- a/Dockerfile
+++ b/Dockerfile
@@ -107,13 +107,19 @@ RUN if [ "$INSTALL_TYPE" = "all" ] ; then \
         pip install -e "." ; \
     fi
 
+    # Install MkDocs and required plugins
+RUN pip install --no-cache-dir \
+    mkdocs \
+    mkdocs-material \
+    mkdocs-terminal \
+    pymdown-extensions
+
+# Build MkDocs documentation
+RUN mkdocs build
+
 # Install Playwright and browsers
 RUN playwright install
 
-# Health check
-HEALTHCHECK --interval=30s --timeout=30s --start-period=5s --retries=3 \
-    CMD curl -f http://localhost:8000/health || exit 1
-
 # Expose port
 EXPOSE 8000 11235 9222 8080
 

From 6f2fe5954f6ce9f7f17fb15802054cd6c5802123 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Sat, 16 Nov 2024 17:12:41 +0800
Subject: [PATCH 029/115] feat(deploy): update instance size to professional-xs
 and add memory utilization alert

---
 .do/deploy.template.yaml | 7 +++++--
 1 file changed, 5 insertions(+), 2 deletions(-)

diff --git a/.do/deploy.template.yaml b/.do/deploy.template.yaml
index ab76795d..c7db5e7e 100644
--- a/.do/deploy.template.yaml
+++ b/.do/deploy.template.yaml
@@ -8,7 +8,7 @@ spec:
       dockerfile_path: Dockerfile
       http_port: 11235
       instance_count: 1
-      instance_size_slug: basic-xs
+      instance_size_slug: professional-xs # 4GB RAM, 2 vCPUs
       health_check:
         http_path: /health
       envs:
@@ -19,4 +19,7 @@ spec:
         - key: ENABLE_GPU
           value: "false"
       routes:
-        - path: /
\ No newline at end of file
+        - path: /
+  alerts:
+    - rule: MEM_UTILIZATION
+      value: 90  # Alert at 90% memory usage
\ No newline at end of file

From 6b569cceb5332ea481190a86086fbf934c7c89e7 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Sat, 16 Nov 2024 17:21:45 +0800
Subject: [PATCH 030/115] feat(deploy): update branch to 0.3.74 and change
 instance size to basic-xs

---
 .do/app.yaml             | 2 +-
 .do/deploy.template.yaml | 4 ++--
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/.do/app.yaml b/.do/app.yaml
index 7e11aab7..bff8ff97 100644
--- a/.do/app.yaml
+++ b/.do/app.yaml
@@ -6,7 +6,7 @@ region: nyc
 services:
 - dockerfile_path: Dockerfile
   github:
-    branch: main
+    branch: 0.3.74
     deploy_on_push: true
     repo: unclecode/crawl4ai 
   health_check:
diff --git a/.do/deploy.template.yaml b/.do/deploy.template.yaml
index c7db5e7e..73ee7c5c 100644
--- a/.do/deploy.template.yaml
+++ b/.do/deploy.template.yaml
@@ -3,12 +3,12 @@ spec:
   services:
     - name: crawl4ai
       git:
-        branch: main
+        branch: 0.3.74
         repo_clone_url: https://github.com/unclecode/crawl4ai.git
       dockerfile_path: Dockerfile
       http_port: 11235
       instance_count: 1
-      instance_size_slug: professional-xs # 4GB RAM, 2 vCPUs
+      instance_size_slug: basic-xs # 4GB RAM, 2 vCPUs
       health_check:
         http_path: /health
       envs:

From 67edc2d641a672e9fa5a95fa4341407b9e574851 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Sat, 16 Nov 2024 17:23:32 +0800
Subject: [PATCH 031/115] feat(deploy): update instance size to professional-xs
 and add memory utilization alert parameters

---
 .do/deploy.template.yaml | 9 +++++++--
 1 file changed, 7 insertions(+), 2 deletions(-)

diff --git a/.do/deploy.template.yaml b/.do/deploy.template.yaml
index 73ee7c5c..49d0012b 100644
--- a/.do/deploy.template.yaml
+++ b/.do/deploy.template.yaml
@@ -8,7 +8,7 @@ spec:
       dockerfile_path: Dockerfile
       http_port: 11235
       instance_count: 1
-      instance_size_slug: basic-xs # 4GB RAM, 2 vCPUs
+      instance_size_slug: professional-xs
       health_check:
         http_path: /health
       envs:
@@ -22,4 +22,9 @@ spec:
         - path: /
   alerts:
     - rule: MEM_UTILIZATION
-      value: 90  # Alert at 90% memory usage
\ No newline at end of file
+      value: 90
+      window: 5m          # Added window parameter
+      operator: GREATER_THAN
+      disabled: false
+    - rule: DEPLOYMENT_FAILED
+    - rule: DOMAIN_FAILED
\ No newline at end of file

From 5d0b13294cfec45c55b07a5593726335c79b6cde Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Sat, 16 Nov 2024 17:25:07 +0800
Subject: [PATCH 032/115] feat(deploy): change instance size to professional-xs
 and update memory utilization alert window to 300 seconds

---
 .do/app.yaml             | 2 +-
 .do/deploy.template.yaml | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/.do/app.yaml b/.do/app.yaml
index bff8ff97..00d7b781 100644
--- a/.do/app.yaml
+++ b/.do/app.yaml
@@ -13,7 +13,7 @@ services:
     http_path: /health
   http_port: 11235
   instance_count: 1
-  instance_size_slug: basic-xs
+  instance_size_slug: professional-xs
   name: web
   routes:
   - path: /
\ No newline at end of file
diff --git a/.do/deploy.template.yaml b/.do/deploy.template.yaml
index 49d0012b..dcd9b2d7 100644
--- a/.do/deploy.template.yaml
+++ b/.do/deploy.template.yaml
@@ -23,7 +23,7 @@ spec:
   alerts:
     - rule: MEM_UTILIZATION
       value: 90
-      window: 5m          # Added window parameter
+      window: 300        # Changed from "5m" to 300 (5 minutes in seconds)
       operator: GREATER_THAN
       disabled: false
     - rule: DEPLOYMENT_FAILED

From 79feab89c4236e7de180ec4cd2257df3f5f3e386 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Sat, 16 Nov 2024 17:28:42 +0800
Subject: [PATCH 033/115] refactor(deploy): remove memory utilization alert
 configuration from deployment template

---
 .do/deploy.template.yaml | 10 +---------
 1 file changed, 1 insertion(+), 9 deletions(-)

diff --git a/.do/deploy.template.yaml b/.do/deploy.template.yaml
index dcd9b2d7..9a06a366 100644
--- a/.do/deploy.template.yaml
+++ b/.do/deploy.template.yaml
@@ -19,12 +19,4 @@ spec:
         - key: ENABLE_GPU
           value: "false"
       routes:
-        - path: /
-  alerts:
-    - rule: MEM_UTILIZATION
-      value: 90
-      window: 300        # Changed from "5m" to 300 (5 minutes in seconds)
-      operator: GREATER_THAN
-      disabled: false
-    - rule: DEPLOYMENT_FAILED
-    - rule: DOMAIN_FAILED
\ No newline at end of file
+        - path: /
\ No newline at end of file

From 1961adb530baf74dfec16a0f2da795946855459a Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Sat, 16 Nov 2024 17:35:27 +0800
Subject: [PATCH 034/115] refactor(docker): remove shared memory size
 configuration to streamline Dockerfile

---
 Dockerfile | 5 -----
 1 file changed, 5 deletions(-)

diff --git a/Dockerfile b/Dockerfile
index 54ac641c..ba29faf1 100644
--- a/Dockerfile
+++ b/Dockerfile
@@ -123,10 +123,5 @@ RUN playwright install
 # Expose port
 EXPOSE 8000 11235 9222 8080
 
-# Optional: Increase shared memory size to prevent browser crashes
-# when loading heavy pages
-RUN mkdir /dev/shm
-VOLUME /dev/shm
-
 # Start the FastAPI server
 CMD ["uvicorn", "main:app", "--host", "0.0.0.0", "--port", "11235"]
\ No newline at end of file

From 6360d0545ac2812687a1a9a31de95fa64f600ed4 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Sat, 16 Nov 2024 18:08:56 +0800
Subject: [PATCH 035/115] feat(api): add API token authentication and update
 Dockerfile description

---
 Dockerfile                      |  3 ++-
 docker-compose.yml              | 33 +++++++++++++++++++++++++++++++++
 docs/examples/docker_example.py | 15 ++++++++++-----
 main.py                         | 23 ++++++++++++++++++++---
 4 files changed, 65 insertions(+), 9 deletions(-)
 create mode 100644 docker-compose.yml

diff --git a/Dockerfile b/Dockerfile
index ba29faf1..76b4e1cf 100644
--- a/Dockerfile
+++ b/Dockerfile
@@ -12,7 +12,7 @@ ARG ENABLE_GPU=false
 
 # Platform-specific labels
 LABEL maintainer="unclecode"
-LABEL description="Crawl4AI - Advanced Web Crawler with AI capabilities"
+LABEL description="🔥🕷️ Crawl4AI: Open-source LLM Friendly Web Crawler & scraper"
 LABEL version="1.0"
 
 # Environment setup
@@ -79,6 +79,7 @@ COPY . .
 RUN pip install --no-cache-dir -r requirements.txt
 
 # Install required library for FastAPI
+RUN pip install .
 RUN pip install fastapi uvicorn psutil
 
 # Install ML dependencies first for better layer caching
diff --git a/docker-compose.yml b/docker-compose.yml
new file mode 100644
index 00000000..ef0dc9e4
--- /dev/null
+++ b/docker-compose.yml
@@ -0,0 +1,33 @@
+version: '3.8'
+
+services:
+  crawl4ai:
+    build:
+      context: .
+      dockerfile: Dockerfile
+      args:
+        PYTHON_VERSION: 3.10
+        INSTALL_TYPE: all
+        ENABLE_GPU: false
+    ports:
+      - "11235:11235"  # FastAPI server
+      - "8000:8000"    # Alternative port
+      - "9222:9222"    # Browser debugging
+      - "8080:8080"    # Additional port
+    environment:
+      - CRAWL4AI_API_TOKEN=${CRAWL4AI_API_TOKEN:-}  # Optional API token
+    volumes:
+      - /dev/shm:/dev/shm  # Shared memory for browser operations
+    deploy:
+      resources:
+        limits:
+          memory: 4G
+        reservations:
+          memory: 1G
+    restart: unless-stopped
+    healthcheck:
+      test: ["CMD", "curl", "-f", "http://localhost:11235/health"]
+      interval: 30s
+      timeout: 10s
+      retries: 3
+      start_period: 40s
\ No newline at end of file
diff --git a/docs/examples/docker_example.py b/docs/examples/docker_example.py
index 502f1e52..6701f6ac 100644
--- a/docs/examples/docker_example.py
+++ b/docs/examples/docker_example.py
@@ -7,12 +7,14 @@ import os
 from typing import Dict, Any
 
 class Crawl4AiTester:
-    def __init__(self, base_url: str = "http://localhost:11235"):
+    def __init__(self, base_url: str = "http://localhost:11235", api_token: str = None):
         self.base_url = base_url
+        self.api_token = api_token or os.getenv('CRAWL4AI_API_TOKEN')  # Check environment variable as fallback
+        self.headers = {'Authorization': f'Bearer {self.api_token}'} if self.api_token else {}
         
     def submit_and_wait(self, request_data: Dict[str, Any], timeout: int = 300) -> Dict[str, Any]:
         # Submit crawl job
-        response = requests.post(f"{self.base_url}/crawl", json=request_data)
+        response = requests.post(f"{self.base_url}/crawl", json=request_data, headers=self.headers)
         task_id = response.json()["task_id"]
         print(f"Task ID: {task_id}")
         
@@ -22,7 +24,7 @@ class Crawl4AiTester:
             if time.time() - start_time > timeout:
                 raise TimeoutError(f"Task {task_id} did not complete within {timeout} seconds")
                 
-            result = requests.get(f"{self.base_url}/task/{task_id}")
+            result = requests.get(f"{self.base_url}/task/{task_id}", headers=self.headers)
             status = result.json()
             
             if status["status"] == "failed":
@@ -35,14 +37,17 @@ class Crawl4AiTester:
             time.sleep(2)
             
     def submit_sync(self, request_data: Dict[str, Any]) -> Dict[str, Any]:
-        response = requests.post(f"{self.base_url}/crawl_sync", json=request_data, timeout=60)
+        response = requests.post(f"{self.base_url}/crawl_sync", json=request_data, headers=self.headers, timeout=60)
         if response.status_code == 408:
             raise TimeoutError("Task did not complete within server timeout")
         response.raise_for_status()
         return response.json()
 
 def test_docker_deployment(version="basic"):
-    tester = Crawl4AiTester()
+    tester = Crawl4AiTester(
+        # base_url="http://localhost:11235" 
+        base_url="https://crawl4ai-sby74.ondigitalocean.app" 
+    )
     print(f"Testing Crawl4AI Docker {version} version")
     
     # Health check with timeout and retry
diff --git a/main.py b/main.py
index 660c3366..92b1793b 100644
--- a/main.py
+++ b/main.py
@@ -10,6 +10,8 @@ from fastapi.exceptions import RequestValidationError
 from starlette.middleware.base import BaseHTTPMiddleware
 from starlette.responses import FileResponse
 from fastapi.responses import RedirectResponse
+from fastapi.security import HTTPBearer, HTTPAuthorizationCredentials
+from fastapi import Depends, Security
 
 from pydantic import BaseModel, HttpUrl, Field
 from typing import Optional, List, Dict, Any, Union
@@ -322,6 +324,21 @@ app.add_middleware(
 # Mount the pages directory as a static directory
 app.mount("/pages", StaticFiles(directory=__location__ + "/pages"), name="pages")
 
+# API token security
+security = HTTPBearer()
+CRAWL4AI_API_TOKEN = os.getenv("CRAWL4AI_API_TOKEN")
+
+async def verify_token(credentials: HTTPAuthorizationCredentials = Security(security)):
+    if not CRAWL4AI_API_TOKEN:
+        return credentials  # No token verification if CRAWL4AI_API_TOKEN is not set
+    if credentials.credentials != CRAWL4AI_API_TOKEN:
+        raise HTTPException(status_code=401, detail="Invalid token")
+    return credentials
+
+# Helper function to conditionally apply security
+def secure_endpoint():
+    return Depends(verify_token) if CRAWL4AI_API_TOKEN else None
+
 # Check if site directory exists
 if os.path.exists(__location__ + "/site"):
     # Mount the site directory as a static directory
@@ -348,12 +365,12 @@ def read_root():
     return {"message": "Crawl4AI API service is running"}
 
 
-@app.post("/crawl")
+@app.post("/crawl", dependencies=[Depends(verify_token)])
 async def crawl(request: CrawlRequest) -> Dict[str, str]:
     task_id = await crawler_service.submit_task(request)
     return {"task_id": task_id}
 
-@app.get("/task/{task_id}")
+@app.get("/task/{task_id}", dependencies=[Depends(verify_token)])
 async def get_task_status(task_id: str):
     task_info = crawler_service.task_manager.get_task(task_id)
     if not task_info:
@@ -375,7 +392,7 @@ async def get_task_status(task_id: str):
 
     return response
 
-@app.post("/crawl_sync")
+@app.post("/crawl_sync", dependencies=[Depends(verify_token)])
 async def crawl_sync(request: CrawlRequest) -> Dict[str, Any]:
     task_id = await crawler_service.submit_task(request)
     

From 9139ef3125b8a0bc96e2b26f3a06b09ecc60c020 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Sat, 16 Nov 2024 18:19:44 +0800
Subject: [PATCH 036/115] feat(docker): update Dockerfile for improved
 installation process and enhance deployment documentation with Docker Compose
 setup and API token security

---
 Dockerfile                            |   9 +-
 docs/md_v2/basic/docker-deploymeny.md | 123 +++++++++++++++++---------
 2 files changed, 86 insertions(+), 46 deletions(-)

diff --git a/Dockerfile b/Dockerfile
index 76b4e1cf..aac2280a 100644
--- a/Dockerfile
+++ b/Dockerfile
@@ -79,7 +79,6 @@ COPY . .
 RUN pip install --no-cache-dir -r requirements.txt
 
 # Install required library for FastAPI
-RUN pip install .
 RUN pip install fastapi uvicorn psutil
 
 # Install ML dependencies first for better layer caching
@@ -97,15 +96,15 @@ RUN if [ "$INSTALL_TYPE" = "all" ] ; then \
 
 # Install the package
 RUN if [ "$INSTALL_TYPE" = "all" ] ; then \
-        pip install -e ".[all]" && \
+        pip install ".[all]" && \
         python -m crawl4ai.model_loader ; \
     elif [ "$INSTALL_TYPE" = "torch" ] ; then \
-        pip install -e ".[torch]" ; \
+        pip install ".[torch]" ; \
     elif [ "$INSTALL_TYPE" = "transformer" ] ; then \
-        pip install -e ".[transformer]" && \
+        pip install ".[transformer]" && \
         python -m crawl4ai.model_loader ; \
     else \
-        pip install -e "." ; \
+        pip install "." ; \
     fi
 
     # Install MkDocs and required plugins
diff --git a/docs/md_v2/basic/docker-deploymeny.md b/docs/md_v2/basic/docker-deploymeny.md
index cc11d0d9..a500ee21 100644
--- a/docs/md_v2/basic/docker-deploymeny.md
+++ b/docs/md_v2/basic/docker-deploymeny.md
@@ -1,71 +1,112 @@
-# Docker Deployment
+# Docker Deployment 🐳
 
 Crawl4AI provides official Docker images for easy deployment and scalability. This guide covers installation, configuration, and usage of Crawl4AI in Docker environments.
 
-## Quick Start 🚀
+## Docker Compose Setup 🐳
 
-Pull and run the basic version:
+### Basic Usage
 
-```bash
-docker pull unclecode/crawl4ai:basic
-docker run -p 11235:11235 unclecode/crawl4ai:basic
+Create a `docker-compose.yml`:
+```yaml
+version: '3.8'
+
+services:
+  crawl4ai:
+    image: unclecode/crawl4ai:all
+    ports:
+      - "11235:11235"
+    volumes:
+      - /dev/shm:/dev/shm
+    deploy:
+      resources:
+        limits:
+          memory: 4G
+    restart: unless-stopped
 ```
 
-Test the deployment:
+Run with:
+```bash
+docker-compose up -d
+```
+
+### Secure Mode with API Token
+
+To enable API authentication, simply set the `CRAWL4AI_API_TOKEN`:
+```bash
+CRAWL4AI_API_TOKEN=your-secret-token docker-compose up -d
+```
+
+### Using Environment Variables
+
+Create a `.env` file for your API tokens:
+```env
+# Crawl4AI API Security (optional)
+CRAWL4AI_API_TOKEN=your-secret-token
+
+# LLM Provider API Keys
+OPENAI_API_KEY=sk-...
+ANTHROPIC_API_KEY=sk-ant-...
+GOOGLE_API_KEY=...
+GEMINI_API_KEY=...
+OLLAMA_API_KEY=...
+
+# Additional Configuration
+MAX_CONCURRENT_TASKS=5
+```
+
+Docker Compose will automatically load variables from the `.env` file. No additional configuration needed!
+
+### Testing with API Token
+
 ```python
 import requests
 
-# Test health endpoint
-health = requests.get("http://localhost:11235/health")
-print("Health check:", health.json())
+# Initialize headers with token if using secure mode
+headers = {}
+if api_token := os.getenv('CRAWL4AI_API_TOKEN'):
+    headers['Authorization'] = f'Bearer {api_token}'
 
-# Test basic crawl
+# Test crawl with authentication
 response = requests.post(
     "http://localhost:11235/crawl",
+    headers=headers,
     json={
         "urls": "https://www.nbcnews.com/business",
         "priority": 10
     }
 )
 task_id = response.json()["task_id"]
-print("Task ID:", task_id)
 ```
 
-## Available Images 🏷️
+### Security Best Practices 🔒
 
-- `unclecode/crawl4ai:basic` - Basic web crawling capabilities
-- `unclecode/crawl4ai:all` - Full installation with all features
-- `unclecode/crawl4ai:gpu` - GPU-enabled version for ML features
-
-## Configuration Options 🔧
-
-### Environment Variables
-
-```bash
-docker run -p 11235:11235 \
-    -e MAX_CONCURRENT_TASKS=5 \
-    -e OPENAI_API_KEY=your_key \
-    unclecode/crawl4ai:all
+- Add `.env` to your `.gitignore`
+- Use different API tokens for development and production
+- Rotate API tokens periodically
+- Use secure methods to pass tokens in production environments
 ```
 
-### Volume Mounting
+This addition to your documentation:
+1. Shows how to use Docker Compose
+2. Explains both secure and non-secure modes
+3. Demonstrates environment variable configuration
+4. Provides example code for authenticated requests
+5. Includes security best practices
+
+
+
+
+
+
+
+
+
+
+
+
 
-Mount a directory for persistent data:
-```bash
-docker run -p 11235:11235 \
-    -v $(pwd)/data:/app/data \
-    unclecode/crawl4ai:all
-```
 
-### Resource Limits
 
-Control container resources:
-```bash
-docker run -p 11235:11235 \
-    --memory=4g \
-    --cpus=2 \
-    unclecode/crawl4ai:all
-```
 
 ## Usage Examples 📝
 

From 4b45b28f256ad62272d5ea75ae898de7882618ba Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Sat, 16 Nov 2024 18:44:47 +0800
Subject: [PATCH 037/115] feat(docs): enhance deployment documentation with
 one-click setup, API security details, and Docker Compose examples

---
 README.md                             |  15 ++
 docs/examples/docker_example.py       |  13 +-
 docs/md_v2/basic/docker-deploymeny.md | 230 ++++++++++++++++++++------
 main.py                               |   3 +
 4 files changed, 207 insertions(+), 54 deletions(-)

diff --git a/README.md b/README.md
index d250f936..a2806304 100644
--- a/README.md
+++ b/README.md
@@ -113,6 +113,21 @@ cd crawl4ai
 pip install -e .
 ```
 
+## One-Click Deployment 🚀
+
+Deploy your own instance of Crawl4AI with one click:
+
+[![DigitalOcean Referral Badge](https://web-platforms.sfo2.cdn.digitaloceanspaces.com/WWW/Badge%203.svg)](https://www.digitalocean.com/?repo=https://github.com/unclecode/crawl4ai/tree/0.3.74&refcode=a0780f1bdb3d&utm_campaign=Referral_Invite&utm_medium=Referral_Program&utm_source=badge)
+
+
+> 💡 **Recommended specs**: 4GB RAM minimum. Select "professional-xs" or higher when deploying for stable operation.
+
+The deploy will:
+- Set up a Docker container with Crawl4AI
+- Configure Playwright and all dependencies
+- Start the FastAPI server on port 11235
+- Set up health checks and auto-deployment
+
 ### Using Docker 🐳
 
 Crawl4AI is available as Docker images for easy deployment. You can either pull directly from Docker Hub (recommended) or build from the repository.
diff --git a/docs/examples/docker_example.py b/docs/examples/docker_example.py
index 6701f6ac..b43e8ee6 100644
--- a/docs/examples/docker_example.py
+++ b/docs/examples/docker_example.py
@@ -15,6 +15,8 @@ class Crawl4AiTester:
     def submit_and_wait(self, request_data: Dict[str, Any], timeout: int = 300) -> Dict[str, Any]:
         # Submit crawl job
         response = requests.post(f"{self.base_url}/crawl", json=request_data, headers=self.headers)
+        if response.status_code == 403:
+            raise Exception("API token is invalid or missing")
         task_id = response.json()["task_id"]
         print(f"Task ID: {task_id}")
         
@@ -45,8 +47,9 @@ class Crawl4AiTester:
 
 def test_docker_deployment(version="basic"):
     tester = Crawl4AiTester(
-        # base_url="http://localhost:11235" 
-        base_url="https://crawl4ai-sby74.ondigitalocean.app" 
+        base_url="http://localhost:11235" ,
+        # base_url="https://crawl4ai-sby74.ondigitalocean.app",
+        api_token="test"
     )
     print(f"Testing Crawl4AI Docker {version} version")
     
@@ -83,7 +86,8 @@ def test_basic_crawl(tester: Crawl4AiTester):
     print("\n=== Testing Basic Crawl ===")
     request = {
         "urls": "https://www.nbcnews.com/business",
-        "priority": 10
+        "priority": 10, 
+        "session_id": "test"
     }
     
     result = tester.submit_and_wait(request)
@@ -95,7 +99,8 @@ def test_basic_crawl_sync(tester: Crawl4AiTester):
     print("\n=== Testing Basic Crawl (Sync) ===")
     request = {
         "urls": "https://www.nbcnews.com/business",
-        "priority": 10
+        "priority": 10,
+        "session_id": "test"
     }
     
     result = tester.submit_sync(request)
diff --git a/docs/md_v2/basic/docker-deploymeny.md b/docs/md_v2/basic/docker-deploymeny.md
index a500ee21..30555708 100644
--- a/docs/md_v2/basic/docker-deploymeny.md
+++ b/docs/md_v2/basic/docker-deploymeny.md
@@ -1,12 +1,115 @@
-# Docker Deployment 🐳
+# Docker Deployment
 
 Crawl4AI provides official Docker images for easy deployment and scalability. This guide covers installation, configuration, and usage of Crawl4AI in Docker environments.
 
-## Docker Compose Setup 🐳
+## Quick Start 🚀
 
-### Basic Usage
+Pull and run the basic version:
+
+```bash
+# Basic run without security
+docker pull unclecode/crawl4ai:basic
+docker run -p 11235:11235 unclecode/crawl4ai:basic
+
+# Run with API security enabled
+docker run -p 11235:11235 -e CRAWL4AI_API_TOKEN=your_secret_token unclecode/crawl4ai:basic
+```
+
+## API Security 🔒
+
+### Understanding CRAWL4AI_API_TOKEN
+
+The `CRAWL4AI_API_TOKEN` provides optional security for your Crawl4AI instance:
+
+- If `CRAWL4AI_API_TOKEN` is set: All API endpoints (except `/health`) require authentication
+- If `CRAWL4AI_API_TOKEN` is not set: The API is publicly accessible
+
+```bash
+# Secured Instance
+docker run -p 11235:11235 -e CRAWL4AI_API_TOKEN=your_secret_token unclecode/crawl4ai:all
+
+# Unsecured Instance
+docker run -p 11235:11235 unclecode/crawl4ai:all
+```
+
+### Making API Calls
+
+For secured instances, include the token in all requests:
+
+```python
+import requests
+
+# Setup headers if token is being used
+api_token = "your_secret_token"  # Same token set in CRAWL4AI_API_TOKEN
+headers = {"Authorization": f"Bearer {api_token}"} if api_token else {}
+
+# Making authenticated requests
+response = requests.post(
+    "http://localhost:11235/crawl",
+    headers=headers,
+    json={
+        "urls": "https://example.com",
+        "priority": 10
+    }
+)
+
+# Checking task status
+task_id = response.json()["task_id"]
+status = requests.get(
+    f"http://localhost:11235/task/{task_id}",
+    headers=headers
+)
+```
+
+### Using with Docker Compose
+
+In your `docker-compose.yml`:
+```yaml
+services:
+  crawl4ai:
+    image: unclecode/crawl4ai:all
+    environment:
+      - CRAWL4AI_API_TOKEN=${CRAWL4AI_API_TOKEN:-}  # Optional
+    # ... other configuration
+```
+
+Then either:
+1. Set in `.env` file:
+```env
+CRAWL4AI_API_TOKEN=your_secret_token
+```
+
+2. Or set via command line:
+```bash
+CRAWL4AI_API_TOKEN=your_secret_token docker-compose up
+```
+
+> **Security Note**: If you enable the API token, make sure to keep it secure and never commit it to version control. The token will be required for all API endpoints except the health check endpoint (`/health`).
+
+## Configuration Options 🔧
+
+### Environment Variables
+
+You can configure the service using environment variables:
+
+```bash
+# Basic configuration
+docker run -p 11235:11235 \
+    -e MAX_CONCURRENT_TASKS=5 \
+    unclecode/crawl4ai:all
+
+# With security and LLM support
+docker run -p 11235:11235 \
+    -e CRAWL4AI_API_TOKEN=your_secret_token \
+    -e OPENAI_API_KEY=sk-... \
+    -e ANTHROPIC_API_KEY=sk-ant-... \
+    unclecode/crawl4ai:all
+```
+
+### Using Docker Compose (Recommended) 🐳
 
 Create a `docker-compose.yml`:
+
 ```yaml
 version: '3.8'
 
@@ -15,83 +118,110 @@ services:
     image: unclecode/crawl4ai:all
     ports:
       - "11235:11235"
+    environment:
+      - CRAWL4AI_API_TOKEN=${CRAWL4AI_API_TOKEN:-}  # Optional API security
+      - MAX_CONCURRENT_TASKS=5
+      # LLM Provider Keys
+      - OPENAI_API_KEY=${OPENAI_API_KEY:-}
+      - ANTHROPIC_API_KEY=${ANTHROPIC_API_KEY:-}
     volumes:
       - /dev/shm:/dev/shm
     deploy:
       resources:
         limits:
           memory: 4G
-    restart: unless-stopped
+        reservations:
+          memory: 1G
 ```
 
-Run with:
+You can run it in two ways:
+
+1. Using environment variables directly:
 ```bash
-docker-compose up -d
+CRAWL4AI_API_TOKEN=secret123 OPENAI_API_KEY=sk-... docker-compose up
 ```
 
-### Secure Mode with API Token
-
-To enable API authentication, simply set the `CRAWL4AI_API_TOKEN`:
-```bash
-CRAWL4AI_API_TOKEN=your-secret-token docker-compose up -d
-```
-
-### Using Environment Variables
-
-Create a `.env` file for your API tokens:
+2. Using a `.env` file (recommended):
+Create a `.env` file in the same directory:
 ```env
-# Crawl4AI API Security (optional)
-CRAWL4AI_API_TOKEN=your-secret-token
+# API Security (optional)
+CRAWL4AI_API_TOKEN=your_secret_token
 
-# LLM Provider API Keys
+# LLM Provider Keys
 OPENAI_API_KEY=sk-...
 ANTHROPIC_API_KEY=sk-ant-...
-GOOGLE_API_KEY=...
-GEMINI_API_KEY=...
-OLLAMA_API_KEY=...
 
-# Additional Configuration
+# Other Configuration
 MAX_CONCURRENT_TASKS=5
 ```
 
-Docker Compose will automatically load variables from the `.env` file. No additional configuration needed!
+Then simply run:
+```bash
+docker-compose up
+```
 
-### Testing with API Token
+### Testing the Deployment 🧪
 
 ```python
 import requests
 
-# Initialize headers with token if using secure mode
-headers = {}
-if api_token := os.getenv('CRAWL4AI_API_TOKEN'):
-    headers['Authorization'] = f'Bearer {api_token}'
+# For unsecured instances
+def test_unsecured():
+    # Health check
+    health = requests.get("http://localhost:11235/health")
+    print("Health check:", health.json())
 
-# Test crawl with authentication
-response = requests.post(
-    "http://localhost:11235/crawl",
-    headers=headers,
-    json={
-        "urls": "https://www.nbcnews.com/business",
-        "priority": 10
+    # Basic crawl
+    response = requests.post(
+        "http://localhost:11235/crawl",
+        json={
+            "urls": "https://www.nbcnews.com/business",
+            "priority": 10
+        }
+    )
+    task_id = response.json()["task_id"]
+    print("Task ID:", task_id)
+
+# For secured instances
+def test_secured(api_token):
+    headers = {"Authorization": f"Bearer {api_token}"}
+    
+    # Basic crawl with authentication
+    response = requests.post(
+        "http://localhost:11235/crawl",
+        headers=headers,
+        json={
+            "urls": "https://www.nbcnews.com/business",
+            "priority": 10
+        }
+    )
+    task_id = response.json()["task_id"]
+    print("Task ID:", task_id)
+```
+
+### LLM Extraction Example 🤖
+
+When you've configured your LLM provider keys (via environment variables or `.env`), you can use LLM extraction:
+
+```python
+request = {
+    "urls": "https://example.com",
+    "extraction_config": {
+        "type": "llm",
+        "params": {
+            "provider": "openai/gpt-4",
+            "instruction": "Extract main topics from the page"
+        }
     }
-)
-task_id = response.json()["task_id"]
+}
+
+# Make the request (add headers if using API security)
+response = requests.post("http://localhost:11235/crawl", json=request)
 ```
 
-### Security Best Practices 🔒
+> **Note**: Remember to add `.env` to your `.gitignore` to keep your API keys secure!
 
-- Add `.env` to your `.gitignore`
-- Use different API tokens for development and production
-- Rotate API tokens periodically
-- Use secure methods to pass tokens in production environments
-```
 
-This addition to your documentation:
-1. Shows how to use Docker Compose
-2. Explains both secure and non-secure modes
-3. Demonstrates environment variable configuration
-4. Provides example code for authenticated requests
-5. Includes security best practices
 
 
 
diff --git a/main.py b/main.py
index 92b1793b..41788d61 100644
--- a/main.py
+++ b/main.py
@@ -65,6 +65,7 @@ class CrawlRequest(BaseModel):
     screenshot: bool = False
     magic: bool = False
     extra: Optional[Dict[str, Any]] = {}
+    session_id: Optional[str] = None
 
 @dataclass
 class TaskInfo:
@@ -284,6 +285,7 @@ class CrawlerService:
                             css_selector=request.css_selector,
                             screenshot=request.screenshot,
                             magic=request.magic,
+                            session_id=request.session_id,
                             **request.extra,
                         )
                     else:
@@ -295,6 +297,7 @@ class CrawlerService:
                             css_selector=request.css_selector,
                             screenshot=request.screenshot,
                             magic=request.magic,
+                            session_id=request.session_id,
                             **request.extra,
                         )
 

From 3a66aa8a60ae7213bb8437003b58a631df208ffb Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Sun, 17 Nov 2024 15:30:56 +0800
Subject: [PATCH 038/115] feat(cache): introduce CacheMode and CacheContext for
 enhanced caching behavior chore(requirements): add colorama dependency
 refactor(config): add SHOW_DEPRECATION_WARNINGS flag and clean up code
 fix(docs): update example scripts for clarity and consistency

---
 crawl4ai/__init__.py               |   3 +-
 crawl4ai/async_crawler_strategy.py |   8 +-
 crawl4ai/async_webcrawler.3.73.py  | 344 +++++++++++++++++++++++++++++
 crawl4ai/async_webcrawler.py       | 285 +++++++++++++++++-------
 crawl4ai/cache_context.py          |  79 +++++++
 crawl4ai/config.py                 |   3 +-
 docs/examples/docker_example.py    |   5 +-
 docs/examples/quickstart_async.py  |  12 +-
 requirements.txt                   |   3 +-
 tests/docker_example.py            | 332 ++++++++++++++++++++++++++++
 10 files changed, 979 insertions(+), 95 deletions(-)
 create mode 100644 crawl4ai/async_webcrawler.3.73.py
 create mode 100644 crawl4ai/cache_context.py
 create mode 100644 tests/docker_example.py

diff --git a/crawl4ai/__init__.py b/crawl4ai/__init__.py
index e55aaf73..ad9475b4 100644
--- a/crawl4ai/__init__.py
+++ b/crawl4ai/__init__.py
@@ -1,6 +1,6 @@
 # __init__.py
 
-from .async_webcrawler import AsyncWebCrawler
+from .async_webcrawler import AsyncWebCrawler, CacheMode
 from .models import CrawlResult
 from .__version__ import __version__
 # __version__ = "0.3.73"
@@ -8,6 +8,7 @@ from .__version__ import __version__
 __all__ = [
     "AsyncWebCrawler",
     "CrawlResult",
+    "CacheMode",
 ]
 
 def is_sync_version_installed():
diff --git a/crawl4ai/async_crawler_strategy.py b/crawl4ai/async_crawler_strategy.py
index 83933a35..a67591af 100644
--- a/crawl4ai/async_crawler_strategy.py
+++ b/crawl4ai/async_crawler_strategy.py
@@ -669,8 +669,8 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
             if self.accept_downloads:
                 page.on("download", lambda download: asyncio.create_task(self._handle_download(download)))
 
-            if self.verbose:
-                print(f"[LOG] 🕸️ Crawling {url} using AsyncPlaywrightCrawlerStrategy...")
+            # if self.verbose:
+            #     print(f"[LOG] 🕸️ Crawling {url} using AsyncPlaywrightCrawlerStrategy...")
 
             if self.use_cached_html:
                 cache_file_path = os.path.join(
@@ -873,8 +873,8 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
                     await asyncio.sleep(screenshot_wait_for)
                 screenshot_data = await self.take_screenshot(page)          
 
-            if self.verbose:
-                print(f"[LOG] ✅ Crawled {url} successfully!")
+            # if self.verbose:
+            #     print(f"[LOG] ✅ Crawled {url} successfully!")
            
             if self.use_cached_html:
                 cache_file_path = os.path.join(
diff --git a/crawl4ai/async_webcrawler.3.73.py b/crawl4ai/async_webcrawler.3.73.py
new file mode 100644
index 00000000..03e7a393
--- /dev/null
+++ b/crawl4ai/async_webcrawler.3.73.py
@@ -0,0 +1,344 @@
+import os
+import time
+from pathlib import Path
+from typing import Optional
+import json
+import asyncio
+from .models import CrawlResult
+from .async_database import async_db_manager
+from .chunking_strategy import *
+from .extraction_strategy import *
+from .async_crawler_strategy import AsyncCrawlerStrategy, AsyncPlaywrightCrawlerStrategy, AsyncCrawlResponse
+from .content_scrapping_strategy import WebScrapingStrategy
+from .config import MIN_WORD_THRESHOLD, IMAGE_DESCRIPTION_MIN_WORD_THRESHOLD
+from .utils import (
+    sanitize_input_encode,
+    InvalidCSSSelectorError,
+    format_html
+)
+from .__version__ import __version__ as crawl4ai_version
+
+class AsyncWebCrawler:
+    def __init__(
+        self,
+        crawler_strategy: Optional[AsyncCrawlerStrategy] = None,
+        always_by_pass_cache: bool = False,
+        base_directory: str = str(Path.home()),
+        **kwargs,
+    ):
+        self.crawler_strategy = crawler_strategy or AsyncPlaywrightCrawlerStrategy(
+            **kwargs
+        )
+        self.always_by_pass_cache = always_by_pass_cache
+        # self.crawl4ai_folder = os.path.join(Path.home(), ".crawl4ai")
+        self.crawl4ai_folder = os.path.join(base_directory, ".crawl4ai")
+        os.makedirs(self.crawl4ai_folder, exist_ok=True)
+        os.makedirs(f"{self.crawl4ai_folder}/cache", exist_ok=True)
+        self.ready = False
+        self.verbose = kwargs.get("verbose", False)
+
+    async def __aenter__(self):
+        await self.crawler_strategy.__aenter__()
+        await self.awarmup()
+        return self
+
+    async def __aexit__(self, exc_type, exc_val, exc_tb):
+        await self.crawler_strategy.__aexit__(exc_type, exc_val, exc_tb)
+
+    async def awarmup(self):
+        # Print a message for crawl4ai and its version
+        if self.verbose:
+            print(f"[LOG] 🚀 Crawl4AI {crawl4ai_version}")
+            print("[LOG] 🌤️  Warming up the AsyncWebCrawler")
+        # await async_db_manager.ainit_db()
+        # # await async_db_manager.initialize()
+        # await self.arun(
+        #     url="https://google.com/",
+        #     word_count_threshold=5,
+        #     bypass_cache=False,
+        #     verbose=False,
+        # )
+        self.ready = True
+        if self.verbose:
+            print("[LOG] 🌞 AsyncWebCrawler is ready to crawl")
+
+    async def arun(
+        self,
+        url: str,
+        word_count_threshold=MIN_WORD_THRESHOLD,
+        extraction_strategy: ExtractionStrategy = None,
+        chunking_strategy: ChunkingStrategy = RegexChunking(),
+        bypass_cache: bool = False,
+        css_selector: str = None,
+        screenshot: bool = False,
+        user_agent: str = None,
+        verbose=True,
+        disable_cache: bool = False,
+        no_cache_read: bool = False,
+        no_cache_write: bool = False,
+        **kwargs,
+    ) -> CrawlResult:
+        """
+        Runs the crawler for a single source: URL (web, local file, or raw HTML).
+
+        Args:
+            url (str): The URL to crawl. Supported prefixes:
+                - 'http://' or 'https://': Web URL to crawl.
+                - 'file://': Local file path to process.
+                - 'raw:': Raw HTML content to process.
+            ... [other existing parameters]
+
+        Returns:
+            CrawlResult: The result of the crawling and processing.
+        """
+        try:
+            if disable_cache:
+                bypass_cache = True
+                no_cache_read = True
+                no_cache_write = True
+            
+            extraction_strategy = extraction_strategy or NoExtractionStrategy()
+            extraction_strategy.verbose = verbose
+            if not isinstance(extraction_strategy, ExtractionStrategy):
+                raise ValueError("Unsupported extraction strategy")
+            if not isinstance(chunking_strategy, ChunkingStrategy):
+                raise ValueError("Unsupported chunking strategy")
+            
+            word_count_threshold = max(word_count_threshold, MIN_WORD_THRESHOLD)
+
+            async_response: AsyncCrawlResponse = None
+            cached = None
+            screenshot_data = None
+            extracted_content = None
+            
+            is_web_url = url.startswith(('http://', 'https://'))
+            is_local_file = url.startswith("file://")
+            is_raw_html = url.startswith("raw:")
+            _url = url if not is_raw_html else "Raw HTML"
+            
+            start_time = time.perf_counter()
+            cached_result = None
+            if is_web_url and (not bypass_cache or not no_cache_read) and not self.always_by_pass_cache:
+                cached_result = await async_db_manager.aget_cached_url(url)
+                        
+            if cached_result:
+                html = sanitize_input_encode(cached_result.html)
+                extracted_content = sanitize_input_encode(cached_result.extracted_content or "")
+                if screenshot:
+                    screenshot_data = cached_result.screenshot
+                    if not screenshot_data:
+                        cached_result = None
+                if verbose:
+                    print(
+                        f"[LOG] 1️⃣  ✅ Page fetched (cache) for {_url}, success: {bool(html)}, time taken: {time.perf_counter() - start_time:.2f} seconds"
+                    )
+
+
+            if not cached or not html:
+                t1 = time.perf_counter()
+                
+                if user_agent:
+                    self.crawler_strategy.update_user_agent(user_agent)
+                async_response: AsyncCrawlResponse = await self.crawler_strategy.crawl(url, screenshot=screenshot, **kwargs)
+                html = sanitize_input_encode(async_response.html)
+                screenshot_data = async_response.screenshot
+                t2 = time.perf_counter()
+                if verbose:
+                    print(
+                        f"[LOG] 1️⃣  ✅ Page fetched (no-cache) for {_url}, success: {bool(html)}, time taken: {t2 - t1:.2f} seconds"
+                    )
+
+            t1 = time.perf_counter()
+            crawl_result = await self.aprocess_html(
+                url=url,
+                html=html,
+                extracted_content=extracted_content,
+                word_count_threshold=word_count_threshold,
+                extraction_strategy=extraction_strategy,
+                chunking_strategy=chunking_strategy,
+                css_selector=css_selector,
+                screenshot=screenshot_data,
+                verbose=verbose,
+                is_cached=bool(cached),
+                async_response=async_response,
+                bypass_cache=bypass_cache,
+                is_web_url = is_web_url,
+                is_local_file = is_local_file,
+                is_raw_html = is_raw_html,
+                **kwargs,
+            )
+            
+            if async_response:
+                crawl_result.status_code = async_response.status_code
+                crawl_result.response_headers = async_response.response_headers
+                crawl_result.downloaded_files = async_response.downloaded_files
+            else:
+                crawl_result.status_code = 200
+                crawl_result.response_headers = cached_result.response_headers if cached_result else {}
+
+            crawl_result.success = bool(html)
+            crawl_result.session_id = kwargs.get("session_id", None)
+
+            if verbose:
+                print(
+                    f"[LOG] 🔥 🚀 Crawling done for {_url}, success: {crawl_result.success}, time taken: {time.perf_counter() - start_time:.2f} seconds"
+                )
+
+            if not is_raw_html and not no_cache_write:
+                if not bool(cached_result) or kwargs.get("bypass_cache", False) or self.always_by_pass_cache:
+                    await async_db_manager.acache_url(crawl_result)
+
+
+            return crawl_result
+        
+        except Exception as e:
+            if not hasattr(e, "msg"):
+                e.msg = str(e)
+            print(f"[ERROR] 🚫 arun(): Failed to crawl {_url}, error: {e.msg}")
+            return CrawlResult(url=url, html="", markdown = f"[ERROR] 🚫 arun(): Failed to crawl {_url}, error: {e.msg}", success=False, error_message=e.msg)
+
+    async def arun_many(
+        self,
+        urls: List[str],
+        word_count_threshold=MIN_WORD_THRESHOLD,
+        extraction_strategy: ExtractionStrategy = None,
+        chunking_strategy: ChunkingStrategy = RegexChunking(),
+        bypass_cache: bool = False,
+        css_selector: str = None,
+        screenshot: bool = False,
+        user_agent: str = None,
+        verbose=True,
+        **kwargs,
+    ) -> List[CrawlResult]:
+        """
+        Runs the crawler for multiple sources: URLs (web, local files, or raw HTML).
+
+        Args:
+            urls (List[str]): A list of URLs with supported prefixes:
+                - 'http://' or 'https://': Web URL to crawl.
+                - 'file://': Local file path to process.
+                - 'raw:': Raw HTML content to process.
+            ... [other existing parameters]
+
+        Returns:
+            List[CrawlResult]: The results of the crawling and processing.
+        """
+        semaphore_count = kwargs.get('semaphore_count', 5)  # Adjust as needed
+        semaphore = asyncio.Semaphore(semaphore_count)
+
+        async def crawl_with_semaphore(url):
+            async with semaphore:
+                return await self.arun(
+                    url,
+                    word_count_threshold=word_count_threshold,
+                    extraction_strategy=extraction_strategy,
+                    chunking_strategy=chunking_strategy,
+                    bypass_cache=bypass_cache,
+                    css_selector=css_selector,
+                    screenshot=screenshot,
+                    user_agent=user_agent,
+                    verbose=verbose,
+                    **kwargs,
+                )
+
+        tasks = [crawl_with_semaphore(url) for url in urls]
+        results = await asyncio.gather(*tasks, return_exceptions=True)
+        return [result if not isinstance(result, Exception) else str(result) for result in results]
+
+    async def aprocess_html(
+        self,
+        url: str,
+        html: str,
+        extracted_content: str,
+        word_count_threshold: int,
+        extraction_strategy: ExtractionStrategy,
+        chunking_strategy: ChunkingStrategy,
+        css_selector: str,
+        screenshot: str,
+        verbose: bool,
+        **kwargs,
+    ) -> CrawlResult:
+        t = time.perf_counter()
+        # Extract content from HTML
+        try:
+            _url = url if not kwargs.get("is_raw_html", False) else "Raw HTML"
+            t1 = time.perf_counter()
+            scrapping_strategy = WebScrapingStrategy()
+            # result = await scrapping_strategy.ascrap(
+            result = scrapping_strategy.scrap(
+                url,
+                html,
+                word_count_threshold=word_count_threshold,
+                css_selector=css_selector,
+                only_text=kwargs.get("only_text", False),
+                image_description_min_word_threshold=kwargs.get(
+                    "image_description_min_word_threshold", IMAGE_DESCRIPTION_MIN_WORD_THRESHOLD
+                ),
+                **kwargs,
+            )
+
+            if result is None:
+                raise ValueError(f"Process HTML, Failed to extract content from the website: {url}")
+        except InvalidCSSSelectorError as e:
+            raise ValueError(str(e))
+        except Exception as e:
+            raise ValueError(f"Process HTML, Failed to extract content from the website: {url}, error: {str(e)}")
+
+        cleaned_html = sanitize_input_encode(result.get("cleaned_html", ""))
+        markdown = sanitize_input_encode(result.get("markdown", ""))
+        fit_markdown = sanitize_input_encode(result.get("fit_markdown", ""))
+        fit_html = sanitize_input_encode(result.get("fit_html", ""))
+        media = result.get("media", [])
+        links = result.get("links", [])
+        metadata = result.get("metadata", {})
+        
+        if verbose:
+            print(
+                f"[LOG] 2️⃣  ✅ Scraping done for {_url}, success: True, time taken: {time.perf_counter() - t1:.2f} seconds"
+            )        
+
+        if extracted_content is None and extraction_strategy and chunking_strategy and not isinstance(extraction_strategy, NoExtractionStrategy):
+            t1 = time.perf_counter()
+            # Check if extraction strategy is type of JsonCssExtractionStrategy
+            if isinstance(extraction_strategy, JsonCssExtractionStrategy) or isinstance(extraction_strategy, JsonCssExtractionStrategy):
+                extraction_strategy.verbose = verbose
+                extracted_content = extraction_strategy.run(url, [html])
+                extracted_content = json.dumps(extracted_content, indent=4, default=str, ensure_ascii=False)
+            else:
+                sections = chunking_strategy.chunk(markdown)
+                extracted_content = extraction_strategy.run(url, sections)
+                extracted_content = json.dumps(extracted_content, indent=4, default=str, ensure_ascii=False)
+            if verbose:
+                print(
+                    f"[LOG] 3️⃣  ✅ Extraction done for {_url}, time taken: {time.perf_counter() - t1:.2f} seconds"
+                )
+
+        screenshot = None if not screenshot else screenshot
+        
+        return CrawlResult(
+            url=url,
+            html=html,
+            cleaned_html=format_html(cleaned_html),
+            markdown=markdown,
+            fit_markdown=fit_markdown,
+            fit_html= fit_html,
+            media=media,
+            links=links,
+            metadata=metadata,
+            screenshot=screenshot,
+            extracted_content=extracted_content,
+            success=True,
+            error_message="",
+        )
+
+    async def aclear_cache(self):
+        # await async_db_manager.aclear_db()
+        await async_db_manager.cleanup()
+
+    async def aflush_cache(self):
+        await async_db_manager.aflush_db()
+
+    async def aget_cache_size(self):
+        return await async_db_manager.aget_total_count()
+
+
diff --git a/crawl4ai/async_webcrawler.py b/crawl4ai/async_webcrawler.py
index 03e7a393..d554576d 100644
--- a/crawl4ai/async_webcrawler.py
+++ b/crawl4ai/async_webcrawler.py
@@ -1,7 +1,10 @@
 import os
 import time
+import warnings
+from enum import Enum
+from colorama import init, Fore, Back, Style
 from pathlib import Path
-from typing import Optional
+from typing import Optional, List, Union
 import json
 import asyncio
 from .models import CrawlResult
@@ -9,8 +12,13 @@ from .async_database import async_db_manager
 from .chunking_strategy import *
 from .extraction_strategy import *
 from .async_crawler_strategy import AsyncCrawlerStrategy, AsyncPlaywrightCrawlerStrategy, AsyncCrawlResponse
+from .cache_context import CacheMode, CacheContext, _legacy_to_cache_mode
 from .content_scrapping_strategy import WebScrapingStrategy
-from .config import MIN_WORD_THRESHOLD, IMAGE_DESCRIPTION_MIN_WORD_THRESHOLD
+from .config import (
+    MIN_WORD_THRESHOLD, 
+    IMAGE_DESCRIPTION_MIN_WORD_THRESHOLD,
+    SHOW_DEPRECATION_WARNINGS  # New import
+)
 from .utils import (
     sanitize_input_encode,
     InvalidCSSSelectorError,
@@ -18,19 +26,77 @@ from .utils import (
 )
 from .__version__ import __version__ as crawl4ai_version
 
+
 class AsyncWebCrawler:
+    """
+    Asynchronous web crawler with flexible caching capabilities.
+    
+    Migration Guide (from version X.X.X):
+    Old way (deprecated):
+        crawler = AsyncWebCrawler(always_by_pass_cache=True)
+        result = await crawler.arun(
+            url="https://example.com",
+            bypass_cache=True,
+            no_cache_read=True,
+            no_cache_write=False
+        )
+    
+    New way (recommended):
+        crawler = AsyncWebCrawler(always_bypass_cache=True)
+        result = await crawler.arun(
+            url="https://example.com",
+            cache_mode=CacheMode.WRITE_ONLY
+        )
+    
+    To disable deprecation warnings:
+        Set SHOW_DEPRECATION_WARNINGS = False in config.py
+    """
+
     def __init__(
         self,
         crawler_strategy: Optional[AsyncCrawlerStrategy] = None,
-        always_by_pass_cache: bool = False,
+        always_bypass_cache: bool = False,
+        always_by_pass_cache: Optional[bool] = None,  # Deprecated parameter
         base_directory: str = str(Path.home()),
         **kwargs,
     ):
-        self.crawler_strategy = crawler_strategy or AsyncPlaywrightCrawlerStrategy(
-            **kwargs
-        )
-        self.always_by_pass_cache = always_by_pass_cache
-        # self.crawl4ai_folder = os.path.join(Path.home(), ".crawl4ai")
+        """
+        Initialize the AsyncWebCrawler.
+
+        Args:
+            crawler_strategy: Strategy for crawling web pages
+            always_bypass_cache: Whether to always bypass cache (new parameter)
+            always_by_pass_cache: Deprecated, use always_bypass_cache instead
+            base_directory: Base directory for storing cache
+        """
+        init()
+        self.log_width = 10  # Width of "[COMPLETE]" 
+        self.tag_format = lambda tag: f"[{tag}]".ljust(self.log_width, ".")
+        self.log_icons = {
+            'INIT': '→',      # Alternative: '▶' or '►'
+            'READY': '✓',     # Alternative: '√'
+            'FETCH': '↓',     # Alternative: '▼'
+            'SCRAPE': '◆',    # Alternative: '♦'
+            'EXTRACT': '■',    # Alternative: '□'
+            'COMPLETE': '●',   # Alternative: '○'
+            'ERROR': '×' 
+        }        
+        self.crawler_strategy = crawler_strategy or AsyncPlaywrightCrawlerStrategy(**kwargs)
+        
+        # Handle deprecated parameter
+        if always_by_pass_cache is not None:
+            if SHOW_DEPRECATION_WARNINGS:
+                warnings.warn(
+                    "'always_by_pass_cache' is deprecated and will be removed in version X.X.X. "
+                    "Use 'always_bypass_cache' instead. "
+                    "Set SHOW_DEPRECATION_WARNINGS=False in config.py to suppress this warning.",
+                    DeprecationWarning,
+                    stacklevel=2
+                )
+            self.always_bypass_cache = always_by_pass_cache
+        else:
+            self.always_bypass_cache = always_bypass_cache
+
         self.crawl4ai_folder = os.path.join(base_directory, ".crawl4ai")
         os.makedirs(self.crawl4ai_folder, exist_ok=True)
         os.makedirs(f"{self.crawl4ai_folder}/cache", exist_ok=True)
@@ -46,21 +112,13 @@ class AsyncWebCrawler:
         await self.crawler_strategy.__aexit__(exc_type, exc_val, exc_tb)
 
     async def awarmup(self):
-        # Print a message for crawl4ai and its version
+        """Initialize the crawler with warm-up sequence."""
         if self.verbose:
-            print(f"[LOG] 🚀 Crawl4AI {crawl4ai_version}")
-            print("[LOG] 🌤️  Warming up the AsyncWebCrawler")
-        # await async_db_manager.ainit_db()
-        # # await async_db_manager.initialize()
-        # await self.arun(
-        #     url="https://google.com/",
-        #     word_count_threshold=5,
-        #     bypass_cache=False,
-        #     verbose=False,
-        # )
+            print(f"{Fore.CYAN}{self.tag_format('INIT')} {self.log_icons['INIT']} Crawl4AI {crawl4ai_version}{Style.RESET_ALL}")
+            print(f"{Fore.CYAN}{self.tag_format('INIT')} {self.log_icons['INIT']} Warming up AsyncWebCrawler{Style.RESET_ALL}")
         self.ready = True
         if self.verbose:
-            print("[LOG] 🌞 AsyncWebCrawler is ready to crawl")
+            print(f"{Fore.GREEN}{self.tag_format('READY')} {self.log_icons['READY']} AsyncWebCrawler initialized{Style.RESET_ALL}")
 
     async def arun(
         self,
@@ -68,35 +126,81 @@ class AsyncWebCrawler:
         word_count_threshold=MIN_WORD_THRESHOLD,
         extraction_strategy: ExtractionStrategy = None,
         chunking_strategy: ChunkingStrategy = RegexChunking(),
+        cache_mode: Optional[CacheMode] = None,
+        # Deprecated parameters
         bypass_cache: bool = False,
+        disable_cache: bool = False,
+        no_cache_read: bool = False,
+        no_cache_write: bool = False,
+        # Other parameters
         css_selector: str = None,
         screenshot: bool = False,
         user_agent: str = None,
         verbose=True,
-        disable_cache: bool = False,
-        no_cache_read: bool = False,
-        no_cache_write: bool = False,
         **kwargs,
     ) -> CrawlResult:
         """
         Runs the crawler for a single source: URL (web, local file, or raw HTML).
 
+        Migration from legacy cache parameters:
+            Old way (deprecated):
+                await crawler.arun(url, bypass_cache=True, no_cache_read=True)
+            
+            New way:
+                await crawler.arun(url, cache_mode=CacheMode.BYPASS)
+
         Args:
-            url (str): The URL to crawl. Supported prefixes:
-                - 'http://' or 'https://': Web URL to crawl.
-                - 'file://': Local file path to process.
-                - 'raw:': Raw HTML content to process.
-            ... [other existing parameters]
+            url: The URL to crawl (http://, https://, file://, or raw:)
+            cache_mode: Cache behavior control (recommended)
+            word_count_threshold: Minimum word count threshold
+            extraction_strategy: Strategy for content extraction
+            chunking_strategy: Strategy for content chunking
+            css_selector: CSS selector for content extraction
+            screenshot: Whether to capture screenshot
+            user_agent: Custom user agent
+            verbose: Enable verbose logging
+            
+            Deprecated Args:
+                bypass_cache: Use cache_mode=CacheMode.BYPASS instead
+                disable_cache: Use cache_mode=CacheMode.DISABLED instead
+                no_cache_read: Use cache_mode=CacheMode.WRITE_ONLY instead
+                no_cache_write: Use cache_mode=CacheMode.READ_ONLY instead
 
         Returns:
-            CrawlResult: The result of the crawling and processing.
+            CrawlResult: The result of crawling and processing
         """
         try:
-            if disable_cache:
-                bypass_cache = True
-                no_cache_read = True
-                no_cache_write = True
+            # Handle deprecated parameters
+            if any([bypass_cache, disable_cache, no_cache_read, no_cache_write]):
+                if SHOW_DEPRECATION_WARNINGS:
+                    warnings.warn(
+                        "Cache control boolean flags are deprecated and will be removed in version X.X.X. "
+                        "Use 'cache_mode' parameter instead. Examples:\n"
+                        "- For bypass_cache=True, use cache_mode=CacheMode.BYPASS\n"
+                        "- For disable_cache=True, use cache_mode=CacheMode.DISABLED\n"
+                        "- For no_cache_read=True, use cache_mode=CacheMode.WRITE_ONLY\n"
+                        "- For no_cache_write=True, use cache_mode=CacheMode.READ_ONLY\n"
+                        "Set SHOW_DEPRECATION_WARNINGS=False in config.py to suppress this warning.",
+                        DeprecationWarning,
+                        stacklevel=2
+                    )
+                
+                # Convert legacy parameters if cache_mode not provided
+                if cache_mode is None:
+                    cache_mode = _legacy_to_cache_mode(
+                        disable_cache=disable_cache,
+                        bypass_cache=bypass_cache,
+                        no_cache_read=no_cache_read,
+                        no_cache_write=no_cache_write
+                    )
             
+            # Default to ENABLED if no cache mode specified
+            if cache_mode is None:
+                cache_mode = CacheMode.ENABLED
+
+            # Create cache context
+            cache_context = CacheContext(url, cache_mode, self.always_bypass_cache)
+
             extraction_strategy = extraction_strategy or NoExtractionStrategy()
             extraction_strategy.verbose = verbose
             if not isinstance(extraction_strategy, ExtractionStrategy):
@@ -107,18 +211,14 @@ class AsyncWebCrawler:
             word_count_threshold = max(word_count_threshold, MIN_WORD_THRESHOLD)
 
             async_response: AsyncCrawlResponse = None
-            cached = None
+            cached_result = None
             screenshot_data = None
             extracted_content = None
             
-            is_web_url = url.startswith(('http://', 'https://'))
-            is_local_file = url.startswith("file://")
-            is_raw_html = url.startswith("raw:")
-            _url = url if not is_raw_html else "Raw HTML"
-            
             start_time = time.perf_counter()
-            cached_result = None
-            if is_web_url and (not bypass_cache or not no_cache_read) and not self.always_by_pass_cache:
+            
+            # Try to get cached result if appropriate
+            if cache_context.should_read():
                 cached_result = await async_db_manager.aget_cached_url(url)
                         
             if cached_result:
@@ -129,26 +229,27 @@ class AsyncWebCrawler:
                     if not screenshot_data:
                         cached_result = None
                 if verbose:
-                    print(
-                        f"[LOG] 1️⃣  ✅ Page fetched (cache) for {_url}, success: {bool(html)}, time taken: {time.perf_counter() - start_time:.2f} seconds"
-                    )
+                    print(f"{Fore.BLUE}{self.tag_format('FETCH')} {self.log_icons['FETCH']} Cache hit for {cache_context.display_url} | Status: {Fore.GREEN if bool(html) else Fore.RED}{bool(html)}{Style.RESET_ALL} | Time: {time.perf_counter() - start_time:.2f}s")
 
 
-            if not cached or not html:
+            # Fetch fresh content if needed
+            if not cached_result or not html:
                 t1 = time.perf_counter()
                 
                 if user_agent:
                     self.crawler_strategy.update_user_agent(user_agent)
-                async_response: AsyncCrawlResponse = await self.crawler_strategy.crawl(url, screenshot=screenshot, **kwargs)
+                async_response: AsyncCrawlResponse = await self.crawler_strategy.crawl(
+                    url, 
+                    screenshot=screenshot, 
+                    **kwargs
+                )
                 html = sanitize_input_encode(async_response.html)
                 screenshot_data = async_response.screenshot
                 t2 = time.perf_counter()
                 if verbose:
-                    print(
-                        f"[LOG] 1️⃣  ✅ Page fetched (no-cache) for {_url}, success: {bool(html)}, time taken: {t2 - t1:.2f} seconds"
-                    )
+                    print(f"{Fore.BLUE}{self.tag_format('FETCH')} {self.log_icons['FETCH']} Live fetch for {cache_context.display_url} | Status: {Fore.GREEN if bool(html) else Fore.RED}{bool(html)}{Style.RESET_ALL} | Time: {t2 - t1:.2f}s")
 
-            t1 = time.perf_counter()
+            # Process the HTML content
             crawl_result = await self.aprocess_html(
                 url=url,
                 html=html,
@@ -159,15 +260,15 @@ class AsyncWebCrawler:
                 css_selector=css_selector,
                 screenshot=screenshot_data,
                 verbose=verbose,
-                is_cached=bool(cached),
+                is_cached=bool(cached_result),
                 async_response=async_response,
-                bypass_cache=bypass_cache,
-                is_web_url = is_web_url,
-                is_local_file = is_local_file,
-                is_raw_html = is_raw_html,
+                is_web_url=cache_context.is_web_url,
+                is_local_file=cache_context.is_local_file,
+                is_raw_html=cache_context.is_raw_html,
                 **kwargs,
             )
             
+            # Set response data
             if async_response:
                 crawl_result.status_code = async_response.status_code
                 crawl_result.response_headers = async_response.response_headers
@@ -180,22 +281,26 @@ class AsyncWebCrawler:
             crawl_result.session_id = kwargs.get("session_id", None)
 
             if verbose:
-                print(
-                    f"[LOG] 🔥 🚀 Crawling done for {_url}, success: {crawl_result.success}, time taken: {time.perf_counter() - start_time:.2f} seconds"
-                )
+                print(f"{Fore.GREEN}{self.tag_format('COMPLETE')} {self.log_icons['COMPLETE']} {cache_context.display_url} | Status: {Fore.GREEN if crawl_result.success else Fore.RED}{crawl_result.success} | {Fore.YELLOW}Total: {time.perf_counter() - start_time:.2f}s{Style.RESET_ALL}")
 
-            if not is_raw_html and not no_cache_write:
-                if not bool(cached_result) or kwargs.get("bypass_cache", False) or self.always_by_pass_cache:
-                    await async_db_manager.acache_url(crawl_result)
 
+            # Update cache if appropriate
+            if cache_context.should_write() and not bool(cached_result):
+                await async_db_manager.acache_url(crawl_result)
 
             return crawl_result
         
         except Exception as e:
             if not hasattr(e, "msg"):
                 e.msg = str(e)
-            print(f"[ERROR] 🚫 arun(): Failed to crawl {_url}, error: {e.msg}")
-            return CrawlResult(url=url, html="", markdown = f"[ERROR] 🚫 arun(): Failed to crawl {_url}, error: {e.msg}", success=False, error_message=e.msg)
+            print(f"{Fore.RED}{self.tag_format('ERROR')} {self.log_icons['ERROR']} Failed to crawl {cache_context.display_url} | {e.msg}{Style.RESET_ALL}")
+            return CrawlResult(
+                url=url, 
+                html="", 
+                markdown=f"[ERROR] 🚫 arun(): Failed to crawl {cache_context.display_url}, error: {e.msg}", 
+                success=False, 
+                error_message=e.msg
+            )
 
     async def arun_many(
         self,
@@ -203,6 +308,8 @@ class AsyncWebCrawler:
         word_count_threshold=MIN_WORD_THRESHOLD,
         extraction_strategy: ExtractionStrategy = None,
         chunking_strategy: ChunkingStrategy = RegexChunking(),
+        cache_mode: Optional[CacheMode] = None,
+        # Deprecated parameters
         bypass_cache: bool = False,
         css_selector: str = None,
         screenshot: bool = False,
@@ -211,19 +318,35 @@ class AsyncWebCrawler:
         **kwargs,
     ) -> List[CrawlResult]:
         """
-        Runs the crawler for multiple sources: URLs (web, local files, or raw HTML).
+        Runs the crawler for multiple URLs concurrently.
+
+        Migration from legacy parameters:
+            Old way (deprecated):
+                results = await crawler.arun_many(urls, bypass_cache=True)
+            
+            New way:
+                results = await crawler.arun_many(urls, cache_mode=CacheMode.BYPASS)
 
         Args:
-            urls (List[str]): A list of URLs with supported prefixes:
-                - 'http://' or 'https://': Web URL to crawl.
-                - 'file://': Local file path to process.
-                - 'raw:': Raw HTML content to process.
-            ... [other existing parameters]
+            urls: List of URLs to crawl
+            cache_mode: Cache behavior control (recommended)
+            [other parameters same as arun()]
 
         Returns:
-            List[CrawlResult]: The results of the crawling and processing.
+            List[CrawlResult]: Results for each URL
         """
-        semaphore_count = kwargs.get('semaphore_count', 5)  # Adjust as needed
+        if bypass_cache and SHOW_DEPRECATION_WARNINGS:
+            warnings.warn(
+                "'bypass_cache' is deprecated and will be removed in version X.X.X. "
+                "Use 'cache_mode=CacheMode.BYPASS' instead. "
+                "Set SHOW_DEPRECATION_WARNINGS=False in config.py to suppress this warning.",
+                DeprecationWarning,
+                stacklevel=2
+            )
+            if cache_mode is None:
+                cache_mode = CacheMode.BYPASS
+
+        semaphore_count = kwargs.get('semaphore_count', 5)
         semaphore = asyncio.Semaphore(semaphore_count)
 
         async def crawl_with_semaphore(url):
@@ -233,7 +356,7 @@ class AsyncWebCrawler:
                     word_count_threshold=word_count_threshold,
                     extraction_strategy=extraction_strategy,
                     chunking_strategy=chunking_strategy,
-                    bypass_cache=bypass_cache,
+                    cache_mode=cache_mode,
                     css_selector=css_selector,
                     screenshot=screenshot,
                     user_agent=user_agent,
@@ -245,6 +368,7 @@ class AsyncWebCrawler:
         results = await asyncio.gather(*tasks, return_exceptions=True)
         return [result if not isinstance(result, Exception) else str(result) for result in results]
 
+
     async def aprocess_html(
         self,
         url: str,
@@ -258,7 +382,6 @@ class AsyncWebCrawler:
         verbose: bool,
         **kwargs,
     ) -> CrawlResult:
-        t = time.perf_counter()
         # Extract content from HTML
         try:
             _url = url if not kwargs.get("is_raw_html", False) else "Raw HTML"
@@ -293,9 +416,9 @@ class AsyncWebCrawler:
         metadata = result.get("metadata", {})
         
         if verbose:
-            print(
-                f"[LOG] 2️⃣  ✅ Scraping done for {_url}, success: True, time taken: {time.perf_counter() - t1:.2f} seconds"
-            )        
+            print(f"{Fore.MAGENTA}{self.tag_format('SCRAPE')} {self.log_icons['SCRAPE']} Processed {_url}{Style.RESET_ALL} | Time: {int((time.perf_counter() - t1) * 1000)}ms")
+
+
 
         if extracted_content is None and extraction_strategy and chunking_strategy and not isinstance(extraction_strategy, NoExtractionStrategy):
             t1 = time.perf_counter()
@@ -309,9 +432,9 @@ class AsyncWebCrawler:
                 extracted_content = extraction_strategy.run(url, sections)
                 extracted_content = json.dumps(extracted_content, indent=4, default=str, ensure_ascii=False)
             if verbose:
-                print(
-                    f"[LOG] 3️⃣  ✅ Extraction done for {_url}, time taken: {time.perf_counter() - t1:.2f} seconds"
-                )
+                print(f"{Fore.YELLOW}{self.tag_format('EXTRACT')} {self.log_icons['EXTRACT']} Completed for {_url}{Style.RESET_ALL} | Time: {time.perf_counter() - t1:.2f}s{Style.RESET_ALL}")
+
+                
 
         screenshot = None if not screenshot else screenshot
         
@@ -332,13 +455,15 @@ class AsyncWebCrawler:
         )
 
     async def aclear_cache(self):
-        # await async_db_manager.aclear_db()
+        """Clear the cache database."""
         await async_db_manager.cleanup()
 
     async def aflush_cache(self):
+        """Flush the cache database."""
         await async_db_manager.aflush_db()
 
     async def aget_cache_size(self):
+        """Get the total number of cached items."""
         return await async_db_manager.aget_total_count()
 
 
diff --git a/crawl4ai/cache_context.py b/crawl4ai/cache_context.py
new file mode 100644
index 00000000..429eacc1
--- /dev/null
+++ b/crawl4ai/cache_context.py
@@ -0,0 +1,79 @@
+from enum import Enum
+
+
+class CacheMode(Enum):
+    """
+    Defines the caching behavior for web crawling operations.
+    
+    Modes:
+    - ENABLED: Normal caching behavior (read and write)
+    - DISABLED: No caching at all
+    - READ_ONLY: Only read from cache, don't write
+    - WRITE_ONLY: Only write to cache, don't read
+    - BYPASS: Bypass cache for this operation
+    """
+    ENABLED = "enabled"
+    DISABLED = "disabled"
+    READ_ONLY = "read_only"
+    WRITE_ONLY = "write_only"
+    BYPASS = "bypass"
+
+
+class CacheContext:
+    """
+    Encapsulates cache-related decisions and URL handling.
+    
+    This class centralizes all cache-related logic and URL type checking,
+    making the caching behavior more predictable and maintainable.
+    """
+    def __init__(self, url: str, cache_mode: CacheMode, always_bypass: bool = False):
+        self.url = url
+        self.cache_mode = cache_mode
+        self.always_bypass = always_bypass
+        self.is_cacheable = url.startswith(('http://', 'https://', 'file://'))
+        self.is_web_url = url.startswith(('http://', 'https://'))
+        self.is_local_file = url.startswith("file://")
+        self.is_raw_html = url.startswith("raw:")
+        self._url_display = url if not self.is_raw_html else "Raw HTML"
+    
+    def should_read(self) -> bool:
+        """Determines if cache should be read based on context."""
+        if self.always_bypass or not self.is_cacheable:
+            return False
+        return self.cache_mode in [CacheMode.ENABLED, CacheMode.READ_ONLY]
+    
+    def should_write(self) -> bool:
+        """Determines if cache should be written based on context."""
+        if self.always_bypass or not self.is_cacheable:
+            return False
+        return self.cache_mode in [CacheMode.ENABLED, CacheMode.WRITE_ONLY]
+    
+    @property
+    def display_url(self) -> str:
+        """Returns the URL in display format."""
+        return self._url_display
+
+
+def _legacy_to_cache_mode(
+    disable_cache: bool = False,
+    bypass_cache: bool = False,
+    no_cache_read: bool = False,
+    no_cache_write: bool = False
+) -> CacheMode:
+    """
+    Converts legacy cache parameters to the new CacheMode enum.
+    
+    This is an internal function to help transition from the old boolean flags
+    to the new CacheMode system.
+    """
+    if disable_cache:
+        return CacheMode.DISABLED
+    if bypass_cache:
+        return CacheMode.BYPASS
+    if no_cache_read and no_cache_write:
+        return CacheMode.DISABLED
+    if no_cache_read:
+        return CacheMode.WRITE_ONLY
+    if no_cache_write:
+        return CacheMode.READ_ONLY
+    return CacheMode.ENABLED
diff --git a/crawl4ai/config.py b/crawl4ai/config.py
index 5bc284bf..6b1324dd 100644
--- a/crawl4ai/config.py
+++ b/crawl4ai/config.py
@@ -54,4 +54,5 @@ IMAGE_SCORE_THRESHOLD = 2
 
 MAX_METRICS_HISTORY = 1000
 
-NEED_MIGRATION = True
\ No newline at end of file
+NEED_MIGRATION = True
+SHOW_DEPRECATION_WARNINGS = True
\ No newline at end of file
diff --git a/docs/examples/docker_example.py b/docs/examples/docker_example.py
index b43e8ee6..898f14da 100644
--- a/docs/examples/docker_example.py
+++ b/docs/examples/docker_example.py
@@ -48,8 +48,8 @@ class Crawl4AiTester:
 def test_docker_deployment(version="basic"):
     tester = Crawl4AiTester(
         base_url="http://localhost:11235" ,
-        # base_url="https://crawl4ai-sby74.ondigitalocean.app",
-        api_token="test"
+        # base_url="https://api.crawl4ai.com" # just for example
+        # api_token="test" # just for example
     )
     print(f"Testing Crawl4AI Docker {version} version")
     
@@ -69,6 +69,7 @@ def test_docker_deployment(version="basic"):
     
     # Test cases based on version
     test_basic_crawl(tester)
+    test_basic_crawl(tester)
     test_basic_crawl_sync(tester)
     
     # if version in ["full", "transformer"]:
diff --git a/docs/examples/quickstart_async.py b/docs/examples/quickstart_async.py
index 9c57f57d..d67a8c30 100644
--- a/docs/examples/quickstart_async.py
+++ b/docs/examples/quickstart_async.py
@@ -71,12 +71,12 @@ async def use_proxy():
         "Note: Replace 'http://your-proxy-url:port' with a working proxy to run this example."
     )
     # Uncomment and modify the following lines to use a proxy
-    # async with AsyncWebCrawler(verbose=True, proxy="http://your-proxy-url:port") as crawler:
-    #     result = await crawler.arun(
-    #         url="https://www.nbcnews.com/business",
-    #         bypass_cache=True
-    #     )
-    #     print(result.markdown[:500])  # Print first 500 characters
+    async with AsyncWebCrawler(verbose=True, proxy="http://your-proxy-url:port") as crawler:
+        result = await crawler.arun(
+            url="https://www.nbcnews.com/business",
+            bypass_cache=True
+        )
+        print(result.markdown[:500])  # Print first 500 characters
 
 async def capture_and_save_screenshot(url: str, output_path: str):
     async with AsyncWebCrawler(verbose=True) as crawler:
diff --git a/requirements.txt b/requirements.txt
index 74e8b3d6..e6294cc5 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -11,4 +11,5 @@ beautifulsoup4~=4.12
 tf-playwright-stealth~=1.0
 xxhash~=3.4
 rank-bm25~=0.2
-aiofiles~=24.0
\ No newline at end of file
+aiofiles~=24.0
+colorama~=0.4
\ No newline at end of file
diff --git a/tests/docker_example.py b/tests/docker_example.py
new file mode 100644
index 00000000..658e80fd
--- /dev/null
+++ b/tests/docker_example.py
@@ -0,0 +1,332 @@
+import requests
+import json
+import time
+import sys
+import base64
+import os
+from typing import Dict, Any
+
+class Crawl4AiTester:
+    def __init__(self, base_url: str = "http://localhost:11235", api_token: str = None):
+        self.base_url = base_url
+        self.api_token = api_token or os.getenv('CRAWL4AI_API_TOKEN')  # Check environment variable as fallback
+        self.headers = {'Authorization': f'Bearer {self.api_token}'} if self.api_token else {}
+        
+    def submit_and_wait(self, request_data: Dict[str, Any], timeout: int = 300) -> Dict[str, Any]:
+        # Submit crawl job
+        response = requests.post(f"{self.base_url}/crawl", json=request_data, headers=self.headers)
+        if response.status_code == 403:
+            raise Exception("API token is invalid or missing")
+        task_id = response.json()["task_id"]
+        print(f"Task ID: {task_id}")
+        
+        # Poll for result
+        start_time = time.time()
+        while True:
+            if time.time() - start_time > timeout:
+                raise TimeoutError(f"Task {task_id} did not complete within {timeout} seconds")
+                
+            result = requests.get(f"{self.base_url}/task/{task_id}", headers=self.headers)
+            status = result.json()
+            
+            if status["status"] == "failed":
+                print("Task failed:", status.get("error"))
+                raise Exception(f"Task failed: {status.get('error')}")
+                
+            if status["status"] == "completed":
+                return status
+                
+            time.sleep(2)
+            
+    def submit_sync(self, request_data: Dict[str, Any]) -> Dict[str, Any]:
+        response = requests.post(f"{self.base_url}/crawl_sync", json=request_data, headers=self.headers, timeout=60)
+        if response.status_code == 408:
+            raise TimeoutError("Task did not complete within server timeout")
+        response.raise_for_status()
+        return response.json()
+
+def test_docker_deployment(version="basic"):
+    tester = Crawl4AiTester(
+        # base_url="http://localhost:11235" ,
+        base_url="https://crawl4ai-sby74.ondigitalocean.app",
+        api_token="test"
+    )
+    print(f"Testing Crawl4AI Docker {version} version")
+    
+    # Health check with timeout and retry
+    max_retries = 5
+    for i in range(max_retries):
+        try:
+            health = requests.get(f"{tester.base_url}/health", timeout=10)
+            print("Health check:", health.json())
+            break
+        except requests.exceptions.RequestException as e:
+            if i == max_retries - 1:
+                print(f"Failed to connect after {max_retries} attempts")
+                sys.exit(1)
+            print(f"Waiting for service to start (attempt {i+1}/{max_retries})...")
+            time.sleep(5)
+    
+    # Test cases based on version
+    test_basic_crawl(tester)
+    test_basic_crawl(tester)
+    test_basic_crawl_sync(tester)
+    
+    # if version in ["full", "transformer"]:
+    #     test_cosine_extraction(tester)
+
+    # test_js_execution(tester)
+    # test_css_selector(tester)
+    # test_structured_extraction(tester)
+    # test_llm_extraction(tester)
+    # test_llm_with_ollama(tester)
+    # test_screenshot(tester)
+    
+
+def test_basic_crawl(tester: Crawl4AiTester):
+    print("\n=== Testing Basic Crawl ===")
+    request = {
+        "urls": "https://www.nbcnews.com/business",
+        "priority": 10, 
+        "session_id": "test"
+    }
+    
+    result = tester.submit_and_wait(request)
+    print(f"Basic crawl result length: {len(result['result']['markdown'])}")
+    assert result["result"]["success"]
+    assert len(result["result"]["markdown"]) > 0
+
+def test_basic_crawl_sync(tester: Crawl4AiTester):
+    print("\n=== Testing Basic Crawl (Sync) ===")
+    request = {
+        "urls": "https://www.nbcnews.com/business",
+        "priority": 10,
+        "session_id": "test"
+    }
+    
+    result = tester.submit_sync(request)
+    print(f"Basic crawl result length: {len(result['result']['markdown'])}")
+    assert result['status'] == 'completed'
+    assert result['result']['success']
+    assert len(result['result']['markdown']) > 0
+    
+def test_js_execution(tester: Crawl4AiTester):
+    print("\n=== Testing JS Execution ===")
+    request = {
+        "urls": "https://www.nbcnews.com/business",
+        "priority": 8,
+        "js_code": [
+            "const loadMoreButton = Array.from(document.querySelectorAll('button')).find(button => button.textContent.includes('Load More')); loadMoreButton && loadMoreButton.click();"
+        ],
+        "wait_for": "article.tease-card:nth-child(10)",
+        "crawler_params": {
+            "headless": True
+        }
+    }
+    
+    result = tester.submit_and_wait(request)
+    print(f"JS execution result length: {len(result['result']['markdown'])}")
+    assert result["result"]["success"]
+
+def test_css_selector(tester: Crawl4AiTester):
+    print("\n=== Testing CSS Selector ===")
+    request = {
+        "urls": "https://www.nbcnews.com/business",
+        "priority": 7,
+        "css_selector": ".wide-tease-item__description",
+        "crawler_params": {
+            "headless": True
+        },
+        "extra": {"word_count_threshold": 10}
+        
+    }
+    
+    result = tester.submit_and_wait(request)
+    print(f"CSS selector result length: {len(result['result']['markdown'])}")
+    assert result["result"]["success"]
+
+def test_structured_extraction(tester: Crawl4AiTester):
+    print("\n=== Testing Structured Extraction ===")
+    schema = {
+        "name": "Coinbase Crypto Prices",
+        "baseSelector": ".cds-tableRow-t45thuk",
+        "fields": [
+            {
+                "name": "crypto",
+                "selector": "td:nth-child(1) h2",
+                "type": "text",
+            },
+            {
+                "name": "symbol",
+                "selector": "td:nth-child(1) p",
+                "type": "text",
+            },
+            {
+                "name": "price",
+                "selector": "td:nth-child(2)",
+                "type": "text",
+            }
+        ],
+    }
+    
+    request = {
+        "urls": "https://www.coinbase.com/explore",
+        "priority": 9,
+        "extraction_config": {
+            "type": "json_css",
+            "params": {
+                "schema": schema
+            }
+        }
+    }
+    
+    result = tester.submit_and_wait(request)
+    extracted = json.loads(result["result"]["extracted_content"])
+    print(f"Extracted {len(extracted)} items")
+    print("Sample item:", json.dumps(extracted[0], indent=2))
+    assert result["result"]["success"]
+    assert len(extracted) > 0
+
+def test_llm_extraction(tester: Crawl4AiTester):
+    print("\n=== Testing LLM Extraction ===")
+    schema = {
+        "type": "object",
+        "properties": {
+            "model_name": {
+                "type": "string",
+                "description": "Name of the OpenAI model."
+            },
+            "input_fee": {
+                "type": "string",
+                "description": "Fee for input token for the OpenAI model."
+            },
+            "output_fee": {
+                "type": "string",
+                "description": "Fee for output token for the OpenAI model."
+            }
+        },
+        "required": ["model_name", "input_fee", "output_fee"]
+    }
+    
+    request = {
+        "urls": "https://openai.com/api/pricing",
+        "priority": 8,
+        "extraction_config": {
+            "type": "llm",
+            "params": {
+                "provider": "openai/gpt-4o-mini",
+                "api_token": os.getenv("OPENAI_API_KEY"),
+                "schema": schema,
+                "extraction_type": "schema",
+                "instruction": """From the crawled content, extract all mentioned model names along with their fees for input and output tokens."""
+            }
+        },
+        "crawler_params": {"word_count_threshold": 1}
+    }
+    
+    try:
+        result = tester.submit_and_wait(request)
+        extracted = json.loads(result["result"]["extracted_content"])
+        print(f"Extracted {len(extracted)} model pricing entries")
+        print("Sample entry:", json.dumps(extracted[0], indent=2))
+        assert result["result"]["success"]
+    except Exception as e:
+        print(f"LLM extraction test failed (might be due to missing API key): {str(e)}")
+
+def test_llm_with_ollama(tester: Crawl4AiTester):
+    print("\n=== Testing LLM with Ollama ===")
+    schema = {
+        "type": "object",
+        "properties": {
+            "article_title": {
+                "type": "string",
+                "description": "The main title of the news article"
+            },
+            "summary": {
+                "type": "string",
+                "description": "A brief summary of the article content"
+            },
+            "main_topics": {
+                "type": "array",
+                "items": {"type": "string"},
+                "description": "Main topics or themes discussed in the article"
+            }
+        }
+    }
+    
+    request = {
+        "urls": "https://www.nbcnews.com/business",
+        "priority": 8,
+        "extraction_config": {
+            "type": "llm",
+            "params": {
+                "provider": "ollama/llama2",
+                "schema": schema,
+                "extraction_type": "schema",
+                "instruction": "Extract the main article information including title, summary, and main topics."
+            }
+        },
+        "extra": {"word_count_threshold": 1},
+        "crawler_params": {"verbose": True}
+    }
+    
+    try:
+        result = tester.submit_and_wait(request)
+        extracted = json.loads(result["result"]["extracted_content"])
+        print("Extracted content:", json.dumps(extracted, indent=2))
+        assert result["result"]["success"]
+    except Exception as e:
+        print(f"Ollama extraction test failed: {str(e)}")
+
+def test_cosine_extraction(tester: Crawl4AiTester):
+    print("\n=== Testing Cosine Extraction ===")
+    request = {
+        "urls": "https://www.nbcnews.com/business",
+        "priority": 8,
+        "extraction_config": {
+            "type": "cosine",
+            "params": {
+                "semantic_filter": "business finance economy",
+                "word_count_threshold": 10,
+                "max_dist": 0.2,
+                "top_k": 3
+            }
+        }
+    }
+    
+    try:
+        result = tester.submit_and_wait(request)
+        extracted = json.loads(result["result"]["extracted_content"])
+        print(f"Extracted {len(extracted)} text clusters")
+        print("First cluster tags:", extracted[0]["tags"])
+        assert result["result"]["success"]
+    except Exception as e:
+        print(f"Cosine extraction test failed: {str(e)}")
+
+def test_screenshot(tester: Crawl4AiTester):
+    print("\n=== Testing Screenshot ===")
+    request = {
+        "urls": "https://www.nbcnews.com/business",
+        "priority": 5,
+        "screenshot": True,
+        "crawler_params": {
+            "headless": True
+        }
+    }
+    
+    result = tester.submit_and_wait(request)
+    print("Screenshot captured:", bool(result["result"]["screenshot"]))
+    
+    if result["result"]["screenshot"]:
+        # Save screenshot
+        screenshot_data = base64.b64decode(result["result"]["screenshot"])
+        with open("test_screenshot.jpg", "wb") as f:
+            f.write(screenshot_data)
+        print("Screenshot saved as test_screenshot.jpg")
+    
+    assert result["result"]["success"]
+
+if __name__ == "__main__":
+    version = sys.argv[1] if len(sys.argv) > 1 else "basic"
+    # version = "full"
+    test_docker_deployment(version)
\ No newline at end of file

From 3a524a3bdd3afdd58d64c336031e7687fdfe5631 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Sun, 17 Nov 2024 16:00:39 +0800
Subject: [PATCH 039/115] fix(docs): remove unnecessary blank line in README
 for improved readability

---
 README.md | 1 -
 1 file changed, 1 deletion(-)

diff --git a/README.md b/README.md
index a2806304..069c02b8 100644
--- a/README.md
+++ b/README.md
@@ -119,7 +119,6 @@ Deploy your own instance of Crawl4AI with one click:
 
 [![DigitalOcean Referral Badge](https://web-platforms.sfo2.cdn.digitaloceanspaces.com/WWW/Badge%203.svg)](https://www.digitalocean.com/?repo=https://github.com/unclecode/crawl4ai/tree/0.3.74&refcode=a0780f1bdb3d&utm_campaign=Referral_Invite&utm_medium=Referral_Program&utm_source=badge)
 
-
 > 💡 **Recommended specs**: 4GB RAM minimum. Select "professional-xs" or higher when deploying for stable operation.
 
 The deploy will:

From 2a82455b3dd3427f3099e201c2d88fadcc0c78fc Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Sun, 17 Nov 2024 17:17:34 +0800
Subject: [PATCH 040/115] feat(crawl): implement direct crawl functionality and
 introduce CacheMode for improved caching control

---
 docs/examples/docker_example.py | 33 ++++++++++++--
 docs/md_v2/basic/cache-modes.md | 79 +++++++++++++++++++++++++++++++++
 main.py                         | 46 ++++++++++++++++++-
 mkdocs.yml                      |  1 +
 4 files changed, 153 insertions(+), 6 deletions(-)
 create mode 100644 docs/md_v2/basic/cache-modes.md

diff --git a/docs/examples/docker_example.py b/docs/examples/docker_example.py
index 898f14da..17ef9f04 100644
--- a/docs/examples/docker_example.py
+++ b/docs/examples/docker_example.py
@@ -9,7 +9,7 @@ from typing import Dict, Any
 class Crawl4AiTester:
     def __init__(self, base_url: str = "http://localhost:11235", api_token: str = None):
         self.base_url = base_url
-        self.api_token = api_token or os.getenv('CRAWL4AI_API_TOKEN')  # Check environment variable as fallback
+        self.api_token = api_token or os.getenv('CRAWL4AI_API_TOKEN') or "test_api_code"  # Check environment variable as fallback
         self.headers = {'Authorization': f'Bearer {self.api_token}'} if self.api_token else {}
         
     def submit_and_wait(self, request_data: Dict[str, Any], timeout: int = 300) -> Dict[str, Any]:
@@ -44,6 +44,16 @@ class Crawl4AiTester:
             raise TimeoutError("Task did not complete within server timeout")
         response.raise_for_status()
         return response.json()
+    
+    def crawl_direct(self, request_data: Dict[str, Any]) -> Dict[str, Any]:
+        """Directly crawl without using task queue"""
+        response = requests.post(
+            f"{self.base_url}/crawl_direct", 
+            json=request_data, 
+            headers=self.headers
+        )
+        response.raise_for_status()
+        return response.json()
 
 def test_docker_deployment(version="basic"):
     tester = Crawl4AiTester(
@@ -68,9 +78,10 @@ def test_docker_deployment(version="basic"):
             time.sleep(5)
     
     # Test cases based on version
-    test_basic_crawl(tester)
-    test_basic_crawl(tester)
-    test_basic_crawl_sync(tester)
+    # test_basic_crawl(tester)
+    # test_basic_crawl(tester)
+    # test_basic_crawl_sync(tester)
+    test_basic_crawl_direct(tester)
     
     # if version in ["full", "transformer"]:
     #     test_cosine_extraction(tester)
@@ -110,6 +121,20 @@ def test_basic_crawl_sync(tester: Crawl4AiTester):
     assert result['result']['success']
     assert len(result['result']['markdown']) > 0
     
+def test_basic_crawl_direct(tester: Crawl4AiTester):
+    print("\n=== Testing Basic Crawl (Direct) ===")
+    request = {
+        "urls": "https://www.nbcnews.com/business",
+        "priority": 10,
+        # "session_id": "test"
+        "cache_mode": "bypass"  # or "enabled", "disabled", "read_only", "write_only"
+    }
+    
+    result = tester.crawl_direct(request)
+    print(f"Basic crawl result length: {len(result['result']['markdown'])}")
+    assert result['result']['success']
+    assert len(result['result']['markdown']) > 0
+    
 def test_js_execution(tester: Crawl4AiTester):
     print("\n=== Testing JS Execution ===")
     request = {
diff --git a/docs/md_v2/basic/cache-modes.md b/docs/md_v2/basic/cache-modes.md
new file mode 100644
index 00000000..04a4f218
--- /dev/null
+++ b/docs/md_v2/basic/cache-modes.md
@@ -0,0 +1,79 @@
+# Crawl4AI Cache System and Migration Guide
+
+## Overview
+Starting from version X.X.X, Crawl4AI introduces a new caching system that replaces the old boolean flags with a more intuitive `CacheMode` enum. This change simplifies cache control and makes the behavior more predictable.
+
+## Old vs New Approach
+
+### Old Way (Deprecated)
+The old system used multiple boolean flags:
+- `bypass_cache`: Skip cache entirely
+- `disable_cache`: Disable all caching
+- `no_cache_read`: Don't read from cache
+- `no_cache_write`: Don't write to cache
+
+### New Way (Recommended)
+The new system uses a single `CacheMode` enum:
+- `CacheMode.ENABLED`: Normal caching (read/write)
+- `CacheMode.DISABLED`: No caching at all
+- `CacheMode.READ_ONLY`: Only read from cache
+- `CacheMode.WRITE_ONLY`: Only write to cache
+- `CacheMode.BYPASS`: Skip cache for this operation
+
+## Migration Example
+
+### Old Code (Deprecated)
+```python
+import asyncio
+from crawl4ai import AsyncWebCrawler
+
+async def use_proxy():
+    async with AsyncWebCrawler(verbose=True) as crawler:
+        result = await crawler.arun(
+            url="https://www.nbcnews.com/business",
+            bypass_cache=True  # Old way
+        )
+        print(len(result.markdown))
+
+async def main():
+    await use_proxy()
+
+if __name__ == "__main__":
+    asyncio.run(main())
+```
+
+### New Code (Recommended)
+```python
+import asyncio
+from crawl4ai import AsyncWebCrawler, CacheMode  # Import CacheMode
+
+async def use_proxy():
+    async with AsyncWebCrawler(verbose=True) as crawler:
+        result = await crawler.arun(
+            url="https://www.nbcnews.com/business",
+            cache_mode=CacheMode.BYPASS  # New way
+        )
+        print(len(result.markdown))
+
+async def main():
+    await use_proxy()
+
+if __name__ == "__main__":
+    asyncio.run(main())
+```
+
+## Common Migration Patterns
+
+Old Flag | New Mode
+---------|----------
+`bypass_cache=True` | `cache_mode=CacheMode.BYPASS`
+`disable_cache=True` | `cache_mode=CacheMode.DISABLED`
+`no_cache_read=True` | `cache_mode=CacheMode.WRITE_ONLY`
+`no_cache_write=True` | `cache_mode=CacheMode.READ_ONLY`
+
+## Suppressing Deprecation Warnings
+If you need time to migrate, you can temporarily suppress deprecation warnings:
+```python
+# In your config.py
+SHOW_DEPRECATION_WARNINGS = False
+```
diff --git a/main.py b/main.py
index 41788d61..ee5f7fc6 100644
--- a/main.py
+++ b/main.py
@@ -25,7 +25,7 @@ import logging
 from enum import Enum
 from dataclasses import dataclass
 import json
-from crawl4ai import AsyncWebCrawler, CrawlResult
+from crawl4ai import AsyncWebCrawler, CrawlResult, CacheMode
 from crawl4ai.extraction_strategy import (
     LLMExtractionStrategy,
     CosineStrategy,
@@ -66,6 +66,7 @@ class CrawlRequest(BaseModel):
     magic: bool = False
     extra: Optional[Dict[str, Any]] = {}
     session_id: Optional[str] = None
+    cache_mode: Optional[CacheMode] = None
 
 @dataclass
 class TaskInfo:
@@ -329,7 +330,7 @@ app.mount("/pages", StaticFiles(directory=__location__ + "/pages"), name="pages"
 
 # API token security
 security = HTTPBearer()
-CRAWL4AI_API_TOKEN = os.getenv("CRAWL4AI_API_TOKEN")
+CRAWL4AI_API_TOKEN = os.getenv("CRAWL4AI_API_TOKEN") or "test_api_code"
 
 async def verify_token(credentials: HTTPAuthorizationCredentials = Security(security)):
     if not CRAWL4AI_API_TOKEN:
@@ -419,6 +420,47 @@ async def crawl_sync(request: CrawlRequest) -> Dict[str, Any]:
     # If we get here, task didn't complete within timeout
     raise HTTPException(status_code=408, detail="Task timed out")
 
+@app.post("/crawl_direct", dependencies=[Depends(verify_token)])
+async def crawl_direct(request: CrawlRequest) -> Dict[str, Any]:
+    try:
+        crawler = await crawler_service.crawler_pool.acquire(**request.crawler_params)
+        extraction_strategy = crawler_service._create_extraction_strategy(request.extraction_config)
+        
+        try:
+            if isinstance(request.urls, list):
+                results = await crawler.arun_many(
+                    urls=[str(url) for url in request.urls],
+                    extraction_strategy=extraction_strategy,
+                    js_code=request.js_code,
+                    wait_for=request.wait_for,
+                    css_selector=request.css_selector,
+                    screenshot=request.screenshot,
+                    magic=request.magic,
+                    cache_mode=request.cache_mode,
+                    session_id=request.session_id,
+                    **request.extra,
+                )
+                return {"results": [result.dict() for result in results]}
+            else:
+                result = await crawler.arun(
+                    url=str(request.urls),
+                    extraction_strategy=extraction_strategy,
+                    js_code=request.js_code,
+                    wait_for=request.wait_for,
+                    css_selector=request.css_selector,
+                    screenshot=request.screenshot,
+                    magic=request.magic,
+                    cache_mode=request.cache_mode,
+                    session_id=request.session_id,
+                    **request.extra,
+                )
+                return {"result": result.dict()}
+        finally:
+            await crawler_service.crawler_pool.release(crawler)
+    except Exception as e:
+        logger.error(f"Error in direct crawl: {str(e)}")
+        raise HTTPException(status_code=500, detail=str(e))
+    
 @app.get("/health")
 async def health_check():
     available_slots = await crawler_service.resource_monitor.get_available_slots()
diff --git a/mkdocs.yml b/mkdocs.yml
index b09cb9eb..1b26b9df 100644
--- a/mkdocs.yml
+++ b/mkdocs.yml
@@ -17,6 +17,7 @@ nav:
     - 'Browser Configuration': 'basic/browser-config.md'
     - 'Page Interaction': 'basic/page-interaction.md'
     - 'Content Selection': 'basic/content-selection.md'
+    - 'Cache Modes': 'basic/cache-modes.md'
 
   - Advanced:
     - 'Content Processing': 'advanced/content-processing.md'

From f9fe6f89feafeba175dc35da64ca5f6883839473 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Sun, 17 Nov 2024 18:09:33 +0800
Subject: [PATCH 041/115] feat(database): implement version management and
 migration checks during initialization

---
 crawl4ai/async_database.py       | 39 +++++++++++++++++++++++++--
 crawl4ai/version_manager.py      | 30 +++++++++++++++++++++
 docs/md_v2/basic/installation.md | 45 ++++++++++++++++++++++++++++++++
 setup.py                         |  2 +-
 4 files changed, 113 insertions(+), 3 deletions(-)
 create mode 100644 crawl4ai/version_manager.py

diff --git a/crawl4ai/async_database.py b/crawl4ai/async_database.py
index f97d8131..7809dfe1 100644
--- a/crawl4ai/async_database.py
+++ b/crawl4ai/async_database.py
@@ -11,6 +11,7 @@ from .models import CrawlResult
 import xxhash
 import aiofiles
 from .config import NEED_MIGRATION
+from .version_manager import VersionManager
 # Set up logging
 logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger(__name__)
@@ -28,22 +29,49 @@ class AsyncDatabaseManager:
         self.connection_pool: Dict[int, aiosqlite.Connection] = {}
         self.pool_lock = asyncio.Lock()
         self.connection_semaphore = asyncio.Semaphore(pool_size)
+        self._initialized = False  
+        self.version_manager = VersionManager()
+        
         
     async def initialize(self):
         """Initialize the database and connection pool"""
         try:
             logger.info("Initializing database...")
+            # Ensure the database file exists
+            os.makedirs(os.path.dirname(self.db_path), exist_ok=True)
+            
+            # Check if version update is needed
+            needs_update = self.version_manager.needs_update()
+            
+            # Always ensure base table exists
             await self.ainit_db()
-            if NEED_MIGRATION:
+            
+            # Verify the table exists
+            async def verify_table(db):
+                async with db.execute(
+                    "SELECT name FROM sqlite_master WHERE type='table' AND name='crawled_data'"
+                ) as cursor:
+                    result = await cursor.fetchone()
+                    if not result:
+                        raise Exception("crawled_data table was not created")
+                    
+            await self.execute_with_retry(verify_table)
+            
+            # If version changed or fresh install, run updates
+            if needs_update:
+                logger.info("New version detected, running updates...")
                 await self.update_db_schema()
                 from .migrations import run_migration  # Import here to avoid circular imports
                 await run_migration()
-                logger.info("Database initialization and migration completed successfully")
+                self.version_manager.update_version()  # Update stored version after successful migration
+                logger.info("Version update completed successfully")
             else:
                 logger.info("Database initialization completed successfully")
+                
         except Exception as e:
             logger.error(f"Database initialization error: {e}")
             logger.info("Database will be initialized on first use")
+            raise
             
     async def cleanup(self):
         """Cleanup connections when shutting down"""
@@ -55,6 +83,12 @@ class AsyncDatabaseManager:
     @asynccontextmanager
     async def get_connection(self):
         """Connection pool manager"""
+        if not self._initialized:
+            async with self.pool_lock:  # Prevent multiple simultaneous initializations
+                if not self._initialized:  # Double-check after acquiring lock
+                    await self.initialize()
+                    self._initialized = True
+
         async with self.connection_semaphore:
             task_id = id(asyncio.current_task())
             try:
@@ -79,6 +113,7 @@ class AsyncDatabaseManager:
                         await self.connection_pool[task_id].close()
                         del self.connection_pool[task_id]
 
+
     async def execute_with_retry(self, operation, *args):
         """Execute database operations with retry logic"""
         for attempt in range(self.max_retries):
diff --git a/crawl4ai/version_manager.py b/crawl4ai/version_manager.py
new file mode 100644
index 00000000..07e0c0e9
--- /dev/null
+++ b/crawl4ai/version_manager.py
@@ -0,0 +1,30 @@
+# version_manager.py
+import os
+from pathlib import Path
+from packaging import version
+from . import __version__
+
+class VersionManager:
+    def __init__(self):
+        self.home_dir = Path.home() / ".crawl4ai"
+        self.version_file = self.home_dir / "version.txt"
+        
+    def get_installed_version(self):
+        """Get the version recorded in home directory"""
+        if not self.version_file.exists():
+            return None
+        try:
+            return version.parse(self.version_file.read_text().strip())
+        except:
+            return None
+            
+    def update_version(self):
+        """Update the version file to current library version"""
+        self.version_file.write_text(__version__)
+        
+    def needs_update(self):
+        """Check if database needs update based on version"""
+        installed = self.get_installed_version()
+        current = version.parse(__version__)
+        return installed is None or installed < current
+
diff --git a/docs/md_v2/basic/installation.md b/docs/md_v2/basic/installation.md
index a4a60857..de8aeafa 100644
--- a/docs/md_v2/basic/installation.md
+++ b/docs/md_v2/basic/installation.md
@@ -58,6 +58,51 @@ crawl4ai-download-models
 
 This is optional but will boost the performance and speed of the crawler. You only need to do this once after installation.
 
+## Playwright Installation Note for Ubuntu
+
+If you encounter issues with Playwright installation on Ubuntu, you may need to install additional dependencies:
+
+```bash
+sudo apt-get install -y \
+    libwoff1 \
+    libopus0 \
+    libwebp7 \
+    libwebpdemux2 \
+    libenchant-2-2 \
+    libgudev-1.0-0 \
+    libsecret-1-0 \
+    libhyphen0 \
+    libgdk-pixbuf2.0-0 \
+    libegl1 \
+    libnotify4 \
+    libxslt1.1 \
+    libevent-2.1-7 \
+    libgles2 \
+    libxcomposite1 \
+    libatk1.0-0 \
+    libatk-bridge2.0-0 \
+    libepoxy0 \
+    libgtk-3-0 \
+    libharfbuzz-icu0 \
+    libgstreamer-gl1.0-0 \
+    libgstreamer-plugins-bad1.0-0 \
+    gstreamer1.0-plugins-good \
+    gstreamer1.0-plugins-bad \
+    libxt6 \
+    libxaw7 \
+    xvfb \
+    fonts-noto-color-emoji \
+    libfontconfig \
+    libfreetype6 \
+    xfonts-cyrillic \
+    xfonts-scalable \
+    fonts-liberation \
+    fonts-ipafont-gothic \
+    fonts-wqy-zenhei \
+    fonts-tlwg-loma-otf \
+    fonts-freefont-ttf
+```
+
 ## Option 2: Using Docker (Coming Soon)
 
 Docker support for Crawl4AI is currently in progress and will be available soon. This will allow you to run Crawl4AI in a containerized environment, ensuring consistency across different systems.
diff --git a/setup.py b/setup.py
index d8ad2cd3..bbc03026 100644
--- a/setup.py
+++ b/setup.py
@@ -70,7 +70,7 @@ class PostInstallCommand(install):
     def run(self):
         install.run(self)
         install_playwright()
-        run_migration()
+        # run_migration()
 
 setup(
     name="Crawl4AI",

From a59c107b237ccdab1036f08123421f2645a628f3 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Sun, 17 Nov 2024 18:42:43 +0800
Subject: [PATCH 042/115] Update changelog for 0.3.74

---
 CHANGELOG.md | 220 ++++++++++++++++++++++++++++++++++++++++++++++-----
 1 file changed, 201 insertions(+), 19 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index e82fa6a2..8e5cc91a 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -1,7 +1,194 @@
 # Changelog
 
+## [0.3.74] November 17, 2024
 
-## Version 0.3.74, Major Changes
+This changelog details the updates and changes introduced in Crawl4AI version 0.3.74. It's designed to inform developers about new features, modifications to existing components, removals, and other important information.
+
+### 1. File Download Processing
+
+- Users can now specify download folders using the `downloads_path` parameter in the `AsyncWebCrawler` constructor or the `arun` method. If not specified, downloads are saved to a "downloads" folder within the `.crawl4ai` directory.
+- File download tracking is integrated into the `CrawlResult` object.  Successfully downloaded files are listed in the `downloaded_files` attribute, providing their paths.
+- Added `accept_downloads` parameter to the crawler strategies (defaults to `False`). If set to True you can add JS code and `wait_for` parameter for file download.
+
+**Example:**
+
+```python
+import asyncio
+import os
+from pathlib import Path
+from crawl4ai import AsyncWebCrawler
+
+async def download_example():
+    downloads_path = os.path.join(Path.home(), ".crawl4ai", "downloads")
+    os.makedirs(downloads_path, exist_ok=True)
+
+    async with AsyncWebCrawler(
+        accept_downloads=True, 
+        downloads_path=downloads_path, 
+        verbose=True
+    ) as crawler:
+        result = await crawler.arun(
+            url="https://www.python.org/downloads/",
+            js_code="""
+                const downloadLink = document.querySelector('a[href$=".exe"]');
+                if (downloadLink) { downloadLink.click(); }
+            """,
+            wait_for=5 # To ensure download has started
+        )
+
+        if result.downloaded_files:
+            print("Downloaded files:")
+            for file in result.downloaded_files:
+                print(f"- {file}")
+
+asyncio.run(download_example())
+
+```
+
+### 2. Refined Content Filtering
+
+- Introduced the `RelevanceContentFilter` strategy (and its implementation `BM25ContentFilter`) for extracting relevant content from web pages, replacing Fit Markdown and other content cleaning strategy. This new strategy leverages the BM25 algorithm to identify chunks of text relevant to the page's title, description, keywords, or a user-provided query.
+- The `fit_markdown` flag in the content scraper is used to filter content based on title, meta description, and keywords.
+
+**Example:**
+
+```python
+from crawl4ai import AsyncWebCrawler
+from crawl4ai.content_filter_strategy import BM25ContentFilter
+
+async def filter_content(url, query):
+    async with AsyncWebCrawler() as crawler:
+        content_filter = BM25ContentFilter(user_query=query)
+        result = await crawler.arun(url=url, extraction_strategy=content_filter, fit_markdown=True)
+        print(result.extracted_content)  # Or result.fit_markdown for the markdown version
+        print(result.fit_html) # Or result.fit_html to show HTML with only the filtered content
+
+asyncio.run(filter_content("https://en.wikipedia.org/wiki/Apple", "fruit nutrition health"))
+```
+
+### 3. Raw HTML and Local File Support
+
+- Added support for crawling local files and raw HTML content directly.
+- Use the `file://` prefix for local file paths.
+- Use the `raw:` prefix for raw HTML strings.
+
+**Example:**
+
+```python
+async def crawl_local_or_raw(crawler, content, content_type):
+    prefix = "file://" if content_type == "local" else "raw:"
+    url = f"{prefix}{content}"
+    result = await crawler.arun(url=url)
+    if result.success:
+        print(f"Markdown Content from {content_type.title()} Source:")
+        print(result.markdown)
+
+# Example usage with local file and raw HTML
+async def main():
+    async with AsyncWebCrawler() as crawler:
+        # Local File
+        await crawl_local_or_raw(
+            crawler, os.path.abspath('tests/async/sample_wikipedia.html'), "local"
+        )
+        # Raw HTML
+        await crawl_raw_html(crawler, "<h1>Raw Test</h1><p>This is raw HTML.</p>")
+        
+
+asyncio.run(main())
+```
+
+### 4. Browser Management
+
+- New asynchronous crawler strategy implemented using Playwright.
+- `ManagedBrowser` class introduced for improved browser session handling, offering features like persistent browser sessions between requests (using  `session_id`  parameter) and browser process monitoring.
+- Updated to tf-playwright-stealth for enhanced stealth capabilities.
+- Added `use_managed_browser`, `use_persistent_context`, and `chrome_channel` parameters to AsyncPlaywrightCrawlerStrategy.
+
+
+**Example:**
+```python
+async def browser_management_demo():
+    user_data_dir = os.path.join(Path.home(), ".crawl4ai", "user-data-dir")
+    os.makedirs(user_data_dir, exist_ok=True)  # Ensure directory exists
+    async with AsyncWebCrawler(
+        use_managed_browser=True,
+        user_data_dir=user_data_dir,
+        use_persistent_context=True,
+        verbose=True
+    ) as crawler:
+        result1 = await crawler.arun(
+            url="https://example.com", session_id="my_session"
+        )
+        result2 = await crawler.arun(
+            url="https://example.com/anotherpage", session_id="my_session"
+        )
+
+asyncio.run(browser_management_demo())
+```
+
+
+### 5. API Server & Cache Improvements
+
+- Added CORS support to API server.
+- Implemented static file serving.
+- Enhanced root redirect functionality.
+- Cache database updated to store response headers and downloaded files information. It utilizes a file system approach to manage large content efficiently.
+- New, more efficient caching database built using xxhash and file system approach.
+- Introduced `CacheMode` enum (`ENABLED`, `DISABLED`, `READ_ONLY`, `WRITE_ONLY`, `BYPASS`) and `always_bypass_cache` parameter in AsyncWebCrawler for fine-grained cache control. This replaces `bypass_cache`, `no_cache_read`, `no_cache_write`, and `always_by_pass_cache`.
+
+
+### 🗑️ Removals
+
+- Removed deprecated: `crawl4ai/content_cleaning_strategy.py`.
+- Removed internal class ContentCleaningStrategy
+- Removed legacy cache control flags:  `bypass_cache`,  `disable_cache`,  `no_cache_read`,  `no_cache_write`, and `always_by_pass_cache`.  These have been superseded by  `cache_mode`.
+
+
+### ⚙️ Other Changes
+
+- Moved version file to `crawl4ai/__version__.py`.
+- Added `crawl4ai/cache_context.py`.
+- Added `crawl4ai/version_manager.py`.
+- Added `crawl4ai/migrations.py`.
+- Added `crawl4ai-migrate` entry point.
+- Added config `NEED_MIGRATION` and `SHOW_DEPRECATION_WARNINGS`.
+- API server now requires an API token for authentication, configurable with the `CRAWL4AI_API_TOKEN` environment variable.  This enhances API security.
+- Added synchronous crawl endpoint `/crawl_sync` for immediate result retrieval, and direct crawl endpoint `/crawl_direct` bypassing the task queue.
+
+
+### ⚠️ Deprecation Notices
+
+- The synchronous version of `WebCrawler` is being phased out.  While still available via `crawl4ai[sync]`, it will eventually be removed. Transition to `AsyncWebCrawler` is strongly recommended. Boolean cache control flags in `arun` are also deprecated, migrate to using the `cache_mode` parameter.  See examples in the "New Features" section above for correct usage.
+
+
+### 🐛 Bug Fixes
+
+- Resolved issue with browser context closing unexpectedly in Docker. This significantly improves stability, particularly within containerized environments. 
+- Fixed memory leaks associated with incorrect asynchronous cleanup by removing the `__del__` method and ensuring the browser context is closed explicitly using context managers.
+- Improved error handling in `WebScrapingStrategy`. More detailed error messages and suggestions for debugging will minimize frustration when running into unexpected issues.
+- Fixed issue with incorrect text parsing in specific HTML structures.
+
+
+### Example of migrating to the new CacheMode:
+
+**Old way:**
+
+```python
+crawler = AsyncWebCrawler(always_by_pass_cache=True)
+result = await crawler.arun(url="https://example.com", bypass_cache=True)
+```
+
+**New way:**
+
+```python
+from crawl4ai import CacheMode
+
+crawler = AsyncWebCrawler(always_bypass_cache=True)
+result = await crawler.arun(url="https://example.com", cache_mode=CacheMode.BYPASS)
+```
+
+
+## [0.3.74] - November 13, 2024
 
 1. **File Download Processing** (Nov 14, 2024)
    - Added capability for users to specify download folders
@@ -30,14 +217,9 @@
    - Implemented static file serving
    - Enhanced root redirect functionality
 
-# [0.3.74] November 14, 2024
-
-- In this commit, the library is updated to process file downloads. Users can now specify a download folder and trigger the download process via JavaScript or other means, with all files being saved. The list of downloaded files will also be added to the crowd result object.
-- Another thing this commit introduces is the concept of the Relevance Content Filter. This is an improvement over Fit Markdown. This class of strategies aims to extract the main content from a given page - the part that really matters and is useful to be processed. One strategy has been created using the BM25 algorithm, which finds chunks of text from the web page relevant to its title, descriptions, and keywords, or supports a given user query and matches them. The result is then returned to the main engine to be converted to Markdown. Plans include adding approaches using language models as well.
-- The cache database was updated to hold information about response headers and downloaded files.
 
 
-# Changelog - November 13, 2024
+## [0.3.731] - November 13, 2024
 
 ### Added
 - Support for raw HTML and local file crawling via URL prefixes ('raw:', 'file://')
@@ -137,7 +319,7 @@
 - Modified database connection management approach
 - Updated API response structure for better consistency
 
-## Migration Guide
+### Migration Guide
 When upgrading to v0.3.73, be aware of the following changes:
 
 1. Docker Deployment:
@@ -159,7 +341,7 @@ When upgrading to v0.3.73, be aware of the following changes:
    - Follow recommended fixes for any identified problems
 
 
-## [2024-11-04 - 13:21:42] Comprehensive Update of Crawl4AI Features and Dependencies
+## [v0.3.73] - 2024-11-04
 This commit introduces several key enhancements, including improved error handling and robust database operations in `async_database.py`, which now features a connection pool and retry logic for better reliability. Updates to the README.md provide clearer instructions and a better user experience with links to documentation sections. The `.gitignore` file has been refined to include additional directories, while the async web crawler now utilizes a managed browser for more efficient crawling. Furthermore, multiple dependency updates and introduction of the `CustomHTML2Text` class enhance text extraction capabilities.
 
 ## [v0.3.73] - 2024-10-24
@@ -405,43 +587,43 @@ These updates aim to provide more flexibility in text processing, improve perfor
 - Allows retrieval of content after a specified delay, useful for dynamically loaded content.
 - **How to use**: Access `result.get_delayed_content(delay_in_seconds)` after crawling.
 
-## Improvements and Optimizations
+### Improvements and Optimizations
 
-### 1. AsyncWebCrawler Enhancements
+#### 1. AsyncWebCrawler Enhancements
 - **Flexible Initialization**: Now accepts arbitrary keyword arguments, passed directly to the crawler strategy.
 - Allows for more customized setups.
 
-### 2. Image Processing Optimization
+#### 2. Image Processing Optimization
 - Enhanced image handling in WebScrapingStrategy.
 - Added filtering for small, invisible, or irrelevant images.
 - Improved image scoring system for better content relevance.
 - Implemented JavaScript-based image dimension updating for more accurate representation.
 
-### 3. Database Schema Auto-updates
+#### 3. Database Schema Auto-updates
 - Automatic database schema updates ensure compatibility with the latest version.
 
-### 4. Enhanced Error Handling and Logging
+#### 4. Enhanced Error Handling and Logging
 - Improved error messages and logging for easier debugging.
 
-### 5. Content Extraction Refinements
+#### 5. Content Extraction Refinements
 - Refined HTML sanitization process.
 - Improved handling of base64 encoded images.
 - Enhanced Markdown conversion process.
 - Optimized content extraction algorithms.
 
-### 6. Utility Function Enhancements
+#### 6. Utility Function Enhancements
 - `perform_completion_with_backoff` function now supports additional arguments for more customized API calls to LLM providers.
 
-## Bug Fixes
+### Bug Fixes
 - Fixed an issue where image tags were being prematurely removed during content extraction.
 
-## Examples and Documentation
+### Examples and Documentation
 - Updated `quickstart_async.py` with examples of:
   - Using custom headers in LLM extraction.
   - Different LLM provider usage (OpenAI, Hugging Face, Ollama).
   - Custom browser type usage.
 
-## Developer Notes
+### Developer Notes
 - Refactored code for better maintainability, flexibility, and performance.
 - Enhanced type hinting throughout the codebase for improved development experience.
 - Expanded error handling for more robust operation.

From df63a4060673b2d5647abdce07810e29cf20e739 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Sun, 17 Nov 2024 19:44:45 +0800
Subject: [PATCH 043/115] feat(docs): update examples and documentation to
 replace bypass_cache with cache_mode for improved clarity

---
 README.md                                     |  24 ++-
 crawl4ai/async_webcrawler.py                  |  37 +++--
 crawl4ai/content_scrapping_strategy.py        |  15 +-
 docs/examples/v0.3.74.overview.py             |   2 +-
 docs/md_v2/advanced/managed_browser.md        |  84 ++++++++++
 .../advanced/session-management-advanced.md   |  10 +-
 docs/md_v2/advanced/session-management.md     |   2 +-
 docs/md_v2/api/arun.md                        |  42 +++--
 docs/md_v2/api/crawl-result.md                |   1 +
 docs/md_v2/api/parameters.md                  |   3 +-
 docs/md_v2/basic/content_filtering.md         |  84 ++++++++++
 docs/md_v2/basic/file-download.md             | 148 ++++++++++++++++++
 docs/md_v2/basic/quickstart.md                |  22 +--
 docs/md_v2/basic/simple-crawling.md           |  10 +-
 .../episode_11_2_Extraction_Strategies_LLM.md |   4 +-
 ...isode_11_3_Extraction_Strategies_Cosine.md |   4 +-
 docs/md_v2/tutorial/tutorial.md               |  10 +-
 17 files changed, 422 insertions(+), 80 deletions(-)
 create mode 100644 docs/md_v2/advanced/managed_browser.md
 create mode 100644 docs/md_v2/basic/content_filtering.md
 create mode 100644 docs/md_v2/basic/file-download.md

diff --git a/README.md b/README.md
index 069c02b8..9c3796cd 100644
--- a/README.md
+++ b/README.md
@@ -11,21 +11,19 @@
 
 Crawl4AI simplifies asynchronous web crawling and data extraction, making it accessible for large language models (LLMs) and AI applications. 🆓🌐
 
-## 🌟 Meet the Crawl4AI Assistant: Your Copilot for Crawling
+## New in 0.3.74 ✨
 
-Use the [Crawl4AI GPT Assistant](https://tinyurl.com/crawl4ai-gpt) as your AI-powered copilot! With this assistant, you can:
+- 🚀 **Blazing Fast Scraping:**  The scraping process is now significantly faster, often completing in under 100 milliseconds (excluding web fetch time)!
+- 📥 **Download Mastery:** Control downloads, specify folders, and track files within the `CrawlResult` object.
+- 🔎 **Relevance Filtering:** Extract the most important content with the new `RelevanceContentFilter` and BM25 algorithm.  Control filtering with the `fit_markdown` flag.
+- 🗂️ **Local & Raw HTML:** Crawl local files (`file://`) and raw HTML strings (`raw:`) directly.
+- 🤖 **Browser Boss:** Manage browser sessions with persistent contexts, process monitoring, and tf-playwright-stealth integration.  Configure using `use_managed_browser`, `user_data_dir`, and `use_persistent_context` parameters.
+- ☁️ **API & Cache Boost:** CORS support, static file serving, and a new filesystem-based cache for blazing-fast performance. Fine-tune caching with the `CacheMode` enum (ENABLED, DISABLED, READ_ONLY, WRITE_ONLY, BYPASS) and the `always_bypass_cache` parameter.
+- 🔒 **API Security:** Protect your API server with token-based authentication using the `CRAWL4AI_API_TOKEN` environment variable.
+- 🔄 **Synchronous & Direct Crawling:** Get immediate results with `/crawl_sync` or bypass the task queue with `/crawl_direct`.
+- 🛠️ **Database Migration:**  A new `crawl4ai-migrate` command ensures smooth upgrades and data integrity between versions.
+- 🐛 **Squashed Bugs:**  Fixed browser context issues in Docker, memory leaks, enhanced error handling, and improved HTML parsing.
 
-- 🧑‍💻 Generate code for complex crawling and extraction tasks
-- 💡 Get tailored support and examples
-- 📘 Learn Crawl4AI faster with step-by-step guidance
-
-## New in 0.3.73 ✨
-
-- 🐳 Docker Ready: Full API server with seamless deployment & scaling
-- 🎯 Browser Takeover: Use your own browser with cookies & history intact (CDP support)
-- 📝 Mockdown+: Enhanced tag preservation & content extraction
-- ⚡️ Parallel Power: Supercharged multi-URL crawling performance
-- 🌟 And many more exciting updates...
 
 ## Try it Now!
 
diff --git a/crawl4ai/async_webcrawler.py b/crawl4ai/async_webcrawler.py
index d554576d..d22e3b1f 100644
--- a/crawl4ai/async_webcrawler.py
+++ b/crawl4ai/async_webcrawler.py
@@ -10,14 +10,14 @@ import asyncio
 from .models import CrawlResult
 from .async_database import async_db_manager
 from .chunking_strategy import *
+from .content_filter_strategy import *
 from .extraction_strategy import *
 from .async_crawler_strategy import AsyncCrawlerStrategy, AsyncPlaywrightCrawlerStrategy, AsyncCrawlResponse
 from .cache_context import CacheMode, CacheContext, _legacy_to_cache_mode
 from .content_scrapping_strategy import WebScrapingStrategy
 from .config import (
     MIN_WORD_THRESHOLD, 
-    IMAGE_DESCRIPTION_MIN_WORD_THRESHOLD,
-    SHOW_DEPRECATION_WARNINGS  # New import
+    IMAGE_DESCRIPTION_MIN_WORD_THRESHOLD
 )
 from .utils import (
     sanitize_input_encode,
@@ -49,7 +49,7 @@ class AsyncWebCrawler:
         )
     
     To disable deprecation warnings:
-        Set SHOW_DEPRECATION_WARNINGS = False in config.py
+        Pass warning=False to suppress the warning.
     """
 
     def __init__(
@@ -85,11 +85,11 @@ class AsyncWebCrawler:
         
         # Handle deprecated parameter
         if always_by_pass_cache is not None:
-            if SHOW_DEPRECATION_WARNINGS:
+            if kwargs.get("warning", True):
                 warnings.warn(
                     "'always_by_pass_cache' is deprecated and will be removed in version X.X.X. "
                     "Use 'always_bypass_cache' instead. "
-                    "Set SHOW_DEPRECATION_WARNINGS=False in config.py to suppress this warning.",
+                    "Pass warning=False to suppress this warning.",
                     DeprecationWarning,
                     stacklevel=2
                 )
@@ -126,6 +126,7 @@ class AsyncWebCrawler:
         word_count_threshold=MIN_WORD_THRESHOLD,
         extraction_strategy: ExtractionStrategy = None,
         chunking_strategy: ChunkingStrategy = RegexChunking(),
+        content_filter: RelevantContentFilter = None,
         cache_mode: Optional[CacheMode] = None,
         # Deprecated parameters
         bypass_cache: bool = False,
@@ -172,7 +173,7 @@ class AsyncWebCrawler:
         try:
             # Handle deprecated parameters
             if any([bypass_cache, disable_cache, no_cache_read, no_cache_write]):
-                if SHOW_DEPRECATION_WARNINGS:
+                if kwargs.get("warning", True):
                     warnings.warn(
                         "Cache control boolean flags are deprecated and will be removed in version X.X.X. "
                         "Use 'cache_mode' parameter instead. Examples:\n"
@@ -180,7 +181,7 @@ class AsyncWebCrawler:
                         "- For disable_cache=True, use cache_mode=CacheMode.DISABLED\n"
                         "- For no_cache_read=True, use cache_mode=CacheMode.WRITE_ONLY\n"
                         "- For no_cache_write=True, use cache_mode=CacheMode.READ_ONLY\n"
-                        "Set SHOW_DEPRECATION_WARNINGS=False in config.py to suppress this warning.",
+                        "Pass warning=False to suppress this warning.",
                         DeprecationWarning,
                         stacklevel=2
                     )
@@ -257,6 +258,7 @@ class AsyncWebCrawler:
                 word_count_threshold=word_count_threshold,
                 extraction_strategy=extraction_strategy,
                 chunking_strategy=chunking_strategy,
+                content_filter=content_filter,
                 css_selector=css_selector,
                 screenshot=screenshot_data,
                 verbose=verbose,
@@ -308,6 +310,7 @@ class AsyncWebCrawler:
         word_count_threshold=MIN_WORD_THRESHOLD,
         extraction_strategy: ExtractionStrategy = None,
         chunking_strategy: ChunkingStrategy = RegexChunking(),
+        content_filter: RelevantContentFilter = None,
         cache_mode: Optional[CacheMode] = None,
         # Deprecated parameters
         bypass_cache: bool = False,
@@ -335,14 +338,15 @@ class AsyncWebCrawler:
         Returns:
             List[CrawlResult]: Results for each URL
         """
-        if bypass_cache and SHOW_DEPRECATION_WARNINGS:
-            warnings.warn(
-                "'bypass_cache' is deprecated and will be removed in version X.X.X. "
-                "Use 'cache_mode=CacheMode.BYPASS' instead. "
-                "Set SHOW_DEPRECATION_WARNINGS=False in config.py to suppress this warning.",
-                DeprecationWarning,
-                stacklevel=2
-            )
+        if bypass_cache:
+            if kwargs.get("warning", True):
+                warnings.warn(
+                    "'bypass_cache' is deprecated and will be removed in version X.X.X. "
+                    "Use 'cache_mode=CacheMode.BYPASS' instead. "
+                    "Pass warning=False to suppress this warning.",
+                    DeprecationWarning,
+                    stacklevel=2
+                )
             if cache_mode is None:
                 cache_mode = CacheMode.BYPASS
 
@@ -356,6 +360,7 @@ class AsyncWebCrawler:
                     word_count_threshold=word_count_threshold,
                     extraction_strategy=extraction_strategy,
                     chunking_strategy=chunking_strategy,
+                    content_filter=content_filter,
                     cache_mode=cache_mode,
                     css_selector=css_selector,
                     screenshot=screenshot,
@@ -377,6 +382,7 @@ class AsyncWebCrawler:
         word_count_threshold: int,
         extraction_strategy: ExtractionStrategy,
         chunking_strategy: ChunkingStrategy,
+        content_filter: RelevantContentFilter,
         css_selector: str,
         screenshot: str,
         verbose: bool,
@@ -397,6 +403,7 @@ class AsyncWebCrawler:
                 image_description_min_word_threshold=kwargs.get(
                     "image_description_min_word_threshold", IMAGE_DESCRIPTION_MIN_WORD_THRESHOLD
                 ),
+                content_filter = content_filter,
                 **kwargs,
             )
 
diff --git a/crawl4ai/content_scrapping_strategy.py b/crawl4ai/content_scrapping_strategy.py
index 9c81638c..d16b0680 100644
--- a/crawl4ai/content_scrapping_strategy.py
+++ b/crawl4ai/content_scrapping_strategy.py
@@ -532,14 +532,13 @@ class WebScrapingStrategy(ContentScrapingStrategy):
             
         fit_markdown = "Set flag 'fit_markdown' to True to get cleaned HTML content."
         fit_html = "Set flag 'fit_markdown' to True to get cleaned HTML content."
-        if kwargs.get('fit_markdown', False):
-            # cleaner = ContentCleaningStrategy()
-            # fit_html = cleaner.clean(cleaned_html)
-            # fit_markdown = h.handle(fit_html)
-            content_filter = BM25ContentFilter(
-                user_query= kwargs.get('fit_markdown_user_query', None),
-                bm25_threshold= kwargs.get('fit_markdown_bm25_threshold', 1.0)
-            )
+        if kwargs.get('content_filter', None) or kwargs.get('fit_markdown', False):
+            content_filter = kwargs.get('content_filter', None)
+            if not content_filter:
+                content_filter = BM25ContentFilter(
+                    user_query= kwargs.get('fit_markdown_user_query', None),
+                    bm25_threshold= kwargs.get('fit_markdown_bm25_threshold', 1.0)
+                )
             fit_html = content_filter.filter_content(html)
             fit_html = '\n'.join('<div>{}</div>'.format(s) for s in fit_html)
             fit_markdown = h.handle(fit_html)
diff --git a/docs/examples/v0.3.74.overview.py b/docs/examples/v0.3.74.overview.py
index 579d05dd..ec3a7d73 100644
--- a/docs/examples/v0.3.74.overview.py
+++ b/docs/examples/v0.3.74.overview.py
@@ -56,7 +56,7 @@ async def content_filtering_example():
         
         result = await crawler.arun(
             url="https://openai.com/blog",
-            extraction_strategy=content_filter
+            content_filter=content_filter
         )
         
         print(f"Filtered content: {result.extracted_content}")
diff --git a/docs/md_v2/advanced/managed_browser.md b/docs/md_v2/advanced/managed_browser.md
new file mode 100644
index 00000000..80d6fc1a
--- /dev/null
+++ b/docs/md_v2/advanced/managed_browser.md
@@ -0,0 +1,84 @@
+# Content Filtering in Crawl4AI
+
+This guide explains how to use content filtering strategies in Crawl4AI to extract the most relevant information from crawled web pages.  You'll learn how to use the built-in `BM25ContentFilter` and how to create your own custom content filtering strategies.
+
+## Relevance Content Filter
+
+The `RelevanceContentFilter` is an abstract class that provides a common interface for content filtering strategies. Specific filtering algorithms, like `BM25ContentFilter`, inherit from this class and implement the `filter_content` method. This method takes the HTML content as input and returns a list of filtered text blocks.
+
+## BM25 Algorithm
+
+The `BM25ContentFilter` uses the BM25 algorithm, a ranking function used in information retrieval to estimate the relevance of documents to a given search query. In Crawl4AI, this algorithm helps to identify and extract text chunks that are most relevant to the page's metadata or a user-specified query.
+
+### Usage
+
+To use the `BM25ContentFilter`, initialize it and then pass it as the `extraction_strategy` parameter to the `arun` method of the crawler.
+
+```python
+from crawl4ai import AsyncWebCrawler
+from crawl4ai.content_filter_strategy import BM25ContentFilter
+
+async def filter_content(url, query=None):
+    async with AsyncWebCrawler() as crawler:
+        content_filter = BM25ContentFilter(user_query=query)
+        result = await crawler.arun(url=url, extraction_strategy=content_filter, fit_markdown=True) # Set fit_markdown flag to True to trigger BM25 filtering
+        if result.success:
+            print(f"Filtered Content (JSON):\n{result.extracted_content}")
+            print(f"\nFiltered Markdown:\n{result.fit_markdown}") # New field in CrawlResult object
+            print(f"\nFiltered HTML:\n{result.fit_html}") # New field in CrawlResult object. Note that raw HTML may have tags re-organized due to internal parsing.
+        else:
+            print("Error:", result.error_message)
+
+# Example usage:
+asyncio.run(filter_content("https://en.wikipedia.org/wiki/Apple", "fruit nutrition health")) # with query
+asyncio.run(filter_content("https://en.wikipedia.org/wiki/Apple")) # without query, metadata will be used as the query.
+
+```
+
+### Parameters
+
+- **`user_query`**:  (Optional) A string representing the search query. If not provided, the filter extracts relevant metadata (title, description, keywords) from the page and uses that as the query.
+- **`bm25_threshold`**: (Optional, default 1.0)  A float value that controls the threshold for relevance.  Higher values result in stricter filtering, returning only the most relevant text chunks. Lower values result in more lenient filtering.
+
+
+## Fit Markdown Flag
+
+Setting the `fit_markdown` flag to `True` in the `arun` method activates the BM25 content filtering during the crawl. The `fit_markdown` parameter instructs the scraper to extract and clean the HTML, primarily to prepare for a Large Language Model that cannot process large amounts of data. Setting this flag not only improves the quality of the extracted content but also adds the filtered content to two new attributes in the returned  `CrawlResult` object: `fit_markdown` and `fit_html`.
+
+
+## Custom Content Filtering Strategies
+
+You can create your own custom filtering strategies by inheriting from the `RelevantContentFilter` class and implementing the `filter_content` method.  This allows you to tailor the filtering logic to your specific needs.
+
+```python
+from crawl4ai.content_filter_strategy import RelevantContentFilter
+from bs4 import BeautifulSoup, Tag
+from typing import List
+
+class MyCustomFilter(RelevantContentFilter):
+    def filter_content(self, html: str) -> List[str]:
+        soup = BeautifulSoup(html, 'lxml')
+        # Implement custom filtering logic here
+        # Example: extract all paragraphs within divs with class "article-body"
+        filtered_paragraphs = []
+        for tag in soup.select("div.article-body p"):
+            if isinstance(tag, Tag):
+                filtered_paragraphs.append(str(tag)) # Add the cleaned HTML element.  
+        return filtered_paragraphs
+
+
+
+async def custom_filter_demo(url: str):
+    async with AsyncWebCrawler() as crawler:
+        custom_filter = MyCustomFilter()
+        result = await crawler.arun(url, extraction_strategy=custom_filter)
+        if result.success:
+            print(result.extracted_content)
+
+```
+
+This example demonstrates extracting paragraphs from a specific div class.  You can customize this logic to implement different filtering strategies, use regular expressions, analyze text density, or apply other relevant techniques.
+
+## Conclusion
+
+Content filtering strategies provide a powerful way to refine the output of your crawls. By using `BM25ContentFilter` or creating custom strategies, you can focus on the most pertinent information and improve the efficiency of your data processing pipeline.
diff --git a/docs/md_v2/advanced/session-management-advanced.md b/docs/md_v2/advanced/session-management-advanced.md
index f8c81da2..908828f7 100644
--- a/docs/md_v2/advanced/session-management-advanced.md
+++ b/docs/md_v2/advanced/session-management-advanced.md
@@ -30,7 +30,7 @@ Let's start with a basic example of session-based crawling:
 
 ```python
 import asyncio
-from crawl4ai import AsyncWebCrawler
+from crawl4ai import AsyncWebCrawler, CacheMode
 
 async def basic_session_crawl():
     async with AsyncWebCrawler(verbose=True) as crawler:
@@ -43,7 +43,7 @@ async def basic_session_crawl():
                 session_id=session_id,
                 js_code="document.querySelector('.load-more-button').click();" if page > 0 else None,
                 css_selector=".content-item",
-                bypass_cache=True
+                cache_mode=CacheMode.BYPASS
             )
             
             print(f"Page {page + 1}: Found {result.extracted_content.count('.content-item')} items")
@@ -102,7 +102,7 @@ async def advanced_session_crawl_with_hooks():
                 session_id=session_id,
                 css_selector="li.commit-item",
                 js_code=js_next_page if page > 0 else None,
-                bypass_cache=True,
+                cache_mode=CacheMode.BYPASS,
                 js_only=page > 0
             )
 
@@ -174,7 +174,7 @@ async def integrated_js_and_wait_crawl():
                 extraction_strategy=extraction_strategy,
                 js_code=js_next_page_and_wait if page > 0 else None,
                 js_only=page > 0,
-                bypass_cache=True
+                cache_mode=CacheMode.BYPASS
             )
 
             commits = json.loads(result.extracted_content)
@@ -241,7 +241,7 @@ async def wait_for_parameter_crawl():
                 js_code=js_next_page if page > 0 else None,
                 wait_for=wait_for if page > 0 else None,
                 js_only=page > 0,
-                bypass_cache=True
+                cache_mode=CacheMode.BYPASS
             )
 
             commits = json.loads(result.extracted_content)
diff --git a/docs/md_v2/advanced/session-management.md b/docs/md_v2/advanced/session-management.md
index c38ed852..eae4cf7b 100644
--- a/docs/md_v2/advanced/session-management.md
+++ b/docs/md_v2/advanced/session-management.md
@@ -75,7 +75,7 @@ async def crawl_dynamic_content():
                 js_code=js_next_page if page > 0 else None,
                 wait_for=wait_for if page > 0 else None,
                 js_only=page > 0,
-                bypass_cache=True
+                cache_mode=CacheMode.BYPASS
             )
 
             if result.success:
diff --git a/docs/md_v2/api/arun.md b/docs/md_v2/api/arun.md
index 9ef73aef..509991e5 100644
--- a/docs/md_v2/api/arun.md
+++ b/docs/md_v2/api/arun.md
@@ -8,11 +8,26 @@ The following parameters can be passed to the `arun()` method. They are organize
 await crawler.arun(
     url="https://example.com",   # Required: URL to crawl
     verbose=True,               # Enable detailed logging
-    bypass_cache=False,         # Skip cache for this request
+    cache_mode=CacheMode.ENABLED,  # Control cache behavior
     warmup=True                # Whether to run warmup check
 )
 ```
 
+## Cache Control
+
+```python
+from crawl4ai import CacheMode
+
+await crawler.arun(
+    cache_mode=CacheMode.ENABLED,    # Normal caching (read/write)
+    # Other cache modes:
+    # cache_mode=CacheMode.DISABLED   # No caching at all
+    # cache_mode=CacheMode.READ_ONLY  # Only read from cache
+    # cache_mode=CacheMode.WRITE_ONLY # Only write to cache
+    # cache_mode=CacheMode.BYPASS     # Skip cache for this operation
+)
+```
+
 ## Content Processing Parameters
 
 ### Text Processing
@@ -162,14 +177,13 @@ await crawler.arun(
 
 ## Parameter Interactions and Notes
 
-1. **Magic Mode Combinations**
+1. **Cache and Performance Setup**
    ```python
-   # Full anti-detection setup
+   # Optimal caching for repeated crawls
    await crawler.arun(
-       magic=True,
-       headless=False,
-       simulate_user=True,
-       override_navigator=True
+       cache_mode=CacheMode.ENABLED,
+       word_count_threshold=10,
+       process_iframes=False
    )
    ```
 
@@ -179,7 +193,8 @@ await crawler.arun(
    await crawler.arun(
        js_code="window.scrollTo(0, document.body.scrollHeight);",
        wait_for="css:.lazy-content",
-       delay_before_return_html=2.0
+       delay_before_return_html=2.0,
+       cache_mode=CacheMode.WRITE_ONLY  # Cache results after dynamic load
    )
    ```
 
@@ -192,7 +207,8 @@ await crawler.arun(
        extraction_strategy=my_strategy,
        chunking_strategy=my_chunking,
        process_iframes=True,
-       remove_overlay_elements=True
+       remove_overlay_elements=True,
+       cache_mode=CacheMode.ENABLED
    )
    ```
 
@@ -201,7 +217,7 @@ await crawler.arun(
 1. **Performance Optimization**
    ```python
    await crawler.arun(
-       bypass_cache=False,           # Use cache when possible
+       cache_mode=CacheMode.ENABLED,  # Use full caching
        word_count_threshold=10,      # Filter out noise
        process_iframes=False         # Skip iframes if not needed
    )
@@ -212,7 +228,8 @@ await crawler.arun(
    await crawler.arun(
        magic=True,                   # Enable anti-detection
        delay_before_return_html=1.0, # Wait for dynamic content
-       page_timeout=60000           # Longer timeout for slow pages
+       page_timeout=60000,          # Longer timeout for slow pages
+       cache_mode=CacheMode.WRITE_ONLY  # Cache results after successful crawl
    )
    ```
 
@@ -221,6 +238,7 @@ await crawler.arun(
    await crawler.arun(
        remove_overlay_elements=True,  # Remove popups
        excluded_tags=['nav', 'aside'],# Remove unnecessary elements
-       keep_data_attributes=False     # Remove data attributes
+       keep_data_attributes=False,    # Remove data attributes
+       cache_mode=CacheMode.ENABLED   # Use cache for faster processing
    )
    ```
\ No newline at end of file
diff --git a/docs/md_v2/api/crawl-result.md b/docs/md_v2/api/crawl-result.md
index 06998af3..7e3bda98 100644
--- a/docs/md_v2/api/crawl-result.md
+++ b/docs/md_v2/api/crawl-result.md
@@ -20,6 +20,7 @@ class CrawlResult(BaseModel):
     fit_html: Optional[str] = None          # Most relevant HTML content
     markdown: Optional[str] = None          # HTML converted to markdown
     fit_markdown: Optional[str] = None      # Most relevant markdown content
+    downloaded_files: Optional[List[str]] = None  # Downloaded files
     
     # Extracted Data
     extracted_content: Optional[str] = None  # Content from extraction strategy
diff --git a/docs/md_v2/api/parameters.md b/docs/md_v2/api/parameters.md
index 6c7960d2..c1c4d2ea 100644
--- a/docs/md_v2/api/parameters.md
+++ b/docs/md_v2/api/parameters.md
@@ -32,4 +32,5 @@
 | async_webcrawler.py | warmup | `kwargs.get("warmup", True)` | AsyncWebCrawler | Initialize crawler with warmup request |
 | async_webcrawler.py | session_id | `kwargs.get("session_id", None)` | AsyncWebCrawler | Session identifier for browser reuse |
 | async_webcrawler.py | only_text | `kwargs.get("only_text", False)` | AsyncWebCrawler | Extract only text content |
-| async_webcrawler.py | bypass_cache | `kwargs.get("bypass_cache", False)` | AsyncWebCrawler | Skip cache and force fresh crawl |
\ No newline at end of file
+| async_webcrawler.py | bypass_cache | `kwargs.get("bypass_cache", False)` | AsyncWebCrawler | Skip cache and force fresh crawl |
+| async_webcrawler.py | cache_mode | `kwargs.get("cache_mode", CacheMode.ENABLE)` | AsyncWebCrawler | Cache handling mode for request |
\ No newline at end of file
diff --git a/docs/md_v2/basic/content_filtering.md b/docs/md_v2/basic/content_filtering.md
new file mode 100644
index 00000000..9506c075
--- /dev/null
+++ b/docs/md_v2/basic/content_filtering.md
@@ -0,0 +1,84 @@
+# Content Filtering in Crawl4AI
+
+This guide explains how to use content filtering strategies in Crawl4AI to extract the most relevant information from crawled web pages.  You'll learn how to use the built-in `BM25ContentFilter` and how to create your own custom content filtering strategies.
+
+## Relevance Content Filter
+
+The `RelevanceContentFilter` is an abstract class that provides a common interface for content filtering strategies. Specific filtering algorithms, like `BM25ContentFilter`, inherit from this class and implement the `filter_content` method. This method takes the HTML content as input and returns a list of filtered text blocks.
+
+## BM25 Algorithm
+
+The `BM25ContentFilter` uses the BM25 algorithm, a ranking function used in information retrieval to estimate the relevance of documents to a given search query. In Crawl4AI, this algorithm helps to identify and extract text chunks that are most relevant to the page's metadata or a user-specified query.
+
+### Usage
+
+To use the `BM25ContentFilter`, initialize it and then pass it as the `extraction_strategy` parameter to the `arun` method of the crawler.
+
+```python
+from crawl4ai import AsyncWebCrawler
+from crawl4ai.content_filter_strategy import BM25ContentFilter
+
+async def filter_content(url, query=None):
+    async with AsyncWebCrawler() as crawler:
+        content_filter = BM25ContentFilter(user_query=query)
+        result = await crawler.arun(url=url, content_filter=content_filter, fit_markdown=True) # Set fit_markdown flag to True to trigger BM25 filtering
+        if result.success:
+            print(f"Filtered Content (JSON):\n{result.extracted_content}")
+            print(f"\nFiltered Markdown:\n{result.fit_markdown}") # New field in CrawlResult object
+            print(f"\nFiltered HTML:\n{result.fit_html}") # New field in CrawlResult object. Note that raw HTML may have tags re-organized due to internal parsing.
+        else:
+            print("Error:", result.error_message)
+
+# Example usage:
+asyncio.run(filter_content("https://en.wikipedia.org/wiki/Apple", "fruit nutrition health")) # with query
+asyncio.run(filter_content("https://en.wikipedia.org/wiki/Apple")) # without query, metadata will be used as the query.
+
+```
+
+### Parameters
+
+- **`user_query`**:  (Optional) A string representing the search query. If not provided, the filter extracts relevant metadata (title, description, keywords) from the page and uses that as the query.
+- **`bm25_threshold`**: (Optional, default 1.0)  A float value that controls the threshold for relevance.  Higher values result in stricter filtering, returning only the most relevant text chunks. Lower values result in more lenient filtering.
+
+
+## Fit Markdown Flag
+
+Setting the `fit_markdown` flag to `True` in the `arun` method activates the BM25 content filtering during the crawl. The `fit_markdown` parameter instructs the scraper to extract and clean the HTML, primarily to prepare for a Large Language Model that cannot process large amounts of data. Setting this flag not only improves the quality of the extracted content but also adds the filtered content to two new attributes in the returned  `CrawlResult` object: `fit_markdown` and `fit_html`.
+
+
+## Custom Content Filtering Strategies
+
+You can create your own custom filtering strategies by inheriting from the `RelevantContentFilter` class and implementing the `filter_content` method.  This allows you to tailor the filtering logic to your specific needs.
+
+```python
+from crawl4ai.content_filter_strategy import RelevantContentFilter
+from bs4 import BeautifulSoup, Tag
+from typing import List
+
+class MyCustomFilter(RelevantContentFilter):
+    def filter_content(self, html: str) -> List[str]:
+        soup = BeautifulSoup(html, 'lxml')
+        # Implement custom filtering logic here
+        # Example: extract all paragraphs within divs with class "article-body"
+        filtered_paragraphs = []
+        for tag in soup.select("div.article-body p"):
+            if isinstance(tag, Tag):
+                filtered_paragraphs.append(str(tag)) # Add the cleaned HTML element.  
+        return filtered_paragraphs
+
+
+
+async def custom_filter_demo(url: str):
+    async with AsyncWebCrawler() as crawler:
+        custom_filter = MyCustomFilter()
+        result = await crawler.arun(url, content_filter=custom_filter)
+        if result.success:
+            print(result.extracted_content)
+
+```
+
+This example demonstrates extracting paragraphs from a specific div class.  You can customize this logic to implement different filtering strategies, use regular expressions, analyze text density, or apply other relevant techniques.
+
+## Conclusion
+
+Content filtering strategies provide a powerful way to refine the output of your crawls. By using `BM25ContentFilter` or creating custom strategies, you can focus on the most pertinent information and improve the efficiency of your data processing pipeline.
diff --git a/docs/md_v2/basic/file-download.md b/docs/md_v2/basic/file-download.md
new file mode 100644
index 00000000..c37e8812
--- /dev/null
+++ b/docs/md_v2/basic/file-download.md
@@ -0,0 +1,148 @@
+# Download Handling in Crawl4AI
+
+This guide explains how to use Crawl4AI to handle file downloads during crawling.  You'll learn how to trigger downloads, specify download locations, and access downloaded files.
+
+## Enabling Downloads
+
+By default, Crawl4AI does not download files. To enable downloads, set the `accept_downloads` parameter to `True` in either the `AsyncWebCrawler` constructor or the `arun` method.
+
+```python
+from crawl4ai import AsyncWebCrawler
+
+async def main():
+    async with AsyncWebCrawler(accept_downloads=True) as crawler:  # Globally enable downloads
+        # ... your crawling logic ...
+
+asyncio.run(main())
+```
+
+Or, enable it for a specific crawl:
+
+```python
+async def main():
+    async with AsyncWebCrawler() as crawler:
+        result = await crawler.arun(url="...", accept_downloads=True)
+        # ...
+```
+
+## Specifying Download Location
+
+You can specify the download directory using the `downloads_path` parameter. If not provided, Crawl4AI creates a "downloads" directory inside the `.crawl4ai` folder in your home directory.
+
+```python
+import os
+from pathlib import Path
+
+# ... inside your crawl function:
+
+downloads_path = os.path.join(os.getcwd(), "my_downloads")  # Custom download path
+os.makedirs(downloads_path, exist_ok=True)
+
+result = await crawler.arun(url="...", downloads_path=downloads_path, accept_downloads=True)
+
+# ...
+```
+
+If you are setting it globally, provide the path to the AsyncWebCrawler:
+```python
+async def crawl_with_downloads(url: str, download_path: str):
+    async with AsyncWebCrawler(
+        accept_downloads=True,
+        downloads_path=download_path, # or set it on arun
+        verbose=True
+    ) as crawler:
+        result = await crawler.arun(url=url) # you still need to enable downloads per call.
+        # ...
+```
+
+
+
+## Triggering Downloads
+
+Downloads are typically triggered by user interactions on a web page (e.g., clicking a download button).  You can simulate these actions with the `js_code` parameter, injecting JavaScript code to be executed within the browser context.  The `wait_for` parameter might also be crucial to allowing sufficient time for downloads to initiate before the crawler proceeds.
+
+```python
+result = await crawler.arun(
+    url="https://www.python.org/downloads/",
+    js_code="""
+        // Find and click the first Windows installer link
+        const downloadLink = document.querySelector('a[href$=".exe"]');
+        if (downloadLink) {
+            downloadLink.click();
+        }
+    """,
+    wait_for=5  # Wait for 5 seconds for the download to start
+)
+```
+
+## Accessing Downloaded Files
+
+Downloaded file paths are stored in the `downloaded_files` attribute of the returned  `CrawlResult`  object.  This is a list of strings, with each string representing the absolute path to a downloaded file.
+
+```python
+if result.downloaded_files:
+    print("Downloaded files:")
+    for file_path in result.downloaded_files:
+        print(f"- {file_path}")
+        # Perform operations with downloaded files, e.g., check file size
+        file_size = os.path.getsize(file_path)
+        print(f"- File size: {file_size} bytes")
+else:
+    print("No files downloaded.")
+```
+
+
+##  Example: Downloading Multiple Files
+
+```python
+import asyncio
+import os
+from pathlib import Path
+from crawl4ai import AsyncWebCrawler
+
+async def download_multiple_files(url: str, download_path: str):
+
+    async with AsyncWebCrawler(
+        accept_downloads=True,
+        downloads_path=download_path,
+        verbose=True
+    ) as crawler:
+        result = await crawler.arun(
+            url=url,
+            js_code="""
+            // Trigger multiple downloads (example)
+            const downloadLinks = document.querySelectorAll('a[download]'); // Or a more specific selector
+            for (const link of downloadLinks) {
+                link.click();
+                await new Promise(r => setTimeout(r, 2000)); // Add a small delay between clicks if needed
+            }
+            """,
+            wait_for=10 # Adjust the timeout to match the expected time for all downloads to start
+        )
+
+        if result.downloaded_files:
+            print("Downloaded files:")
+            for file in result.downloaded_files:
+                print(f"- {file}")
+        else:
+            print("No files downloaded.")
+            
+
+# Example usage
+download_path = os.path.join(Path.home(), ".crawl4ai", "downloads")
+os.makedirs(download_path, exist_ok=True) # Create directory if it doesn't exist
+
+
+asyncio.run(download_multiple_files("https://www.python.org/downloads/windows/", download_path))
+```
+
+## Important Considerations
+
+- **Browser Context:** Downloads are managed within the browser context.  Ensure your `js_code` correctly targets the download triggers on the specific web page.
+- **Waiting:**  Use `wait_for` to manage the timing of the crawl process if immediate download might not occur.
+- **Error Handling:** Implement proper error handling to gracefully manage failed downloads or incorrect file paths.
+- **Security:** Downloaded files should be scanned for potential security threats before use.
+
+
+
+This guide provides a foundation for handling downloads with Crawl4AI. You can adapt these techniques to manage downloads in various scenarios and integrate them into more complex crawling workflows.
diff --git a/docs/md_v2/basic/quickstart.md b/docs/md_v2/basic/quickstart.md
index f4904915..95b8a397 100644
--- a/docs/md_v2/basic/quickstart.md
+++ b/docs/md_v2/basic/quickstart.md
@@ -8,7 +8,7 @@ First, let's import the necessary modules and create an instance of `AsyncWebCra
 
 ```python
 import asyncio
-from crawl4ai import AsyncWebCrawler
+from crawl4ai import AsyncWebCrawler, CasheMode
 
 async def main():
     async with AsyncWebCrawler(verbose=True) as crawler:
@@ -42,7 +42,7 @@ async def capture_and_save_screenshot(url: str, output_path: str):
         result = await crawler.arun(
             url=url,
             screenshot=True,
-            bypass_cache=True
+            cache_mode=CacheMode.BYPASS
         )
         
         if result.success and result.screenshot:
@@ -62,15 +62,15 @@ Crawl4AI supports multiple browser engines. Here's how to use different browsers
 ```python
 # Use Firefox
 async with AsyncWebCrawler(browser_type="firefox", verbose=True, headless=True) as crawler:
-    result = await crawler.arun(url="https://www.example.com", bypass_cache=True)
+    result = await crawler.arun(url="https://www.example.com", cache_mode=CacheMode.BYPASS)
 
 # Use WebKit
 async with AsyncWebCrawler(browser_type="webkit", verbose=True, headless=True) as crawler:
-    result = await crawler.arun(url="https://www.example.com", bypass_cache=True)
+    result = await crawler.arun(url="https://www.example.com", cache_mode=CacheMode.BYPASS)
 
 # Use Chromium (default)
 async with AsyncWebCrawler(verbose=True, headless=True) as crawler:
-    result = await crawler.arun(url="https://www.example.com", bypass_cache=True)
+    result = await crawler.arun(url="https://www.example.com", cache_mode=CacheMode.BYPASS)
 ```
 
 ### User Simulation 🎭
@@ -81,7 +81,7 @@ Simulate real user behavior to avoid detection:
 async with AsyncWebCrawler(verbose=True, headless=True) as crawler:
     result = await crawler.arun(
         url="YOUR-URL-HERE",
-        bypass_cache=True,
+        cache_mode=CacheMode.BYPASS,
         simulate_user=True,  # Causes random mouse movements and clicks
         override_navigator=True  # Makes the browser appear more like a real user
     )
@@ -99,7 +99,7 @@ async def main():
         print(f"First crawl result: {result1.markdown[:100]}...")
 
         # Force to crawl again
-        result2 = await crawler.arun(url="https://www.nbcnews.com/business", bypass_cache=True)
+        result2 = await crawler.arun(url="https://www.nbcnews.com/business", cache_mode=CacheMode.BYPASS)
         print(f"Second crawl result: {result2.markdown[:100]}...")
 
 asyncio.run(main())
@@ -189,7 +189,7 @@ extraction_strategy = LLMExtractionStrategy(
 async with AsyncWebCrawler() as crawler:
     result = await crawler.arun(
         url="https://paulgraham.com/love.html",
-        bypass_cache=True,
+        cache_mode=CacheMode.BYPASS,
         extraction_strategy=extraction_strategy
     )
 ```
@@ -239,7 +239,7 @@ async def crawl_dynamic_content():
                 js_code=js_next_page if page > 0 else None,
                 wait_for=wait_for if page > 0 else None,
                 js_only=page > 0,
-                bypass_cache=True,
+                cache_mode=CacheMode.BYPASS,
                 headless=False,
             )
 
@@ -254,7 +254,7 @@ Remove overlay elements and fit content appropriately:
 async with AsyncWebCrawler(headless=False) as crawler:
     result = await crawler.arun(
         url="your-url-here",
-        bypass_cache=True,
+        cache_mode=CacheMode.BYPASS,
         word_count_threshold=10,
         remove_overlay_elements=True,
         screenshot=True
@@ -282,7 +282,7 @@ async with AsyncWebCrawler() as crawler:
     result = await crawler.arun(
         url="https://www.nbcnews.com/business",
         word_count_threshold=0,
-        bypass_cache=True,
+        cache_mode=CacheMode.BYPASS,
         verbose=False,
     )
     end = time.time()
diff --git a/docs/md_v2/basic/simple-crawling.md b/docs/md_v2/basic/simple-crawling.md
index 097d5e61..871fa64c 100644
--- a/docs/md_v2/basic/simple-crawling.md
+++ b/docs/md_v2/basic/simple-crawling.md
@@ -12,7 +12,9 @@ from crawl4ai import AsyncWebCrawler
 
 async def main():
     async with AsyncWebCrawler() as crawler:
-        result = await crawler.arun(url="https://example.com")
+        result = await crawler.arun(
+            url="https://example.com"
+        )
         print(result.markdown)  # Print clean markdown content
 
 if __name__ == "__main__":
@@ -24,7 +26,7 @@ if __name__ == "__main__":
 The `arun()` method returns a `CrawlResult` object with several useful properties. Here's a quick overview (see [CrawlResult](../api/crawl-result.md) for complete details):
 
 ```python
-result = await crawler.arun(url="https://example.com")
+result = await crawler.arun(url="https://example.com", fit_markdown=True)
 
 # Different content formats
 print(result.html)         # Raw HTML
@@ -81,7 +83,7 @@ Here's a more comprehensive example showing common usage patterns:
 
 ```python
 import asyncio
-from crawl4ai import AsyncWebCrawler
+from crawl4ai import AsyncWebCrawler, CacheMode
 
 async def main():
     async with AsyncWebCrawler(verbose=True) as crawler:
@@ -97,7 +99,7 @@ async def main():
             remove_overlay_elements=True,
             
             # Cache control
-            bypass_cache=False  # Use cache if available
+            cache_mode=CacheMode.ENABLE  # Use cache if available
         )
         
         if result.success:
diff --git a/docs/md_v2/tutorial/episode_11_2_Extraction_Strategies_LLM.md b/docs/md_v2/tutorial/episode_11_2_Extraction_Strategies_LLM.md
index 3682425f..a9f00e92 100644
--- a/docs/md_v2/tutorial/episode_11_2_Extraction_Strategies_LLM.md
+++ b/docs/md_v2/tutorial/episode_11_2_Extraction_Strategies_LLM.md
@@ -52,7 +52,7 @@ Here’s a comprehensive outline for the **LLM Extraction Strategy** video, cove
                      extraction_type="schema",
                      instruction="Extract model names and fees for input and output tokens from the page."
                  ),
-                 bypass_cache=True
+                 cache_mode=CacheMode.BYPASS
              )
              print(result.extracted_content)
      ```
@@ -98,7 +98,7 @@ Here’s a comprehensive outline for the **LLM Extraction Strategy** video, cove
              result = await crawler.arun(
                  url="https://example.com/some-article",
                  extraction_strategy=extraction_strategy,
-                 bypass_cache=True
+                 cache_mode=CacheMode.BYPASS
              )
              print(result.extracted_content)
      ```
diff --git a/docs/md_v2/tutorial/episode_11_3_Extraction_Strategies_Cosine.md b/docs/md_v2/tutorial/episode_11_3_Extraction_Strategies_Cosine.md
index 9f1c00ea..6100ae4c 100644
--- a/docs/md_v2/tutorial/episode_11_3_Extraction_Strategies_Cosine.md
+++ b/docs/md_v2/tutorial/episode_11_3_Extraction_Strategies_Cosine.md
@@ -55,7 +55,7 @@ Here’s a structured outline for the **Cosine Similarity Strategy** video, cove
              result = await crawler.arun(
                  url=url,
                  extraction_strategy=extraction_strategy,
-                 bypass_cache=True
+                 cache_mode=CacheMode.BYPASS
              )
              print(result.extracted_content)
      ```
@@ -103,7 +103,7 @@ Here’s a structured outline for the **Cosine Similarity Strategy** video, cove
              result = await crawler.arun(
                  url=url,
                  extraction_strategy=extraction_strategy,
-                 bypass_cache=True
+                 cache_mode=CacheMode.BYPASS
              )
              print(result.extracted_content)
      ```
diff --git a/docs/md_v2/tutorial/tutorial.md b/docs/md_v2/tutorial/tutorial.md
index bf355ed0..7bead842 100644
--- a/docs/md_v2/tutorial/tutorial.md
+++ b/docs/md_v2/tutorial/tutorial.md
@@ -26,7 +26,7 @@ Here's a condensed outline of the **Installation and Setup** video content:
    - Walk through a simple test script to confirm the setup:
       ```python
       import asyncio
-      from crawl4ai import AsyncWebCrawler
+      from crawl4ai import AsyncWebCrawler, CacheMode
       
       async def main():
           async with AsyncWebCrawler(verbose=True) as crawler:
@@ -1093,7 +1093,7 @@ Here’s a comprehensive outline for the **LLM Extraction Strategy** video, cove
                      extraction_type="schema",
                      instruction="Extract model names and fees for input and output tokens from the page."
                  ),
-                 bypass_cache=True
+                 cache_mode=CacheMode.BYPASS
              )
              print(result.extracted_content)
      ```
@@ -1139,7 +1139,7 @@ Here’s a comprehensive outline for the **LLM Extraction Strategy** video, cove
              result = await crawler.arun(
                  url="https://example.com/some-article",
                  extraction_strategy=extraction_strategy,
-                 bypass_cache=True
+                 cache_mode=CacheMode.BYPASS
              )
              print(result.extracted_content)
      ```
@@ -1248,7 +1248,7 @@ Here’s a structured outline for the **Cosine Similarity Strategy** video, cove
              result = await crawler.arun(
                  url=url,
                  extraction_strategy=extraction_strategy,
-                 bypass_cache=True
+                 cache_mode=CacheMode.BYPASS
              )
              print(result.extracted_content)
      ```
@@ -1296,7 +1296,7 @@ Here’s a structured outline for the **Cosine Similarity Strategy** video, cove
              result = await crawler.arun(
                  url=url,
                  extraction_strategy=extraction_strategy,
-                 bypass_cache=True
+                 cache_mode=CacheMode.BYPASS
              )
              print(result.extracted_content)
      ```

From 152ac35bc2805610863d1f13efe8434fe2d290bd Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Sun, 17 Nov 2024 21:09:26 +0800
Subject: [PATCH 044/115] feat(docs): update README for version 0.3.74 with new
 features and improvements fix(version): update version number to 0.3.74
 refactor(async_webcrawler): enhance logging and add domain-based request
 delay

---
 README.md                          | 16 +++++------
 crawl4ai/__version__.py            |  2 +-
 crawl4ai/async_crawler_strategy.py |  4 +--
 crawl4ai/async_webcrawler.py       | 43 +++++++++++++++++++++++++-----
 crawl4ai/config.py                 |  1 +
 5 files changed, 47 insertions(+), 19 deletions(-)

diff --git a/README.md b/README.md
index 9c3796cd..f6c8dc08 100644
--- a/README.md
+++ b/README.md
@@ -13,17 +13,15 @@ Crawl4AI simplifies asynchronous web crawling and data extraction, making it acc
 
 ## New in 0.3.74 ✨
 
-- 🚀 **Blazing Fast Scraping:**  The scraping process is now significantly faster, often completing in under 100 milliseconds (excluding web fetch time)!
-- 📥 **Download Mastery:** Control downloads, specify folders, and track files within the `CrawlResult` object.
-- 🔎 **Relevance Filtering:** Extract the most important content with the new `RelevanceContentFilter` and BM25 algorithm.  Control filtering with the `fit_markdown` flag.
+- 🚀 **Blazing Fast Scraping:** The scraping process is now significantly faster, often completing in under 100 milliseconds (excluding web fetch time)!
+- 📥 **Download Manager:** Integrated file crawling and downloading capabilities, with full control over file management and tracking within the `CrawlResult` object.
+- 🔎 **Markdown Filter:** Enhanced content extraction using BM25 algorithm to create cleaner markdown with only relevant webpage content.
 - 🗂️ **Local & Raw HTML:** Crawl local files (`file://`) and raw HTML strings (`raw:`) directly.
-- 🤖 **Browser Boss:** Manage browser sessions with persistent contexts, process monitoring, and tf-playwright-stealth integration.  Configure using `use_managed_browser`, `user_data_dir`, and `use_persistent_context` parameters.
+- 🤖 **Browser Control:** Use your own browser setup for crawling, with persistent contexts and stealth integration to bypass anti-bot measures.
 - ☁️ **API & Cache Boost:** CORS support, static file serving, and a new filesystem-based cache for blazing-fast performance. Fine-tune caching with the `CacheMode` enum (ENABLED, DISABLED, READ_ONLY, WRITE_ONLY, BYPASS) and the `always_bypass_cache` parameter.
-- 🔒 **API Security:** Protect your API server with token-based authentication using the `CRAWL4AI_API_TOKEN` environment variable.
-- 🔄 **Synchronous & Direct Crawling:** Get immediate results with `/crawl_sync` or bypass the task queue with `/crawl_direct`.
-- 🛠️ **Database Migration:**  A new `crawl4ai-migrate` command ensures smooth upgrades and data integrity between versions.
-- 🐛 **Squashed Bugs:**  Fixed browser context issues in Docker, memory leaks, enhanced error handling, and improved HTML parsing.
-
+- 🐳 **API Gateway:** Run Crawl4AI as a local or cloud API service, enabling cross-platform usage through a containerized server with secure token authentication via `CRAWL4AI_API_TOKEN`.
+- 🛠️ **Database Improvements:** Enhanced database system for handling larger content sets with improved caching and faster performance.
+- 🐛 **Squashed Bugs:** Fixed browser context issues in Docker, memory leaks, enhanced error handling, and improved HTML parsing.
 
 ## Try it Now!
 
diff --git a/crawl4ai/__version__.py b/crawl4ai/__version__.py
index 7ab71c9b..65ee6e73 100644
--- a/crawl4ai/__version__.py
+++ b/crawl4ai/__version__.py
@@ -1,2 +1,2 @@
 # crawl4ai/_version.py
-__version__ = "0.3.731"
\ No newline at end of file
+__version__ = "0.3.74"
\ No newline at end of file
diff --git a/crawl4ai/async_crawler_strategy.py b/crawl4ai/async_crawler_strategy.py
index a67591af..90d5cbe8 100644
--- a/crawl4ai/async_crawler_strategy.py
+++ b/crawl4ai/async_crawler_strategy.py
@@ -605,7 +605,7 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
                             proxy={"server": self.proxy} if self.proxy else None,
                             java_script_enabled=True,
                             accept_downloads=self.accept_downloads,
-                            downloads_path=self.downloads_path if self.accept_downloads else None
+                            # downloads_path=self.downloads_path if self.accept_downloads else None
                         )
                         await context.add_cookies([{"name": "cookiesEnabled", "value": "true", "url": url}])
                         await context.set_extra_http_headers(self.headers)
@@ -905,7 +905,7 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
             )
             return response
         except Error as e:
-            raise Error(f"[ERROR] 🚫 crawl(): Failed to crawl {url}: {str(e)}")
+            raise Error(f"async_crawler_strategy.py:_crawleb(): {str(e)}")
         # finally:
         #     if not session_id:
         #         await page.close()
diff --git a/crawl4ai/async_webcrawler.py b/crawl4ai/async_webcrawler.py
index d22e3b1f..79a17ac4 100644
--- a/crawl4ai/async_webcrawler.py
+++ b/crawl4ai/async_webcrawler.py
@@ -15,15 +15,19 @@ from .extraction_strategy import *
 from .async_crawler_strategy import AsyncCrawlerStrategy, AsyncPlaywrightCrawlerStrategy, AsyncCrawlResponse
 from .cache_context import CacheMode, CacheContext, _legacy_to_cache_mode
 from .content_scrapping_strategy import WebScrapingStrategy
+
 from .config import (
     MIN_WORD_THRESHOLD, 
-    IMAGE_DESCRIPTION_MIN_WORD_THRESHOLD
+    IMAGE_DESCRIPTION_MIN_WORD_THRESHOLD,
+    URL_LOG_SHORTEN_LENGTH
 )
 from .utils import (
     sanitize_input_encode,
     InvalidCSSSelectorError,
     format_html
 )
+from urllib.parse import urlparse
+import random
 from .__version__ import __version__ as crawl4ai_version
 
 
@@ -51,6 +55,7 @@ class AsyncWebCrawler:
     To disable deprecation warnings:
         Pass warning=False to suppress the warning.
     """
+    _domain_last_hit = {}
 
     def __init__(
         self,
@@ -248,7 +253,7 @@ class AsyncWebCrawler:
                 screenshot_data = async_response.screenshot
                 t2 = time.perf_counter()
                 if verbose:
-                    print(f"{Fore.BLUE}{self.tag_format('FETCH')} {self.log_icons['FETCH']} Live fetch for {cache_context.display_url} | Status: {Fore.GREEN if bool(html) else Fore.RED}{bool(html)}{Style.RESET_ALL} | Time: {t2 - t1:.2f}s")
+                    print(f"{Fore.BLUE}{self.tag_format('FETCH')} {self.log_icons['FETCH']} Live fetch for {cache_context.display_url}... | Status: {Fore.GREEN if bool(html) else Fore.RED}{bool(html)}{Style.RESET_ALL} | Time: {t2 - t1:.2f}s")
 
             # Process the HTML content
             crawl_result = await self.aprocess_html(
@@ -283,7 +288,7 @@ class AsyncWebCrawler:
             crawl_result.session_id = kwargs.get("session_id", None)
 
             if verbose:
-                print(f"{Fore.GREEN}{self.tag_format('COMPLETE')} {self.log_icons['COMPLETE']} {cache_context.display_url} | Status: {Fore.GREEN if crawl_result.success else Fore.RED}{crawl_result.success} | {Fore.YELLOW}Total: {time.perf_counter() - start_time:.2f}s{Style.RESET_ALL}")
+                print(f"{Fore.GREEN}{self.tag_format('COMPLETE')} {self.log_icons['COMPLETE']} {cache_context.display_url[:URL_LOG_SHORTEN_LENGTH]}... | Status: {Fore.GREEN if crawl_result.success else Fore.RED}{crawl_result.success} | {Fore.YELLOW}Total: {time.perf_counter() - start_time:.2f}s{Style.RESET_ALL}")
 
 
             # Update cache if appropriate
@@ -295,7 +300,7 @@ class AsyncWebCrawler:
         except Exception as e:
             if not hasattr(e, "msg"):
                 e.msg = str(e)
-            print(f"{Fore.RED}{self.tag_format('ERROR')} {self.log_icons['ERROR']} Failed to crawl {cache_context.display_url} | {e.msg}{Style.RESET_ALL}")
+            print(f"{Fore.RED}{self.tag_format('ERROR')} {self.log_icons['ERROR']} Failed to crawl {cache_context.display_url[:URL_LOG_SHORTEN_LENGTH]}... | {e.msg}{Style.RESET_ALL}")
             return CrawlResult(
                 url=url, 
                 html="", 
@@ -350,10 +355,29 @@ class AsyncWebCrawler:
             if cache_mode is None:
                 cache_mode = CacheMode.BYPASS
 
-        semaphore_count = kwargs.get('semaphore_count', 5)
+        semaphore_count = kwargs.get('semaphore_count', 10)
         semaphore = asyncio.Semaphore(semaphore_count)
 
         async def crawl_with_semaphore(url):
+            domain = urlparse(url).netloc
+            current_time = time.time()
+            
+            print(f"{Fore.LIGHTBLACK_EX}{self.tag_format('PARALLEL')} Started task for {url[:50]}...{Style.RESET_ALL}")
+            
+            # Get delay settings from kwargs or use defaults
+            mean_delay = kwargs.get('mean_delay', 0.1)  # 0.5 seconds default mean delay
+            max_range = kwargs.get('max_range', 0.3)    # 1 seconds default max additional delay
+            
+            # Check if we need to wait
+            if domain in self._domain_last_hit:
+                time_since_last = current_time - self._domain_last_hit[domain]
+                if time_since_last < mean_delay:
+                    delay = mean_delay + random.uniform(0, max_range)
+                    await asyncio.sleep(delay)
+            
+            # Update last hit time
+            self._domain_last_hit[domain] = current_time    
+                    
             async with semaphore:
                 return await self.arun(
                     url,
@@ -369,8 +393,13 @@ class AsyncWebCrawler:
                     **kwargs,
                 )
 
+        # Print start message
+        print(f"{Fore.CYAN}{self.tag_format('INIT')} {self.log_icons['INIT']} Starting concurrent crawling for {len(urls)} URLs...{Style.RESET_ALL}")
+        start_time = time.perf_counter()
         tasks = [crawl_with_semaphore(url) for url in urls]
         results = await asyncio.gather(*tasks, return_exceptions=True)
+        end_time = time.perf_counter()
+        print(f"{Fore.YELLOW}{self.tag_format('COMPLETE')} {self.log_icons['COMPLETE']} Concurrent crawling completed for {len(urls)} URLs | Total time: {end_time - start_time:.2f}s{Style.RESET_ALL}")
         return [result if not isinstance(result, Exception) else str(result) for result in results]
 
 
@@ -423,7 +452,7 @@ class AsyncWebCrawler:
         metadata = result.get("metadata", {})
         
         if verbose:
-            print(f"{Fore.MAGENTA}{self.tag_format('SCRAPE')} {self.log_icons['SCRAPE']} Processed {_url}{Style.RESET_ALL} | Time: {int((time.perf_counter() - t1) * 1000)}ms")
+            print(f"{Fore.MAGENTA}{self.tag_format('SCRAPE')} {self.log_icons['SCRAPE']} Processed {_url[:URL_LOG_SHORTEN_LENGTH]}...{Style.RESET_ALL} | Time: {int((time.perf_counter() - t1) * 1000)}ms")
 
 
 
@@ -439,7 +468,7 @@ class AsyncWebCrawler:
                 extracted_content = extraction_strategy.run(url, sections)
                 extracted_content = json.dumps(extracted_content, indent=4, default=str, ensure_ascii=False)
             if verbose:
-                print(f"{Fore.YELLOW}{self.tag_format('EXTRACT')} {self.log_icons['EXTRACT']} Completed for {_url}{Style.RESET_ALL} | Time: {time.perf_counter() - t1:.2f}s{Style.RESET_ALL}")
+                print(f"{Fore.YELLOW}{self.tag_format('EXTRACT')} {self.log_icons['EXTRACT']} Completed for {_url[:URL_LOG_SHORTEN_LENGTH]}...{Style.RESET_ALL} | Time: {time.perf_counter() - t1:.2f}s{Style.RESET_ALL}")
 
                 
 
diff --git a/crawl4ai/config.py b/crawl4ai/config.py
index 6b1324dd..786ca4e5 100644
--- a/crawl4ai/config.py
+++ b/crawl4ai/config.py
@@ -55,4 +55,5 @@ IMAGE_SCORE_THRESHOLD = 2
 MAX_METRICS_HISTORY = 1000
 
 NEED_MIGRATION = True
+URL_LOG_SHORTEN_LENGTH = 30
 SHOW_DEPRECATION_WARNINGS = True
\ No newline at end of file

From 852729ff380f0568d6874bc960606ba3cce0e935 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Mon, 18 Nov 2024 21:00:06 +0800
Subject: [PATCH 045/115] feat(docker): add Docker Compose configurations for
 local and hub deployment; enhance GPU support checks in Dockerfile
 feat(requirements): update requirements.txt to include snowballstemmer
 fix(version_manager): correct version parsing to use __version__.__version__
 feat(main): introduce chunking strategy and content filter in CrawlRequest
 model feat(content_filter): enhance BM25 algorithm with priority tag scoring
 for improved content relevance feat(logger): implement new async logger
 engine replacing print statements throughout library fix(database): resolve
 version-related deadlock and circular lock issues in database operations
 docs(docker): expand Docker deployment documentation with usage instructions
 for Docker Compose

---
 Dockerfile                             |  12 +-
 crawl4ai/async_crawler_strategy.py     | 149 ++++++++++++----
 crawl4ai/async_database.py             | 189 +++++++++++++-------
 crawl4ai/async_logger.py               | 231 +++++++++++++++++++++++++
 crawl4ai/async_webcrawler.py           | 144 +++++++++++----
 crawl4ai/content_filter_strategy.py    |  71 ++++----
 crawl4ai/content_scrapping_strategy.py |  44 ++++-
 crawl4ai/version_manager.py            |   4 +-
 docker-compose.hub.yml                 |  27 +++
 docker-compose.local.yml               |  33 ++++
 docker-compose.yml                     |  47 ++++-
 docs/examples/v0.3.74.overview.py      | 119 +++++++++----
 docs/md_v2/basic/docker-deploymeny.md  |  88 ++++++++++
 main.py                                |  23 ++-
 requirements.txt                       |   3 +-
 15 files changed, 952 insertions(+), 232 deletions(-)
 create mode 100644 crawl4ai/async_logger.py
 create mode 100644 docker-compose.hub.yml
 create mode 100644 docker-compose.local.yml

diff --git a/Dockerfile b/Dockerfile
index aac2280a..bd71deae 100644
--- a/Dockerfile
+++ b/Dockerfile
@@ -62,11 +62,13 @@ RUN apt-get update && apt-get install -y --no-install-recommends \
     libatspi2.0-0 \
     && rm -rf /var/lib/apt/lists/*
 
-# GPU support if enabled
-RUN if [ "$ENABLE_GPU" = "true" ] ; then \
-    apt-get update && apt-get install -y --no-install-recommends \
-    nvidia-cuda-toolkit \
-    && rm -rf /var/lib/apt/lists/* ; \
+# GPU support if enabled and architecture is supported
+RUN if [ "$ENABLE_GPU" = "true" ] && [ "$(dpkg --print-architecture)" != "arm64" ] ; then \
+        apt-get update && apt-get install -y --no-install-recommends \
+        nvidia-cuda-toolkit \
+        && rm -rf /var/lib/apt/lists/* ; \
+    else \
+        echo "Skipping NVIDIA CUDA Toolkit installation (unsupported architecture or GPU disabled)"; \
     fi
 
 # Create and set working directory
diff --git a/crawl4ai/async_crawler_strategy.py b/crawl4ai/async_crawler_strategy.py
index 90d5cbe8..a6ba8e50 100644
--- a/crawl4ai/async_crawler_strategy.py
+++ b/crawl4ai/async_crawler_strategy.py
@@ -35,13 +35,15 @@ stealth_config = StealthConfig(
 
 
 class ManagedBrowser:
-    def __init__(self, browser_type: str = "chromium", user_data_dir: Optional[str] = None, headless: bool = False):
+    def __init__(self, browser_type: str = "chromium", user_data_dir: Optional[str] = None, headless: bool = False, logger = None):
         self.browser_type = browser_type
         self.user_data_dir = user_data_dir
         self.headless = headless
         self.browser_process = None
         self.temp_dir = None
         self.debugging_port = 9222
+        self.logger = logger
+        self.shutting_down = False
 
     async def start(self) -> str:
         """
@@ -76,15 +78,38 @@ class ManagedBrowser:
     async def _monitor_browser_process(self):
         """Monitor the browser process for unexpected termination."""
         if self.browser_process:
-            stdout, stderr = await asyncio.gather(
-                asyncio.to_thread(self.browser_process.stdout.read),
-                asyncio.to_thread(self.browser_process.stderr.read)
-            )
-            if self.browser_process.poll() is not None:
-                print(f"Browser process terminated unexpectedly with code {self.browser_process.returncode}")
-                print(f"STDOUT: {stdout.decode()}")
-                print(f"STDERR: {stderr.decode()}")
-                await self.cleanup()
+            try:
+                stdout, stderr = await asyncio.gather(
+                    asyncio.to_thread(self.browser_process.stdout.read),
+                    asyncio.to_thread(self.browser_process.stderr.read)
+                )
+                
+                # Check shutting_down flag BEFORE logging anything
+                if self.browser_process.poll() is not None:
+                    if not self.shutting_down:
+                        self.logger.error(
+                            message="Browser process terminated unexpectedly | Code: {code} | STDOUT: {stdout} | STDERR: {stderr}",
+                            tag="ERROR",
+                            params={
+                                "code": self.browser_process.returncode,
+                                "stdout": stdout.decode(),
+                                "stderr": stderr.decode()
+                            }
+                        )                
+                        await self.cleanup()
+                    else:
+                        self.logger.info(
+                            message="Browser process terminated normally | Code: {code}",
+                            tag="INFO",
+                            params={"code": self.browser_process.returncode}
+                        )
+            except Exception as e:
+                if not self.shutting_down:
+                    self.logger.error(
+                        message="Error monitoring browser process: {error}",
+                        tag="ERROR",
+                        params={"error": str(e)}
+                    )
 
     def _get_browser_path(self) -> str:
         """Returns the browser executable path based on OS and browser type"""
@@ -134,20 +159,39 @@ class ManagedBrowser:
 
     async def cleanup(self):
         """Cleanup browser process and temporary directory"""
+        # Set shutting_down flag BEFORE any termination actions
+        self.shutting_down = True
+        
         if self.browser_process:
             try:
                 self.browser_process.terminate()
-                await asyncio.sleep(1)
+                # Wait for process to end gracefully
+                for _ in range(10):  # 10 attempts, 100ms each
+                    if self.browser_process.poll() is not None:
+                        break
+                    await asyncio.sleep(0.1)
+                
+                # Force kill if still running
                 if self.browser_process.poll() is None:
                     self.browser_process.kill()
+                    await asyncio.sleep(0.1)  # Brief wait for kill to take effect
+                    
             except Exception as e:
-                print(f"Error terminating browser: {e}")
+                self.logger.error(
+                    message="Error terminating browser: {error}",
+                    tag="ERROR",
+                    params={"error": str(e)}
+                )
 
         if self.temp_dir and os.path.exists(self.temp_dir):
             try:
                 shutil.rmtree(self.temp_dir)
             except Exception as e:
-                print(f"Error removing temporary directory: {e}")
+                self.logger.error(
+                    message="Error removing temporary directory: {error}",
+                    tag="ERROR",
+                    params={"error": str(e)}
+                )
 
 
 class AsyncCrawlerStrategy(ABC):
@@ -172,7 +216,8 @@ class AsyncCrawlerStrategy(ABC):
         pass
 
 class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
-    def __init__(self, use_cached_html=False, js_code=None, **kwargs):
+    def __init__(self, use_cached_html=False, js_code=None, logger = None, **kwargs):
+        self.logger = logger
         self.use_cached_html = use_cached_html
         self.user_agent = kwargs.get(
             "user_agent",
@@ -231,7 +276,8 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
                 self.managed_browser = ManagedBrowser(
                     browser_type=self.browser_type,
                     user_data_dir=self.user_data_dir,
-                    headless=self.headless
+                    headless=self.headless,
+                    logger=self.logger
                 )
                 cdp_url = await self.managed_browser.start()
                 self.browser = await self.playwright.chromium.connect_over_cdp(cdp_url)
@@ -282,6 +328,10 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
                 # Add extra args if provided
                 if self.extra_args:
                     browser_args["args"].extend(self.extra_args)
+                    
+                # Add downloads path if downloads are enabled
+                if self.accept_downloads:
+                    browser_args["downloads_path"] = self.downloads_path
                 
                 # Add proxy settings if a proxy is specified
                 if self.proxy:
@@ -344,6 +394,7 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
             self.browser = None
             
         if self.managed_browser:
+            await asyncio.sleep(0.5)
             await self.managed_browser.cleanup()
             self.managed_browser = None
             
@@ -491,9 +542,19 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
                         }}
                     """)
                 else:
-                    print(f"Warning: Could not access content frame for iframe {i}")
+                    # print(f"Warning: Could not access content frame for iframe {i}")
+                    self.logger.warning(
+                        message="Could not access content frame for iframe {index}",
+                        tag="SCRAPE",
+                        params={"index": i}
+                    )                    
             except Exception as e:
-                print(f"Error processing iframe {i}: {str(e)}")
+                self.logger.error(
+                    message="Error processing iframe {index}: {error}",
+                    tag="ERROR",
+                    params={"index": i, "error": str(e)}
+                )                
+                # print(f"Error processing iframe {i}: {str(e)}")
 
         # Return the page object
         return page  
@@ -620,7 +681,8 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
                     context = await self.browser.new_context(
                         user_agent=self.user_agent,
                         viewport={"width": 1920, "height": 1080},
-                        proxy={"server": self.proxy} if self.proxy else None
+                        proxy={"server": self.proxy} if self.proxy else None,
+                        accept_downloads=self.accept_downloads,
                     )
                     await context.set_extra_http_headers(self.headers)
                 
@@ -917,17 +979,31 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
             suggested_filename = download.suggested_filename
             download_path = os.path.join(self.downloads_path, suggested_filename)
             
-            if self.verbose:
-                print(f"[LOG] 📥 Downloading {suggested_filename} to {download_path}")
+            self.logger.info(
+                message="Downloading {filename} to {path}",
+                tag="FETCH",
+                params={"filename": suggested_filename, "path": download_path}
+            )
                 
+            start_time = time.perf_counter()
             await download.save_as(download_path)
+            end_time = time.perf_counter()
             self._downloaded_files.append(download_path)
-            
-            if self.verbose:
-                print(f"[LOG] ✅ Downloaded {suggested_filename} successfully")
+
+            self.logger.success(
+                message="Downloaded {filename} successfully",
+                tag="COMPLETE",
+                params={"filename": suggested_filename, "path": download_path, "duration": f"{end_time - start_time:.2f}s"}
+            )            
         except Exception as e:
-            if self.verbose:
-                print(f"[ERROR] Failed to handle download: {str(e)}")
+            self.logger.error(
+                message="Failed to handle download: {error}",
+                tag="ERROR",
+                params={"error": str(e)}
+            )
+            
+            # if self.verbose:
+            #     print(f"[ERROR] Failed to handle download: {str(e)}")
     
     async def crawl_many(self, urls: List[str], **kwargs) -> List[AsyncCrawlResponse]:
         semaphore_count = kwargs.get('semaphore_count', 5)  # Adjust as needed
@@ -1070,8 +1146,13 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
             await page.evaluate(remove_overlays_js)
             await page.wait_for_timeout(500)  # Wait for any animations to complete
         except Exception as e:
-            if self.verbose:
-                print(f"Warning: Failed to remove overlay elements: {str(e)}")
+            self.logger.warning(
+                message="Failed to remove overlay elements: {error}",
+                tag="SCRAPE",
+                params={"error": str(e)}
+            )            
+            # if self.verbose:
+            #     print(f"Warning: Failed to remove overlay elements: {str(e)}")
 
     async def take_screenshot(self, page: Page) -> str:
         """
@@ -1089,7 +1170,12 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
             return base64.b64encode(screenshot).decode('utf-8')
         except Exception as e:
             error_message = f"Failed to take screenshot: {str(e)}"
-            print(error_message)
+            self.logger.error(
+                message="Screenshot failed: {error}",
+                tag="ERROR",
+                params={"error": error_message}
+            )
+            
 
             # Generate an error image
             img = Image.new('RGB', (800, 600), color='black')
@@ -1123,7 +1209,12 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
             return base64.b64encode(screenshot).decode('utf-8')
         except Exception as e:
             error_message = f"Failed to take screenshot: {str(e)}"
-            print(error_message)
+            # print(error_message)
+            self.logger.error(
+                message="Screenshot failed: {error}",
+                tag="ERROR",
+                params={"error": error_message}
+            )            
 
             # Generate an error image
             img = Image.new('RGB', (800, 600), color='black')
diff --git a/crawl4ai/async_database.py b/crawl4ai/async_database.py
index 7809dfe1..19160b6e 100644
--- a/crawl4ai/async_database.py
+++ b/crawl4ai/async_database.py
@@ -12,10 +12,12 @@ import xxhash
 import aiofiles
 from .config import NEED_MIGRATION
 from .version_manager import VersionManager
+from .async_logger import AsyncLogger
 # Set up logging
 logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger(__name__)
 
+base_directory = Path.home()
 DB_PATH = os.path.join(Path.home(), ".crawl4ai")
 os.makedirs(DB_PATH, exist_ok=True)
 DB_PATH = os.path.join(DB_PATH, "crawl4ai.db")
@@ -28,15 +30,21 @@ class AsyncDatabaseManager:
         self.max_retries = max_retries
         self.connection_pool: Dict[int, aiosqlite.Connection] = {}
         self.pool_lock = asyncio.Lock()
+        self.init_lock = asyncio.Lock()
         self.connection_semaphore = asyncio.Semaphore(pool_size)
         self._initialized = False  
         self.version_manager = VersionManager()
+        self.logger = AsyncLogger(
+            log_file=os.path.join(base_directory, ".crawl4ai", "crawler_db.log"),
+            verbose=False,
+            tag_width=10
+        )
         
         
     async def initialize(self):
         """Initialize the database and connection pool"""
         try:
-            logger.info("Initializing database...")
+            self.logger.info("Initializing database", tag="INIT")
             # Ensure the database file exists
             os.makedirs(os.path.dirname(self.db_path), exist_ok=True)
             
@@ -47,31 +55,39 @@ class AsyncDatabaseManager:
             await self.ainit_db()
             
             # Verify the table exists
-            async def verify_table(db):
+            async with aiosqlite.connect(self.db_path, timeout=30.0) as db:
                 async with db.execute(
                     "SELECT name FROM sqlite_master WHERE type='table' AND name='crawled_data'"
                 ) as cursor:
                     result = await cursor.fetchone()
                     if not result:
                         raise Exception("crawled_data table was not created")
-                    
-            await self.execute_with_retry(verify_table)
             
             # If version changed or fresh install, run updates
             if needs_update:
-                logger.info("New version detected, running updates...")
+                self.logger.info("New version detected, running updates", tag="INIT")
                 await self.update_db_schema()
                 from .migrations import run_migration  # Import here to avoid circular imports
                 await run_migration()
                 self.version_manager.update_version()  # Update stored version after successful migration
-                logger.info("Version update completed successfully")
+                self.logger.success("Version update completed successfully", tag="COMPLETE")
             else:
-                logger.info("Database initialization completed successfully")
+                self.logger.success("Database initialization completed successfully", tag="COMPLETE")
+
                 
         except Exception as e:
-            logger.error(f"Database initialization error: {e}")
-            logger.info("Database will be initialized on first use")
+            self.logger.error(
+                message="Database initialization error: {error}",
+                tag="ERROR",
+                params={"error": str(e)}
+            )
+            self.logger.info(
+                message="Database will be initialized on first use",
+                tag="INIT"
+            )
+                        
             raise
+
             
     async def cleanup(self):
         """Cleanup connections when shutting down"""
@@ -84,34 +100,41 @@ class AsyncDatabaseManager:
     async def get_connection(self):
         """Connection pool manager"""
         if not self._initialized:
-            async with self.pool_lock:  # Prevent multiple simultaneous initializations
-                if not self._initialized:  # Double-check after acquiring lock
+            # Use an asyncio.Lock to ensure only one initialization occurs
+            async with self.init_lock:
+                if not self._initialized:
                     await self.initialize()
                     self._initialized = True
 
-        async with self.connection_semaphore:
-            task_id = id(asyncio.current_task())
-            try:
-                async with self.pool_lock:
-                    if task_id not in self.connection_pool:
-                        conn = await aiosqlite.connect(
-                            self.db_path,
-                            timeout=30.0
-                        )
-                        await conn.execute('PRAGMA journal_mode = WAL')
-                        await conn.execute('PRAGMA busy_timeout = 5000')
-                        self.connection_pool[task_id] = conn
-                    
-                yield self.connection_pool[task_id]
-                
-            except Exception as e:
-                logger.error(f"Connection error: {e}")
-                raise
-            finally:
-                async with self.pool_lock:
-                    if task_id in self.connection_pool:
-                        await self.connection_pool[task_id].close()
-                        del self.connection_pool[task_id]
+        await self.connection_semaphore.acquire()
+        task_id = id(asyncio.current_task())
+        try:
+            async with self.pool_lock:
+                if task_id not in self.connection_pool:
+                    conn = await aiosqlite.connect(
+                        self.db_path,
+                        timeout=30.0
+                    )
+                    await conn.execute('PRAGMA journal_mode = WAL')
+                    await conn.execute('PRAGMA busy_timeout = 5000')
+                    self.connection_pool[task_id] = conn
+
+            yield self.connection_pool[task_id]
+
+        except Exception as e:
+            self.logger.error(
+                message="Connection error: {error}",
+                tag="ERROR",
+                force_verbose=True,
+                params={"error": str(e)}
+            )
+            raise
+        finally:
+            async with self.pool_lock:
+                if task_id in self.connection_pool:
+                    await self.connection_pool[task_id].close()
+                    del self.connection_pool[task_id]
+            self.connection_semaphore.release()
 
 
     async def execute_with_retry(self, operation, *args):
@@ -124,13 +147,21 @@ class AsyncDatabaseManager:
                     return result
             except Exception as e:
                 if attempt == self.max_retries - 1:
-                    logger.error(f"Operation failed after {self.max_retries} attempts: {e}")
+                    self.logger.error(
+                        message="Operation failed after {retries} attempts: {error}",
+                        tag="ERROR",
+                        force_verbose=True,
+                        params={
+                            "retries": self.max_retries,
+                            "error": str(e)
+                        }
+                    )                    
                     raise
                 await asyncio.sleep(1 * (attempt + 1))  # Exponential backoff
 
     async def ainit_db(self):
         """Initialize database schema"""
-        async def _init(db):
+        async with aiosqlite.connect(self.db_path, timeout=30.0) as db:
             await db.execute('''
                 CREATE TABLE IF NOT EXISTS crawled_data (
                     url TEXT PRIMARY KEY,
@@ -147,36 +178,37 @@ class AsyncDatabaseManager:
                     downloaded_files TEXT DEFAULT "{}"  -- New column added
                 )
             ''')
-        
-        await self.execute_with_retry(_init)
+            await db.commit()
+
         
 
     async def update_db_schema(self):
         """Update database schema if needed"""
-        async def _check_columns(db):
+        async with aiosqlite.connect(self.db_path, timeout=30.0) as db:
             cursor = await db.execute("PRAGMA table_info(crawled_data)")
             columns = await cursor.fetchall()
-            return [column[1] for column in columns]
+            column_names = [column[1] for column in columns]
+            
+            # List of new columns to add
+            new_columns = ['media', 'links', 'metadata', 'screenshot', 'response_headers', 'downloaded_files']
+            
+            for column in new_columns:
+                if column not in column_names:
+                    await self.aalter_db_add_column(column, db)
+            await db.commit()
 
-        column_names = await self.execute_with_retry(_check_columns)
-        
-        # List of new columns to add
-        new_columns = ['media', 'links', 'metadata', 'screenshot', 'response_headers', 'downloaded_files']
-        
-        for column in new_columns:
-            if column not in column_names:
-                await self.aalter_db_add_column(column)
-
-    async def aalter_db_add_column(self, new_column: str):
+    async def aalter_db_add_column(self, new_column: str, db):
         """Add new column to the database"""
-        async def _alter(db):
-            if new_column == 'response_headers':
-                await db.execute(f'ALTER TABLE crawled_data ADD COLUMN {new_column} TEXT DEFAULT "{{}}"')
-            else:
-                await db.execute(f'ALTER TABLE crawled_data ADD COLUMN {new_column} TEXT DEFAULT ""')
-            logger.info(f"Added column '{new_column}' to the database.")
+        if new_column == 'response_headers':
+            await db.execute(f'ALTER TABLE crawled_data ADD COLUMN {new_column} TEXT DEFAULT "{{}}"')
+        else:
+            await db.execute(f'ALTER TABLE crawled_data ADD COLUMN {new_column} TEXT DEFAULT ""')
+        self.logger.info(
+            message="Added column '{column}' to the database",
+            tag="INIT",
+            params={"column": new_column}
+        )        
 
-        await self.execute_with_retry(_alter)
 
     async def aget_cached_url(self, url: str) -> Optional[CrawlResult]:
         """Retrieve cached URL data as CrawlResult"""
@@ -235,7 +267,12 @@ class AsyncDatabaseManager:
         try:
             return await self.execute_with_retry(_get)
         except Exception as e:
-            logger.error(f"Error retrieving cached URL: {e}")
+            self.logger.error(
+                message="Error retrieving cached URL: {error}",
+                tag="ERROR",
+                force_verbose=True,
+                params={"error": str(e)}
+            )
             return None
 
     async def acache_url(self, result: CrawlResult):
@@ -291,7 +328,13 @@ class AsyncDatabaseManager:
         try:
             await self.execute_with_retry(_cache)
         except Exception as e:
-            logger.error(f"Error caching URL: {e}")
+            self.logger.error(
+                message="Error caching URL: {error}",
+                tag="ERROR",
+                force_verbose=True,
+                params={"error": str(e)}
+            )
+            
 
     async def aget_total_count(self) -> int:
         """Get total number of cached URLs"""
@@ -303,7 +346,12 @@ class AsyncDatabaseManager:
         try:
             return await self.execute_with_retry(_count)
         except Exception as e:
-            logger.error(f"Error getting total count: {e}")
+            self.logger.error(
+                message="Error getting total count: {error}",
+                tag="ERROR",
+                force_verbose=True,
+                params={"error": str(e)}
+            )
             return 0
 
     async def aclear_db(self):
@@ -314,7 +362,12 @@ class AsyncDatabaseManager:
         try:
             await self.execute_with_retry(_clear)
         except Exception as e:
-            logger.error(f"Error clearing database: {e}")
+            self.logger.error(
+                message="Error clearing database: {error}",
+                tag="ERROR",
+                force_verbose=True,
+                params={"error": str(e)}
+            )
 
     async def aflush_db(self):
         """Drop the entire table"""
@@ -324,7 +377,12 @@ class AsyncDatabaseManager:
         try:
             await self.execute_with_retry(_flush)
         except Exception as e:
-            logger.error(f"Error flushing database: {e}")
+            self.logger.error(
+                message="Error flushing database: {error}",
+                tag="ERROR",
+                force_verbose=True,
+                params={"error": str(e)}
+            )
             
                 
     async def _store_content(self, content: str, content_type: str) -> str:
@@ -352,7 +410,12 @@ class AsyncDatabaseManager:
             async with aiofiles.open(file_path, 'r', encoding='utf-8') as f:
                 return await f.read()
         except:
-            logger.error(f"Failed to load content: {file_path}")
+            self.logger.error(
+                message="Failed to load content: {file_path}",
+                tag="ERROR",
+                force_verbose=True,
+                params={"file_path": file_path}
+            )
             return None
 
 # Create a singleton instance
diff --git a/crawl4ai/async_logger.py b/crawl4ai/async_logger.py
new file mode 100644
index 00000000..220edd11
--- /dev/null
+++ b/crawl4ai/async_logger.py
@@ -0,0 +1,231 @@
+from enum import Enum
+from typing import Optional, Dict, Any, Union
+from colorama import Fore, Back, Style, init
+import time
+import os
+from datetime import datetime
+
+class LogLevel(Enum):
+    DEBUG = 1
+    INFO = 2
+    SUCCESS = 3
+    WARNING = 4
+    ERROR = 5
+
+class AsyncLogger:
+    """
+    Asynchronous logger with support for colored console output and file logging.
+    Supports templated messages with colored components.
+    """
+    
+    DEFAULT_ICONS = {
+        'INIT': '→',
+        'READY': '✓',
+        'FETCH': '↓',
+        'SCRAPE': '◆',
+        'EXTRACT': '■',
+        'COMPLETE': '●',
+        'ERROR': '×',
+        'DEBUG': '⋯',
+        'INFO': 'ℹ',
+        'WARNING': '⚠',
+    }
+
+    DEFAULT_COLORS = {
+        LogLevel.DEBUG: Fore.LIGHTBLACK_EX,
+        LogLevel.INFO: Fore.CYAN,
+        LogLevel.SUCCESS: Fore.GREEN,
+        LogLevel.WARNING: Fore.YELLOW,
+        LogLevel.ERROR: Fore.RED,
+    }
+
+    def __init__(
+        self,
+        log_file: Optional[str] = None,
+        log_level: LogLevel = LogLevel.INFO,
+        tag_width: int = 10,
+        icons: Optional[Dict[str, str]] = None,
+        colors: Optional[Dict[LogLevel, str]] = None,
+        verbose: bool = True
+    ):
+        """
+        Initialize the logger.
+        
+        Args:
+            log_file: Optional file path for logging
+            log_level: Minimum log level to display
+            tag_width: Width for tag formatting
+            icons: Custom icons for different tags
+            colors: Custom colors for different log levels
+            verbose: Whether to output to console
+        """
+        init()  # Initialize colorama
+        self.log_file = log_file
+        self.log_level = log_level
+        self.tag_width = tag_width
+        self.icons = icons or self.DEFAULT_ICONS
+        self.colors = colors or self.DEFAULT_COLORS
+        self.verbose = verbose
+        
+        # Create log file directory if needed
+        if log_file:
+            os.makedirs(os.path.dirname(os.path.abspath(log_file)), exist_ok=True)
+
+    def _format_tag(self, tag: str) -> str:
+        """Format a tag with consistent width."""
+        return f"[{tag}]".ljust(self.tag_width, ".")
+
+    def _get_icon(self, tag: str) -> str:
+        """Get the icon for a tag, defaulting to info icon if not found."""
+        return self.icons.get(tag, self.icons['INFO'])
+
+    def _write_to_file(self, message: str):
+        """Write a message to the log file if configured."""
+        if self.log_file:
+            timestamp = datetime.now().strftime('%Y-%m-%d %H:%M:%S.%f')[:-3]
+            with open(self.log_file, 'a', encoding='utf-8') as f:
+                # Strip ANSI color codes for file output
+                clean_message = message.replace(Fore.RESET, '').replace(Style.RESET_ALL, '')
+                for color in vars(Fore).values():
+                    if isinstance(color, str):
+                        clean_message = clean_message.replace(color, '')
+                f.write(f"[{timestamp}] {clean_message}\n")
+
+    def _log(
+        self,
+        level: LogLevel,
+        message: str,
+        tag: str,
+        params: Optional[Dict[str, Any]] = None,
+        colors: Optional[Dict[str, str]] = None,
+        base_color: Optional[str] = None,
+        **kwargs
+    ):
+        """
+        Core logging method that handles message formatting and output.
+        
+        Args:
+            level: Log level for this message
+            message: Message template string
+            tag: Tag for the message
+            params: Parameters to format into the message
+            colors: Color overrides for specific parameters
+            base_color: Base color for the entire message
+        """
+        if level.value < self.log_level.value:
+            return
+
+        # Format the message with parameters if provided
+        if params:
+            try:
+                # First format the message with raw parameters
+                formatted_message = message.format(**params)
+                
+                # Then apply colors if specified
+                if colors:
+                    for key, color in colors.items():
+                        # Find the formatted value in the message and wrap it with color
+                        if key in params:
+                            value_str = str(params[key])
+                            formatted_message = formatted_message.replace(
+                                value_str, 
+                                f"{color}{value_str}{Style.RESET_ALL}"
+                            )
+                            
+            except KeyError as e:
+                formatted_message = f"LOGGING ERROR: Missing parameter {e} in message template"
+                level = LogLevel.ERROR
+        else:
+            formatted_message = message
+
+        # Construct the full log line
+        color = base_color or self.colors[level]
+        log_line = f"{color}{self._format_tag(tag)} {self._get_icon(tag)} {formatted_message}{Style.RESET_ALL}"
+
+        # Output to console if verbose
+        if self.verbose or kwargs.get("force_verbose", False):
+            print(log_line)
+
+        # Write to file if configured
+        self._write_to_file(log_line)
+
+    def debug(self, message: str, tag: str = "DEBUG", **kwargs):
+        """Log a debug message."""
+        self._log(LogLevel.DEBUG, message, tag, **kwargs)
+
+    def info(self, message: str, tag: str = "INFO", **kwargs):
+        """Log an info message."""
+        self._log(LogLevel.INFO, message, tag, **kwargs)
+
+    def success(self, message: str, tag: str = "SUCCESS", **kwargs):
+        """Log a success message."""
+        self._log(LogLevel.SUCCESS, message, tag, **kwargs)
+
+    def warning(self, message: str, tag: str = "WARNING", **kwargs):
+        """Log a warning message."""
+        self._log(LogLevel.WARNING, message, tag, **kwargs)
+
+    def error(self, message: str, tag: str = "ERROR", **kwargs):
+        """Log an error message."""
+        self._log(LogLevel.ERROR, message, tag, **kwargs)
+
+    def url_status(
+        self,
+        url: str,
+        success: bool,
+        timing: float,
+        tag: str = "FETCH",
+        url_length: int = 50
+    ):
+        """
+        Convenience method for logging URL fetch status.
+        
+        Args:
+            url: The URL being processed
+            success: Whether the operation was successful
+            timing: Time taken for the operation
+            tag: Tag for the message
+            url_length: Maximum length for URL in log
+        """
+        self._log(
+            level=LogLevel.SUCCESS if success else LogLevel.ERROR,
+            message="{url:.{url_length}}... | Status: {status} | Time: {timing:.2f}s",
+            tag=tag,
+            params={
+                "url": url,
+                "url_length": url_length,
+                "status": success,
+                "timing": timing
+            },
+            colors={
+                "status": Fore.GREEN if success else Fore.RED,
+                "timing": Fore.YELLOW
+            }
+        )
+
+    def error_status(
+        self,
+        url: str,
+        error: str,
+        tag: str = "ERROR",
+        url_length: int = 50
+    ):
+        """
+        Convenience method for logging error status.
+        
+        Args:
+            url: The URL being processed
+            error: Error message
+            tag: Tag for the message
+            url_length: Maximum length for URL in log
+        """
+        self._log(
+            level=LogLevel.ERROR,
+            message="{url:.{url_length}}... | Error: {error}",
+            tag=tag,
+            params={
+                "url": url,
+                "url_length": url_length,
+                "error": error
+            }
+        )
\ No newline at end of file
diff --git a/crawl4ai/async_webcrawler.py b/crawl4ai/async_webcrawler.py
index 79a17ac4..5fe7822c 100644
--- a/crawl4ai/async_webcrawler.py
+++ b/crawl4ai/async_webcrawler.py
@@ -15,6 +15,7 @@ from .extraction_strategy import *
 from .async_crawler_strategy import AsyncCrawlerStrategy, AsyncPlaywrightCrawlerStrategy, AsyncCrawlResponse
 from .cache_context import CacheMode, CacheContext, _legacy_to_cache_mode
 from .content_scrapping_strategy import WebScrapingStrategy
+from .async_logger import AsyncLogger
 
 from .config import (
     MIN_WORD_THRESHOLD, 
@@ -74,19 +75,29 @@ class AsyncWebCrawler:
             always_by_pass_cache: Deprecated, use always_bypass_cache instead
             base_directory: Base directory for storing cache
         """
-        init()
-        self.log_width = 10  # Width of "[COMPLETE]" 
-        self.tag_format = lambda tag: f"[{tag}]".ljust(self.log_width, ".")
-        self.log_icons = {
-            'INIT': '→',      # Alternative: '▶' or '►'
-            'READY': '✓',     # Alternative: '√'
-            'FETCH': '↓',     # Alternative: '▼'
-            'SCRAPE': '◆',    # Alternative: '♦'
-            'EXTRACT': '■',    # Alternative: '□'
-            'COMPLETE': '●',   # Alternative: '○'
-            'ERROR': '×' 
-        }        
-        self.crawler_strategy = crawler_strategy or AsyncPlaywrightCrawlerStrategy(**kwargs)
+        # init()
+        # self.log_width = 10  # Width of "[COMPLETE]" 
+        # self.tag_format = lambda tag: f"[{tag}]".ljust(self.log_width, ".")
+        # self.log_icons = {
+        #     'INIT': '→',      # Alternative: '▶' or '►'
+        #     'READY': '✓',     # Alternative: '√'
+        #     'FETCH': '↓',     # Alternative: '▼'
+        #     'SCRAPE': '◆',    # Alternative: '♦'
+        #     'EXTRACT': '■',    # Alternative: '□'
+        #     'COMPLETE': '●',   # Alternative: '○'
+        #     'ERROR': '×' 
+        # }        
+        self.verbose = kwargs.get("verbose", False)
+        self.logger = AsyncLogger(
+            log_file=os.path.join(base_directory, ".crawl4ai", "crawler.log"),
+            verbose=self.verbose,
+            tag_width=10
+        )
+        
+        self.crawler_strategy = crawler_strategy or AsyncPlaywrightCrawlerStrategy(
+            logger = self.logger,
+            **kwargs
+        )
         
         # Handle deprecated parameter
         if always_by_pass_cache is not None:
@@ -118,12 +129,13 @@ class AsyncWebCrawler:
 
     async def awarmup(self):
         """Initialize the crawler with warm-up sequence."""
-        if self.verbose:
-            print(f"{Fore.CYAN}{self.tag_format('INIT')} {self.log_icons['INIT']} Crawl4AI {crawl4ai_version}{Style.RESET_ALL}")
-            print(f"{Fore.CYAN}{self.tag_format('INIT')} {self.log_icons['INIT']} Warming up AsyncWebCrawler{Style.RESET_ALL}")
+        self.logger.info(f"Crawl4AI {crawl4ai_version}", tag="INIT")
+        # if self.verbose:
+        #     print(f"{Fore.CYAN}{self.tag_format('INIT')} {self.log_icons['INIT']} Crawl4AI {crawl4ai_version}{Style.RESET_ALL}")
+        #     print(f"{Fore.CYAN}{self.tag_format('INIT')} {self.log_icons['INIT']} Warming up AsyncWebCrawler{Style.RESET_ALL}")
         self.ready = True
-        if self.verbose:
-            print(f"{Fore.GREEN}{self.tag_format('READY')} {self.log_icons['READY']} AsyncWebCrawler initialized{Style.RESET_ALL}")
+        # if self.verbose:
+        #     print(f"{Fore.GREEN}{self.tag_format('READY')} {self.log_icons['READY']} AsyncWebCrawler initialized{Style.RESET_ALL}")
 
     async def arun(
         self,
@@ -234,8 +246,14 @@ class AsyncWebCrawler:
                     screenshot_data = cached_result.screenshot
                     if not screenshot_data:
                         cached_result = None
-                if verbose:
-                    print(f"{Fore.BLUE}{self.tag_format('FETCH')} {self.log_icons['FETCH']} Cache hit for {cache_context.display_url} | Status: {Fore.GREEN if bool(html) else Fore.RED}{bool(html)}{Style.RESET_ALL} | Time: {time.perf_counter() - start_time:.2f}s")
+                # if verbose:
+                #     print(f"{Fore.BLUE}{self.tag_format('FETCH')} {self.log_icons['FETCH']} Cache hit for {cache_context.display_url} | Status: {Fore.GREEN if bool(html) else Fore.RED}{bool(html)}{Style.RESET_ALL} | Time: {time.perf_counter() - start_time:.2f}s")
+                self.logger.url_status(
+                        url=cache_context.display_url,
+                        success=bool(html),
+                        timing=time.perf_counter() - start_time,
+                        tag="FETCH"
+                    )                    
 
 
             # Fetch fresh content if needed
@@ -252,8 +270,14 @@ class AsyncWebCrawler:
                 html = sanitize_input_encode(async_response.html)
                 screenshot_data = async_response.screenshot
                 t2 = time.perf_counter()
-                if verbose:
-                    print(f"{Fore.BLUE}{self.tag_format('FETCH')} {self.log_icons['FETCH']} Live fetch for {cache_context.display_url}... | Status: {Fore.GREEN if bool(html) else Fore.RED}{bool(html)}{Style.RESET_ALL} | Time: {t2 - t1:.2f}s")
+                self.logger.url_status(
+                    url=cache_context.display_url,
+                    success=bool(html),
+                    timing=t2 - t1,
+                    tag="FETCH"
+                )
+                # if verbose:
+                #     print(f"{Fore.BLUE}{self.tag_format('FETCH')} {self.log_icons['FETCH']} Live fetch for {cache_context.display_url}... | Status: {Fore.GREEN if bool(html) else Fore.RED}{bool(html)}{Style.RESET_ALL} | Time: {t2 - t1:.2f}s")
 
             # Process the HTML content
             crawl_result = await self.aprocess_html(
@@ -287,9 +311,21 @@ class AsyncWebCrawler:
             crawl_result.success = bool(html)
             crawl_result.session_id = kwargs.get("session_id", None)
 
-            if verbose:
-                print(f"{Fore.GREEN}{self.tag_format('COMPLETE')} {self.log_icons['COMPLETE']} {cache_context.display_url[:URL_LOG_SHORTEN_LENGTH]}... | Status: {Fore.GREEN if crawl_result.success else Fore.RED}{crawl_result.success} | {Fore.YELLOW}Total: {time.perf_counter() - start_time:.2f}s{Style.RESET_ALL}")
-
+            # if verbose:
+            #     print(f"{Fore.GREEN}{self.tag_format('COMPLETE')} {self.log_icons['COMPLETE']} {cache_context.display_url[:URL_LOG_SHORTEN_LENGTH]}... | Status: {Fore.GREEN if crawl_result.success else Fore.RED}{crawl_result.success} | {Fore.YELLOW}Total: {time.perf_counter() - start_time:.2f}s{Style.RESET_ALL}")
+            self.logger.success(
+                    message="{url:.50}... | Status: {status} | Total: {timing}",
+                    tag="COMPLETE",
+                    params={
+                        "url": cache_context.display_url,
+                        "status": crawl_result.success,
+                        "timing": f"{time.perf_counter() - start_time:.2f}s"
+                    },
+                    colors={
+                        "status": Fore.GREEN if crawl_result.success else Fore.RED,
+                        "timing": Fore.YELLOW
+                    }
+                )
 
             # Update cache if appropriate
             if cache_context.should_write() and not bool(cached_result):
@@ -300,7 +336,12 @@ class AsyncWebCrawler:
         except Exception as e:
             if not hasattr(e, "msg"):
                 e.msg = str(e)
-            print(f"{Fore.RED}{self.tag_format('ERROR')} {self.log_icons['ERROR']} Failed to crawl {cache_context.display_url[:URL_LOG_SHORTEN_LENGTH]}... | {e.msg}{Style.RESET_ALL}")
+            # print(f"{Fore.RED}{self.tag_format('ERROR')} {self.log_icons['ERROR']} Failed to crawl {cache_context.display_url[:URL_LOG_SHORTEN_LENGTH]}... | {e.msg}{Style.RESET_ALL}")
+            self.logger.error_status(
+                url=cache_context.display_url,
+                error=e.msg,
+                tag="ERROR"
+            )            
             return CrawlResult(
                 url=url, 
                 html="", 
@@ -362,7 +403,12 @@ class AsyncWebCrawler:
             domain = urlparse(url).netloc
             current_time = time.time()
             
-            print(f"{Fore.LIGHTBLACK_EX}{self.tag_format('PARALLEL')} Started task for {url[:50]}...{Style.RESET_ALL}")
+            # print(f"{Fore.LIGHTBLACK_EX}{self.tag_format('PARALLEL')} Started task for {url[:50]}...{Style.RESET_ALL}")
+            self.logger.debug(
+                message="Started task for {url:.50}...",
+                tag="PARALLEL",
+                params={"url": url}
+            )            
             
             # Get delay settings from kwargs or use defaults
             mean_delay = kwargs.get('mean_delay', 0.1)  # 0.5 seconds default mean delay
@@ -394,12 +440,26 @@ class AsyncWebCrawler:
                 )
 
         # Print start message
-        print(f"{Fore.CYAN}{self.tag_format('INIT')} {self.log_icons['INIT']} Starting concurrent crawling for {len(urls)} URLs...{Style.RESET_ALL}")
+        # print(f"{Fore.CYAN}{self.tag_format('INIT')} {self.log_icons['INIT']} Starting concurrent crawling for {len(urls)} URLs...{Style.RESET_ALL}")
+        self.logger.info(
+            message="Starting concurrent crawling for {count} URLs...",
+            tag="INIT",
+            params={"count": len(urls)}
+        )        
         start_time = time.perf_counter()
         tasks = [crawl_with_semaphore(url) for url in urls]
         results = await asyncio.gather(*tasks, return_exceptions=True)
         end_time = time.perf_counter()
-        print(f"{Fore.YELLOW}{self.tag_format('COMPLETE')} {self.log_icons['COMPLETE']} Concurrent crawling completed for {len(urls)} URLs | Total time: {end_time - start_time:.2f}s{Style.RESET_ALL}")
+        # print(f"{Fore.YELLOW}{self.tag_format('COMPLETE')} {self.log_icons['COMPLETE']} Concurrent crawling completed for {len(urls)} URLs | Total time: {end_time - start_time:.2f}s{Style.RESET_ALL}")
+        self.logger.success(
+            message="Concurrent crawling completed for {count} URLs | " + Fore.YELLOW + " Total time: {timing}" + Style.RESET_ALL,
+            tag="COMPLETE",
+            params={
+                "count": len(urls),
+                "timing": f"{end_time - start_time:.2f}s"
+            },
+            colors={"timing": Fore.YELLOW}
+        )        
         return [result if not isinstance(result, Exception) else str(result) for result in results]
 
 
@@ -451,9 +511,16 @@ class AsyncWebCrawler:
         links = result.get("links", [])
         metadata = result.get("metadata", {})
         
-        if verbose:
-            print(f"{Fore.MAGENTA}{self.tag_format('SCRAPE')} {self.log_icons['SCRAPE']} Processed {_url[:URL_LOG_SHORTEN_LENGTH]}...{Style.RESET_ALL} | Time: {int((time.perf_counter() - t1) * 1000)}ms")
-
+        # if verbose:
+        #     print(f"{Fore.MAGENTA}{self.tag_format('SCRAPE')} {self.log_icons['SCRAPE']} Processed {_url[:URL_LOG_SHORTEN_LENGTH]}...{Style.RESET_ALL} | Time: {int((time.perf_counter() - t1) * 1000)}ms")
+        self.logger.info(
+            message="Processed {url:.50}... | Time: {timing}ms",
+            tag="SCRAPE",
+            params={
+                "url": _url,
+                "timing": int((time.perf_counter() - t1) * 1000)
+            }
+        )
 
 
         if extracted_content is None and extraction_strategy and chunking_strategy and not isinstance(extraction_strategy, NoExtractionStrategy):
@@ -467,8 +534,17 @@ class AsyncWebCrawler:
                 sections = chunking_strategy.chunk(markdown)
                 extracted_content = extraction_strategy.run(url, sections)
                 extracted_content = json.dumps(extracted_content, indent=4, default=str, ensure_ascii=False)
-            if verbose:
-                print(f"{Fore.YELLOW}{self.tag_format('EXTRACT')} {self.log_icons['EXTRACT']} Completed for {_url[:URL_LOG_SHORTEN_LENGTH]}...{Style.RESET_ALL} | Time: {time.perf_counter() - t1:.2f}s{Style.RESET_ALL}")
+            # if verbose:
+                # print(f"{Fore.YELLOW}{self.tag_format('EXTRACT')} {self.log_icons['EXTRACT']} Completed for {_url[:URL_LOG_SHORTEN_LENGTH]}...{Style.RESET_ALL} | Time: {time.perf_counter() - t1:.2f}s{Style.RESET_ALL}")
+            self.logger.info(
+                message="Completed for {url:.50}... | Time: {timing}s",
+                tag="EXTRACT",
+                params={
+                    "url": _url,
+                    "timing": time.perf_counter() - t1
+                }
+            )
+        
 
                 
 
diff --git a/crawl4ai/content_filter_strategy.py b/crawl4ai/content_filter_strategy.py
index 88375da9..88216f7f 100644
--- a/crawl4ai/content_filter_strategy.py
+++ b/crawl4ai/content_filter_strategy.py
@@ -8,6 +8,10 @@ from bs4 import BeautifulSoup, NavigableString, Tag
 from .utils import clean_tokens
 from abc import ABC, abstractmethod
 
+from snowballstemmer import stemmer
+
+# from nltk.stem import PorterStemmer
+# ps = PorterStemmer()
 class RelevantContentFilter(ABC):
     def __init__(self, user_query: str = None):
         self.user_query = user_query
@@ -252,7 +256,7 @@ class RelevantContentFilter(ABC):
             return str(tag)  # Fallback to original if anything fails
 
 class BM25ContentFilter(RelevantContentFilter):
-    def __init__(self, user_query: str = None, bm25_threshold: float = 1.0):
+    def __init__(self, user_query: str = None, bm25_threshold: float = 1.0, language: str = 'english'):
         super().__init__(user_query=user_query)
         self.bm25_threshold = bm25_threshold
         self.priority_tags = {
@@ -268,6 +272,7 @@ class BM25ContentFilter(RelevantContentFilter):
             'pre': 1.5,
             'th': 1.5,  # Table headers
         }
+        self.stemmer = stemmer(language)
 
     def filter_content(self, html: str) -> List[str]:
         """Implements content filtering using BM25 algorithm with priority tag handling"""
@@ -282,58 +287,42 @@ class BM25ContentFilter(RelevantContentFilter):
         if not candidates:
             return []
 
-        # Split into priority and regular candidates
-        priority_candidates = []
-        regular_candidates = []
+        # Tokenize corpus
+        # tokenized_corpus = [chunk.lower().split() for _, chunk, _, _ in candidates]
+        # tokenized_query = query.lower().split()
+                
+        # tokenized_corpus = [[ps.stem(word) for word in chunk.lower().split()] 
+        #                 for _, chunk, _, _ in candidates]
+        # tokenized_query = [ps.stem(word) for word in query.lower().split()]        
         
-        for index, chunk, tag_type, tag in candidates:
-            if tag.name in self.priority_tags:
-                priority_candidates.append((index, chunk, tag_type, tag))
-            else:
-                regular_candidates.append((index, chunk, tag_type, tag))
+        tokenized_corpus = [[self.stemmer.stemWord(word) for word in chunk.lower().split()] 
+                   for _, chunk, _, _ in candidates]
+        tokenized_query = [self.stemmer.stemWord(word) for word in query.lower().split()]
 
-        # Process regular content with BM25
-        tokenized_corpus = [chunk.lower().split() for _, chunk, _, _ in regular_candidates]
-        tokenized_query = query.lower().split()
-        
         # Clean from stop words and noise
         tokenized_corpus = [clean_tokens(tokens) for tokens in tokenized_corpus]
         tokenized_query = clean_tokens(tokenized_query)
-        
+
         bm25 = BM25Okapi(tokenized_corpus)
         scores = bm25.get_scores(tokenized_query)
 
-        # Score and boost regular candidates
-        scored_candidates = [
-            (score * self.priority_tags.get(tag.name, 1.0), index, chunk, tag_type, tag)
-            for score, (index, chunk, tag_type, tag) in zip(scores, regular_candidates)
+        # Adjust scores with tag weights
+        adjusted_candidates = []
+        for score, (index, chunk, tag_type, tag) in zip(scores, candidates):
+            tag_weight = self.priority_tags.get(tag.name, 1.0)
+            adjusted_score = score * tag_weight
+            adjusted_candidates.append((adjusted_score, index, chunk, tag))
+
+        # Filter candidates by threshold
+        selected_candidates = [
+            (index, chunk, tag) for adjusted_score, index, chunk, tag in adjusted_candidates
+            if adjusted_score >= self.bm25_threshold
         ]
-        scored_candidates.sort(key=lambda x: x[0], reverse=True)
-
-        # Process scored candidates
-        selected_tags = set()
-        selected_candidates = []
-
-        # First add all priority candidates
-        for index, chunk, tag_type, tag in priority_candidates:
-            tag_id = id(tag)
-            if tag_id not in selected_tags:
-                selected_candidates.append((index, chunk, tag))
-                selected_tags.add(tag_id)
-
-        # Then add scored regular candidates that meet threshold
-        for score, index, chunk, tag_type, tag in scored_candidates:
-            if score < self.bm25_threshold:
-                continue
-            tag_id = id(tag)
-            if tag_id not in selected_tags:
-                selected_candidates.append((index, chunk, tag))
-                selected_tags.add(tag_id)
 
         if not selected_candidates:
             return []
 
-        # Sort by original document order
+        # Sort selected candidates by original document order
         selected_candidates.sort(key=lambda x: x[0])
-        return [self.clean_element(tag) for _, _, tag in selected_candidates]
 
+        return [self.clean_element(tag) for _, _, tag in selected_candidates]
diff --git a/crawl4ai/content_scrapping_strategy.py b/crawl4ai/content_scrapping_strategy.py
index d16b0680..0f470671 100644
--- a/crawl4ai/content_scrapping_strategy.py
+++ b/crawl4ai/content_scrapping_strategy.py
@@ -149,6 +149,15 @@ class ContentScrapingStrategy(ABC):
         pass
 
 class WebScrapingStrategy(ContentScrapingStrategy):
+    def __init__(self, logger=None):
+        self.logger = logger
+
+    def _log(self, level, message, tag="SCRAPE", **kwargs):
+        """Helper method to safely use logger."""
+        if self.logger:
+            log_method = getattr(self.logger, level)
+            log_method(message=message, tag=tag, **kwargs)
+                
     def scrap(self, url: str, html: str, **kwargs) -> Dict[str, Any]:
         return self._get_content_of_website_optimized(url, html, is_async=False, **kwargs)
 
@@ -167,7 +176,12 @@ class WebScrapingStrategy(ContentScrapingStrategy):
         try:
             meta = extract_metadata("", soup)
         except Exception as e:
-            print('Error extracting metadata:', str(e))
+            self._log('error', 
+                message="Error extracting metadata: {error}",
+                tag="SCRAPE",
+                params={"error": str(e)}
+            )            
+            # print('Error extracting metadata:', str(e))
             meta = {}
         
         
@@ -430,9 +444,12 @@ class WebScrapingStrategy(ContentScrapingStrategy):
                 try:
                     remove_unwanted_attributes(element, IMPORTANT_ATTRS, kwargs.get('keep_data_attributes', False))
                 except Exception as e:
-                    print('Error removing unwanted attributes:', str(e))
-                
-
+                    # print('Error removing unwanted attributes:', str(e))
+                    self._log('error',
+                        message="Error removing unwanted attributes: {error}",
+                        tag="SCRAPE",
+                        params={"error": str(e)}
+                    )
                 # Process children
                 for child in list(element.children):
                     if isinstance(child, NavigableString) and not isinstance(child, Comment):
@@ -453,7 +470,12 @@ class WebScrapingStrategy(ContentScrapingStrategy):
 
                 return keep_element
             except Exception as e:
-                print('Error processing element:', str(e))
+                # print('Error processing element:', str(e))
+                self._log('error',
+                    message="Error processing element: {error}",
+                    tag="SCRAPE",
+                    params={"error": str(e)}
+                )                
                 return False
        
         process_element(body)
@@ -516,7 +538,10 @@ class WebScrapingStrategy(ContentScrapingStrategy):
             str_body = body.encode_contents().decode('utf-8')
             
             print(f"[LOG] 😧 Error: After processing the crawled HTML and removing irrelevant tags, nothing was left in the page. Check the markdown for further details.")
-
+            self._log('error',
+                message="After processing the crawled HTML and removing irrelevant tags, nothing was left in the page. Check the markdown for further details.",
+                tag="SCRAPE"
+            )
 
         cleaned_html = str_body.replace('\n\n', '\n').replace('  ', ' ')
 
@@ -525,6 +550,13 @@ class WebScrapingStrategy(ContentScrapingStrategy):
             h.update_params(**kwargs.get('html2text', {}))            
             markdown = h.handle(cleaned_html)
         except Exception as e:
+            if not h:
+                h = CustomHTML2Text()
+            self._log('error',
+                message="Error converting HTML to markdown: {error}",
+                tag="SCRAPE",
+                params={"error": str(e)}
+            )
             markdown = h.handle(sanitize_html(cleaned_html))
         markdown = markdown.replace('    ```', '```')
 
diff --git a/crawl4ai/version_manager.py b/crawl4ai/version_manager.py
index 07e0c0e9..8ae2de2e 100644
--- a/crawl4ai/version_manager.py
+++ b/crawl4ai/version_manager.py
@@ -20,11 +20,11 @@ class VersionManager:
             
     def update_version(self):
         """Update the version file to current library version"""
-        self.version_file.write_text(__version__)
+        self.version_file.write_text(__version__.__version__)
         
     def needs_update(self):
         """Check if database needs update based on version"""
         installed = self.get_installed_version()
-        current = version.parse(__version__)
+        current = version.parse(__version__.__version__)
         return installed is None or installed < current
 
diff --git a/docker-compose.hub.yml b/docker-compose.hub.yml
new file mode 100644
index 00000000..9bcfa982
--- /dev/null
+++ b/docker-compose.hub.yml
@@ -0,0 +1,27 @@
+services:
+  crawl4ai:
+    image: unclecode/crawl4ai:basic  # Pull image from Docker Hub
+    ports:
+      - "11235:11235"  # FastAPI server
+      - "8000:8000"    # Alternative port
+      - "9222:9222"    # Browser debugging
+      - "8080:8080"    # Additional port
+    environment:
+      - CRAWL4AI_API_TOKEN=${CRAWL4AI_API_TOKEN:-}  # Optional API token
+      - OPENAI_API_KEY=${OPENAI_API_KEY:-}          # Optional OpenAI API key
+      - CLAUDE_API_KEY=${CLAUDE_API_KEY:-}          # Optional Claude API key
+    volumes:
+      - /dev/shm:/dev/shm  # Shared memory for browser operations
+    deploy:
+      resources:
+        limits:
+          memory: 4G
+        reservations:
+          memory: 1G
+    restart: unless-stopped
+    healthcheck:
+      test: ["CMD", "curl", "-f", "http://localhost:11235/health"]
+      interval: 30s
+      timeout: 10s
+      retries: 3
+      start_period: 40s
diff --git a/docker-compose.local.yml b/docker-compose.local.yml
new file mode 100644
index 00000000..7dc41b47
--- /dev/null
+++ b/docker-compose.local.yml
@@ -0,0 +1,33 @@
+services:
+  crawl4ai:
+    build:
+      context: .
+      dockerfile: Dockerfile
+      args:
+        PYTHON_VERSION: 3.10
+        INSTALL_TYPE: all
+        ENABLE_GPU: false
+    ports:
+      - "11235:11235"  # FastAPI server
+      - "8000:8000"    # Alternative port
+      - "9222:9222"    # Browser debugging
+      - "8080:8080"    # Additional port
+    environment:
+      - CRAWL4AI_API_TOKEN=${CRAWL4AI_API_TOKEN:-}  # Optional API token
+      - OPENAI_API_KEY=${OPENAI_API_KEY:-}          # Optional OpenAI API key
+      - CLAUDE_API_KEY=${CLAUDE_API_KEY:-}          # Optional Claude API key
+    volumes:
+      - /dev/shm:/dev/shm  # Shared memory for browser operations
+    deploy:
+      resources:
+        limits:
+          memory: 4G
+        reservations:
+          memory: 1G
+    restart: unless-stopped
+    healthcheck:
+      test: ["CMD", "curl", "-f", "http://localhost:11235/health"]
+      interval: 30s
+      timeout: 10s
+      retries: 3
+      start_period: 40s
\ No newline at end of file
diff --git a/docker-compose.yml b/docker-compose.yml
index ef0dc9e4..1097ef11 100644
--- a/docker-compose.yml
+++ b/docker-compose.yml
@@ -1,5 +1,3 @@
-version: '3.8'
-
 services:
   crawl4ai:
     build:
@@ -9,15 +7,18 @@ services:
         PYTHON_VERSION: 3.10
         INSTALL_TYPE: all
         ENABLE_GPU: false
+    profiles: ["local"]
     ports:
-      - "11235:11235"  # FastAPI server
-      - "8000:8000"    # Alternative port
-      - "9222:9222"    # Browser debugging
-      - "8080:8080"    # Additional port
+      - "11235:11235"
+      - "8000:8000"
+      - "9222:9222"
+      - "8080:8080"
     environment:
-      - CRAWL4AI_API_TOKEN=${CRAWL4AI_API_TOKEN:-}  # Optional API token
+      - CRAWL4AI_API_TOKEN=${CRAWL4AI_API_TOKEN:-}
+      - OPENAI_API_KEY=${OPENAI_API_KEY:-}
+      - CLAUDE_API_KEY=${CLAUDE_API_KEY:-}
     volumes:
-      - /dev/shm:/dev/shm  # Shared memory for browser operations
+      - /dev/shm:/dev/shm
     deploy:
       resources:
         limits:
@@ -30,4 +31,32 @@ services:
       interval: 30s
       timeout: 10s
       retries: 3
-      start_period: 40s
\ No newline at end of file
+      start_period: 40s
+
+  crawl4ai-hub:
+    image: unclecode/crawl4ai:basic
+    profiles: ["hub"]
+    ports:
+      - "11235:11235"
+      - "8000:8000"
+      - "9222:9222"
+      - "8080:8080"
+    environment:
+      - CRAWL4AI_API_TOKEN=${CRAWL4AI_API_TOKEN:-}
+      - OPENAI_API_KEY=${OPENAI_API_KEY:-}
+      - CLAUDE_API_KEY=${CLAUDE_API_KEY:-}
+    volumes:
+      - /dev/shm:/dev/shm
+    deploy:
+      resources:
+        limits:
+          memory: 4G
+        reservations:
+          memory: 1G
+    restart: unless-stopped
+    healthcheck:
+      test: ["CMD", "curl", "-f", "http://localhost:11235/health"]
+      interval: 30s
+      timeout: 10s
+      retries: 3
+      start_period: 40s
diff --git a/docs/examples/v0.3.74.overview.py b/docs/examples/v0.3.74.overview.py
index ec3a7d73..00296740 100644
--- a/docs/examples/v0.3.74.overview.py
+++ b/docs/examples/v0.3.74.overview.py
@@ -1,9 +1,16 @@
+import os, sys
+# append the parent directory to the sys.path
+parent_dir = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
+sys.path.append(parent_dir)
+parent_parent_dir = os.path.dirname(parent_dir)
+sys.path.append(parent_parent_dir)
+__location__ = os.path.realpath(os.path.join(os.getcwd(), os.path.dirname(__file__)))
+__data__ = os.path.join(__location__, "__data")
 import asyncio
-import os
 from pathlib import Path
 import aiohttp
 import json
-from crawl4ai import AsyncWebCrawler
+from crawl4ai import AsyncWebCrawler, CacheMode
 from crawl4ai.content_filter_strategy import BM25ContentFilter
 
 # 1. File Download Processing Example
@@ -32,7 +39,8 @@ async def download_example():
                 console.log('No .exe download link found');
             }
             """,
-            wait_for=5  # Wait 5 seconds to ensure download starts
+            delay_before_return_html=1,  # Wait 5 seconds to ensure download starts
+            cache_mode=CacheMode.BYPASS
         )
         
         if result.downloaded_files:
@@ -50,22 +58,32 @@ async def content_filtering_example():
     async with AsyncWebCrawler(verbose=True) as crawler:
         # Create filter with custom query for OpenAI's blog
         content_filter = BM25ContentFilter(
-            user_query="AI language models research innovation",
+            # user_query="Investment and fundraising",
+            # user_query="Robotic",
             bm25_threshold=1.0
         )
         
         result = await crawler.arun(
-            url="https://openai.com/blog",
-            content_filter=content_filter
+            url="https://techcrunch.com/",
+            content_filter=content_filter,
+            cache_mode=CacheMode.BYPASS
         )
         
-        print(f"Filtered content: {result.extracted_content}")
+        print(f"Filtered content: {len(result.fit_markdown)}")
+        print(f"Filtered content: {result.fit_markdown}")
+        
+        # Save html 
+        with open(os.path.join(__data__, "techcrunch.html"), "w") as f:
+            f.write(result.fit_html)
+        
+        with open(os.path.join(__data__, "filtered_content.md"), "w") as f:
+            f.write(result.fit_markdown)
 
 # 3. Local File and Raw HTML Processing Example
 async def local_and_raw_html_example():
     """Example of processing local files and raw HTML"""
     # Create a sample HTML file
-    sample_file = "sample.html"
+    sample_file = os.path.join(__data__, "sample.html")
     with open(sample_file, "w") as f:
         f.write("""
         <html><body>
@@ -112,21 +130,18 @@ async def browser_management_example():
         headless=False,
         verbose=True
     ) as crawler:
+
+        result = await crawler.arun(
+            url="https://crawl4ai.com",
+            # session_id="persistent_session_1",
+            cache_mode=CacheMode.BYPASS
+        )        
         # Use GitHub as an example - it's a good test for browser management
         # because it requires proper browser handling
         result = await crawler.arun(
             url="https://github.com/trending",
-            session_id="persistent_session_1",
-            js_code="""
-            // Custom JavaScript to execute on GitHub's trending page
-            const repos = document.querySelectorAll('article.Box-row');
-            const data = Array.from(repos).map(repo => ({
-                name: repo.querySelector('h2')?.textContent?.trim(),
-                description: repo.querySelector('p')?.textContent?.trim(),
-                language: repo.querySelector('[itemprop="programmingLanguage"]')?.textContent?.trim()
-            }));
-            console.log('Trending repositories:', JSON.stringify(data, null, 2));
-            """
+            # session_id="persistent_session_1",
+            cache_mode=CacheMode.BYPASS
         )
         
         print("\nBrowser session result:", result.success)
@@ -136,6 +151,8 @@ async def browser_management_example():
 # 5. API Usage Example
 async def api_example():
     """Example of using the new API endpoints"""
+    api_token = os.getenv('CRAWL4AI_API_TOKEN') or "test_api_code"
+    headers = {'Authorization': f'Bearer {api_token}'}    
     async with aiohttp.ClientSession() as session:
         # Submit crawl job
         crawl_request = {
@@ -143,52 +160,78 @@ async def api_example():
             "extraction_config": {
                 "type": "json_css",
                 "params": {
-                    "selectors": {
-                        "titles": ".title a",
-                        "scores": ".score",
-                        "comments": ".comment-tree"
+                    "schema": {
+                        "name": "Hacker News Articles",
+                        "baseSelector": ".athing",
+                        "fields": [
+                            {
+                                "name": "title",
+                                "selector": ".title a",
+                                "type": "text"
+                            },
+                            {
+                                "name": "score",
+                                "selector": ".score",
+                                "type": "text"
+                            },
+                            {
+                                "name": "url",
+                                "selector": ".title a",
+                                "type": "attribute",
+                                "attribute": "href"
+                            }
+                        ]
                     }
                 }
             },
             "crawler_params": {
                 "headless": True,
-                "use_managed_browser": True
+                # "use_managed_browser": True
             },
-            "screenshot": True,
-            "magic": True
+            "cache_mode": "bypass",
+            # "screenshot": True,
+            # "magic": True
         }
         
         async with session.post(
             "http://localhost:11235/crawl",
-            json=crawl_request
+            json=crawl_request,
+            headers=headers
         ) as response:
             task_data = await response.json()
             task_id = task_data["task_id"]
             
             # Check task status
-            async with session.get(
-                f"http://localhost:11235/task/{task_id}"
-            ) as status_response:
-                result = await status_response.json()
-                print(f"Task result: {result}")
+            while True:
+                async with session.get(
+                    f"http://localhost:11235/task/{task_id}",
+                    headers=headers
+                ) as status_response:
+                    result = await status_response.json()
+                    print(f"Task result: {result}")
+                    
+                    if result["status"] == "completed":
+                        break
+                    else:
+                        await asyncio.sleep(1)
 
 # Main execution
 async def main():
-    print("Running Crawl4AI feature examples...")
+    # print("Running Crawl4AI feature examples...")
     
-    print("\n1. Running Download Example:")
+    # print("\n1. Running Download Example:")
     await download_example()
     
-    print("\n2. Running Content Filtering Example:")
+    # print("\n2. Running Content Filtering Example:")
     await content_filtering_example()
     
-    print("\n3. Running Local and Raw HTML Example:")
+    # print("\n3. Running Local and Raw HTML Example:")
     await local_and_raw_html_example()
     
-    print("\n4. Running Browser Management Example:")
+    # print("\n4. Running Browser Management Example:")
     await browser_management_example()
     
-    print("\n5. Running API Example:")
+    # print("\n5. Running API Example:")
     await api_example()
 
 if __name__ == "__main__":
diff --git a/docs/md_v2/basic/docker-deploymeny.md b/docs/md_v2/basic/docker-deploymeny.md
index 30555708..87e468aa 100644
--- a/docs/md_v2/basic/docker-deploymeny.md
+++ b/docs/md_v2/basic/docker-deploymeny.md
@@ -15,6 +15,94 @@ docker run -p 11235:11235 unclecode/crawl4ai:basic
 docker run -p 11235:11235 -e CRAWL4AI_API_TOKEN=your_secret_token unclecode/crawl4ai:basic
 ```
 
+## Running with Docker Compose 🐳
+
+### Use Docker Compose (From Local Dockerfile or Docker Hub)
+
+Crawl4AI provides flexibility to use Docker Compose for managing your containerized services. You can either build the image locally from the provided `Dockerfile` or use the pre-built image from Docker Hub.
+
+### **Option 1: Using Docker Compose to Build Locally**
+If you want to build the image locally, use the provided `docker-compose.local.yml` file.
+
+```bash
+docker-compose -f docker-compose.local.yml up -d
+```
+
+This will:
+1. Build the Docker image from the provided `Dockerfile`.
+2. Start the container and expose it on `http://localhost:11235`.
+
+---
+
+### **Option 2: Using Docker Compose with Pre-Built Image from Hub**
+If you prefer using the pre-built image on Docker Hub, use the `docker-compose.hub.yml` file.
+
+```bash
+docker-compose -f docker-compose.hub.yml up -d
+```
+
+This will:
+1. Pull the pre-built image `unclecode/crawl4ai:basic` (or `all`, depending on your configuration).
+2. Start the container and expose it on `http://localhost:11235`.
+
+---
+
+### **Stopping the Running Services**
+
+To stop the services started via Docker Compose, you can use:
+
+```bash
+docker-compose -f docker-compose.local.yml down
+# OR
+docker-compose -f docker-compose.hub.yml down
+```
+
+If the containers don’t stop and the application is still running, check the running containers:
+
+```bash
+docker ps
+```
+
+Find the `CONTAINER ID` of the running service and stop it forcefully:
+
+```bash
+docker stop <CONTAINER_ID>
+```
+
+---
+
+### **Debugging with Docker Compose**
+
+- **Check Logs**: To view the container logs:
+  ```bash
+  docker-compose -f docker-compose.local.yml logs -f
+  ```
+
+- **Remove Orphaned Containers**: If the service is still running unexpectedly:
+  ```bash
+  docker-compose -f docker-compose.local.yml down --remove-orphans
+  ```
+
+- **Manually Remove Network**: If the network is still in use:
+  ```bash
+  docker network ls
+  docker network rm crawl4ai_default
+  ```
+
+---
+
+### Why Use Docker Compose?
+
+Docker Compose is the recommended way to deploy Crawl4AI because:
+1. It simplifies multi-container setups.
+2. Allows you to define environment variables, resources, and ports in a single file.
+3. Makes it easier to switch between local development and production-ready images.
+
+For example, your `docker-compose.yml` could include API keys, token settings, and memory limits, making deployment quick and consistent.
+
+
+
+
 ## API Security 🔒
 
 ### Understanding CRAWL4AI_API_TOKEN
diff --git a/main.py b/main.py
index ee5f7fc6..6d217410 100644
--- a/main.py
+++ b/main.py
@@ -26,6 +26,7 @@ from enum import Enum
 from dataclasses import dataclass
 import json
 from crawl4ai import AsyncWebCrawler, CrawlResult, CacheMode
+from crawl4ai.config import MIN_WORD_THRESHOLD
 from crawl4ai.extraction_strategy import (
     LLMExtractionStrategy,
     CosineStrategy,
@@ -53,12 +54,20 @@ class ExtractionConfig(BaseModel):
     type: CrawlerType
     params: Dict[str, Any] = {}
 
+class ChunkingStrategy(BaseModel):
+    type: str
+    params: Dict[str, Any] = {}
+
+class ContentFilter(BaseModel):
+    type: str = "bm25"
+    params: Dict[str, Any] = {}
+
 class CrawlRequest(BaseModel):
     urls: Union[HttpUrl, List[HttpUrl]]
+    word_count_threshold: int = MIN_WORD_THRESHOLD
     extraction_config: Optional[ExtractionConfig] = None
-    crawler_params: Dict[str, Any] = {}
-    priority: int = Field(default=5, ge=1, le=10)
-    ttl: Optional[int] = 3600
+    chunking_strategy: Optional[ChunkingStrategy] = None
+    content_filter: Optional[ContentFilter] = None
     js_code: Optional[List[str]] = None
     wait_for: Optional[str] = None
     css_selector: Optional[str] = None
@@ -66,7 +75,10 @@ class CrawlRequest(BaseModel):
     magic: bool = False
     extra: Optional[Dict[str, Any]] = {}
     session_id: Optional[str] = None
-    cache_mode: Optional[CacheMode] = None
+    cache_mode: Optional[CacheMode] = CacheMode.ENABLED
+    priority: int = Field(default=5, ge=1, le=10)
+    ttl: Optional[int] = 3600    
+    crawler_params: Dict[str, Any] = {}
 
 @dataclass
 class TaskInfo:
@@ -280,6 +292,7 @@ class CrawlerService:
                     if isinstance(request.urls, list):
                         results = await crawler.arun_many(
                             urls=[str(url) for url in request.urls],
+                            word_count_threshold=MIN_WORD_THRESHOLD,
                             extraction_strategy=extraction_strategy,
                             js_code=request.js_code,
                             wait_for=request.wait_for,
@@ -287,6 +300,7 @@ class CrawlerService:
                             screenshot=request.screenshot,
                             magic=request.magic,
                             session_id=request.session_id,
+                            cache_mode=request.cache_mode,
                             **request.extra,
                         )
                     else:
@@ -299,6 +313,7 @@ class CrawlerService:
                             screenshot=request.screenshot,
                             magic=request.magic,
                             session_id=request.session_id,
+                            cache_mode=request.cache_mode,
                             **request.extra,
                         )
 
diff --git a/requirements.txt b/requirements.txt
index e6294cc5..ed259ac9 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -12,4 +12,5 @@ tf-playwright-stealth~=1.0
 xxhash~=3.4
 rank-bm25~=0.2
 aiofiles~=24.0
-colorama~=0.4
\ No newline at end of file
+colorama~=0.4
+snowballstemmer~=2.2
\ No newline at end of file

From 73658c758affac33d1c96ce274735025012da370 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Tue, 19 Nov 2024 16:10:43 +0800
Subject: [PATCH 046/115] chore: update .gitignore to include manage-collab.sh

---
 .gitignore | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/.gitignore b/.gitignore
index 0acec10f..da4b5f88 100644
--- a/.gitignore
+++ b/.gitignore
@@ -210,4 +210,5 @@ git_issues.md
 .issues/
 .docs/
 .issues/
-.gitboss/
\ No newline at end of file
+.gitboss/
+manage-collab.sh 
\ No newline at end of file

From 593c7ad307489edc6a12f2f594bc7827aacbc6f7 Mon Sep 17 00:00:00 2001
From: ntohidikplay <“nasrin@kplay”.team>
Date: Tue, 19 Nov 2024 11:45:26 +0100
Subject: [PATCH 047/115] test: trying to push to main

---
 test.txt | 0
 1 file changed, 0 insertions(+), 0 deletions(-)
 create mode 100644 test.txt

diff --git a/test.txt b/test.txt
new file mode 100644
index 00000000..e69de29b

From 3aae30ed2a2fdd57e1bb9b6374238247d1013974 Mon Sep 17 00:00:00 2001
From: ntohidikplay <“nasrin@kplay”.team>
Date: Tue, 19 Nov 2024 11:57:07 +0100
Subject: [PATCH 048/115] test1: trying to push to main

---
 test1.txt | 0
 1 file changed, 0 insertions(+), 0 deletions(-)
 create mode 100644 test1.txt

diff --git a/test1.txt b/test1.txt
new file mode 100644
index 00000000..e69de29b

From 2f19d386930b48f6758053dd4791b3da9e3a0f29 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Tue, 19 Nov 2024 19:02:41 +0800
Subject: [PATCH 049/115] Update .gitignore to include .gitboss/ and
 todo_executor.md

---
 .gitignore | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/.gitignore b/.gitignore
index 4c3e151e..b92a0b0d 100644
--- a/.gitignore
+++ b/.gitignore
@@ -208,4 +208,6 @@ git_issues.md
 .tests/
 .issues/
 .docs/
-.issues/
\ No newline at end of file
+.issues/
+.gitboss/
+todo_executor.md
\ No newline at end of file

From fbcff85ecb6d189fe77ca979017de9e3415481ce Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Tue, 19 Nov 2024 19:03:23 +0800
Subject: [PATCH 050/115] Remove test files

---
 test.txt  | 0
 test1.txt | 0
 2 files changed, 0 insertions(+), 0 deletions(-)
 delete mode 100644 test.txt
 delete mode 100644 test1.txt

diff --git a/test.txt b/test.txt
deleted file mode 100644
index e69de29b..00000000
diff --git a/test1.txt b/test1.txt
deleted file mode 100644
index e69de29b..00000000

From a6dad3fc6d436af25f65c083c0f3cb2d6f8f9fc1 Mon Sep 17 00:00:00 2001
From: ntohidikplay <“nasrin@kplay”.team>
Date: Tue, 19 Nov 2024 12:09:33 +0100
Subject: [PATCH 051/115] test: trying to push to 0.3.74

---
 test3.txt | 0
 1 file changed, 0 insertions(+), 0 deletions(-)
 create mode 100644 test3.txt

diff --git a/test3.txt b/test3.txt
new file mode 100644
index 00000000..e69de29b

From f2cb7d506dbe78bd29d6d6b32bd56f43ec44b352 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Tue, 19 Nov 2024 19:12:14 +0800
Subject: [PATCH 052/115] Delete test3.txt

---
 test3.txt | 0
 1 file changed, 0 insertions(+), 0 deletions(-)
 delete mode 100644 test3.txt

diff --git a/test3.txt b/test3.txt
deleted file mode 100644
index e69de29b..00000000

From b654c49e55194da47945e726fe18a5fbded68062 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Tue, 19 Nov 2024 19:32:06 +0800
Subject: [PATCH 053/115] Update .gitignore to exclude additional scripts and
 files

---
 .gitignore | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/.gitignore b/.gitignore
index b92a0b0d..de75f544 100644
--- a/.gitignore
+++ b/.gitignore
@@ -210,4 +210,6 @@ git_issues.md
 .docs/
 .issues/
 .gitboss/
-todo_executor.md
\ No newline at end of file
+todo_executor.md
+protect-all-except-feature.sh
+manage-collab.sh
\ No newline at end of file

From 2bdec1fa5a8d13f66598e15ff37d45ef75d5e830 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Tue, 19 Nov 2024 19:33:04 +0800
Subject: [PATCH 054/115] chore: add manage-collab.sh to .gitignore

---
 .gitignore | 1 +
 1 file changed, 1 insertion(+)

diff --git a/.gitignore b/.gitignore
index da4b5f88..0fb09933 100644
--- a/.gitignore
+++ b/.gitignore
@@ -211,4 +211,5 @@ git_issues.md
 .docs/
 .issues/
 .gitboss/
+
 manage-collab.sh 
\ No newline at end of file

From d418a04602ebe32d68d248a2995488beec768c61 Mon Sep 17 00:00:00 2001
From: Darwing Medina <darwing1210@gmail.com>
Date: Wed, 20 Nov 2024 04:52:11 -0600
Subject: [PATCH 055/115] Fix #260 prevent pass duplicated kwargs to
 scrapping_strategy (#269)

Thank you for the suggestions. It totally makes sense now. Change to pop operator.
---
 crawl4ai/async_webcrawler.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/crawl4ai/async_webcrawler.py b/crawl4ai/async_webcrawler.py
index 38e429ca..fb8c5290 100644
--- a/crawl4ai/async_webcrawler.py
+++ b/crawl4ai/async_webcrawler.py
@@ -197,8 +197,8 @@ class AsyncWebCrawler:
                 html,
                 word_count_threshold=word_count_threshold,
                 css_selector=css_selector,
-                only_text=kwargs.get("only_text", False),
-                image_description_min_word_threshold=kwargs.get(
+                only_text=kwargs.pop("only_text", False),
+                image_description_min_word_threshold=kwargs.pop(
                     "image_description_min_word_threshold", IMAGE_DESCRIPTION_MIN_WORD_THRESHOLD
                 ),
                 **kwargs,

From 3439f7886d170e05e0c97c804b1057187325c2a2 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?=E7=A8=8B=E5=BA=8F=E5=91=98=E9=98=BF=E6=B1=9F=28Relakkes?=
 =?UTF-8?q?=29?= <relakkes@gmail.com>
Date: Wed, 20 Nov 2024 20:30:25 +0800
Subject: [PATCH 056/115] fix: crawler strategy exception handling and fixes
 (#271)

---
 crawl4ai/crawler_strategy.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/crawl4ai/crawler_strategy.py b/crawl4ai/crawler_strategy.py
index ce802e49..898dcfa8 100644
--- a/crawl4ai/crawler_strategy.py
+++ b/crawl4ai/crawler_strategy.py
@@ -283,7 +283,7 @@ class LocalSeleniumCrawlerStrategy(CrawlerStrategy):
                 print(f"[LOG] ✅ Crawled {url} successfully!")
             
             return html
-        except InvalidArgumentException:
+        except InvalidArgumentException as e:
             if not hasattr(e, 'msg'):
                 e.msg = sanitize_input_encode(str(e))
             raise InvalidArgumentException(f"Failed to crawl {url}: {e.msg}")

From dbb751c8f09f76ffce4046784c2cd2b0021de7d0 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Thu, 21 Nov 2024 18:21:43 +0800
Subject: [PATCH 057/115] In this commit, we introduce the new concept of
 MakrdownGenerationStrategy, which allows us to expand our future strategies
 to generate better markdown. Right now, we generate raw markdown as we were
 doing before. We have a new algorithm for fitting markdown based on BM25, and
 now we add the ability to refine markdown into a citation form. Our links
 will be extracted and replaced by a citation reference number, and then we
 will have reference sections at the very end; we add all the links with the
 descriptions. This format is more suitable for large language models. In case
 we don't need to pass links, we can reduce the size of the markdown
 significantly and also attach the list of references as a separate file to a
 large language model. This commit contains changes for this direction.

---
 crawl4ai/__init__.py                          |   1 +
 crawl4ai/async_crawler_strategy.py            |  13 +-
 crawl4ai/async_database.3.73.py               | 285 ---------------
 crawl4ai/async_webcrawler.3.73.py             | 344 ------------------
 crawl4ai/async_webcrawler.py                  |   9 +-
 ...rategy.py => content_scraping_strategy.py} | 229 ++++++------
 crawl4ai/markdown_generation_strategy.py      | 115 ++++++
 crawl4ai/models.py                            |  13 +-
 crawl4ai/utils.py                             |  88 +++++
 crawl4ai/web_crawler.py                       |   2 +-
 tests/async/test_content_scraper_strategy.py  |   4 +-
 tests/async/test_markdown_genertor.py         | 165 +++++++++
 12 files changed, 506 insertions(+), 762 deletions(-)
 delete mode 100644 crawl4ai/async_database.3.73.py
 delete mode 100644 crawl4ai/async_webcrawler.3.73.py
 rename crawl4ai/{content_scrapping_strategy.py => content_scraping_strategy.py} (84%)
 create mode 100644 crawl4ai/markdown_generation_strategy.py
 create mode 100644 tests/async/test_markdown_genertor.py

diff --git a/crawl4ai/__init__.py b/crawl4ai/__init__.py
index ad9475b4..0ccf13d8 100644
--- a/crawl4ai/__init__.py
+++ b/crawl4ai/__init__.py
@@ -1,6 +1,7 @@
 # __init__.py
 
 from .async_webcrawler import AsyncWebCrawler, CacheMode
+
 from .models import CrawlResult
 from .__version__ import __version__
 # __version__ = "0.3.73"
diff --git a/crawl4ai/async_crawler_strategy.py b/crawl4ai/async_crawler_strategy.py
index e7dc9c54..3f332eb0 100644
--- a/crawl4ai/async_crawler_strategy.py
+++ b/crawl4ai/async_crawler_strategy.py
@@ -229,6 +229,7 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
         self.headless = kwargs.get("headless", True)
         self.browser_type = kwargs.get("browser_type", "chromium")
         self.headers = kwargs.get("headers", {})
+        self.cookies = kwargs.get("cookies", [])
         self.sessions = {}
         self.session_ttl = 1800 
         self.js_code = js_code
@@ -295,6 +296,8 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
                 # Set up the default context
                 if self.default_context:
                     await self.default_context.set_extra_http_headers(self.headers)
+                    if self.cookies:
+                        await self.default_context.add_cookies(self.cookies)                    
                     if self.accept_downloads:
                         await self.default_context.set_default_timeout(60000)
                         await self.default_context.set_default_navigation_timeout(60000)
@@ -669,6 +672,8 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
                             # downloads_path=self.downloads_path if self.accept_downloads else None
                         )
                         await context.add_cookies([{"name": "cookiesEnabled", "value": "true", "url": url}])
+                        if self.cookies:
+                            await context.add_cookies(self.cookies)
                         await context.set_extra_http_headers(self.headers)
                         page = await context.new_page()
                     self.sessions[session_id] = (context, page, time.time())
@@ -684,6 +689,8 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
                         proxy={"server": self.proxy} if self.proxy else None,
                         accept_downloads=self.accept_downloads,
                     )
+                    if self.cookies:
+                            await context.add_cookies(self.cookies)
                     await context.set_extra_http_headers(self.headers)
                 
                 if kwargs.get("override_navigator", False) or kwargs.get("simulate_user", False) or kwargs.get("magic", False):
@@ -828,7 +835,8 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
                     for js in js_code:
                         await page.evaluate(js)
                 
-                await page.wait_for_load_state('networkidle')
+                # await page.wait_for_timeout(100)
+                
                 # Check for on execution event
                 await self.execute_hook('on_execution_started', page)
                 
@@ -846,6 +854,9 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
                     await self.smart_wait(page, wait_for, timeout=kwargs.get("page_timeout", 60000))
                 except Exception as e:
                     raise RuntimeError(f"Wait condition failed: {str(e)}")
+            
+            # if not wait_for and js_code:
+            #     await page.wait_for_load_state('networkidle', timeout=5000)
 
             # Update image dimensions
             update_image_dimensions_js = """
diff --git a/crawl4ai/async_database.3.73.py b/crawl4ai/async_database.3.73.py
deleted file mode 100644
index f86c7f1d..00000000
--- a/crawl4ai/async_database.3.73.py
+++ /dev/null
@@ -1,285 +0,0 @@
-import os
-from pathlib import Path
-import aiosqlite
-import asyncio
-from typing import Optional, Tuple, Dict
-from contextlib import asynccontextmanager
-import logging
-import json  # Added for serialization/deserialization
-from .utils import ensure_content_dirs, generate_content_hash
-import xxhash
-import aiofiles
-# Set up logging
-logging.basicConfig(level=logging.INFO)
-logger = logging.getLogger(__name__)
-
-DB_PATH = os.path.join(Path.home(), ".crawl4ai")
-os.makedirs(DB_PATH, exist_ok=True)
-DB_PATH = os.path.join(DB_PATH, "crawl4ai.db")
-
-class AsyncDatabaseManager:
-    def __init__(self, pool_size: int = 10, max_retries: int = 3):
-        self.db_path = DB_PATH
-        self.content_paths = ensure_content_dirs(os.path.dirname(DB_PATH))
-        self.pool_size = pool_size
-        self.max_retries = max_retries
-        self.connection_pool: Dict[int, aiosqlite.Connection] = {}
-        self.pool_lock = asyncio.Lock()
-        self.connection_semaphore = asyncio.Semaphore(pool_size)
-        
-    async def initialize(self):
-        """Initialize the database and connection pool"""
-        await self.ainit_db()
-        
-    async def cleanup(self):
-        """Cleanup connections when shutting down"""
-        async with self.pool_lock:
-            for conn in self.connection_pool.values():
-                await conn.close()
-            self.connection_pool.clear()
-
-    @asynccontextmanager
-    async def get_connection(self):
-        """Connection pool manager"""
-        async with self.connection_semaphore:
-            task_id = id(asyncio.current_task())
-            try:
-                async with self.pool_lock:
-                    if task_id not in self.connection_pool:
-                        conn = await aiosqlite.connect(
-                            self.db_path,
-                            timeout=30.0
-                        )
-                        await conn.execute('PRAGMA journal_mode = WAL')
-                        await conn.execute('PRAGMA busy_timeout = 5000')
-                        self.connection_pool[task_id] = conn
-                    
-                yield self.connection_pool[task_id]
-                
-            except Exception as e:
-                logger.error(f"Connection error: {e}")
-                raise
-            finally:
-                async with self.pool_lock:
-                    if task_id in self.connection_pool:
-                        await self.connection_pool[task_id].close()
-                        del self.connection_pool[task_id]
-
-    async def execute_with_retry(self, operation, *args):
-        """Execute database operations with retry logic"""
-        for attempt in range(self.max_retries):
-            try:
-                async with self.get_connection() as db:
-                    result = await operation(db, *args)
-                    await db.commit()
-                    return result
-            except Exception as e:
-                if attempt == self.max_retries - 1:
-                    logger.error(f"Operation failed after {self.max_retries} attempts: {e}")
-                    raise
-                await asyncio.sleep(1 * (attempt + 1))  # Exponential backoff
-
-    async def ainit_db(self):
-        """Initialize database schema"""
-        async def _init(db):
-            await db.execute('''
-                CREATE TABLE IF NOT EXISTS crawled_data (
-                    url TEXT PRIMARY KEY,
-                    html TEXT,
-                    cleaned_html TEXT,
-                    markdown TEXT,
-                    extracted_content TEXT,
-                    success BOOLEAN,
-                    media TEXT DEFAULT "{}",
-                    links TEXT DEFAULT "{}",
-                    metadata TEXT DEFAULT "{}",
-                    screenshot TEXT DEFAULT "",
-                    response_headers TEXT DEFAULT "{}",
-                    downloaded_files TEXT DEFAULT "{}"  -- New column added
-                )
-            ''')
-        
-        await self.execute_with_retry(_init)
-        await self.update_db_schema()
-
-    async def update_db_schema(self):
-        """Update database schema if needed"""
-        async def _check_columns(db):
-            cursor = await db.execute("PRAGMA table_info(crawled_data)")
-            columns = await cursor.fetchall()
-            return [column[1] for column in columns]
-
-        column_names = await self.execute_with_retry(_check_columns)
-        
-        # List of new columns to add
-        new_columns = ['media', 'links', 'metadata', 'screenshot', 'response_headers', 'downloaded_files']
-        
-        for column in new_columns:
-            if column not in column_names:
-                await self.aalter_db_add_column(column)
-
-    async def aalter_db_add_column(self, new_column: str):
-        """Add new column to the database"""
-        async def _alter(db):
-            if new_column == 'response_headers':
-                await db.execute(f'ALTER TABLE crawled_data ADD COLUMN {new_column} TEXT DEFAULT "{{}}"')
-            else:
-                await db.execute(f'ALTER TABLE crawled_data ADD COLUMN {new_column} TEXT DEFAULT ""')
-            logger.info(f"Added column '{new_column}' to the database.")
-
-        await self.execute_with_retry(_alter)
-
-
-    async def aget_cached_url(self, url: str) -> Optional[Tuple[str, str, str, str, str, bool, str, str, str, str]]:
-        """Retrieve cached URL data"""
-        async def _get(db):
-            async with db.execute(
-                '''
-                SELECT url, html, cleaned_html, markdown, 
-                    extracted_content, success, media, links,
-                    metadata, screenshot, response_headers,
-                    downloaded_files
-                FROM crawled_data WHERE url = ?
-                ''',
-                (url,)
-            ) as cursor:
-                row = await cursor.fetchone()
-                if row:
-                    # Load content from files using stored hashes
-                    html = await self._load_content(row[1], 'html') if row[1] else ""
-                    cleaned = await self._load_content(row[2], 'cleaned') if row[2] else ""
-                    markdown = await self._load_content(row[3], 'markdown') if row[3] else ""
-                    extracted = await self._load_content(row[4], 'extracted') if row[4] else ""
-                    screenshot = await self._load_content(row[9], 'screenshots') if row[9] else ""
-                    
-                    return (
-                        row[0],  # url
-                        html or "",  # Return empty string if file not found
-                        cleaned or "",
-                        markdown or "", 
-                        extracted or "",
-                        row[5],  # success
-                        json.loads(row[6] or '{}'),  # media
-                        json.loads(row[7] or '{}'),  # links
-                        json.loads(row[8] or '{}'),  # metadata
-                        screenshot or "",
-                        json.loads(row[10] or '{}'),  # response_headers
-                        json.loads(row[11] or '[]')  # downloaded_files
-                    )
-                return None
-
-        try:
-            return await self.execute_with_retry(_get)
-        except Exception as e:
-            logger.error(f"Error retrieving cached URL: {e}")
-            return None
-
-    async def acache_url(self, url: str, html: str, cleaned_html: str, 
-                        markdown: str, extracted_content: str, success: bool,
-                        media: str = "{}", links: str = "{}", 
-                        metadata: str = "{}", screenshot: str = "",
-                        response_headers: str = "{}", downloaded_files: str = "[]"):
-        """Cache URL data with content stored in filesystem"""
-        
-        # Store content files and get hashes
-        html_hash = await self._store_content(html, 'html')
-        cleaned_hash = await self._store_content(cleaned_html, 'cleaned')
-        markdown_hash = await self._store_content(markdown, 'markdown')
-        extracted_hash = await self._store_content(extracted_content, 'extracted')
-        screenshot_hash = await self._store_content(screenshot, 'screenshots')
-
-        async def _cache(db):
-            await db.execute('''
-                INSERT INTO crawled_data (
-                    url, html, cleaned_html, markdown,
-                    extracted_content, success, media, links, metadata,
-                    screenshot, response_headers, downloaded_files
-                )
-                VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)
-                ON CONFLICT(url) DO UPDATE SET
-                    html = excluded.html,
-                    cleaned_html = excluded.cleaned_html,
-                    markdown = excluded.markdown,
-                    extracted_content = excluded.extracted_content,
-                    success = excluded.success,
-                    media = excluded.media,      
-                    links = excluded.links,    
-                    metadata = excluded.metadata,      
-                    screenshot = excluded.screenshot,
-                    response_headers = excluded.response_headers,
-                    downloaded_files = excluded.downloaded_files
-            ''', (url, html_hash, cleaned_hash, markdown_hash, extracted_hash,
-                success, media, links, metadata, screenshot_hash,
-                response_headers, downloaded_files))
-
-        try:
-            await self.execute_with_retry(_cache)
-        except Exception as e:
-            logger.error(f"Error caching URL: {e}")
-
-
-
-    async def aget_total_count(self) -> int:
-        """Get total number of cached URLs"""
-        async def _count(db):
-            async with db.execute('SELECT COUNT(*) FROM crawled_data') as cursor:
-                result = await cursor.fetchone()
-                return result[0] if result else 0
-
-        try:
-            return await self.execute_with_retry(_count)
-        except Exception as e:
-            logger.error(f"Error getting total count: {e}")
-            return 0
-
-    async def aclear_db(self):
-        """Clear all data from the database"""
-        async def _clear(db):
-            await db.execute('DELETE FROM crawled_data')
-
-        try:
-            await self.execute_with_retry(_clear)
-        except Exception as e:
-            logger.error(f"Error clearing database: {e}")
-
-    async def aflush_db(self):
-        """Drop the entire table"""
-        async def _flush(db):
-            await db.execute('DROP TABLE IF EXISTS crawled_data')
-
-        try:
-            await self.execute_with_retry(_flush)
-        except Exception as e:
-            logger.error(f"Error flushing database: {e}")
-            
-                
-    async def _store_content(self, content: str, content_type: str) -> str:
-        """Store content in filesystem and return hash"""
-        if not content:
-            return ""
-            
-        content_hash = generate_content_hash(content)
-        file_path = os.path.join(self.content_paths[content_type], content_hash)
-        
-        # Only write if file doesn't exist
-        if not os.path.exists(file_path):
-            async with aiofiles.open(file_path, 'w', encoding='utf-8') as f:
-                await f.write(content)
-                
-        return content_hash
-
-    async def _load_content(self, content_hash: str, content_type: str) -> Optional[str]:
-        """Load content from filesystem by hash"""
-        if not content_hash:
-            return None
-            
-        file_path = os.path.join(self.content_paths[content_type], content_hash)
-        try:
-            async with aiofiles.open(file_path, 'r', encoding='utf-8') as f:
-                return await f.read()
-        except:
-            logger.error(f"Failed to load content: {file_path}")
-            return None
-
-# Create a singleton instance
-async_db_manager = AsyncDatabaseManager()
diff --git a/crawl4ai/async_webcrawler.3.73.py b/crawl4ai/async_webcrawler.3.73.py
deleted file mode 100644
index 03e7a393..00000000
--- a/crawl4ai/async_webcrawler.3.73.py
+++ /dev/null
@@ -1,344 +0,0 @@
-import os
-import time
-from pathlib import Path
-from typing import Optional
-import json
-import asyncio
-from .models import CrawlResult
-from .async_database import async_db_manager
-from .chunking_strategy import *
-from .extraction_strategy import *
-from .async_crawler_strategy import AsyncCrawlerStrategy, AsyncPlaywrightCrawlerStrategy, AsyncCrawlResponse
-from .content_scrapping_strategy import WebScrapingStrategy
-from .config import MIN_WORD_THRESHOLD, IMAGE_DESCRIPTION_MIN_WORD_THRESHOLD
-from .utils import (
-    sanitize_input_encode,
-    InvalidCSSSelectorError,
-    format_html
-)
-from .__version__ import __version__ as crawl4ai_version
-
-class AsyncWebCrawler:
-    def __init__(
-        self,
-        crawler_strategy: Optional[AsyncCrawlerStrategy] = None,
-        always_by_pass_cache: bool = False,
-        base_directory: str = str(Path.home()),
-        **kwargs,
-    ):
-        self.crawler_strategy = crawler_strategy or AsyncPlaywrightCrawlerStrategy(
-            **kwargs
-        )
-        self.always_by_pass_cache = always_by_pass_cache
-        # self.crawl4ai_folder = os.path.join(Path.home(), ".crawl4ai")
-        self.crawl4ai_folder = os.path.join(base_directory, ".crawl4ai")
-        os.makedirs(self.crawl4ai_folder, exist_ok=True)
-        os.makedirs(f"{self.crawl4ai_folder}/cache", exist_ok=True)
-        self.ready = False
-        self.verbose = kwargs.get("verbose", False)
-
-    async def __aenter__(self):
-        await self.crawler_strategy.__aenter__()
-        await self.awarmup()
-        return self
-
-    async def __aexit__(self, exc_type, exc_val, exc_tb):
-        await self.crawler_strategy.__aexit__(exc_type, exc_val, exc_tb)
-
-    async def awarmup(self):
-        # Print a message for crawl4ai and its version
-        if self.verbose:
-            print(f"[LOG] 🚀 Crawl4AI {crawl4ai_version}")
-            print("[LOG] 🌤️  Warming up the AsyncWebCrawler")
-        # await async_db_manager.ainit_db()
-        # # await async_db_manager.initialize()
-        # await self.arun(
-        #     url="https://google.com/",
-        #     word_count_threshold=5,
-        #     bypass_cache=False,
-        #     verbose=False,
-        # )
-        self.ready = True
-        if self.verbose:
-            print("[LOG] 🌞 AsyncWebCrawler is ready to crawl")
-
-    async def arun(
-        self,
-        url: str,
-        word_count_threshold=MIN_WORD_THRESHOLD,
-        extraction_strategy: ExtractionStrategy = None,
-        chunking_strategy: ChunkingStrategy = RegexChunking(),
-        bypass_cache: bool = False,
-        css_selector: str = None,
-        screenshot: bool = False,
-        user_agent: str = None,
-        verbose=True,
-        disable_cache: bool = False,
-        no_cache_read: bool = False,
-        no_cache_write: bool = False,
-        **kwargs,
-    ) -> CrawlResult:
-        """
-        Runs the crawler for a single source: URL (web, local file, or raw HTML).
-
-        Args:
-            url (str): The URL to crawl. Supported prefixes:
-                - 'http://' or 'https://': Web URL to crawl.
-                - 'file://': Local file path to process.
-                - 'raw:': Raw HTML content to process.
-            ... [other existing parameters]
-
-        Returns:
-            CrawlResult: The result of the crawling and processing.
-        """
-        try:
-            if disable_cache:
-                bypass_cache = True
-                no_cache_read = True
-                no_cache_write = True
-            
-            extraction_strategy = extraction_strategy or NoExtractionStrategy()
-            extraction_strategy.verbose = verbose
-            if not isinstance(extraction_strategy, ExtractionStrategy):
-                raise ValueError("Unsupported extraction strategy")
-            if not isinstance(chunking_strategy, ChunkingStrategy):
-                raise ValueError("Unsupported chunking strategy")
-            
-            word_count_threshold = max(word_count_threshold, MIN_WORD_THRESHOLD)
-
-            async_response: AsyncCrawlResponse = None
-            cached = None
-            screenshot_data = None
-            extracted_content = None
-            
-            is_web_url = url.startswith(('http://', 'https://'))
-            is_local_file = url.startswith("file://")
-            is_raw_html = url.startswith("raw:")
-            _url = url if not is_raw_html else "Raw HTML"
-            
-            start_time = time.perf_counter()
-            cached_result = None
-            if is_web_url and (not bypass_cache or not no_cache_read) and not self.always_by_pass_cache:
-                cached_result = await async_db_manager.aget_cached_url(url)
-                        
-            if cached_result:
-                html = sanitize_input_encode(cached_result.html)
-                extracted_content = sanitize_input_encode(cached_result.extracted_content or "")
-                if screenshot:
-                    screenshot_data = cached_result.screenshot
-                    if not screenshot_data:
-                        cached_result = None
-                if verbose:
-                    print(
-                        f"[LOG] 1️⃣  ✅ Page fetched (cache) for {_url}, success: {bool(html)}, time taken: {time.perf_counter() - start_time:.2f} seconds"
-                    )
-
-
-            if not cached or not html:
-                t1 = time.perf_counter()
-                
-                if user_agent:
-                    self.crawler_strategy.update_user_agent(user_agent)
-                async_response: AsyncCrawlResponse = await self.crawler_strategy.crawl(url, screenshot=screenshot, **kwargs)
-                html = sanitize_input_encode(async_response.html)
-                screenshot_data = async_response.screenshot
-                t2 = time.perf_counter()
-                if verbose:
-                    print(
-                        f"[LOG] 1️⃣  ✅ Page fetched (no-cache) for {_url}, success: {bool(html)}, time taken: {t2 - t1:.2f} seconds"
-                    )
-
-            t1 = time.perf_counter()
-            crawl_result = await self.aprocess_html(
-                url=url,
-                html=html,
-                extracted_content=extracted_content,
-                word_count_threshold=word_count_threshold,
-                extraction_strategy=extraction_strategy,
-                chunking_strategy=chunking_strategy,
-                css_selector=css_selector,
-                screenshot=screenshot_data,
-                verbose=verbose,
-                is_cached=bool(cached),
-                async_response=async_response,
-                bypass_cache=bypass_cache,
-                is_web_url = is_web_url,
-                is_local_file = is_local_file,
-                is_raw_html = is_raw_html,
-                **kwargs,
-            )
-            
-            if async_response:
-                crawl_result.status_code = async_response.status_code
-                crawl_result.response_headers = async_response.response_headers
-                crawl_result.downloaded_files = async_response.downloaded_files
-            else:
-                crawl_result.status_code = 200
-                crawl_result.response_headers = cached_result.response_headers if cached_result else {}
-
-            crawl_result.success = bool(html)
-            crawl_result.session_id = kwargs.get("session_id", None)
-
-            if verbose:
-                print(
-                    f"[LOG] 🔥 🚀 Crawling done for {_url}, success: {crawl_result.success}, time taken: {time.perf_counter() - start_time:.2f} seconds"
-                )
-
-            if not is_raw_html and not no_cache_write:
-                if not bool(cached_result) or kwargs.get("bypass_cache", False) or self.always_by_pass_cache:
-                    await async_db_manager.acache_url(crawl_result)
-
-
-            return crawl_result
-        
-        except Exception as e:
-            if not hasattr(e, "msg"):
-                e.msg = str(e)
-            print(f"[ERROR] 🚫 arun(): Failed to crawl {_url}, error: {e.msg}")
-            return CrawlResult(url=url, html="", markdown = f"[ERROR] 🚫 arun(): Failed to crawl {_url}, error: {e.msg}", success=False, error_message=e.msg)
-
-    async def arun_many(
-        self,
-        urls: List[str],
-        word_count_threshold=MIN_WORD_THRESHOLD,
-        extraction_strategy: ExtractionStrategy = None,
-        chunking_strategy: ChunkingStrategy = RegexChunking(),
-        bypass_cache: bool = False,
-        css_selector: str = None,
-        screenshot: bool = False,
-        user_agent: str = None,
-        verbose=True,
-        **kwargs,
-    ) -> List[CrawlResult]:
-        """
-        Runs the crawler for multiple sources: URLs (web, local files, or raw HTML).
-
-        Args:
-            urls (List[str]): A list of URLs with supported prefixes:
-                - 'http://' or 'https://': Web URL to crawl.
-                - 'file://': Local file path to process.
-                - 'raw:': Raw HTML content to process.
-            ... [other existing parameters]
-
-        Returns:
-            List[CrawlResult]: The results of the crawling and processing.
-        """
-        semaphore_count = kwargs.get('semaphore_count', 5)  # Adjust as needed
-        semaphore = asyncio.Semaphore(semaphore_count)
-
-        async def crawl_with_semaphore(url):
-            async with semaphore:
-                return await self.arun(
-                    url,
-                    word_count_threshold=word_count_threshold,
-                    extraction_strategy=extraction_strategy,
-                    chunking_strategy=chunking_strategy,
-                    bypass_cache=bypass_cache,
-                    css_selector=css_selector,
-                    screenshot=screenshot,
-                    user_agent=user_agent,
-                    verbose=verbose,
-                    **kwargs,
-                )
-
-        tasks = [crawl_with_semaphore(url) for url in urls]
-        results = await asyncio.gather(*tasks, return_exceptions=True)
-        return [result if not isinstance(result, Exception) else str(result) for result in results]
-
-    async def aprocess_html(
-        self,
-        url: str,
-        html: str,
-        extracted_content: str,
-        word_count_threshold: int,
-        extraction_strategy: ExtractionStrategy,
-        chunking_strategy: ChunkingStrategy,
-        css_selector: str,
-        screenshot: str,
-        verbose: bool,
-        **kwargs,
-    ) -> CrawlResult:
-        t = time.perf_counter()
-        # Extract content from HTML
-        try:
-            _url = url if not kwargs.get("is_raw_html", False) else "Raw HTML"
-            t1 = time.perf_counter()
-            scrapping_strategy = WebScrapingStrategy()
-            # result = await scrapping_strategy.ascrap(
-            result = scrapping_strategy.scrap(
-                url,
-                html,
-                word_count_threshold=word_count_threshold,
-                css_selector=css_selector,
-                only_text=kwargs.get("only_text", False),
-                image_description_min_word_threshold=kwargs.get(
-                    "image_description_min_word_threshold", IMAGE_DESCRIPTION_MIN_WORD_THRESHOLD
-                ),
-                **kwargs,
-            )
-
-            if result is None:
-                raise ValueError(f"Process HTML, Failed to extract content from the website: {url}")
-        except InvalidCSSSelectorError as e:
-            raise ValueError(str(e))
-        except Exception as e:
-            raise ValueError(f"Process HTML, Failed to extract content from the website: {url}, error: {str(e)}")
-
-        cleaned_html = sanitize_input_encode(result.get("cleaned_html", ""))
-        markdown = sanitize_input_encode(result.get("markdown", ""))
-        fit_markdown = sanitize_input_encode(result.get("fit_markdown", ""))
-        fit_html = sanitize_input_encode(result.get("fit_html", ""))
-        media = result.get("media", [])
-        links = result.get("links", [])
-        metadata = result.get("metadata", {})
-        
-        if verbose:
-            print(
-                f"[LOG] 2️⃣  ✅ Scraping done for {_url}, success: True, time taken: {time.perf_counter() - t1:.2f} seconds"
-            )        
-
-        if extracted_content is None and extraction_strategy and chunking_strategy and not isinstance(extraction_strategy, NoExtractionStrategy):
-            t1 = time.perf_counter()
-            # Check if extraction strategy is type of JsonCssExtractionStrategy
-            if isinstance(extraction_strategy, JsonCssExtractionStrategy) or isinstance(extraction_strategy, JsonCssExtractionStrategy):
-                extraction_strategy.verbose = verbose
-                extracted_content = extraction_strategy.run(url, [html])
-                extracted_content = json.dumps(extracted_content, indent=4, default=str, ensure_ascii=False)
-            else:
-                sections = chunking_strategy.chunk(markdown)
-                extracted_content = extraction_strategy.run(url, sections)
-                extracted_content = json.dumps(extracted_content, indent=4, default=str, ensure_ascii=False)
-            if verbose:
-                print(
-                    f"[LOG] 3️⃣  ✅ Extraction done for {_url}, time taken: {time.perf_counter() - t1:.2f} seconds"
-                )
-
-        screenshot = None if not screenshot else screenshot
-        
-        return CrawlResult(
-            url=url,
-            html=html,
-            cleaned_html=format_html(cleaned_html),
-            markdown=markdown,
-            fit_markdown=fit_markdown,
-            fit_html= fit_html,
-            media=media,
-            links=links,
-            metadata=metadata,
-            screenshot=screenshot,
-            extracted_content=extracted_content,
-            success=True,
-            error_message="",
-        )
-
-    async def aclear_cache(self):
-        # await async_db_manager.aclear_db()
-        await async_db_manager.cleanup()
-
-    async def aflush_cache(self):
-        await async_db_manager.aflush_db()
-
-    async def aget_cache_size(self):
-        return await async_db_manager.aget_total_count()
-
-
diff --git a/crawl4ai/async_webcrawler.py b/crawl4ai/async_webcrawler.py
index 7d1814b6..2ff7ce0f 100644
--- a/crawl4ai/async_webcrawler.py
+++ b/crawl4ai/async_webcrawler.py
@@ -7,14 +7,14 @@ from pathlib import Path
 from typing import Optional, List, Union
 import json
 import asyncio
-from .models import CrawlResult
+from .models import CrawlResult, MarkdownGenerationResult
 from .async_database import async_db_manager
 from .chunking_strategy import *
 from .content_filter_strategy import *
 from .extraction_strategy import *
 from .async_crawler_strategy import AsyncCrawlerStrategy, AsyncPlaywrightCrawlerStrategy, AsyncCrawlResponse
 from .cache_context import CacheMode, CacheContext, _legacy_to_cache_mode
-from .content_scrapping_strategy import WebScrapingStrategy
+from .content_scraping_strategy import WebScrapingStrategy
 from .async_logger import AsyncLogger
 
 from .config import (
@@ -476,7 +476,7 @@ class AsyncWebCrawler:
                 html,
                 word_count_threshold=word_count_threshold,
                 css_selector=css_selector,
-                only_text=kwargs.get("only_text", False),
+                only_text=kwargs.pop("only_text", False),
                 image_description_min_word_threshold=kwargs.get(
                     "image_description_min_word_threshold", IMAGE_DESCRIPTION_MIN_WORD_THRESHOLD
                 ),
@@ -491,6 +491,8 @@ class AsyncWebCrawler:
         except Exception as e:
             raise ValueError(f"Process HTML, Failed to extract content from the website: {url}, error: {str(e)}")
 
+        markdown_v2: MarkdownGenerationResult = result.get("markdown_v2", None)
+        
         cleaned_html = sanitize_input_encode(result.get("cleaned_html", ""))
         markdown = sanitize_input_encode(result.get("markdown", ""))
         fit_markdown = sanitize_input_encode(result.get("fit_markdown", ""))
@@ -542,6 +544,7 @@ class AsyncWebCrawler:
             url=url,
             html=html,
             cleaned_html=format_html(cleaned_html),
+            markdown_v2=markdown_v2,
             markdown=markdown,
             fit_markdown=fit_markdown,
             fit_html= fit_html,
diff --git a/crawl4ai/content_scrapping_strategy.py b/crawl4ai/content_scraping_strategy.py
similarity index 84%
rename from crawl4ai/content_scrapping_strategy.py
rename to crawl4ai/content_scraping_strategy.py
index 0f470671..3823a78d 100644
--- a/crawl4ai/content_scrapping_strategy.py
+++ b/crawl4ai/content_scraping_strategy.py
@@ -1,6 +1,6 @@
 import re  # Point 1: Pre-Compile Regular Expressions
 from abc import ABC, abstractmethod
-from typing import Dict, Any
+from typing import Dict, Any, Optional
 from bs4 import BeautifulSoup
 from concurrent.futures import ThreadPoolExecutor
 import asyncio, requests, re, os
@@ -10,103 +10,19 @@ from urllib.parse import urljoin
 from requests.exceptions import InvalidSchema
 # from .content_cleaning_strategy import ContentCleaningStrategy
 from .content_filter_strategy import RelevantContentFilter, BM25ContentFilter
-
+from .markdown_generation_strategy import MarkdownGenerationStrategy, DefaultMarkdownGenerationStrategy
+from .models import MarkdownGenerationResult
 from .utils import (
     sanitize_input_encode,
     sanitize_html,
     extract_metadata,
     InvalidCSSSelectorError,
-    # CustomHTML2Text,
+    CustomHTML2Text,
     normalize_url,
     is_external_url
     
 )
 
-from .html2text import HTML2Text
-class CustomHTML2Text(HTML2Text):
-    def __init__(self, *args, **kwargs):
-        super().__init__(*args, **kwargs)
-        self.inside_pre = False
-        self.inside_code = False
-        self.preserve_tags = set()  # Set of tags to preserve
-        self.current_preserved_tag = None
-        self.preserved_content = []
-        self.preserve_depth = 0
-        
-        # Configuration options
-        self.skip_internal_links = False
-        self.single_line_break = False
-        self.mark_code = False
-        self.include_sup_sub = False
-        self.body_width = 0
-        self.ignore_mailto_links = True
-        self.ignore_links = False
-        self.escape_backslash = False
-        self.escape_dot = False
-        self.escape_plus = False
-        self.escape_dash = False
-        self.escape_snob = False
-
-    def update_params(self, **kwargs):
-        """Update parameters and set preserved tags."""
-        for key, value in kwargs.items():
-            if key == 'preserve_tags':
-                self.preserve_tags = set(value)
-            else:
-                setattr(self, key, value)
-
-    def handle_tag(self, tag, attrs, start):
-        # Handle preserved tags
-        if tag in self.preserve_tags:
-            if start:
-                if self.preserve_depth == 0:
-                    self.current_preserved_tag = tag
-                    self.preserved_content = []
-                    # Format opening tag with attributes
-                    attr_str = ''.join(f' {k}="{v}"' for k, v in attrs.items() if v is not None)
-                    self.preserved_content.append(f'<{tag}{attr_str}>')
-                self.preserve_depth += 1
-                return
-            else:
-                self.preserve_depth -= 1
-                if self.preserve_depth == 0:
-                    self.preserved_content.append(f'</{tag}>')
-                    # Output the preserved HTML block with proper spacing
-                    preserved_html = ''.join(self.preserved_content)
-                    self.o('\n' + preserved_html + '\n')
-                    self.current_preserved_tag = None
-                return
-
-        # If we're inside a preserved tag, collect all content
-        if self.preserve_depth > 0:
-            if start:
-                # Format nested tags with attributes
-                attr_str = ''.join(f' {k}="{v}"' for k, v in attrs.items() if v is not None)
-                self.preserved_content.append(f'<{tag}{attr_str}>')
-            else:
-                self.preserved_content.append(f'</{tag}>')
-            return
-
-        # Handle pre tags
-        if tag == 'pre':
-            if start:
-                self.o('```\n')
-                self.inside_pre = True
-            else:
-                self.o('\n```')
-                self.inside_pre = False
-        # elif tag in ["h1", "h2", "h3", "h4", "h5", "h6"]:
-        #     pass
-        else:
-            super().handle_tag(tag, attrs, start)
-
-    def handle_data(self, data, entity_char=False):
-        """Override handle_data to capture content within preserved tags."""
-        if self.preserve_depth > 0:
-            self.preserved_content.append(data)
-            return
-        super().handle_data(data, entity_char)
-
 # Pre-compile regular expressions for Open Graph and Twitter metadata
 OG_REGEX = re.compile(r'^og:')
 TWITTER_REGEX = re.compile(r'^twitter:')
@@ -164,6 +80,98 @@ class WebScrapingStrategy(ContentScrapingStrategy):
     async def ascrap(self, url: str, html: str, **kwargs) -> Dict[str, Any]:
         return await asyncio.to_thread(self._get_content_of_website_optimized, url, html, **kwargs)
 
+
+    def _generate_markdown_content(self, 
+                                 cleaned_html: str,
+                                 html: str,
+                                 url: str,
+                                 success: bool,
+                                 **kwargs) -> Dict[str, Any]:
+        """Generate markdown content using either new strategy or legacy method.
+        
+        Args:
+            cleaned_html: Sanitized HTML content
+            html: Original HTML content
+            url: Base URL of the page
+            success: Whether scraping was successful
+            **kwargs: Additional options including:
+                - markdown_generator: Optional[MarkdownGenerationStrategy]
+                - html2text: Dict[str, Any] options for HTML2Text
+                - content_filter: Optional[RelevantContentFilter]
+                - fit_markdown: bool
+                - fit_markdown_user_query: Optional[str]
+                - fit_markdown_bm25_threshold: float
+        
+        Returns:
+            Dict containing markdown content in various formats
+        """
+        markdown_generator: Optional[MarkdownGenerationStrategy] = kwargs.get('markdown_generator', DefaultMarkdownGenerationStrategy())
+        
+        if markdown_generator:
+            try:
+                markdown_result = markdown_generator.generate_markdown(
+                    cleaned_html=cleaned_html,
+                    base_url=url,
+                    html2text_options=kwargs.get('html2text', {}),
+                    content_filter=kwargs.get('content_filter', None)
+                )
+                
+                markdown_v2 = MarkdownGenerationResult(
+                    raw_markdown=markdown_result.raw_markdown,
+                    markdown_with_citations=markdown_result.markdown_with_citations,
+                    references_markdown=markdown_result.references_markdown,
+                    fit_markdown=markdown_result.fit_markdown
+                )
+
+                return {
+                    'markdown': markdown_result.raw_markdown,  
+                    'fit_markdown': markdown_result.fit_markdown or "Set flag 'fit_markdown' to True to get cleaned HTML content.",
+                    'fit_html': kwargs.get('content_filter', None).filter_content(html) if kwargs.get('content_filter') else "Set flag 'fit_markdown' to True to get cleaned HTML content.",
+                    'markdown_v2': markdown_v2
+                }
+            except Exception as e:
+                self._log('error',
+                    message="Error using new markdown generation strategy: {error}",
+                    tag="SCRAPE",
+                    params={"error": str(e)}
+                )
+                markdown_generator = None
+
+        # Legacy method
+        h = CustomHTML2Text()
+        h.update_params(**kwargs.get('html2text', {}))            
+        markdown = h.handle(cleaned_html)
+        markdown = markdown.replace('    ```', '```')
+        
+        fit_markdown = "Set flag 'fit_markdown' to True to get cleaned HTML content."
+        fit_html = "Set flag 'fit_markdown' to True to get cleaned HTML content."
+        
+        if kwargs.get('content_filter', None) or kwargs.get('fit_markdown', False):
+            content_filter = kwargs.get('content_filter', None)
+            if not content_filter:
+                content_filter = BM25ContentFilter(
+                    user_query=kwargs.get('fit_markdown_user_query', None),
+                    bm25_threshold=kwargs.get('fit_markdown_bm25_threshold', 1.0)
+                )
+            fit_html = content_filter.filter_content(html)
+            fit_html = '\n'.join('<div>{}</div>'.format(s) for s in fit_html)
+            fit_markdown = h.handle(fit_html)
+
+        markdown_v2 = MarkdownGenerationResult(
+            raw_markdown=markdown,
+            markdown_with_citations=markdown,
+            references_markdown=markdown,
+            fit_markdown=fit_markdown
+        )
+        
+        return {
+            'markdown': markdown,
+            'fit_markdown': fit_markdown,
+            'fit_html': fit_html,
+            'markdown_v2' : markdown_v2
+        }
+
+
     def _get_content_of_website_optimized(self, url: str, html: str, word_count_threshold: int = MIN_WORD_THRESHOLD, css_selector: str = None, **kwargs) -> Dict[str, Any]:
         success = True
         if not html:
@@ -242,8 +250,6 @@ class WebScrapingStrategy(ContentScrapingStrategy):
 
             #Score an image for it's usefulness
             def score_image_for_usefulness(img, base_url, index, images_count):
-
-
                 image_height = img.get('height')
                 height_value, height_unit = parse_dimension(image_height)
                 image_width =  img.get('width')
@@ -282,7 +288,7 @@ class WebScrapingStrategy(ContentScrapingStrategy):
             if not is_valid_image(img, img.parent, img.parent.get('class', [])):
                 return None
             score = score_image_for_usefulness(img, url, index, total_images)
-            if score <= IMAGE_SCORE_THRESHOLD:
+            if score <= kwargs.get('image_score_threshold', IMAGE_SCORE_THRESHOLD):
                 return None
             return {
                 'src': img.get('src', ''),
@@ -545,41 +551,16 @@ class WebScrapingStrategy(ContentScrapingStrategy):
 
         cleaned_html = str_body.replace('\n\n', '\n').replace('  ', ' ')
 
-        try:
-            h = CustomHTML2Text()
-            h.update_params(**kwargs.get('html2text', {}))            
-            markdown = h.handle(cleaned_html)
-        except Exception as e:
-            if not h:
-                h = CustomHTML2Text()
-            self._log('error',
-                message="Error converting HTML to markdown: {error}",
-                tag="SCRAPE",
-                params={"error": str(e)}
-            )
-            markdown = h.handle(sanitize_html(cleaned_html))
-        markdown = markdown.replace('    ```', '```')
-
+        markdown_content = self._generate_markdown_content(
+            cleaned_html=cleaned_html,
+            html=html,
+            url=url,
+            success=success,
+            **kwargs
+        )
         
-            
-        fit_markdown = "Set flag 'fit_markdown' to True to get cleaned HTML content."
-        fit_html = "Set flag 'fit_markdown' to True to get cleaned HTML content."
-        if kwargs.get('content_filter', None) or kwargs.get('fit_markdown', False):
-            content_filter = kwargs.get('content_filter', None)
-            if not content_filter:
-                content_filter = BM25ContentFilter(
-                    user_query= kwargs.get('fit_markdown_user_query', None),
-                    bm25_threshold= kwargs.get('fit_markdown_bm25_threshold', 1.0)
-                )
-            fit_html = content_filter.filter_content(html)
-            fit_html = '\n'.join('<div>{}</div>'.format(s) for s in fit_html)
-            fit_markdown = h.handle(fit_html)
-
-        cleaned_html = sanitize_html(cleaned_html)
         return {
-            'markdown': markdown,
-            'fit_markdown': fit_markdown,
-            'fit_html': fit_html,
+            **markdown_content,
             'cleaned_html': cleaned_html,
             'success': success,
             'media': media,
diff --git a/crawl4ai/markdown_generation_strategy.py b/crawl4ai/markdown_generation_strategy.py
new file mode 100644
index 00000000..1adb4c28
--- /dev/null
+++ b/crawl4ai/markdown_generation_strategy.py
@@ -0,0 +1,115 @@
+from abc import ABC, abstractmethod
+from typing import Optional, Dict, Any, Tuple
+from .models import MarkdownGenerationResult
+from .utils import CustomHTML2Text
+from .content_filter_strategy import RelevantContentFilter, BM25ContentFilter
+import re
+from urllib.parse import urljoin
+
+# Pre-compile the regex pattern
+LINK_PATTERN = re.compile(r'!?\[([^\]]+)\]\(([^)]+?)(?:\s+"([^"]*)")?\)')
+
+class MarkdownGenerationStrategy(ABC):
+    """Abstract base class for markdown generation strategies."""
+    
+    @abstractmethod
+    def generate_markdown(self, 
+                         cleaned_html: str, 
+                         base_url: str = "",
+                         html2text_options: Optional[Dict[str, Any]] = None,
+                         content_filter: Optional[RelevantContentFilter] = None,
+                         citations: bool = True,
+                         **kwargs) -> MarkdownGenerationResult:
+        """Generate markdown from cleaned HTML."""
+        pass
+
+class DefaultMarkdownGenerationStrategy(MarkdownGenerationStrategy):
+    """Default implementation of markdown generation strategy."""
+    
+    def convert_links_to_citations(self, markdown: str, base_url: str = "") -> Tuple[str, str]:
+        link_map = {}
+        url_cache = {}  # Cache for URL joins
+        parts = []
+        last_end = 0
+        counter = 1
+        
+        for match in LINK_PATTERN.finditer(markdown):
+            parts.append(markdown[last_end:match.start()])
+            text, url, title = match.groups()
+            
+            # Use cached URL if available, otherwise compute and cache
+            if base_url and not url.startswith(('http://', 'https://', 'mailto:')):
+                if url not in url_cache:
+                    url_cache[url] = fast_urljoin(base_url, url)
+                url = url_cache[url]
+                
+            if url not in link_map:
+                desc = []
+                if title: desc.append(title)
+                if text and text != title: desc.append(text)
+                link_map[url] = (counter, ": " + " - ".join(desc) if desc else "")
+                counter += 1
+                
+            num = link_map[url][0]
+            parts.append(f"{text}⟨{num}⟩" if not match.group(0).startswith('!') else f"![{text}⟨{num}⟩]")
+            last_end = match.end()
+        
+        parts.append(markdown[last_end:])
+        converted_text = ''.join(parts)
+        
+        # Pre-build reference strings
+        references = ["\n\n## References\n\n"]
+        references.extend(
+            f"⟨{num}⟩ {url}{desc}\n" 
+            for url, (num, desc) in sorted(link_map.items(), key=lambda x: x[1][0])
+        )
+        
+        return converted_text, ''.join(references)
+
+    def generate_markdown(self, 
+                         cleaned_html: str, 
+                         base_url: str = "",
+                         html2text_options: Optional[Dict[str, Any]] = None,
+                         content_filter: Optional[RelevantContentFilter] = None,
+                         citations: bool = True,
+                         **kwargs) -> MarkdownGenerationResult:
+        """Generate markdown with citations from cleaned HTML."""
+        # Initialize HTML2Text with options
+        h = CustomHTML2Text()
+        if html2text_options:
+            h.update_params(**html2text_options)
+
+        # Generate raw markdown
+        raw_markdown = h.handle(cleaned_html)
+        raw_markdown = raw_markdown.replace('    ```', '```')
+
+        # Convert links to citations
+        if citations:
+            markdown_with_citations, references_markdown = self.convert_links_to_citations(
+                raw_markdown, base_url
+            )
+
+        # Generate fit markdown if content filter is provided
+        fit_markdown: Optional[str] = None
+        if content_filter:
+            filtered_html = content_filter.filter_content(cleaned_html)
+            filtered_html = '\n'.join('<div>{}</div>'.format(s) for s in filtered_html)
+            fit_markdown = h.handle(filtered_html)
+
+        return MarkdownGenerationResult(
+            raw_markdown=raw_markdown,
+            markdown_with_citations=markdown_with_citations,
+            references_markdown=references_markdown,
+            fit_markdown=fit_markdown
+        )
+
+def fast_urljoin(base: str, url: str) -> str:
+    """Fast URL joining for common cases."""
+    if url.startswith(('http://', 'https://', 'mailto:', '//')):
+        return url
+    if url.startswith('/'):
+        # Handle absolute paths
+        if base.endswith('/'):
+            return base[:-1] + url
+        return base + url
+    return urljoin(base, url)
\ No newline at end of file
diff --git a/crawl4ai/models.py b/crawl4ai/models.py
index cab4c45b..122434ad 100644
--- a/crawl4ai/models.py
+++ b/crawl4ai/models.py
@@ -1,5 +1,5 @@
 from pydantic import BaseModel, HttpUrl
-from typing import List, Dict, Optional, Callable, Awaitable
+from typing import List, Dict, Optional, Callable, Awaitable, Union
 
 
 
@@ -7,6 +7,12 @@ class UrlModel(BaseModel):
     url: HttpUrl
     forced: bool = False
 
+class MarkdownGenerationResult(BaseModel):
+    raw_markdown: str
+    markdown_with_citations: str
+    references_markdown: str
+    fit_markdown: Optional[str] = None
+
 class CrawlResult(BaseModel):
     url: str
     html: str
@@ -16,7 +22,8 @@ class CrawlResult(BaseModel):
     links: Dict[str, List[Dict]] = {}
     downloaded_files: Optional[List[str]] = None
     screenshot: Optional[str] = None
-    markdown: Optional[str] = None
+    markdown: Optional[Union[str, MarkdownGenerationResult]] = None
+    markdown_v2: Optional[MarkdownGenerationResult] = None
     fit_markdown: Optional[str] = None
     fit_html: Optional[str] = None
     extracted_content: Optional[str] = None
@@ -36,3 +43,5 @@ class AsyncCrawlResponse(BaseModel):
 
     class Config:
         arbitrary_types_allowed = True
+
+
diff --git a/crawl4ai/utils.py b/crawl4ai/utils.py
index 9abc5784..b07562df 100644
--- a/crawl4ai/utils.py
+++ b/crawl4ai/utils.py
@@ -18,6 +18,94 @@ import hashlib
 from typing import Optional, Tuple, Dict, Any
 import xxhash
 
+
+from .html2text import HTML2Text
+class CustomHTML2Text(HTML2Text):
+    def __init__(self, *args, **kwargs):
+        super().__init__(*args, **kwargs)
+        self.inside_pre = False
+        self.inside_code = False
+        self.preserve_tags = set()  # Set of tags to preserve
+        self.current_preserved_tag = None
+        self.preserved_content = []
+        self.preserve_depth = 0
+        
+        # Configuration options
+        self.skip_internal_links = False
+        self.single_line_break = False
+        self.mark_code = False
+        self.include_sup_sub = False
+        self.body_width = 0
+        self.ignore_mailto_links = True
+        self.ignore_links = False
+        self.escape_backslash = False
+        self.escape_dot = False
+        self.escape_plus = False
+        self.escape_dash = False
+        self.escape_snob = False
+
+    def update_params(self, **kwargs):
+        """Update parameters and set preserved tags."""
+        for key, value in kwargs.items():
+            if key == 'preserve_tags':
+                self.preserve_tags = set(value)
+            else:
+                setattr(self, key, value)
+
+    def handle_tag(self, tag, attrs, start):
+        # Handle preserved tags
+        if tag in self.preserve_tags:
+            if start:
+                if self.preserve_depth == 0:
+                    self.current_preserved_tag = tag
+                    self.preserved_content = []
+                    # Format opening tag with attributes
+                    attr_str = ''.join(f' {k}="{v}"' for k, v in attrs.items() if v is not None)
+                    self.preserved_content.append(f'<{tag}{attr_str}>')
+                self.preserve_depth += 1
+                return
+            else:
+                self.preserve_depth -= 1
+                if self.preserve_depth == 0:
+                    self.preserved_content.append(f'</{tag}>')
+                    # Output the preserved HTML block with proper spacing
+                    preserved_html = ''.join(self.preserved_content)
+                    self.o('\n' + preserved_html + '\n')
+                    self.current_preserved_tag = None
+                return
+
+        # If we're inside a preserved tag, collect all content
+        if self.preserve_depth > 0:
+            if start:
+                # Format nested tags with attributes
+                attr_str = ''.join(f' {k}="{v}"' for k, v in attrs.items() if v is not None)
+                self.preserved_content.append(f'<{tag}{attr_str}>')
+            else:
+                self.preserved_content.append(f'</{tag}>')
+            return
+
+        # Handle pre tags
+        if tag == 'pre':
+            if start:
+                self.o('```\n')
+                self.inside_pre = True
+            else:
+                self.o('\n```')
+                self.inside_pre = False
+        # elif tag in ["h1", "h2", "h3", "h4", "h5", "h6"]:
+        #     pass
+        else:
+            super().handle_tag(tag, attrs, start)
+
+    def handle_data(self, data, entity_char=False):
+        """Override handle_data to capture content within preserved tags."""
+        if self.preserve_depth > 0:
+            self.preserved_content.append(data)
+            return
+        super().handle_data(data, entity_char)
+
+
+
 class InvalidCSSSelectorError(Exception):
     pass
 
diff --git a/crawl4ai/web_crawler.py b/crawl4ai/web_crawler.py
index 6cfef6f0..a32a988d 100644
--- a/crawl4ai/web_crawler.py
+++ b/crawl4ai/web_crawler.py
@@ -10,7 +10,7 @@ from .extraction_strategy import *
 from .crawler_strategy import *
 from typing import List
 from concurrent.futures import ThreadPoolExecutor
-from .content_scrapping_strategy import WebScrapingStrategy
+from .content_scraping_strategy import WebScrapingStrategy
 from .config import *
 import warnings
 import json
diff --git a/tests/async/test_content_scraper_strategy.py b/tests/async/test_content_scraper_strategy.py
index 5dfa6362..62c49148 100644
--- a/tests/async/test_content_scraper_strategy.py
+++ b/tests/async/test_content_scraper_strategy.py
@@ -13,8 +13,8 @@ parent_dir = os.path.dirname(os.path.dirname(os.path.dirname(os.path.abspath(__f
 sys.path.append(parent_dir)
 __location__ = os.path.realpath(os.path.join(os.getcwd(), os.path.dirname(__file__)))
 
-from crawl4ai.content_scrapping_strategy import WebScrapingStrategy
-from crawl4ai.content_scrapping_strategy import WebScrapingStrategy as WebScrapingStrategyCurrent
+from crawl4ai.content_scraping_strategy import WebScrapingStrategy
+from crawl4ai.content_scraping_strategy import WebScrapingStrategy as WebScrapingStrategyCurrent
 # from crawl4ai.content_scrapping_strategy_current import WebScrapingStrategy as WebScrapingStrategyCurrent
 
 @dataclass
diff --git a/tests/async/test_markdown_genertor.py b/tests/async/test_markdown_genertor.py
new file mode 100644
index 00000000..025a0318
--- /dev/null
+++ b/tests/async/test_markdown_genertor.py
@@ -0,0 +1,165 @@
+# ## Issue #236
+# - **Last Updated:** 2024-11-11 01:42:14
+# - **Title:** [user data crawling opens two windows, unable to control correct user browser](https://github.com/unclecode/crawl4ai/issues/236)
+# - **State:** open
+
+import os, sys, time
+parent_dir = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
+sys.path.append(parent_dir)
+__location__ = os.path.realpath(    os.path.join(os.getcwd(), os.path.dirname(__file__)))
+import asyncio
+import os
+import time
+from typing import Dict, Any
+from crawl4ai.markdown_generation_strategy import DefaultMarkdownGenerationStrategy
+
+# Get current directory
+__location__ = os.path.realpath(os.path.join(os.getcwd(), os.path.dirname(__file__)))
+
+def print_test_result(name: str, result: Dict[str, Any], execution_time: float):
+    """Helper function to print test results."""
+    print(f"\n{'='*20} {name} {'='*20}")
+    print(f"Execution time: {execution_time:.4f} seconds")
+    
+    
+    # Save markdown to files
+    for key, content in result.items():
+        if isinstance(content, str):
+            with open(__location__ + f"/output/{name.lower()}_{key}.md", "w") as f:
+                f.write(content)
+    
+    # # Print first few lines of each markdown version
+    # for key, content in result.items():
+    #     if isinstance(content, str):
+    #         preview = '\n'.join(content.split('\n')[:3])
+    #         print(f"\n{key} (first 3 lines):")
+    #         print(preview)
+    #         print(f"Total length: {len(content)} characters")
+
+def test_basic_markdown_conversion():
+    """Test basic markdown conversion with links."""
+    with open(__location__ + "/data/wikipedia.html", "r") as f:
+        cleaned_html = f.read()
+
+    generator = DefaultMarkdownGenerationStrategy()
+    
+    start_time = time.perf_counter()
+    result = generator.generate_markdown(
+        cleaned_html=cleaned_html,
+        base_url="https://en.wikipedia.org"
+    )
+    execution_time = time.perf_counter() - start_time
+    
+    print_test_result("Basic Markdown Conversion", {
+        'raw': result.raw_markdown,
+        'with_citations': result.markdown_with_citations,
+        'references': result.references_markdown
+    }, execution_time)
+    
+    # Basic assertions
+    assert result.raw_markdown, "Raw markdown should not be empty"
+    assert result.markdown_with_citations, "Markdown with citations should not be empty"
+    assert result.references_markdown, "References should not be empty"
+    assert "⟨" in result.markdown_with_citations, "Citations should use ⟨⟩ brackets"
+    assert "## References" in result.references_markdown, "Should contain references section"
+
+def test_relative_links():
+    """Test handling of relative links with base URL."""
+    markdown = """
+    Here's a [relative link](/wiki/Apple) and an [absolute link](https://example.com).
+    Also an [image](/images/test.png) and another [page](/wiki/Banana).
+    """
+    
+    generator = DefaultMarkdownGenerationStrategy()
+    result = generator.generate_markdown(
+        cleaned_html=markdown,
+        base_url="https://en.wikipedia.org"
+    )
+    
+    assert "https://en.wikipedia.org/wiki/Apple" in result.references_markdown
+    assert "https://example.com" in result.references_markdown
+    assert "https://en.wikipedia.org/images/test.png" in result.references_markdown
+
+def test_duplicate_links():
+    """Test handling of duplicate links."""
+    markdown = """
+    Here's a [link](/test) and another [link](/test) and a [different link](/other).
+    """
+    
+    generator = DefaultMarkdownGenerationStrategy()
+    result = generator.generate_markdown(
+        cleaned_html=markdown,
+        base_url="https://example.com"
+    )
+    
+    # Count citations in markdown
+    citations = result.markdown_with_citations.count("⟨1⟩")
+    assert citations == 2, "Same link should use same citation number"
+
+def test_link_descriptions():
+    """Test handling of link titles and descriptions."""
+    markdown = """
+    Here's a [link with title](/test "Test Title") and a [link with description](/other) to test.
+    """
+    
+    generator = DefaultMarkdownGenerationStrategy()
+    result = generator.generate_markdown(
+        cleaned_html=markdown,
+        base_url="https://example.com"
+    )
+    
+    assert "Test Title" in result.references_markdown, "Link title should be in references"
+    assert "link with description" in result.references_markdown, "Link text should be in references"
+
+def test_performance_large_document():
+    """Test performance with large document."""
+    with open(__location__ + "/data/wikipedia.md", "r") as f:
+        markdown = f.read()
+    
+    # Test with multiple iterations
+    iterations = 5
+    times = []
+    
+    generator = DefaultMarkdownGenerationStrategy()
+    
+    for i in range(iterations):
+        start_time = time.perf_counter()
+        result = generator.generate_markdown(
+            cleaned_html=markdown,
+            base_url="https://en.wikipedia.org"
+        )
+        end_time = time.perf_counter()
+        times.append(end_time - start_time)
+    
+    avg_time = sum(times) / len(times)
+    print(f"\n{'='*20} Performance Test {'='*20}")
+    print(f"Average execution time over {iterations} iterations: {avg_time:.4f} seconds")
+    print(f"Min time: {min(times):.4f} seconds")
+    print(f"Max time: {max(times):.4f} seconds")
+
+def test_image_links():
+    """Test handling of image links."""
+    markdown = """
+    Here's an ![image](/image.png "Image Title") and another ![image](/other.jpg).
+    And a regular [link](/page).
+    """
+    
+    generator = DefaultMarkdownGenerationStrategy()
+    result = generator.generate_markdown(
+        cleaned_html=markdown,
+        base_url="https://example.com"
+    )
+    
+    assert "![" in result.markdown_with_citations, "Image markdown syntax should be preserved"
+    assert "Image Title" in result.references_markdown, "Image title should be in references"
+
+if __name__ == "__main__":
+    print("Running markdown generation strategy tests...")
+    
+    test_basic_markdown_conversion()
+    test_relative_links()
+    test_duplicate_links()
+    test_link_descriptions()
+    test_performance_large_document()
+    test_image_links()
+    
\ No newline at end of file

From 006bee4a5a50fed10496b701ecfea350be1b7888 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Fri, 22 Nov 2024 16:00:17 +0800
Subject: [PATCH 058/115] feat: enhance image processing capabilities -
 Enhanced image processing with srcset support and validation checks for
 better image selection.

---
 README.md                             |   4 +-
 crawl4ai/content_scraping_strategy.py | 145 ++++++++++++++++++++++++--
 crawl4ai/tools.py                     |  34 ++++++
 3 files changed, 172 insertions(+), 11 deletions(-)
 create mode 100644 crawl4ai/tools.py

diff --git a/README.md b/README.md
index af0d6610..1d3063c7 100644
--- a/README.md
+++ b/README.md
@@ -13,8 +13,10 @@ Crawl4AI simplifies asynchronous web crawling and data extraction, making it acc
 
 ## New in 0.3.74 ✨
 
-- 🚀 **Blazing Fast Scraping:** The scraping process is now significantly faster, often completing in under 100 milliseconds (excluding web fetch time)!
+- 🚀 **Blazing Fast Scraping:** The scraping process is now significantly faster!
 - 📥 **Download Manager:** Integrated file crawling and downloading capabilities, with full control over file management and tracking within the `CrawlResult` object.
+- 📝 **Markdown Generation Strategy:** Flexible markdown generation system supporting custom strategies for different use cases and output formats.
+- 🔗 **LLM-Friendly Citations:** Automatic conversion of links into numbered citations with organized reference lists, making content more digestible for large language models.
 - 🔎 **Markdown Filter:** Enhanced content extraction using BM25 algorithm to create cleaner markdown with only relevant webpage content.
 - 🗂️ **Local & Raw HTML:** Crawl local files (`file://`) and raw HTML strings (`raw:`) directly.
 - 🤖 **Browser Control:** Use your own browser setup for crawling, with persistent contexts and stealth integration to bypass anti-bot measures.
diff --git a/crawl4ai/content_scraping_strategy.py b/crawl4ai/content_scraping_strategy.py
index 3823a78d..3b41ec82 100644
--- a/crawl4ai/content_scraping_strategy.py
+++ b/crawl4ai/content_scraping_strategy.py
@@ -19,9 +19,9 @@ from .utils import (
     InvalidCSSSelectorError,
     CustomHTML2Text,
     normalize_url,
-    is_external_url
-    
+    is_external_url    
 )
+from .tools import profile_and_time
 
 # Pre-compile regular expressions for Open Graph and Twitter metadata
 OG_REGEX = re.compile(r'^og:')
@@ -234,7 +234,26 @@ class WebScrapingStrategy(ContentScrapingStrategy):
                             return text_content
                 return None
 
-        def process_image(img, url, index, total_images):
+        def process_image_old(img, url, index, total_images):
+            def parse_srcset(srcset_str):
+                """Parse srcset attribute into list of image URLs with their sizes."""
+                if not srcset_str:
+                    return []
+                
+                sources = []
+                # Split on http/https and filter empty strings
+                urls = [f"http{part}" for part in srcset_str.split("http") if part]
+                
+                for url in urls:
+                    # Remove trailing comma and whitespace, then split to get width
+                    url = url.strip().rstrip(',')
+                    parts = url.rsplit(' ', 1)
+                    img_url = parts[0].strip()
+                    width = parts[1].rstrip('w') if len(parts) > 1 else None
+                    sources.append({'url': img_url, 'width': width})
+                
+                return sources          
+            
             #Check if an image has valid display and inside undesired html elements
             def is_valid_image(img, parent, parent_classes):
                 style = img.get('style', '')
@@ -283,14 +302,14 @@ class WebScrapingStrategy(ContentScrapingStrategy):
                     score+=1
                 return score
 
-            
-            
             if not is_valid_image(img, img.parent, img.parent.get('class', [])):
                 return None
+                
             score = score_image_for_usefulness(img, url, index, total_images)
             if score <= kwargs.get('image_score_threshold', IMAGE_SCORE_THRESHOLD):
                 return None
-            return {
+
+            base_result = {
                 'src': img.get('src', ''),
                 'data-src': img.get('data-src', ''),
                 'alt': img.get('alt', ''),
@@ -299,6 +318,109 @@ class WebScrapingStrategy(ContentScrapingStrategy):
                 'type': 'image'
             }
 
+            sources = []
+            srcset = img.get('srcset', '')
+            if srcset:
+                sources = parse_srcset(srcset)
+                if sources:
+                    return [dict(base_result, src=source['url'], width=source['width']) 
+                        for source in sources]
+
+            return [base_result]  # Always return a list
+
+        def process_image(img, url, index, total_images):
+            parse_srcset = lambda s: [{'url': u.strip().split()[0], 'width': u.strip().split()[-1].rstrip('w') 
+                          if ' ' in u else None} 
+                         for u in [f"http{p}" for p in s.split("http") if p]]
+            
+            # Constants for checks
+            classes_to_check = frozenset(['button', 'icon', 'logo'])
+            tags_to_check = frozenset(['button', 'input'])
+            
+            # Pre-fetch commonly used attributes
+            style = img.get('style', '')
+            alt = img.get('alt', '')
+            src = img.get('src', '')
+            data_src = img.get('data-src', '')
+            width = img.get('width')
+            height = img.get('height')
+            parent = img.parent
+            parent_classes = parent.get('class', [])
+
+            # Quick validation checks
+            if ('display:none' in style or
+                parent.name in tags_to_check or
+                any(c in cls for c in parent_classes for cls in classes_to_check) or
+                any(c in src for c in classes_to_check) or
+                any(c in alt for c in classes_to_check)):
+                return None
+
+            # Quick score calculation
+            score = 0
+            if width and width.isdigit():
+                width_val = int(width)
+                score += 1 if width_val > 150 else 0
+            if height and height.isdigit():
+                height_val = int(height)
+                score += 1 if height_val > 150 else 0
+            if alt:
+                score += 1
+            score += index/total_images < 0.5
+            
+            image_format = ''
+            if "data:image/" in src:
+                image_format = src.split(',')[0].split(';')[0].split('/')[1].split(';')[0]
+            else:
+                image_format = os.path.splitext(src)[1].lower().strip('.').split('?')[0]
+            
+            if image_format in ('jpg', 'png', 'webp', 'avif'):
+                score += 1
+
+            if score <= kwargs.get('image_score_threshold', IMAGE_SCORE_THRESHOLD):
+                return None
+
+            # Use set for deduplication
+            unique_urls = set()
+            image_variants = []
+            
+            # Base image info template
+            base_info = {
+                'alt': alt,
+                'desc': find_closest_parent_with_useful_text(img),
+                'score': score,
+                'type': 'image'
+            }
+
+            # Inline function for adding variants
+            def add_variant(src, width=None):
+                if src and not src.startswith('data:') and src not in unique_urls:
+                    unique_urls.add(src)
+                    image_variants.append({**base_info, 'src': src, 'width': width})
+
+            # Process all sources
+            add_variant(src)
+            add_variant(data_src)
+            
+            # Handle srcset and data-srcset in one pass
+            for attr in ('srcset', 'data-srcset'):
+                if value := img.get(attr):
+                    for source in parse_srcset(value):
+                        add_variant(source['url'], source['width'])
+
+            # Quick picture element check
+            if picture := img.find_parent('picture'):
+                for source in picture.find_all('source'):
+                    if srcset := source.get('srcset'):
+                        for src in parse_srcset(srcset):
+                            add_variant(src['url'], src['width'])
+
+            # Framework-specific attributes in one pass
+            for attr, value in img.attrs.items():
+                if attr.startswith('data-') and ('src' in attr or 'srcset' in attr) and 'http' in value:
+                    add_variant(value)
+
+            return image_variants if image_variants else None
+
         def remove_unwanted_attributes(element, important_attrs, keep_data_attributes=False):
             attrs_to_remove = []
             for attr in element.attrs:
@@ -490,13 +612,16 @@ class WebScrapingStrategy(ContentScrapingStrategy):
         links['internal'] = list(internal_links_dict.values())
         links['external'] = list(external_links_dict.values())
 
-
         # # Process images using ThreadPoolExecutor
         imgs = body.find_all('img')
         
-        with ThreadPoolExecutor() as executor:
-            image_results = list(executor.map(process_image, imgs, [url]*len(imgs), range(len(imgs)), [len(imgs)]*len(imgs)))
-        media['images'] = [result for result in image_results if result is not None]
+        # For test we use for loop instead of thread
+        media['images'] = [
+            img for result in (process_image(img, url, i, len(imgs)) 
+                            for i, img in enumerate(imgs))
+            if result is not None
+            for img in result
+        ]
 
         def flatten_nested_elements(node):
             if isinstance(node, NavigableString):
diff --git a/crawl4ai/tools.py b/crawl4ai/tools.py
new file mode 100644
index 00000000..ff36b53a
--- /dev/null
+++ b/crawl4ai/tools.py
@@ -0,0 +1,34 @@
+import time
+import cProfile
+import pstats
+from functools import wraps
+
+def profile_and_time(func):
+    @wraps(func)
+    def wrapper(self, *args, **kwargs):
+        # Start timer
+        start_time = time.perf_counter()
+        
+        # Setup profiler
+        profiler = cProfile.Profile()
+        profiler.enable()
+        
+        # Run function
+        result = func(self, *args, **kwargs)
+        
+        # Stop profiler
+        profiler.disable()
+        
+        # Calculate elapsed time
+        elapsed_time = time.perf_counter() - start_time
+        
+        # Print timing
+        print(f"[PROFILER] Scraping completed in {elapsed_time:.2f} seconds")
+        
+        # Print profiling stats
+        stats = pstats.Stats(profiler)
+        stats.sort_stats('cumulative')  # Sort by cumulative time
+        stats.print_stats(20)  # Print top 20 time-consuming functions
+        
+        return result
+    return wrapper
\ No newline at end of file

From 571dda6549da3c31a5f7566359585eefe9ad2867 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Fri, 22 Nov 2024 18:27:43 +0800
Subject: [PATCH 059/115] Update Redme

---
 README.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/README.md b/README.md
index 1d3063c7..e3ced79e 100644
--- a/README.md
+++ b/README.md
@@ -18,6 +18,7 @@ Crawl4AI simplifies asynchronous web crawling and data extraction, making it acc
 - 📝 **Markdown Generation Strategy:** Flexible markdown generation system supporting custom strategies for different use cases and output formats.
 - 🔗 **LLM-Friendly Citations:** Automatic conversion of links into numbered citations with organized reference lists, making content more digestible for large language models.
 - 🔎 **Markdown Filter:** Enhanced content extraction using BM25 algorithm to create cleaner markdown with only relevant webpage content.
+- 🖼️ **Enhanced Image Extraction:** Supports srcset, picture elements, and responsive images. 
 - 🗂️ **Local & Raw HTML:** Crawl local files (`file://`) and raw HTML strings (`raw:`) directly.
 - 🤖 **Browser Control:** Use your own browser setup for crawling, with persistent contexts and stealth integration to bypass anti-bot measures.
 - ☁️ **API & Cache Boost:** CORS support, static file serving, and a new filesystem-based cache for blazing-fast performance. Fine-tune caching with the `CacheMode` enum (ENABLED, DISABLED, READ_ONLY, WRITE_ONLY, BYPASS) and the `always_bypass_cache` parameter.

From 24ad2fe2ddc11250bdd90d42c127a85cbfdb8fd5 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Fri, 22 Nov 2024 18:47:17 +0800
Subject: [PATCH 060/115] feat: enhance Markdown generation to include fit_html
 attribute

---
 crawl4ai/content_scraping_strategy.py    | 13 +++----------
 crawl4ai/markdown_generation_strategy.py |  3 ++-
 crawl4ai/models.py                       |  1 +
 3 files changed, 6 insertions(+), 11 deletions(-)

diff --git a/crawl4ai/content_scraping_strategy.py b/crawl4ai/content_scraping_strategy.py
index 3b41ec82..d4b901d2 100644
--- a/crawl4ai/content_scraping_strategy.py
+++ b/crawl4ai/content_scraping_strategy.py
@@ -109,25 +109,18 @@ class WebScrapingStrategy(ContentScrapingStrategy):
         
         if markdown_generator:
             try:
-                markdown_result = markdown_generator.generate_markdown(
+                markdown_result: MarkdownGenerationResult = markdown_generator.generate_markdown(
                     cleaned_html=cleaned_html,
                     base_url=url,
                     html2text_options=kwargs.get('html2text', {}),
                     content_filter=kwargs.get('content_filter', None)
                 )
                 
-                markdown_v2 = MarkdownGenerationResult(
-                    raw_markdown=markdown_result.raw_markdown,
-                    markdown_with_citations=markdown_result.markdown_with_citations,
-                    references_markdown=markdown_result.references_markdown,
-                    fit_markdown=markdown_result.fit_markdown
-                )
-
                 return {
                     'markdown': markdown_result.raw_markdown,  
                     'fit_markdown': markdown_result.fit_markdown or "Set flag 'fit_markdown' to True to get cleaned HTML content.",
-                    'fit_html': kwargs.get('content_filter', None).filter_content(html) if kwargs.get('content_filter') else "Set flag 'fit_markdown' to True to get cleaned HTML content.",
-                    'markdown_v2': markdown_v2
+                    'fit_html': markdown_result.fit_html or "Set flag 'fit_markdown' to True to get cleaned HTML content.",
+                    'markdown_v2': markdown_result
                 }
             except Exception as e:
                 self._log('error',
diff --git a/crawl4ai/markdown_generation_strategy.py b/crawl4ai/markdown_generation_strategy.py
index 1adb4c28..7922c413 100644
--- a/crawl4ai/markdown_generation_strategy.py
+++ b/crawl4ai/markdown_generation_strategy.py
@@ -100,7 +100,8 @@ class DefaultMarkdownGenerationStrategy(MarkdownGenerationStrategy):
             raw_markdown=raw_markdown,
             markdown_with_citations=markdown_with_citations,
             references_markdown=references_markdown,
-            fit_markdown=fit_markdown
+            fit_markdown=fit_markdown,
+            fit_html=filtered_html
         )
 
 def fast_urljoin(base: str, url: str) -> str:
diff --git a/crawl4ai/models.py b/crawl4ai/models.py
index 122434ad..3a1b8bd1 100644
--- a/crawl4ai/models.py
+++ b/crawl4ai/models.py
@@ -12,6 +12,7 @@ class MarkdownGenerationResult(BaseModel):
     markdown_with_citations: str
     references_markdown: str
     fit_markdown: Optional[str] = None
+    fit_html: Optional[str] = None
 
 class CrawlResult(BaseModel):
     url: str

From e02935dc5b1fee1734f12fb60145193c2b9f5645 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Fri, 22 Nov 2024 18:49:22 +0800
Subject: [PATCH 061/115] chore: update README to reflect new features and
 improvements in version 0.3.74

---
 README.md | 24 ++++++++++++------------
 1 file changed, 12 insertions(+), 12 deletions(-)

diff --git a/README.md b/README.md
index e3ced79e..b0f9fff9 100644
--- a/README.md
+++ b/README.md
@@ -13,18 +13,18 @@ Crawl4AI simplifies asynchronous web crawling and data extraction, making it acc
 
 ## New in 0.3.74 ✨
 
-- 🚀 **Blazing Fast Scraping:** The scraping process is now significantly faster!
-- 📥 **Download Manager:** Integrated file crawling and downloading capabilities, with full control over file management and tracking within the `CrawlResult` object.
-- 📝 **Markdown Generation Strategy:** Flexible markdown generation system supporting custom strategies for different use cases and output formats.
-- 🔗 **LLM-Friendly Citations:** Automatic conversion of links into numbered citations with organized reference lists, making content more digestible for large language models.
-- 🔎 **Markdown Filter:** Enhanced content extraction using BM25 algorithm to create cleaner markdown with only relevant webpage content.
-- 🖼️ **Enhanced Image Extraction:** Supports srcset, picture elements, and responsive images. 
-- 🗂️ **Local & Raw HTML:** Crawl local files (`file://`) and raw HTML strings (`raw:`) directly.
-- 🤖 **Browser Control:** Use your own browser setup for crawling, with persistent contexts and stealth integration to bypass anti-bot measures.
-- ☁️ **API & Cache Boost:** CORS support, static file serving, and a new filesystem-based cache for blazing-fast performance. Fine-tune caching with the `CacheMode` enum (ENABLED, DISABLED, READ_ONLY, WRITE_ONLY, BYPASS) and the `always_bypass_cache` parameter.
-- 🐳 **API Gateway:** Run Crawl4AI as a local or cloud API service, enabling cross-platform usage through a containerized server with secure token authentication via `CRAWL4AI_API_TOKEN`.
-- 🛠️ **Database Improvements:** Enhanced database system for handling larger content sets with improved caching and faster performance.
-- 🐛 **Squashed Bugs:** Fixed browser context issues in Docker, memory leaks, enhanced error handling, and improved HTML parsing.
+🚀 **Blazing Fast Scraping**: Significantly improved scraping speed.  
+📥 **Download Manager**: Integrated file crawling, downloading, and tracking within `CrawlResult`.  
+📝 **Markdown Strategy**: Flexible system for custom markdown generation and formats.  
+🔗 **LLM-Friendly Citations**: Auto-converts links to numbered citations with reference lists.  
+🔎 **Markdown Filter**: BM25-based content extraction for cleaner, relevant markdown.  
+🖼️ **Image Extraction**: Supports `srcset`, `picture`, and responsive image formats.  
+🗂️ **Local/Raw HTML**: Crawl `file://` paths and raw HTML (`raw:`) directly.  
+🤖 **Browser Control**: Custom browser setups with stealth integration to bypass bots.  
+☁️ **API & Cache Boost**: CORS, static serving, and enhanced filesystem-based caching.  
+🐳 **API Gateway**: Run as an API service with secure token authentication.  
+🛠️ **Database Upgrades**: Optimized for larger content sets with faster caching.  
+🐛 **Bug Fixes**: Resolved browser context issues, memory leaks, and improved error handling.
 
 ## Try it Now!
 

From 8dea3f470f5a496a30dada1eab1c3b23ee3560ca Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Fri, 22 Nov 2024 18:50:12 +0800
Subject: [PATCH 062/115] chore: update README to include new features and
 improvements for version 0.3.74

---
 README.md | 25 +++++++++++++------------
 1 file changed, 13 insertions(+), 12 deletions(-)

diff --git a/README.md b/README.md
index b0f9fff9..fa88a507 100644
--- a/README.md
+++ b/README.md
@@ -13,18 +13,19 @@ Crawl4AI simplifies asynchronous web crawling and data extraction, making it acc
 
 ## New in 0.3.74 ✨
 
-🚀 **Blazing Fast Scraping**: Significantly improved scraping speed.  
-📥 **Download Manager**: Integrated file crawling, downloading, and tracking within `CrawlResult`.  
-📝 **Markdown Strategy**: Flexible system for custom markdown generation and formats.  
-🔗 **LLM-Friendly Citations**: Auto-converts links to numbered citations with reference lists.  
-🔎 **Markdown Filter**: BM25-based content extraction for cleaner, relevant markdown.  
-🖼️ **Image Extraction**: Supports `srcset`, `picture`, and responsive image formats.  
-🗂️ **Local/Raw HTML**: Crawl `file://` paths and raw HTML (`raw:`) directly.  
-🤖 **Browser Control**: Custom browser setups with stealth integration to bypass bots.  
-☁️ **API & Cache Boost**: CORS, static serving, and enhanced filesystem-based caching.  
-🐳 **API Gateway**: Run as an API service with secure token authentication.  
-🛠️ **Database Upgrades**: Optimized for larger content sets with faster caching.  
-🐛 **Bug Fixes**: Resolved browser context issues, memory leaks, and improved error handling.
+- 🚀 **Blazing Fast Scraping**: Significantly improved scraping speed.  
+- 📥 **Download Manager**: Integrated file crawling, downloading, and tracking within `CrawlResult`.  
+- 📝 **Markdown Strategy**: Flexible system for custom markdown generation and formats.  
+- 🔗 **LLM-Friendly Citations**: Auto-converts links to numbered citations with reference lists.  
+- 🔎 **Markdown Filter**: BM25-based content extraction for cleaner, relevant markdown.  
+- 🖼️ **Image Extraction**: Supports `srcset`, `picture`, and responsive image formats.  
+- 🗂️ **Local/Raw HTML**: Crawl `file://` paths and raw HTML (`raw:`) directly.  
+- 🤖 **Browser Control**: Custom browser setups with stealth integration to bypass bots.  
+- ☁️ **API & Cache Boost**: CORS, static serving, and enhanced filesystem-based caching.  
+- 🐳 **API Gateway**: Run as an API service with secure token authentication.  
+- 🛠️ **Database Upgrades**: Optimized for larger content sets with faster caching.  
+- 🐛 **Bug Fixes**: Resolved browser context issues, memory leaks, and improved error handling.
+
 
 ## Try it Now!
 

From 0d0cef343842af2aa369423790e159620e717f6c Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Fri, 22 Nov 2024 20:14:58 +0800
Subject: [PATCH 063/115] feat: add enhanced markdown generation example with
 citations and file output

---
 docs/examples/v0.3.74.overview.py | 109 ++++++++++++++++++++----------
 1 file changed, 74 insertions(+), 35 deletions(-)

diff --git a/docs/examples/v0.3.74.overview.py b/docs/examples/v0.3.74.overview.py
index 00296740..362ae8fc 100644
--- a/docs/examples/v0.3.74.overview.py
+++ b/docs/examples/v0.3.74.overview.py
@@ -52,34 +52,7 @@ async def download_example():
         else:
             print("\nNo files were downloaded")
 
-# 2. Content Filtering with BM25 Example
-async def content_filtering_example():
-    """Example of using the new BM25 content filtering"""
-    async with AsyncWebCrawler(verbose=True) as crawler:
-        # Create filter with custom query for OpenAI's blog
-        content_filter = BM25ContentFilter(
-            # user_query="Investment and fundraising",
-            # user_query="Robotic",
-            bm25_threshold=1.0
-        )
-        
-        result = await crawler.arun(
-            url="https://techcrunch.com/",
-            content_filter=content_filter,
-            cache_mode=CacheMode.BYPASS
-        )
-        
-        print(f"Filtered content: {len(result.fit_markdown)}")
-        print(f"Filtered content: {result.fit_markdown}")
-        
-        # Save html 
-        with open(os.path.join(__data__, "techcrunch.html"), "w") as f:
-            f.write(result.fit_html)
-        
-        with open(os.path.join(__data__, "filtered_content.md"), "w") as f:
-            f.write(result.fit_markdown)
-
-# 3. Local File and Raw HTML Processing Example
+# 2. Local File and Raw HTML Processing Example
 async def local_and_raw_html_example():
     """Example of processing local files and raw HTML"""
     # Create a sample HTML file
@@ -115,6 +88,68 @@ async def local_and_raw_html_example():
         print("Local file content:", local_result.markdown)
         print("\nRaw HTML content:", raw_result.markdown)
 
+# 3. Enhanced Markdown Generation Example
+async def markdown_generation_example():
+    """Example of enhanced markdown generation with citations and LLM-friendly features"""
+    async with AsyncWebCrawler(verbose=True) as crawler:
+        # Create a content filter (optional)
+        content_filter = BM25ContentFilter(
+            # user_query="History and cultivation",
+            bm25_threshold=1.0
+        )
+        
+        result = await crawler.arun(
+            url="https://en.wikipedia.org/wiki/Apple",
+            css_selector="main div#bodyContent",
+            content_filter=content_filter,
+            cache_mode=CacheMode.BYPASS
+        )
+        
+        from crawl4ai import AsyncWebCrawler
+        from crawl4ai.content_filter_strategy import BM25ContentFilter
+        
+        result = await crawler.arun(
+            url="https://en.wikipedia.org/wiki/Apple",
+            css_selector="main div#bodyContent",
+            content_filter=BM25ContentFilter()
+        )
+        print(result.markdown_v2.fit_markdown)
+        
+        print("\nMarkdown Generation Results:")
+        print(f"1. Original markdown length: {len(result.markdown)}")
+        print(f"2. New markdown versions (markdown_v2):")
+        print(f"   - Raw markdown length: {len(result.markdown_v2.raw_markdown)}")
+        print(f"   - Citations markdown length: {len(result.markdown_v2.markdown_with_citations)}")
+        print(f"   - References section length: {len(result.markdown_v2.references_markdown)}")
+        if result.markdown_v2.fit_markdown:
+            print(f"   - Filtered markdown length: {len(result.markdown_v2.fit_markdown)}")
+        
+        # Save examples to files
+        output_dir = os.path.join(__data__, "markdown_examples")
+        os.makedirs(output_dir, exist_ok=True)
+        
+        # Save different versions
+        with open(os.path.join(output_dir, "1_raw_markdown.md"), "w") as f:
+            f.write(result.markdown_v2.raw_markdown)
+            
+        with open(os.path.join(output_dir, "2_citations_markdown.md"), "w") as f:
+            f.write(result.markdown_v2.markdown_with_citations)
+            
+        with open(os.path.join(output_dir, "3_references.md"), "w") as f:
+            f.write(result.markdown_v2.references_markdown)
+            
+        if result.markdown_v2.fit_markdown:
+            with open(os.path.join(output_dir, "4_filtered_markdown.md"), "w") as f:
+                f.write(result.markdown_v2.fit_markdown)
+                
+        print(f"\nMarkdown examples saved to: {output_dir}")
+        
+        # Show a sample of citations and references
+        print("\nSample of markdown with citations:")
+        print(result.markdown_v2.markdown_with_citations[:500] + "...\n")
+        print("Sample of references:")
+        print('\n'.join(result.markdown_v2.references_markdown.split('\n')[:10]) + "...")
+
 # 4. Browser Management Example
 async def browser_management_example():
     """Example of using enhanced browser management features"""
@@ -208,9 +243,13 @@ async def api_example():
                     headers=headers
                 ) as status_response:
                     result = await status_response.json()
-                    print(f"Task result: {result}")
+                    print(f"Task status: {result['status']}")
                     
                     if result["status"] == "completed":
+                        print("Task completed!")
+                        print("Results:")
+                        news = json.loads(result["results"][0]['extracted_content'])
+                        print(json.dumps(news[:4], indent=2))
                         break
                     else:
                         await asyncio.sleep(1)
@@ -220,15 +259,15 @@ async def main():
     # print("Running Crawl4AI feature examples...")
     
     # print("\n1. Running Download Example:")
-    await download_example()
+    # await download_example()
     
-    # print("\n2. Running Content Filtering Example:")
-    await content_filtering_example()
+    # print("\n2. Running Markdown Generation Example:")
+    # await markdown_generation_example()
     
-    # print("\n3. Running Local and Raw HTML Example:")
-    await local_and_raw_html_example()
+    # # print("\n3. Running Local and Raw HTML Example:")
+    # await local_and_raw_html_example()
     
-    # print("\n4. Running Browser Management Example:")
+    # # print("\n4. Running Browser Management Example:")
     await browser_management_example()
     
     # print("\n5. Running API Example:")

From d729aa7d5edf9dab069af06e0c4ade1ca997eef7 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Sat, 23 Nov 2024 18:00:32 +0800
Subject: [PATCH 064/115] refactor: Add group ID to for images extracted from
 srcset.

---
 crawl4ai/content_scraping_strategy.py | 25 ++++++-------------------
 1 file changed, 6 insertions(+), 19 deletions(-)

diff --git a/crawl4ai/content_scraping_strategy.py b/crawl4ai/content_scraping_strategy.py
index d4b901d2..70a43240 100644
--- a/crawl4ai/content_scraping_strategy.py
+++ b/crawl4ai/content_scraping_strategy.py
@@ -228,24 +228,7 @@ class WebScrapingStrategy(ContentScrapingStrategy):
                 return None
 
         def process_image_old(img, url, index, total_images):
-            def parse_srcset(srcset_str):
-                """Parse srcset attribute into list of image URLs with their sizes."""
-                if not srcset_str:
-                    return []
-                
-                sources = []
-                # Split on http/https and filter empty strings
-                urls = [f"http{part}" for part in srcset_str.split("http") if part]
-                
-                for url in urls:
-                    # Remove trailing comma and whitespace, then split to get width
-                    url = url.strip().rstrip(',')
-                    parts = url.rsplit(' ', 1)
-                    img_url = parts[0].strip()
-                    width = parts[1].rstrip('w') if len(parts) > 1 else None
-                    sources.append({'url': img_url, 'width': width})
-                
-                return sources          
+                   
             
             #Check if an image has valid display and inside undesired html elements
             def is_valid_image(img, parent, parent_classes):
@@ -376,12 +359,16 @@ class WebScrapingStrategy(ContentScrapingStrategy):
             unique_urls = set()
             image_variants = []
             
+            # Generate a unique group ID for this set of variants
+            group_id = index 
+            
             # Base image info template
             base_info = {
                 'alt': alt,
                 'desc': find_closest_parent_with_useful_text(img),
                 'score': score,
-                'type': 'image'
+                'type': 'image',
+                'group_id': group_id # Group ID for this set of variants
             }
 
             # Inline function for adding variants

From 829a1f7992703064084826e0ebfeed819988c6e7 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Sat, 23 Nov 2024 19:45:41 +0800
Subject: [PATCH 065/115] feat: update version to 0.3.741 and enhance content
 filtering with heuristic strategy. Fixing the issue that when the past HTML
 to BM25 content filter does not have any HTML elements.

---
 crawl4ai/__version__.py               |   2 +-
 crawl4ai/content_filter_strategy.py   | 188 +++++++++++++++++++++++++-
 crawl4ai/content_scraping_strategy.py |   8 +-
 3 files changed, 189 insertions(+), 9 deletions(-)

diff --git a/crawl4ai/__version__.py b/crawl4ai/__version__.py
index 65ee6e73..05bfd336 100644
--- a/crawl4ai/__version__.py
+++ b/crawl4ai/__version__.py
@@ -1,2 +1,2 @@
 # crawl4ai/_version.py
-__version__ = "0.3.74"
\ No newline at end of file
+__version__ = "0.3.741"
\ No newline at end of file
diff --git a/crawl4ai/content_filter_strategy.py b/crawl4ai/content_filter_strategy.py
index 88216f7f..e6891a3f 100644
--- a/crawl4ai/content_filter_strategy.py
+++ b/crawl4ai/content_filter_strategy.py
@@ -10,6 +10,13 @@ from abc import ABC, abstractmethod
 
 from snowballstemmer import stemmer
 
+
+# import regex
+# def tokenize_text(text):
+#     # Regular expression to match words or CJK (Chinese, Japanese, Korean) characters
+#     pattern = r'\p{L}+|\p{N}+|[\p{Script=Han}\p{Script=Hiragana}\p{Script=Katakana}ー]|[\p{P}]'
+#     return regex.findall(pattern, text)
+
 # from nltk.stem import PorterStemmer
 # ps = PorterStemmer()
 class RelevantContentFilter(ABC):
@@ -57,9 +64,14 @@ class RelevantContentFilter(ABC):
         query_parts = []
         
         # Title
-        if soup.title:
-            query_parts.append(soup.title.string)
-        elif soup.find('h1'):
+        try:
+            title = soup.title.string
+            if title:
+                query_parts.append(title)
+        except Exception:
+            pass
+
+        if soup.find('h1'):
             query_parts.append(soup.find('h1').get_text())
             
         # Meta tags
@@ -81,7 +93,7 @@ class RelevantContentFilter(ABC):
         return ' '.join(filter(None, query_parts))
 
 
-    def extract_text_chunks(self, body: Tag) -> List[Tuple[str, str]]:
+    def extract_text_chunks(self, body: Tag, min_word_threshold: int = None) -> List[Tuple[str, str]]:
         """
         Extracts text chunks from a BeautifulSoup body element while preserving order.
         Returns list of tuples (text, tag_name) for classification.
@@ -155,6 +167,9 @@ class RelevantContentFilter(ABC):
             if text:
                 chunks.append((chunk_index, text, 'content', body))
         
+        if min_word_threshold:
+            chunks = [chunk for chunk in chunks if len(chunk[1].split()) >= min_word_threshold]
+        
         return chunks    
     
 
@@ -274,15 +289,26 @@ class BM25ContentFilter(RelevantContentFilter):
         }
         self.stemmer = stemmer(language)
 
-    def filter_content(self, html: str) -> List[str]:
+    def filter_content(self, html: str, min_word_threshold: int = None) -> List[str]:
         """Implements content filtering using BM25 algorithm with priority tag handling"""
         if not html or not isinstance(html, str):
             return []
 
         soup = BeautifulSoup(html, 'lxml')
+        
+        # Check if body is present
+        if not soup.body:
+            # Wrap in body tag if missing
+            soup = BeautifulSoup(f'<body>{html}</body>', 'lxml')        
         body = soup.find('body')
-        query = self.extract_page_query(soup.find('head'), body)
-        candidates = self.extract_text_chunks(body)
+        
+        query = self.extract_page_query(soup, body)
+        
+        if not query:
+            return []
+            # return [self.clean_element(soup)]
+            
+        candidates = self.extract_text_chunks(body, min_word_threshold)
 
         if not candidates:
             return []
@@ -299,6 +325,10 @@ class BM25ContentFilter(RelevantContentFilter):
                    for _, chunk, _, _ in candidates]
         tokenized_query = [self.stemmer.stemWord(word) for word in query.lower().split()]
 
+        # tokenized_corpus = [[self.stemmer.stemWord(word) for word in tokenize_text(chunk.lower())] 
+        #            for _, chunk, _, _ in candidates]
+        # tokenized_query = [self.stemmer.stemWord(word) for word in tokenize_text(query.lower())]
+
         # Clean from stop words and noise
         tokenized_corpus = [clean_tokens(tokens) for tokens in tokenized_corpus]
         tokenized_query = clean_tokens(tokenized_query)
@@ -326,3 +356,147 @@ class BM25ContentFilter(RelevantContentFilter):
         selected_candidates.sort(key=lambda x: x[0])
 
         return [self.clean_element(tag) for _, _, tag in selected_candidates]
+
+
+class HeuristicContentFilter(RelevantContentFilter):
+    def __init__(self):
+        super().__init__()
+        # Weights for different heuristics
+        self.tag_weights = {
+            'article': 10,
+            'main': 8,
+            'section': 5,
+            'div': 3,
+            'p': 2,
+            'pre': 2,
+            'code': 2,
+            'blockquote': 2,
+            'li': 1,
+            'span': 1,
+        }
+        self.max_depth = 5  # Maximum depth from body to consider
+
+    def filter_content(self, html: str) -> List[str]:
+        """Implements heuristic content filtering without relying on a query."""
+        if not html or not isinstance(html, str):
+            return []
+
+        soup = BeautifulSoup(html, 'lxml')
+
+        # Ensure there is a body tag
+        if not soup.body:
+            soup = BeautifulSoup(f'<body>{html}</body>', 'lxml')
+        body = soup.body
+
+        # Extract candidate text chunks
+        candidates = self.extract_text_chunks(body)
+
+        if not candidates:
+            return []
+
+        # Score each candidate
+        scored_candidates = []
+        for index, text, tag_type, tag in candidates:
+            score = self.score_element(tag, text)
+            if score > 0:
+                scored_candidates.append((score, index, text, tag))
+
+        # Sort candidates by score and then by document order
+        scored_candidates.sort(key=lambda x: (-x[0], x[1]))
+
+        # Extract the top candidates (e.g., top 5)
+        top_candidates = scored_candidates[:5]  # Adjust the number as needed
+
+        # Sort the top candidates back to their original document order
+        top_candidates.sort(key=lambda x: x[1])
+
+        # Clean and return the content
+        return [self.clean_element(tag) for _, _, _, tag in top_candidates]
+
+    def score_element(self, tag: Tag, text: str) -> float:
+        """Compute a score for an element based on heuristics."""
+        if not text or not tag:
+            return 0
+
+        # Exclude unwanted tags
+        if self.is_excluded(tag):
+            return 0
+
+        # Text density
+        text_length = len(text.strip())
+        html_length = len(str(tag))
+        text_density = text_length / html_length if html_length > 0 else 0
+
+        # Link density
+        link_text_length = sum(len(a.get_text().strip()) for a in tag.find_all('a'))
+        link_density = link_text_length / text_length if text_length > 0 else 0
+
+        # Tag weight
+        tag_weight = self.tag_weights.get(tag.name, 1)
+
+        # Depth factor (prefer elements closer to the body tag)
+        depth = self.get_depth(tag)
+        depth_weight = max(self.max_depth - depth, 1) / self.max_depth
+
+        # Compute the final score
+        score = (text_density * tag_weight * depth_weight) / (1 + link_density)
+
+        return score
+
+    def get_depth(self, tag: Tag) -> int:
+        """Compute the depth of the tag from the body tag."""
+        depth = 0
+        current = tag
+        while current and current != current.parent and current.name != 'body':
+            current = current.parent
+            depth += 1
+        return depth
+
+    def extract_text_chunks(self, body: Tag) -> List[Tuple[int, str, str, Tag]]:
+        """
+        Extracts text chunks from the body element while preserving order.
+        Returns list of tuples (index, text, tag_type, tag) for scoring.
+        """
+        chunks = []
+        index = 0
+
+        def traverse(element):
+            nonlocal index
+            if isinstance(element, NavigableString):
+                return
+            if not isinstance(element, Tag):
+                return
+            if self.is_excluded(element):
+                return
+            # Only consider included tags
+            if element.name in self.included_tags:
+                text = element.get_text(separator=' ', strip=True)
+                if len(text.split()) >= self.min_word_count:
+                    tag_type = 'header' if element.name in self.header_tags else 'content'
+                    chunks.append((index, text, tag_type, element))
+                    index += 1
+                    # Do not traverse children of this element to prevent duplication
+                    return
+            for child in element.children:
+                traverse(child)
+
+        traverse(body)
+        return chunks
+
+    def is_excluded(self, tag: Tag) -> bool:
+        """Determine if a tag should be excluded based on heuristics."""
+        if tag.name in self.excluded_tags:
+            return True
+        class_id = ' '.join(filter(None, [
+            ' '.join(tag.get('class', [])),
+            tag.get('id', '')
+        ]))
+        if self.negative_patterns.search(class_id):
+            return True
+        # Exclude tags with high link density (e.g., navigation menus)
+        text = tag.get_text(separator=' ', strip=True)
+        link_text_length = sum(len(a.get_text(strip=True)) for a in tag.find_all('a'))
+        text_length = len(text)
+        if text_length > 0 and (link_text_length / text_length) > 0.5:
+            return True
+        return False
diff --git a/crawl4ai/content_scraping_strategy.py b/crawl4ai/content_scraping_strategy.py
index 70a43240..ea6a2ef8 100644
--- a/crawl4ai/content_scraping_strategy.py
+++ b/crawl4ai/content_scraping_strategy.py
@@ -9,7 +9,7 @@ from bs4 import element, NavigableString, Comment
 from urllib.parse import urljoin
 from requests.exceptions import InvalidSchema
 # from .content_cleaning_strategy import ContentCleaningStrategy
-from .content_filter_strategy import RelevantContentFilter, BM25ContentFilter
+from .content_filter_strategy import RelevantContentFilter, BM25ContentFilter#, HeuristicContentFilter
 from .markdown_generation_strategy import MarkdownGenerationStrategy, DefaultMarkdownGenerationStrategy
 from .models import MarkdownGenerationResult
 from .utils import (
@@ -129,6 +129,12 @@ class WebScrapingStrategy(ContentScrapingStrategy):
                     params={"error": str(e)}
                 )
                 markdown_generator = None
+                return {
+                    'markdown': f"Error using new markdown generation strategy: {str(e)}",
+                    'fit_markdown': "Set flag 'fit_markdown' to True to get cleaned HTML content.",
+                    'fit_html': "Set flag 'fit_markdown' to True to get cleaned HTML content.",
+                    'markdown_v2': None                    
+                }
 
         # Legacy method
         h = CustomHTML2Text()

From edad7b6a742249f324d3baba01095f93fc05912f Mon Sep 17 00:00:00 2001
From: unclecode <unclecode@kidocode.com>
Date: Sun, 24 Nov 2024 18:48:39 +0800
Subject: [PATCH 066/115] chore: remove Railway deployment configuration and
 related documentation

---
 deploy/railway/README.md        |  19 -
 deploy/railway/button.json      |  33 --
 deploy/railway/railway.toml     |  18 -
 pages/app.css                   | 131 -----
 pages/app.js                    | 356 ------------
 pages/index copy.html           | 971 --------------------------------
 pages/index.html                |  73 ---
 pages/index_pooling.html        | 425 --------------
 pages/partial/footer.html       |  36 --
 pages/partial/how_to_guide.html | 174 ------
 pages/partial/installation.html |  65 ---
 pages/partial/try_it.html       | 217 -------
 pages/tmp.html                  | 434 --------------
 13 files changed, 2952 deletions(-)
 delete mode 100644 deploy/railway/README.md
 delete mode 100644 deploy/railway/button.json
 delete mode 100644 deploy/railway/railway.toml
 delete mode 100644 pages/app.css
 delete mode 100644 pages/app.js
 delete mode 100644 pages/index copy.html
 delete mode 100644 pages/index.html
 delete mode 100644 pages/index_pooling.html
 delete mode 100644 pages/partial/footer.html
 delete mode 100644 pages/partial/how_to_guide.html
 delete mode 100644 pages/partial/installation.html
 delete mode 100644 pages/partial/try_it.html
 delete mode 100644 pages/tmp.html

diff --git a/deploy/railway/README.md b/deploy/railway/README.md
deleted file mode 100644
index 155e7642..00000000
--- a/deploy/railway/README.md
+++ /dev/null
@@ -1,19 +0,0 @@
-# Railway Deployment
-
-## Quick Deploy
-[![Deploy on Railway](https://railway.app/button.svg)](https://railway.app/template/crawl4ai)
-
-## Manual Setup
-1. Fork this repository
-2. Create a new Railway project 
-3. Configure environment variables:
-   - `INSTALL_TYPE`: basic or all
-   - `ENABLE_GPU`: true/false
-4. Deploy!
-
-## Configuration
-See `railway.toml` for:
-- Memory limits
-- Health checks
-- Restart policies
-- Scaling options
\ No newline at end of file
diff --git a/deploy/railway/button.json b/deploy/railway/button.json
deleted file mode 100644
index 1fc52167..00000000
--- a/deploy/railway/button.json
+++ /dev/null
@@ -1,33 +0,0 @@
-{
-    "name": "Crawl4AI",
-    "description": "LLM Friendly Web Crawler & Scraper",
-    "render": {
-      "dockerfile": {
-        "path": "Dockerfile"
-      }
-    },
-    "env": [
-      {
-        "key": "INSTALL_TYPE",
-        "description": "Installation type (basic/all)",
-        "default": "basic",
-        "required": true
-      },
-      {
-        "key": "ENABLE_GPU",
-        "description": "Enable GPU support",
-        "default": "false",
-        "required": false
-      }
-    ],
-    "services": [
-      {
-        "name": "web",
-        "dockerfile": "./Dockerfile",
-        "healthcheck": {
-          "path": "/health",
-          "port": 11235
-        }
-      }
-    ]
-  }
\ No newline at end of file
diff --git a/deploy/railway/railway.toml b/deploy/railway/railway.toml
deleted file mode 100644
index f24d8fab..00000000
--- a/deploy/railway/railway.toml
+++ /dev/null
@@ -1,18 +0,0 @@
-# railway.toml
-[build]
-builder = "DOCKERFILE"
-dockerfilePath = "Dockerfile"
-
-[deploy]
-startCommand = "uvicorn main:app --host 0.0.0.0 --port $PORT"
-healthcheckPath = "/health"
-restartPolicyType = "ON_FAILURE"
-restartPolicyMaxRetries = 3
-
-[deploy.memory]
-soft = 2048 # 2GB min for Playwright
-hard = 4096 # 4GB max
-
-[deploy.scaling]
-min = 1
-max = 1
diff --git a/pages/app.css b/pages/app.css
deleted file mode 100644
index 0e94a2e5..00000000
--- a/pages/app.css
+++ /dev/null
@@ -1,131 +0,0 @@
-:root {
-    --ifm-font-size-base: 100%;
-    --ifm-line-height-base: 1.65;
-    --ifm-font-family-base: system-ui, -apple-system, Segoe UI, Roboto, Ubuntu, Cantarell, Noto Sans, sans-serif,
-        BlinkMacSystemFont, "Segoe UI", Helvetica, Arial, sans-serif, "Apple Color Emoji", "Segoe UI Emoji",
-        "Segoe UI Symbol";
-}
-html {
-    -webkit-font-smoothing: antialiased;
-    -webkit-text-size-adjust: 100%;
-    text-size-adjust: 100%;
-    font: var(--ifm-font-size-base) / var(--ifm-line-height-base) var(--ifm-font-family-base);
-}
-body {
-    background-color: #1a202c;
-    color: #fff;
-}
-.tab-content {
-    max-height: 400px;
-    overflow: auto;
-}
-pre {
-    white-space: pre-wrap;
-    font-size: 14px;
-}
-pre code {
-    width: 100%;
-}
-
-/* Custom styling for docs-item class and Markdown generated elements */
-.docs-item {
-    background-color: #2d3748; /* bg-gray-800 */
-    padding: 1rem; /* p-4 */
-    border-radius: 0.375rem; /* rounded */
-    box-shadow: 0 4px 6px rgba(0, 0, 0, 0.1); /* shadow-md */
-    margin-bottom: 1rem; /* space between items */
-    line-height: 1.5; /* leading-normal */
-}
-
-.docs-item h3,
-.docs-item h4 {
-    color: #ffffff; /* text-white */
-    font-size: 1.25rem; /* text-xl */
-    font-weight: 700; /* font-bold */
-    margin-bottom: 0.5rem; /* mb-2 */
-}
-.docs-item h4 {
-    font-size: 1rem; /* text-xl */
-}
-
-.docs-item p {
-    color: #e2e8f0; /* text-gray-300 */
-    margin-bottom: 0.5rem; /* mb-2 */
-}
-
-.docs-item code {
-    background-color: #1a202c; /* bg-gray-900 */
-    color: #e2e8f0; /* text-gray-300 */
-    padding: 0.25rem 0.5rem; /* px-2 py-1 */
-    border-radius: 0.25rem; /* rounded */
-    font-size: 0.875rem; /* text-sm */
-}
-
-.docs-item pre {
-    background-color: #1a202c; /* bg-gray-900 */
-    color: #e2e8f0; /* text-gray-300 */
-    padding: 0.5rem; /* p-2 */
-    border-radius: 0.375rem; /* rounded */
-    overflow: auto; /* overflow-auto */
-    margin-bottom: 0.5rem; /* mb-2 */
-}
-
-.docs-item div {
-    color: #e2e8f0; /* text-gray-300 */
-    font-size: 1rem; /* prose prose-sm */
-    line-height: 1.25rem; /* line-height for readability */
-}
-
-/* Adjustments to make prose class more suitable for dark mode */
-.prose {
-    max-width: none; /* max-w-none */
-}
-
-.prose p,
-.prose ul {
-    margin-bottom: 1rem; /* mb-4 */
-}
-
-.prose code {
-    /* background-color: #4a5568; */ /* bg-gray-700 */
-    color: #65a30d; /* text-white */
-    padding: 0.25rem 0.5rem; /* px-1 py-0.5 */
-    border-radius: 0.25rem; /* rounded */
-    display: inline-block; /* inline-block */
-}
-
-.prose pre {
-    background-color: #1a202c; /* bg-gray-900 */
-    color: #ffffff; /* text-white */
-    padding: 0.5rem; /* p-2 */
-    border-radius: 0.375rem; /* rounded */
-}
-
-.prose h3 {
-    color: #65a30d; /* text-white */
-    font-size: 1.25rem; /* text-xl */
-    font-weight: 700; /* font-bold */
-    margin-bottom: 0.5rem; /* mb-2 */
-}
-
-body {
-    background-color: #1a1a1a;
-    color: #b3ff00;
-}
-.sidebar {
-    color: #b3ff00;
-    border-right: 1px solid #333;
-}
-.sidebar a {
-    color: #b3ff00;
-    text-decoration: none;
-}
-.sidebar a:hover {
-    background-color: #555;
-}
-.content-section {
-    display: none;
-}
-.content-section.active {
-    display: block;
-}
diff --git a/pages/app.js b/pages/app.js
deleted file mode 100644
index 098008ab..00000000
--- a/pages/app.js
+++ /dev/null
@@ -1,356 +0,0 @@
-// JavaScript to manage dynamic form changes and logic
-document.getElementById("extraction-strategy-select").addEventListener("change", function () {
-    const strategy = this.value;
-    const providerModelSelect = document.getElementById("provider-model-select");
-    const tokenInput = document.getElementById("token-input");
-    const instruction = document.getElementById("instruction");
-    const semantic_filter = document.getElementById("semantic_filter");
-    const instruction_div = document.getElementById("instruction_div");
-    const semantic_filter_div = document.getElementById("semantic_filter_div");
-    const llm_settings = document.getElementById("llm_settings");
-
-    if (strategy === "LLMExtractionStrategy") {
-        // providerModelSelect.disabled = false;
-        // tokenInput.disabled = false;
-        // semantic_filter.disabled = true;
-        // instruction.disabled = false;
-        llm_settings.classList.remove("hidden");
-        instruction_div.classList.remove("hidden");
-        semantic_filter_div.classList.add("hidden");
-    } else if (strategy === "NoExtractionStrategy") {
-        semantic_filter_div.classList.add("hidden");
-        instruction_div.classList.add("hidden");
-        llm_settings.classList.add("hidden");
-    } else {
-        // providerModelSelect.disabled = true;
-        // tokenInput.disabled = true;
-        // semantic_filter.disabled = false;
-        // instruction.disabled = true;
-        llm_settings.classList.add("hidden");
-        instruction_div.classList.add("hidden");
-        semantic_filter_div.classList.remove("hidden");
-    }
-
-
-});
-
-// Get the selected provider model and token from local storage
-const storedProviderModel = localStorage.getItem("provider_model");
-const storedToken = localStorage.getItem(storedProviderModel);
-
-if (storedProviderModel) {
-    document.getElementById("provider-model-select").value = storedProviderModel;
-}
-
-if (storedToken) {
-    document.getElementById("token-input").value = storedToken;
-}
-
-// Handle provider model dropdown change
-document.getElementById("provider-model-select").addEventListener("change", () => {
-    const selectedProviderModel = document.getElementById("provider-model-select").value;
-    const storedToken = localStorage.getItem(selectedProviderModel);
-
-    if (storedToken) {
-        document.getElementById("token-input").value = storedToken;
-    } else {
-        document.getElementById("token-input").value = "";
-    }
-});
-
-// Fetch total count from the database
-axios
-    .get("/total-count")
-    .then((response) => {
-        document.getElementById("total-count").textContent = response.data.count;
-    })
-    .catch((error) => console.error(error));
-
-// Handle crawl button click
-document.getElementById("crawl-btn").addEventListener("click", () => {
-    // validate input to have both URL and API token
-    // if selected extraction strategy is LLMExtractionStrategy, then API token is required
-    if (document.getElementById("extraction-strategy-select").value === "LLMExtractionStrategy") {
-        if (!document.getElementById("url-input").value || !document.getElementById("token-input").value) {
-            alert("Please enter both URL(s) and API token.");
-            return;
-        }
-    }
-
-    const selectedProviderModel = document.getElementById("provider-model-select").value;
-    const apiToken = document.getElementById("token-input").value;
-    const extractBlocks = document.getElementById("extract-blocks-checkbox").checked;
-    const bypassCache = document.getElementById("bypass-cache-checkbox").checked;
-
-    // Save the selected provider model and token to local storage
-    localStorage.setItem("provider_model", selectedProviderModel);
-    localStorage.setItem(selectedProviderModel, apiToken);
-
-    const urlsInput = document.getElementById("url-input").value;
-    const urls = urlsInput.split(",").map((url) => url.trim());
-    const data = {
-        urls: urls,
-        include_raw_html: true,
-        bypass_cache: bypassCache,
-        extract_blocks: extractBlocks,
-        word_count_threshold: parseInt(document.getElementById("threshold").value),
-        extraction_strategy: document.getElementById("extraction-strategy-select").value,
-        extraction_strategy_args: {
-            provider: selectedProviderModel,
-            api_token: apiToken,
-            instruction: document.getElementById("instruction").value,
-            semantic_filter: document.getElementById("semantic_filter").value,
-        },
-        chunking_strategy: document.getElementById("chunking-strategy-select").value,
-        chunking_strategy_args: {},
-        css_selector: document.getElementById("css-selector").value,
-        screenshot: document.getElementById("screenshot-checkbox").checked,
-        // instruction: document.getElementById("instruction").value,
-        // semantic_filter: document.getElementById("semantic_filter").value,
-        verbose: true,
-    };
-
-    // import requests
-
-    // data = {
-    //   "urls": [
-    //     "https://www.nbcnews.com/business"
-    //   ],
-    //   "word_count_threshold": 10,
-    //   "extraction_strategy": "NoExtractionStrategy",
-    // }
-    
-    // response = requests.post("https://crawl4ai.com/crawl", json=data) # OR local host if your run locally 
-    // print(response.json())
-
-    // save api token to local storage
-    localStorage.setItem("api_token", document.getElementById("token-input").value);
-
-    document.getElementById("loading").classList.remove("hidden");
-    document.getElementById("result").style.visibility = "hidden";
-    document.getElementById("code_help").style.visibility = "hidden";
-
-    axios
-        .post("/crawl", data)
-        .then((response) => {
-            const result = response.data.results[0];
-            const parsedJson = JSON.parse(result.extracted_content);
-            document.getElementById("json-result").textContent = JSON.stringify(parsedJson, null, 2);
-            document.getElementById("cleaned-html-result").textContent = result.cleaned_html;
-            document.getElementById("markdown-result").textContent = result.markdown;
-            document.getElementById("media-result").textContent = JSON.stringify( result.media, null, 2);
-            if (result.screenshot){
-                const imgElement = document.createElement("img");
-                // Set the src attribute with the base64 data
-                imgElement.src = `data:image/png;base64,${result.screenshot}`;
-                document.getElementById("screenshot-result").innerHTML = "";
-                document.getElementById("screenshot-result").appendChild(imgElement);
-            }
-            
-            // Update code examples dynamically
-            const extractionStrategy = data.extraction_strategy;
-            const isLLMExtraction = extractionStrategy === "LLMExtractionStrategy";
-
-            // REMOVE API TOKEN FROM CODE EXAMPLES
-            data.extraction_strategy_args.api_token = "your_api_token";
-
-            if (data.extraction_strategy === "NoExtractionStrategy") {
-                delete data.extraction_strategy_args;
-                delete data.extrac_blocks;
-            }
-
-            if (data.chunking_strategy === "RegexChunking") {
-                delete data.chunking_strategy_args;
-            }
-
-            delete data.verbose;
-
-            if (data.css_selector === "") {
-                delete data.css_selector;
-            }
-
-            if (!data.bypass_cache) {
-                delete data.bypass_cache;
-            }
-
-            if (!data.extract_blocks) {
-                delete data.extract_blocks;
-            }
-
-            if (!data.include_raw_html) {
-                delete data.include_raw_html;
-            }
-
-            document.getElementById(
-                "curl-code"
-            ).textContent = `curl -X POST -H "Content-Type: application/json" -d '${JSON.stringify({
-                ...data,
-                api_token: isLLMExtraction ? "your_api_token" : undefined,
-            }, null, 2)}' https://crawl4ai.com/crawl`;
-
-            document.getElementById("python-code").textContent = `import requests\n\ndata = ${JSON.stringify(
-                { ...data, api_token: isLLMExtraction ? "your_api_token" : undefined },
-                null,
-                2
-            )}\n\nresponse = requests.post("https://crawl4ai.com/crawl", json=data) # OR local host if your run locally \nprint(response.json())`;
-
-            document.getElementById(
-                "nodejs-code"
-            ).textContent = `const axios = require('axios');\n\nconst data = ${JSON.stringify(
-                { ...data, api_token: isLLMExtraction ? "your_api_token" : undefined },
-                null,
-                2
-            )};\n\naxios.post("https://crawl4ai.com/crawl", data) // OR local host if your run locally \n    .then(response => console.log(response.data))\n    .catch(error => console.error(error));`;
-
-            document.getElementById(
-                "library-code"
-            ).textContent = `from crawl4ai.web_crawler import WebCrawler\nfrom crawl4ai.extraction_strategy import *\nfrom crawl4ai.chunking_strategy import *\n\ncrawler = WebCrawler()\ncrawler.warmup()\n\nresult = crawler.run(\n    url='${
-                urls[0]
-            }',\n    word_count_threshold=${data.word_count_threshold},\n    extraction_strategy=${
-                isLLMExtraction
-                    ? `${extractionStrategy}(provider="${data.provider_model}", api_token="${data.api_token}")`
-                    : extractionStrategy + "()"
-            },\n    chunking_strategy=${data.chunking_strategy}(),\n    bypass_cache=${
-                data.bypass_cache
-            },\n    css_selector="${data.css_selector}"\n)\nprint(result)`;
-
-            // Highlight code syntax
-            hljs.highlightAll();
-
-            // Select JSON tab by default
-            document.querySelector('.tab-btn[data-tab="json"]').click();
-
-            document.getElementById("loading").classList.add("hidden");
-
-            document.getElementById("result").style.visibility = "visible";
-            document.getElementById("code_help").style.visibility = "visible";
-
-            // increment the total count
-            document.getElementById("total-count").textContent =
-                parseInt(document.getElementById("total-count").textContent) + 1;
-        })
-        .catch((error) => {
-            console.error(error);
-            document.getElementById("loading").classList.add("hidden");
-        });
-});
-
-// Handle tab clicks
-document.querySelectorAll(".tab-btn").forEach((btn) => {
-    btn.addEventListener("click", () => {
-        const tab = btn.dataset.tab;
-        document.querySelectorAll(".tab-btn").forEach((b) => b.classList.remove("bg-lime-700", "text-white"));
-        btn.classList.add("bg-lime-700", "text-white");
-        document.querySelectorAll(".tab-content.code pre").forEach((el) => el.classList.add("hidden"));
-        document.getElementById(`${tab}-result`).parentElement.classList.remove("hidden");
-    });
-});
-
-// Handle code tab clicks
-document.querySelectorAll(".code-tab-btn").forEach((btn) => {
-    btn.addEventListener("click", () => {
-        const tab = btn.dataset.tab;
-        document.querySelectorAll(".code-tab-btn").forEach((b) => b.classList.remove("bg-lime-700", "text-white"));
-        btn.classList.add("bg-lime-700", "text-white");
-        document.querySelectorAll(".tab-content.result pre").forEach((el) => el.classList.add("hidden"));
-        document.getElementById(`${tab}-code`).parentElement.classList.remove("hidden");
-    });
-});
-
-// Handle copy to clipboard button clicks
-
-async function copyToClipboard(text) {
-    if (navigator.clipboard && navigator.clipboard.writeText) {
-        return navigator.clipboard.writeText(text);
-    } else {
-        return fallbackCopyTextToClipboard(text);
-    }
-}
-
-function fallbackCopyTextToClipboard(text) {
-    return new Promise((resolve, reject) => {
-        const textArea = document.createElement("textarea");
-        textArea.value = text;
-
-        // Avoid scrolling to bottom
-        textArea.style.top = "0";
-        textArea.style.left = "0";
-        textArea.style.position = "fixed";
-
-        document.body.appendChild(textArea);
-        textArea.focus();
-        textArea.select();
-
-        try {
-            const successful = document.execCommand("copy");
-            if (successful) {
-                resolve();
-            } else {
-                reject();
-            }
-        } catch (err) {
-            reject(err);
-        }
-
-        document.body.removeChild(textArea);
-    });
-}
-
-document.querySelectorAll(".copy-btn").forEach((btn) => {
-    btn.addEventListener("click", () => {
-        const target = btn.dataset.target;
-        const code = document.getElementById(target).textContent;
-        //navigator.clipboard.writeText(code).then(() => {
-        copyToClipboard(code).then(() => {
-            btn.textContent = "Copied!";
-            setTimeout(() => {
-                btn.textContent = "Copy";
-            }, 2000);
-        });
-    });
-});
-
-document.addEventListener("DOMContentLoaded", async () => {
-    try {
-        const extractionResponse = await fetch("/strategies/extraction");
-        const extractionStrategies = await extractionResponse.json();
-
-        const chunkingResponse = await fetch("/strategies/chunking");
-        const chunkingStrategies = await chunkingResponse.json();
-
-        renderStrategies("extraction-strategies", extractionStrategies);
-        renderStrategies("chunking-strategies", chunkingStrategies);
-    } catch (error) {
-        console.error("Error fetching strategies:", error);
-    }
-});
-
-function renderStrategies(containerId, strategies) {
-    const container = document.getElementById(containerId);
-    container.innerHTML = ""; // Clear any existing content
-    strategies = JSON.parse(strategies);
-    Object.entries(strategies).forEach(([strategy, description]) => {
-        const strategyElement = document.createElement("div");
-        strategyElement.classList.add("bg-zinc-800", "p-4", "rounded", "shadow-md", "docs-item");
-
-        const strategyDescription = document.createElement("div");
-        strategyDescription.classList.add("text-gray-300", "prose", "prose-sm");
-        strategyDescription.innerHTML = marked.parse(description);
-
-        strategyElement.appendChild(strategyDescription);
-
-        container.appendChild(strategyElement);
-    });
-}
-document.querySelectorAll(".sidebar a").forEach((link) => {
-    link.addEventListener("click", function (event) {
-        event.preventDefault();
-        document.querySelectorAll(".content-section").forEach((section) => {
-            section.classList.remove("active");
-        });
-        const target = event.target.getAttribute("data-target");
-        document.getElementById(target).classList.add("active");
-    });
-});
-// Highlight code syntax
-hljs.highlightAll();
diff --git a/pages/index copy.html b/pages/index copy.html
deleted file mode 100644
index b61b7298..00000000
--- a/pages/index copy.html	
+++ /dev/null
@@ -1,971 +0,0 @@
-<!DOCTYPE html>
-<html lang="en">
-    <head>
-        <meta charset="UTF-8" />
-        <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-        <title>Crawl4AI</title>
-
-        <link rel="preconnect" href="https://fonts.googleapis.com" />
-        <link rel="preconnect" href="https://fonts.gstatic.com" crossorigin />
-        <link href="https://fonts.googleapis.com/css2?family=Inter:wght@100..900&display=swap" rel="stylesheet" />
-
-        <!-- <link href="https://cdn.jsdelivr.net/npm/tailwindcss@3.4.3/dist/tailwind.min.css" rel="stylesheet" /> -->
-        <script src="https://cdn.tailwindcss.com"></script>
-        <script src="https://cdn.jsdelivr.net/npm/axios/dist/axios.min.js"></script>
-        <link
-            rel="stylesheet"
-            href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/11.7.0/styles/monokai.min.css"
-        />
-        <script src="https://cdn.jsdelivr.net/npm/marked/marked.min.js"></script>
-
-        <script src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/11.7.0/highlight.min.js"></script>
-        <style>
-            :root {
-                --ifm-font-size-base: 100%;
-                --ifm-line-height-base: 1.65;
-                --ifm-font-family-base: system-ui, -apple-system, Segoe UI, Roboto, Ubuntu, Cantarell, Noto Sans,
-                    sans-serif, BlinkMacSystemFont, "Segoe UI", Helvetica, Arial, sans-serif, "Apple Color Emoji",
-                    "Segoe UI Emoji", "Segoe UI Symbol";
-            }
-            html {
-                -webkit-font-smoothing: antialiased;
-                -webkit-text-size-adjust: 100%;
-                text-size-adjust: 100%;
-                font: var(--ifm-font-size-base) / var(--ifm-line-height-base) var(--ifm-font-family-base);
-            }
-            body {
-                background-color: #1a202c;
-                color: #fff;
-            }
-            .tab-content {
-                max-height: 400px;
-                overflow: auto;
-            }
-            pre {
-                white-space: pre-wrap;
-                font-size: 14px;
-            }
-            pre code {
-                width: 100%;
-            }
-        </style>
-        <style>
-            /* Custom styling for docs-item class and Markdown generated elements */
-            .docs-item {
-                background-color: #2d3748; /* bg-gray-800 */
-                padding: 1rem; /* p-4 */
-                border-radius: 0.375rem; /* rounded */
-                box-shadow: 0 4px 6px rgba(0, 0, 0, 0.1); /* shadow-md */
-                margin-bottom: 1rem; /* space between items */
-            }
-
-            .docs-item h3,
-            .docs-item h4 {
-                color: #ffffff; /* text-white */
-                font-size: 1.25rem; /* text-xl */
-                font-weight: 700; /* font-bold */
-                margin-bottom: 0.5rem; /* mb-2 */
-            }
-
-            .docs-item p {
-                color: #e2e8f0; /* text-gray-300 */
-                margin-bottom: 0.5rem; /* mb-2 */
-            }
-
-            .docs-item code {
-                background-color: #1a202c; /* bg-gray-900 */
-                color: #e2e8f0; /* text-gray-300 */
-                padding: 0.25rem 0.5rem; /* px-2 py-1 */
-                border-radius: 0.25rem; /* rounded */
-            }
-
-            .docs-item pre {
-                background-color: #1a202c; /* bg-gray-900 */
-                color: #e2e8f0; /* text-gray-300 */
-                padding: 0.5rem; /* p-2 */
-                border-radius: 0.375rem; /* rounded */
-                overflow: auto; /* overflow-auto */
-                margin-bottom: 0.5rem; /* mb-2 */
-            }
-
-            .docs-item div {
-                color: #e2e8f0; /* text-gray-300 */
-                font-size: 1rem; /* prose prose-sm */
-                line-height: 1.25rem; /* line-height for readability */
-            }
-
-            /* Adjustments to make prose class more suitable for dark mode */
-            .prose {
-                max-width: none; /* max-w-none */
-            }
-
-            .prose p,
-            .prose ul {
-                margin-bottom: 1rem; /* mb-4 */
-            }
-
-            .prose code {
-                /* background-color: #4a5568; */ /* bg-gray-700 */
-                color: #65a30d; /* text-white */
-                padding: 0.25rem 0.5rem; /* px-1 py-0.5 */
-                border-radius: 0.25rem; /* rounded */
-                display: inline-block; /* inline-block */
-            }
-
-            .prose pre {
-                background-color: #1a202c; /* bg-gray-900 */
-                color: #ffffff; /* text-white */
-                padding: 0.5rem; /* p-2 */
-                border-radius: 0.375rem; /* rounded */
-            }
-
-            .prose h3 {
-                color: #65a30d; /* text-white */
-                font-size: 1.25rem; /* text-xl */
-                font-weight: 700; /* font-bold */
-                margin-bottom: 0.5rem; /* mb-2 */
-            }
-        </style>
-    </head>
-    <body class="bg-black text-gray-200">
-        <header class="bg-zinc-950 text-white py-4 flex">
-            <div class="mx-auto px-4">
-                <h1 class="text-2xl font-bold">🔥🕷️ Crawl4AI: Web Data for your Thoughts</h1>
-            </div>
-            <div class="mx-auto px-4 flex font-bold text-xl gap-2">
-                <span>📊 Total Website Processed</span>
-                <span id="total-count" class="text-lime-400">2</span>
-            </div>
-        </header>
-
-        <section class="try-it py-8 px-16 pb-20">
-            <div class="container mx-auto px-4">
-                <h2 class="text-2xl font-bold mb-4">Try It Now</h2>
-                <div class="grid grid-cols-1 lg:grid-cols-3 gap-4">
-                    <div class="space-y-4">
-                        <div class="flex flex-col">
-                            <label for="url-input" class="text-lime-500 font-bold text-xs">URL(s)</label>
-                            <input
-                                type="text"
-                                id="url-input"
-                                value="https://www.nbcnews.com/business"
-                                class="border border-zinc-700 rounded px-4 py-0 bg-zinc-900 text-lime-500"
-                                placeholder="Enter URL(s) separated by commas"
-                            />
-                        </div>
-                        <div class="flex flex-col">
-                            <label for="threshold" class="text-lime-500 font-bold text-xs">Min Words Threshold</label>
-                            <select
-                                id="threshold"
-                                class="border border-zinc-700 rounded px-4 py-0 bg-zinc-900 text-lime-500"
-                            >
-                                <option value="5">5</option>
-                                <option value="10" selected>10</option>
-                                <option value="15">15</option>
-                                <option value="20">20</option>
-                                <option value="25">25</option>
-                            </select>
-                        </div>
-                        <div class="flex flex-col">
-                            <label for="css-selector" class="text-lime-500 font-bold text-xs">CSS Selector</label>
-                            <input
-                                type="text"
-                                id="css-selector"
-                                class="border border-zinc-700 rounded px-4 py-0 bg-zinc-900 text-lime-500"
-                                placeholder="Enter CSS Selector"
-                            />
-                        </div>
-                        <div class="flex flex-col">
-                            <label for="extraction-strategy-select" class="text-lime-500 font-bold text-xs"
-                                >Extraction Strategy</label
-                            >
-                            <select
-                                id="extraction-strategy-select"
-                                class="border border-zinc-700 rounded px-4 py-1 bg-zinc-900 text-lime-500"
-                            >
-                                <option value="CosineStrategy">CosineStrategy</option>
-                                <option value="LLMExtractionStrategy">LLMExtractionStrategy</option>
-                                <option value="NoExtractionStrategy">NoExtractionStrategy</option>
-                            </select>
-                        </div>
-                        <div class="flex flex-col">
-                            <label for="chunking-strategy-select" class="text-lime-500 font-bold text-xs"
-                                >Chunking Strategy</label
-                            >
-                            <select
-                                id="chunking-strategy-select"
-                                class="border border-zinc-700 rounded px-4 py-1 bg-zinc-900 text-lime-500"
-                            >
-                                <option value="RegexChunking">RegexChunking</option>
-                                <option value="NlpSentenceChunking">NlpSentenceChunking</option>
-                                <option value="TopicSegmentationChunking">TopicSegmentationChunking</option>
-                                <option value="FixedLengthWordChunking">FixedLengthWordChunking</option>
-                                <option value="SlidingWindowChunking">SlidingWindowChunking</option>
-                            </select>
-                        </div>
-                        <div class="flex flex-col">
-                            <label for="provider-model-select" class="text-lime-500 font-bold text-xs"
-                                >Provider Model</label
-                            >
-                            <select
-                                id="provider-model-select"
-                                class="border border-zinc-700 rounded px-4 py-0 bg-zinc-900 text-lime-500"
-                                disabled
-                            >
-                                <option value="groq/llama3-70b-8192">groq/llama3-70b-8192</option>
-                                <option value="groq/llama3-8b-8192">groq/llama3-8b-8192</option>
-                                <option value="openai/gpt-4-turbo">gpt-4-turbo</option>
-                                <option value="openai/gpt-3.5-turbo">gpt-3.5-turbo</option>
-                                <option value="anthropic/claude-3-haiku-20240307">claude-3-haiku</option>
-                                <option value="anthropic/claude-3-opus-20240229">claude-3-opus</option>
-                                <option value="anthropic/claude-3-sonnet-20240229">claude-3-sonnet</option>
-                            </select>
-                        </div>
-                        <div class="flex flex-col">
-                            <label for="token-input" class="text-lime-500 font-bold text-xs">API Token</label>
-                            <input
-                                type="password"
-                                id="token-input"
-                                class="border border-zinc-700 rounded px-4 py-0 bg-zinc-900 text-lime-500"
-                                placeholder="Enter Groq API token"
-                                disabled
-                            />
-                        </div>
-                        <div class="flex gap-3">
-                            <div class="flex items-center gap-2">
-                                <input type="checkbox" id="bypass-cache-checkbox" />
-                                <label for="bypass-cache-checkbox" class="text-lime-500 font-bold">Bypass Cache</label>
-                            </div>
-                            <div class="flex items-center gap-2">
-                                <input type="checkbox" id="extract-blocks-checkbox" checked />
-                                <label for="extract-blocks-checkbox" class="text-lime-500 font-bold"
-                                    >Extract Blocks</label
-                                >
-                            </div>
-                            <button id="crawl-btn" class="bg-lime-600 text-black font-bold px-4 py-0 rounded">
-                                Crawl
-                            </button>
-                        </div>
-                    </div>
-
-                    <div id="result" class=" ">
-                        <div id="loading" class="hidden">
-                            <p class="text-white">Loading... Please wait.</p>
-                        </div>
-                        <div class="tab-buttons flex gap-2">
-                            <button
-                                class="tab-btn px-4 py-1 text-sm bg-zinc-700 rounded-t text-lime-500"
-                                data-tab="json"
-                            >
-                                JSON
-                            </button>
-                            <button
-                                class="tab-btn px-4 py-1 text-sm bg-zinc-700 rounded-t text-lime-500"
-                                data-tab="cleaned-html"
-                            >
-                                Cleaned HTML
-                            </button>
-                            <button
-                                class="tab-btn px-4 py-1 text-sm bg-zinc-700 rounded-t text-lime-500"
-                                data-tab="markdown"
-                            >
-                                Markdown
-                            </button>
-                        </div>
-                        <div class="tab-content code bg-zinc-900 p-2 rounded h-full border border-zinc-700 text-sm">
-                            <pre class="h-full flex"><code id="json-result" class="language-json"></code></pre>
-                            <pre
-                                class="hidden h-full flex"
-                            ><code id="cleaned-html-result" class="language-html"></code></pre>
-                            <pre
-                                class="hidden h-full flex"
-                            ><code id="markdown-result" class="language-markdown"></code></pre>
-                        </div>
-                    </div>
-
-                    <div id="code_help" class=" ">
-                        <div class="tab-buttons flex gap-2">
-                            <button
-                                class="code-tab-btn px-4 py-1 text-sm bg-zinc-700 rounded-t text-lime-500"
-                                data-tab="curl"
-                            >
-                                cURL
-                            </button>
-                            <button
-                                class="code-tab-btn px-4 py-1 text-sm bg-zinc-700 rounded-t text-lime-500"
-                                data-tab="library"
-                            >
-                                Python Library
-                            </button>
-                            <button
-                                class="code-tab-btn px-4 py-1 text-sm bg-zinc-700 rounded-t text-lime-500"
-                                data-tab="python"
-                            >
-                                Python (Request)
-                            </button>
-                            <button
-                                class="code-tab-btn px-4 py-1 text-sm bg-zinc-700 rounded-t text-lime-500"
-                                data-tab="nodejs"
-                            >
-                                Node.js
-                            </button>
-                        </div>
-                        <div class="tab-content result bg-zinc-900 p-2 rounded h-full border border-zinc-700 text-sm">
-                            <pre class="h-full flex relative">
-                                <code id="curl-code" class="language-bash"></code>
-                                <button class="absolute top-2 right-2 bg-zinc-700 text-white px-2 py-1 rounded copy-btn" data-target="curl-code">Copy</button>
-                            </pre>
-                            <pre class="hidden h-full flex relative">
-                                <code id="python-code" class="language-python"></code>
-                                <button class="absolute top-2 right-2 bg-zinc-700 text-white px-2 py-1 rounded copy-btn" data-target="python-code">Copy</button>
-                            </pre>
-                            <pre class="hidden h-full flex relative">
-                                <code id="nodejs-code" class="language-javascript"></code>
-                                <button class="absolute top-2 right-2 bg-zinc-700 text-white px-2 py-1 rounded copy-btn" data-target="nodejs-code">Copy</button>
-                            </pre>
-                            <pre class="hidden h-full flex relative">
-                                <code id="library-code" class="language-python"></code>
-                                <button class="absolute top-2 right-2 bg-zinc-700 text-white px-2 py-1 rounded copy-btn" data-target="library-code">Copy</button>
-                            </pre>
-                        </div>
-                    </div>
-                </div>
-            </div>
-        </section>
-        <section class="bg-zinc-900 text-zinc-300 p-6 px-20">
-            <div class="grid grid-cols-2 gap-4 p-4 bg-zinc-900 text-lime-500">
-                <!-- Step 1 -->
-                <div class="col-span-2 bg-yellow-500 p-2 rounded text-zinc-900">
-                    🌟 <strong>Welcome to the Crawl4ai Quickstart Guide! Let's dive into some web crawling fun!</strong>
-                </div>
-                <div class="bg-zinc-800 p-2 rounded">
-                    First Step: Create an instance of WebCrawler and call the <code>warmup()</code> function.
-                </div>
-                <div>
-                    <pre><code class="language-python">crawler = WebCrawler()
-            crawler.warmup()</code></pre>
-                </div>
-
-                <!-- Step 2 -->
-                <div class="col-span-2 bg-yellow-500 p-2 rounded text-zinc-900">
-                    🧠 <strong>Understanding 'bypass_cache' and 'include_raw_html' parameters:</strong>
-                </div>
-                <div class="bg-zinc-800 p-2 rounded">First crawl (caches the result):</div>
-                <div>
-                    <pre><code class="language-python">result = crawler.run(url="https://www.nbcnews.com/business")</code></pre>
-                </div>
-                <div class="bg-zinc-800 p-2 rounded">Second crawl (Force to crawl again):</div>
-                <div>
-                    <pre><code class="language-python">result = crawler.run(url="https://www.nbcnews.com/business", bypass_cache=True)</code></pre>
-                </div>
-                <div class="bg-zinc-800 p-2 rounded">Crawl result without raw HTML content:</div>
-                <div>
-                    <pre><code class="language-python">result = crawler.run(url="https://www.nbcnews.com/business", include_raw_html=False)</code></pre>
-                </div>
-
-                <!-- Step 3 -->
-                <div class="col-span-2 bg-yellow-500 p-2 rounded text-zinc-900">
-                    📄
-                    <strong
-                        >The 'include_raw_html' parameter, when set to True, includes the raw HTML content in the
-                        response. By default, it is set to True.</strong
-                    >
-                </div>
-                <div class="bg-zinc-800 p-2 rounded">Set <code>always_by_pass_cache</code> to True:</div>
-                <div>
-                    <pre><code class="language-python">crawler.always_by_pass_cache = True</code></pre>
-                </div>
-
-                <!-- Step 4 -->
-                <div class="col-span-2 bg-yellow-500 p-2 rounded text-zinc-900">
-                    🧩 <strong>Let's add a chunking strategy: RegexChunking!</strong>
-                </div>
-                <div class="bg-zinc-800 p-2 rounded">Using RegexChunking:</div>
-                <div>
-                    <pre><code class="language-python">result = crawler.run(
-                url="https://www.nbcnews.com/business",
-                chunking_strategy=RegexChunking(patterns=["\n\n"])
-            )</code></pre>
-                </div>
-                <div class="bg-zinc-800 p-2 rounded">Using NlpSentenceChunking:</div>
-                <div>
-                    <pre><code class="language-python">result = crawler.run(
-                url="https://www.nbcnews.com/business",
-                chunking_strategy=NlpSentenceChunking()
-            )</code></pre>
-                </div>
-
-                <!-- Step 5 -->
-                <div class="col-span-2 bg-yellow-500 p-2 rounded text-zinc-900">
-                    🧠 <strong>Let's get smarter with an extraction strategy: CosineStrategy!</strong>
-                </div>
-                <div class="bg-zinc-800 p-2 rounded">Using CosineStrategy:</div>
-                <div>
-                    <pre><code class="language-python">result = crawler.run(
-                url="https://www.nbcnews.com/business",
-                extraction_strategy=CosineStrategy(word_count_threshold=10, max_dist=0.2, linkage_method="ward", top_k=3)
-            )</code></pre>
-                </div>
-
-                <!-- Step 6 -->
-                <div class="col-span-2 bg-yellow-500 p-2 rounded text-zinc-900">
-                    🤖 <strong>Time to bring in the big guns: LLMExtractionStrategy without instructions!</strong>
-                </div>
-                <div class="bg-zinc-800 p-2 rounded">Using LLMExtractionStrategy without instructions:</div>
-                <div>
-                    <pre><code class="language-python">result = crawler.run(
-                url="https://www.nbcnews.com/business",
-                extraction_strategy=LLMExtractionStrategy(provider="openai/gpt-4o", api_token=os.getenv('OPENAI_API_KEY'))
-            )</code></pre>
-                </div>
-
-                <!-- Step 7 -->
-                <div class="col-span-2 bg-yellow-500 p-2 rounded text-zinc-900">
-                    📜 <strong>Let's make it even more interesting: LLMExtractionStrategy with instructions!</strong>
-                </div>
-                <div class="bg-zinc-800 p-2 rounded">Using LLMExtractionStrategy with instructions:</div>
-                <div>
-                    <pre><code class="language-python">result = crawler.run(
-                url="https://www.nbcnews.com/business",
-                extraction_strategy=LLMExtractionStrategy(
-                    provider="openai/gpt-4o",
-                    api_token=os.getenv('OPENAI_API_KEY'),
-                    instruction="I am interested in only financial news"
-                )
-            )</code></pre>
-                </div>
-
-                <!-- Step 8 -->
-                <div class="col-span-2 bg-yellow-500 p-2 rounded text-zinc-900">
-                    🎯 <strong>Targeted extraction: Let's use a CSS selector to extract only H2 tags!</strong>
-                </div>
-                <div class="bg-zinc-800 p-2 rounded">Using CSS selector to extract H2 tags:</div>
-                <div>
-                    <pre><code class="language-python">result = crawler.run(
-                url="https://www.nbcnews.com/business",
-                css_selector="h2"
-            )</code></pre>
-                </div>
-
-                <!-- Step 9 -->
-                <div class="col-span-2 bg-yellow-500 p-2 rounded text-zinc-900">
-                    🖱️ <strong>Let's get interactive: Passing JavaScript code to click 'Load More' button!</strong>
-                </div>
-                <div class="bg-zinc-800 p-2 rounded">Using JavaScript to click 'Load More' button:</div>
-                <div>
-                    <pre><code class="language-python">js_code = """
-            const loadMoreButton = Array.from(document.querySelectorAll('button')).find(button => button.textContent.includes('Load More'));
-            loadMoreButton && loadMoreButton.click();
-            """
-            crawler_strategy = LocalSeleniumCrawlerStrategy(js_code=js_code)
-            crawler = WebCrawler(crawler_strategy=crawler_strategy, always_by_pass_cache=True)
-            result = crawler.run(url="https://www.nbcnews.com/business")</code></pre>
-                </div>
-
-                <!-- Conclusion -->
-                <div class="col-span-2 bg-yellow-500 p-2 rounded text-zinc-900">
-                    🎉
-                    <strong
-                        >Congratulations! You've made it through the Crawl4ai Quickstart Guide! Now go forth and crawl
-                        the web like a pro! 🕸️</strong
-                    >
-                </div>
-            </div>
-        </section>
-        <section class="bg-zinc-900 text-zinc-300 p-6 px-20">
-            <h1 class="text-3xl font-bold mb-4">Installation 💻</h1>
-            <p class="mb-4">
-                There are two ways to use Crawl4AI: as a library in your Python projects or as a standalone local
-                server.
-            </p>
-
-            <p class="mb-4">
-                You can also try Crawl4AI in a Google Colab
-                <a href="https://colab.research.google.com/drive/1wz8u30rvbq6Scodye9AGCw8Qg_Z8QGsk"
-                    ><img
-                        src="https://colab.research.google.com/assets/colab-badge.svg"
-                        alt="Open In Colab"
-                        style="display: inline-block; width: 100px; height: 20px"
-                /></a>
-            </p>
-
-            <h2 class="text-2xl font-bold mb-2">Using Crawl4AI as a Library 📚</h2>
-            <p class="mb-4">To install Crawl4AI as a library, follow these steps:</p>
-
-            <ol class="list-decimal list-inside mb-4">
-                <li class="mb-2">
-                    Install the package from GitHub:
-                    <pre
-                        class="bg-zinc-800 p-4 rounded mt-2 text-zinc-100"
-                    ><code>pip install git+https://github.com/unclecode/crawl4ai.git</code></pre>
-                </li>
-                <li class="mb-2">
-                    Alternatively, you can clone the repository and install the package locally:
-                    <pre
-                        class="bg-zinc-800 p-4 rounded mt-2 text-zinc-100"
-                    ><code  class = "language-python bash">virtualenv venv
-source venv/bin/activate
-git clone https://github.com/unclecode/crawl4ai.git
-cd crawl4ai
-pip install -e .
-        </code></pre>
-                </li>
-                <li>
-                    Import the necessary modules in your Python script:
-                    <pre
-                        class="bg-zinc-800 p-4 rounded mt-2 text-zinc-100"
-                    ><code class = "language-python hljs">from crawl4ai.web_crawler import WebCrawler
-from crawl4ai.chunking_strategy import *
-from crawl4ai.extraction_strategy import *
-import os
-
-crawler = WebCrawler()
-
-# Single page crawl
-single_url = UrlModel(url='https://www.nbcnews.com/business', forced=False)
-result = crawl4ai.fetch_page(
-    url='https://www.nbcnews.com/business',
-    word_count_threshold=5, # Minimum word count for a HTML tag to be considered as a worthy block
-    chunking_strategy= RegexChunking( patterns = ["\\n\\n"]), # Default is RegexChunking
-    extraction_strategy= CosineStrategy(word_count_threshold=10, max_dist=0.2, linkage_method='ward', top_k=3) # Default is CosineStrategy
-    # extraction_strategy= LLMExtractionStrategy(provider= "openai/gpt-4o", api_token = os.getenv('OPENAI_API_KEY')),
-    bypass_cache=False,
-    extract_blocks =True, # Whether to extract semantical blocks of text from the HTML
-    css_selector = "", # Eg: "div.article-body"
-    verbose=True,
-    include_raw_html=True, # Whether to include the raw HTML content in the response
-)
-print(result.model_dump())
-        </code></pre>
-                </li>
-            </ol>
-            <p class="mb-4">
-                For more information about how to run Crawl4AI as a local server, please refer to the
-                <a href="https://github.com/unclecode/crawl4ai" class="text-blue-400">GitHub repository</a>.
-            </p>
-            
-        </section>
-
-        <section class="bg-zinc-900 text-zinc-300 p-6 px-20">
-            <h1 class="text-3xl font-bold mb-4">📖 Parameters</h1>
-            <div class="overflow-x-auto">
-                <table class="min-w-full bg-zinc-800 border border-zinc-700">
-                    <thead>
-                        <tr>
-                            <th class="py-2 px-4 border-b border-zinc-700">Parameter</th>
-                            <th class="py-2 px-4 border-b border-zinc-700">Description</th>
-                            <th class="py-2 px-4 border-b border-zinc-700">Required</th>
-                            <th class="py-2 px-4 border-b border-zinc-700">Default Value</th>
-                        </tr>
-                    </thead>
-                    <tbody>
-                        <tr>
-                            <td class="py-2 px-4 border-b border-zinc-700">urls</td>
-                            <td class="py-2 px-4 border-b border-zinc-700">
-                                A list of URLs to crawl and extract data from.
-                            </td>
-                            <td class="py-2 px-4 border-b border-zinc-700">Yes</td>
-                            <td class="py-2 px-4 border-b border-zinc-700">-</td>
-                        </tr>
-                        <tr>
-                            <td class="py-2 px-4 border-b border-zinc-700">include_raw_html</td>
-                            <td class="py-2 px-4 border-b border-zinc-700">
-                                Whether to include the raw HTML content in the response.
-                            </td>
-                            <td class="py-2 px-4 border-b border-zinc-700">No</td>
-                            <td class="py-2 px-4 border-b border-zinc-700">false</td>
-                        </tr>
-                        <tr>
-                            <td class="py-2 px-4 border-b border-zinc-700">bypass_cache</td>
-                            <td class="py-2 px-4 border-b border-zinc-700">
-                                Whether to force a fresh crawl even if the URL has been previously crawled.
-                            </td>
-                            <td class="py-2 px-4 border-b border-zinc-700">No</td>
-                            <td class="py-2 px-4 border-b border-zinc-700">false</td>
-                        </tr>
-                        <tr>
-                            <td class="py-2 px-4 border-b border-zinc-700">extract_blocks</td>
-                            <td class="py-2 px-4 border-b border-zinc-700">
-                                Whether to extract semantical blocks of text from the HTML.
-                            </td>
-                            <td class="py-2 px-4 border-b border-zinc-700">No</td>
-                            <td class="py-2 px-4 border-b border-zinc-700">true</td>
-                        </tr>
-                        <tr>
-                            <td class="py-2 px-4 border-b border-zinc-700">word_count_threshold</td>
-                            <td class="py-2 px-4 border-b border-zinc-700">
-                                The minimum number of words a block must contain to be considered meaningful (minimum
-                                value is 5).
-                            </td>
-                            <td class="py-2 px-4 border-b border-zinc-700">No</td>
-                            <td class="py-2 px-4 border-b border-zinc-700">5</td>
-                        </tr>
-                        <tr>
-                            <td class="py-2 px-4 border-b border-zinc-700">extraction_strategy</td>
-                            <td class="py-2 px-4 border-b border-zinc-700">
-                                The strategy to use for extracting content from the HTML (e.g., "CosineStrategy").
-                            </td>
-                            <td class="py-2 px-4 border-b border-zinc-700">No</td>
-                            <td class="py-2 px-4 border-b border-zinc-700">CosineStrategy</td>
-                        </tr>
-                        <tr>
-                            <td class="py-2 px-4 border-b border-zinc-700">chunking_strategy</td>
-                            <td class="py-2 px-4 border-b border-zinc-700">
-                                The strategy to use for chunking the text before processing (e.g., "RegexChunking").
-                            </td>
-                            <td class="py-2 px-4 border-b border-zinc-700">No</td>
-                            <td class="py-2 px-4 border-b border-zinc-700">RegexChunking</td>
-                        </tr>
-                        <tr>
-                            <td class="py-2 px-4 border-b border-zinc-700">css_selector</td>
-                            <td class="py-2 px-4 border-b border-zinc-700">
-                                The CSS selector to target specific parts of the HTML for extraction.
-                            </td>
-                            <td class="py-2 px-4 border-b border-zinc-700">No</td>
-                            <td class="py-2 px-4 border-b border-zinc-700">None</td>
-                        </tr>
-                        <tr>
-                            <td class="py-2 px-4">verbose</td>
-                            <td class="py-2 px-4">Whether to enable verbose logging.</td>
-                            <td class="py-2 px-4">No</td>
-                            <td class="py-2 px-4">true</td>
-                        </tr>
-                    </tbody>
-                </table>
-            </div>
-        </section>
-
-        <section id="extraction" class="py-8 px-20">
-            <div class="overflow-x-auto mx-auto px-6">
-                <h2 class="text-2xl font-bold mb-4">Extraction Strategies</h2>
-                <div id="extraction-strategies" class="space-y-4"></div>
-            </div>
-        </section>
-
-        <section id="chunking" class="py-8 px-20">
-            <div class="overflow-x-auto mx-auto px-6">
-                <h2 class="text-2xl font-bold mb-4">Chunking Strategies</h2>
-                <div id="chunking-strategies" class="space-y-4"></div>
-            </div>
-        </section>
-
-        <section class="hero bg-zinc-900 py-8 px-20">
-            <div class="container mx-auto px-4">
-                <h2 class="text-3xl font-bold mb-4">🤔 Why building this?</h2>
-                <p class="text-lg mb-4">
-                    In recent times, we've witnessed a surge of startups emerging, riding the AI hype wave and charging
-                    for services that should rightfully be accessible to everyone. 🌍💸 One such example is scraping and
-                    crawling web pages and transforming them into a format suitable for Large Language Models (LLMs).
-                    🕸️🤖 We believe that building a business around this is not the right approach; instead, it should
-                    definitely be open-source. 🆓🌟 So, if you possess the skills to build such tools and share our
-                    philosophy, we invite you to join our "Robinhood" band and help set these products free for the
-                    benefit of all. 🤝💪
-                </p>
-            </div>
-        </section>
-
-        <section class="installation py-8 px-20">
-            <div class="container mx-auto px-4">
-                <h2 class="text-2xl font-bold mb-4">⚙️ Installation</h2>
-                <p class="mb-4">
-                    To install and run Crawl4AI as a library or a local server, please refer to the 📚
-                    <a href="https://github.com/unclecode/crawl4ai" class="text-blue-400">GitHub repository</a>.
-                </p>
-            </div>
-        </section>
-
-        <footer class="bg-zinc-900 text-white py-4">
-            <div class="container mx-auto px-4">
-                <div class="flex justify-between items-center">
-                    <p>© 2024 Crawl4AI. All rights reserved.</p>
-                    <div class="social-links">
-                        <a
-                            href="https://github.com/unclecode/crawl4ai"
-                            class="text-white hover:text-gray-300 mx-2"
-                            target="_blank"
-                            >😺 GitHub</a
-                        >
-                        <a
-                            href="https://twitter.com/unclecode"
-                            class="text-white hover:text-gray-300 mx-2"
-                            target="_blank"
-                            >🐦 Twitter</a
-                        >
-                    </div>
-                </div>
-            </div>
-        </footer>
-
-        <script>
-            // JavaScript to manage dynamic form changes and logic
-            document.getElementById("extraction-strategy-select").addEventListener("change", function () {
-                const strategy = this.value;
-                const providerModelSelect = document.getElementById("provider-model-select");
-                const tokenInput = document.getElementById("token-input");
-
-                if (strategy === "LLMExtractionStrategy") {
-                    providerModelSelect.disabled = false;
-                    tokenInput.disabled = false;
-                } else {
-                    providerModelSelect.disabled = true;
-                    tokenInput.disabled = true;
-                }
-            });
-
-            // Get the selected provider model and token from local storage
-            const storedProviderModel = localStorage.getItem("provider_model");
-            const storedToken = localStorage.getItem(storedProviderModel);
-
-            if (storedProviderModel) {
-                document.getElementById("provider-model-select").value = storedProviderModel;
-            }
-
-            if (storedToken) {
-                document.getElementById("token-input").value = storedToken;
-            }
-
-            // Handle provider model dropdown change
-            document.getElementById("provider-model-select").addEventListener("change", () => {
-                const selectedProviderModel = document.getElementById("provider-model-select").value;
-                const storedToken = localStorage.getItem(selectedProviderModel);
-
-                if (storedToken) {
-                    document.getElementById("token-input").value = storedToken;
-                } else {
-                    document.getElementById("token-input").value = "";
-                }
-            });
-
-            // Fetch total count from the database
-            axios
-                .get("/total-count")
-                .then((response) => {
-                    document.getElementById("total-count").textContent = response.data.count;
-                })
-                .catch((error) => console.error(error));
-
-            // Handle crawl button click
-            document.getElementById("crawl-btn").addEventListener("click", () => {
-                // validate input to have both URL and API token
-                if (!document.getElementById("url-input").value || !document.getElementById("token-input").value) {
-                    alert("Please enter both URL(s) and API token.");
-                    return;
-                }
-
-                const selectedProviderModel = document.getElementById("provider-model-select").value;
-                const apiToken = document.getElementById("token-input").value;
-                const extractBlocks = document.getElementById("extract-blocks-checkbox").checked;
-                const bypassCache = document.getElementById("bypass-cache-checkbox").checked;
-
-                // Save the selected provider model and token to local storage
-                localStorage.setItem("provider_model", selectedProviderModel);
-                localStorage.setItem(selectedProviderModel, apiToken);
-
-                const urlsInput = document.getElementById("url-input").value;
-                const urls = urlsInput.split(",").map((url) => url.trim());
-                const data = {
-                    urls: urls,
-                    provider_model: selectedProviderModel,
-                    api_token: apiToken,
-                    include_raw_html: true,
-                    bypass_cache: bypassCache,
-                    extract_blocks: extractBlocks,
-                    word_count_threshold: parseInt(document.getElementById("threshold").value),
-                    extraction_strategy: document.getElementById("extraction-strategy-select").value,
-                    chunking_strategy: document.getElementById("chunking-strategy-select").value,
-                    css_selector: document.getElementById("css-selector").value,
-                    verbose: true,
-                };
-
-                // save api token to local storage
-                localStorage.setItem("api_token", document.getElementById("token-input").value);
-
-                document.getElementById("loading").classList.remove("hidden");
-                //document.getElementById("result").classList.add("hidden");
-                //document.getElementById("code_help").classList.add("hidden");
-
-                axios
-                    .post("/crawl", data)
-                    .then((response) => {
-                        const result = response.data.results[0];
-                        const parsedJson = JSON.parse(result.extracted_content);
-                        document.getElementById("json-result").textContent = JSON.stringify(parsedJson, null, 2);
-                        document.getElementById("cleaned-html-result").textContent = result.cleaned_html;
-                        document.getElementById("markdown-result").textContent = result.markdown;
-
-                        // Update code examples dynamically
-                        const extractionStrategy = data.extraction_strategy;
-                        const isLLMExtraction = extractionStrategy === "LLMExtractionStrategy";
-
-                        document.getElementById(
-                            "curl-code"
-                        ).textContent = `curl -X POST -H "Content-Type: application/json" -d '${JSON.stringify({
-                            ...data,
-                            api_token: isLLMExtraction ? "your_api_token" : undefined,
-                        })}' http://crawl4ai.uccode.io/crawl`;
-
-                        document.getElementById(
-                            "python-code"
-                        ).textContent = `import requests\n\ndata = ${JSON.stringify(
-                            { ...data, api_token: isLLMExtraction ? "your_api_token" : undefined },
-                            null,
-                            2
-                        )}\n\nresponse = requests.post("http://crawl4ai.uccode.io/crawl", json=data) # OR local host if your run locally \nprint(response.json())`;
-
-                        document.getElementById(
-                            "nodejs-code"
-                        ).textContent = `const axios = require('axios');\n\nconst data = ${JSON.stringify(
-                            { ...data, api_token: isLLMExtraction ? "your_api_token" : undefined },
-                            null,
-                            2
-                        )};\n\naxios.post("http://crawl4ai.uccode.io/crawl", data) // OR local host if your run locally \n    .then(response => console.log(response.data))\n    .catch(error => console.error(error));`;
-
-                        document.getElementById(
-                            "library-code"
-                        ).textContent = `from crawl4ai.web_crawler import WebCrawler\nfrom crawl4ai.extraction_strategy import *\nfrom crawl4ai.chunking_strategy import *\n\ncrawler = WebCrawler()\ncrawler.warmup()\n\nresult = crawler.run(\n    url='${
-                            urls[0]
-                        }',\n    word_count_threshold=${data.word_count_threshold},\n    extraction_strategy=${
-                            isLLMExtraction
-                                ? `${extractionStrategy}(provider="${data.provider_model}", api_token="${data.api_token}")`
-                                : extractionStrategy + "()"
-                        },\n    chunking_strategy=${data.chunking_strategy}(),\n    bypass_cache=${
-                            data.bypass_cache
-                        },\n    css_selector="${data.css_selector}"\n)\nprint(result)`;
-
-                        // Highlight code syntax
-                        hljs.highlightAll();
-
-                        // Select JSON tab by default
-                        document.querySelector('.tab-btn[data-tab="json"]').click();
-
-                        document.getElementById("loading").classList.add("hidden");
-                        document.getElementById("result").classList.remove("hidden");
-                        document.getElementById("code_help").classList.remove("hidden");
-
-                        // increment the total count
-                        document.getElementById("total-count").textContent =
-                            parseInt(document.getElementById("total-count").textContent) + 1;
-                    })
-                    .catch((error) => {
-                        console.error(error);
-                        document.getElementById("loading").classList.add("hidden");
-                    });
-            });
-
-            // Handle tab clicks
-            document.querySelectorAll(".tab-btn").forEach((btn) => {
-                btn.addEventListener("click", () => {
-                    const tab = btn.dataset.tab;
-                    document
-                        .querySelectorAll(".tab-btn")
-                        .forEach((b) => b.classList.remove("bg-lime-700", "text-white"));
-                    btn.classList.add("bg-lime-700", "text-white");
-                    document.querySelectorAll(".tab-content.code pre").forEach((el) => el.classList.add("hidden"));
-                    document.getElementById(`${tab}-result`).parentElement.classList.remove("hidden");
-                });
-            });
-
-            // Handle code tab clicks
-            document.querySelectorAll(".code-tab-btn").forEach((btn) => {
-                btn.addEventListener("click", () => {
-                    const tab = btn.dataset.tab;
-                    document
-                        .querySelectorAll(".code-tab-btn")
-                        .forEach((b) => b.classList.remove("bg-lime-700", "text-white"));
-                    btn.classList.add("bg-lime-700", "text-white");
-                    document.querySelectorAll(".tab-content.result pre").forEach((el) => el.classList.add("hidden"));
-                    document.getElementById(`${tab}-code`).parentElement.classList.remove("hidden");
-                });
-            });
-
-            // Handle copy to clipboard button clicks
-
-            async function copyToClipboard(text) {
-                if (navigator.clipboard && navigator.clipboard.writeText) {
-                    return navigator.clipboard.writeText(text);
-                } else {
-                    return fallbackCopyTextToClipboard(text);
-                }
-            }
-
-            function fallbackCopyTextToClipboard(text) {
-                return new Promise((resolve, reject) => {
-                    const textArea = document.createElement("textarea");
-                    textArea.value = text;
-
-                    // Avoid scrolling to bottom
-                    textArea.style.top = "0";
-                    textArea.style.left = "0";
-                    textArea.style.position = "fixed";
-
-                    document.body.appendChild(textArea);
-                    textArea.focus();
-                    textArea.select();
-
-                    try {
-                        const successful = document.execCommand("copy");
-                        if (successful) {
-                            resolve();
-                        } else {
-                            reject();
-                        }
-                    } catch (err) {
-                        reject(err);
-                    }
-
-                    document.body.removeChild(textArea);
-                });
-            }
-
-            document.querySelectorAll(".copy-btn").forEach((btn) => {
-                btn.addEventListener("click", () => {
-                    const target = btn.dataset.target;
-                    const code = document.getElementById(target).textContent;
-                    //navigator.clipboard.writeText(code).then(() => {
-                    copyToClipboard(code).then(() => {
-                        btn.textContent = "Copied!";
-                        setTimeout(() => {
-                            btn.textContent = "Copy";
-                        }, 2000);
-                    });
-                });
-            });
-
-            document.addEventListener("DOMContentLoaded", async () => {
-                try {
-                    const extractionResponse = await fetch("/strategies/extraction");
-                    const extractionStrategies = await extractionResponse.json();
-
-                    const chunkingResponse = await fetch("/strategies/chunking");
-                    const chunkingStrategies = await chunkingResponse.json();
-
-                    renderStrategies("extraction-strategies", extractionStrategies);
-                    renderStrategies("chunking-strategies", chunkingStrategies);
-                } catch (error) {
-                    console.error("Error fetching strategies:", error);
-                }
-            });
-
-            function renderStrategies(containerId, strategies) {
-                const container = document.getElementById(containerId);
-                container.innerHTML = ""; // Clear any existing content
-                strategies = JSON.parse(strategies);
-                Object.entries(strategies).forEach(([strategy, description]) => {
-                    const strategyElement = document.createElement("div");
-                    strategyElement.classList.add("bg-zinc-800", "p-4", "rounded", "shadow-md", "docs-item");
-
-                    const strategyDescription = document.createElement("div");
-                    strategyDescription.classList.add("text-gray-300", "prose", "prose-sm");
-                    strategyDescription.innerHTML = marked.parse(description);
-
-                    strategyElement.appendChild(strategyDescription);
-
-                    container.appendChild(strategyElement);
-                });
-            }
-
-            // Highlight code syntax
-            hljs.highlightAll();
-        </script>
-    </body>
-</html>
diff --git a/pages/index.html b/pages/index.html
deleted file mode 100644
index 2947c34a..00000000
--- a/pages/index.html
+++ /dev/null
@@ -1,73 +0,0 @@
-<!DOCTYPE html>
-<html lang="en">
-    <head>
-        <meta charset="UTF-8" />
-        <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-        <title>Crawl4AI</title>
-
-        <link rel="preconnect" href="https://fonts.googleapis.com" />
-        <link rel="preconnect" href="https://fonts.gstatic.com" crossorigin />
-        <link href="https://fonts.googleapis.com/css2?family=Inter:wght@100..900&display=swap" rel="stylesheet" />
-
-        <!-- <link href="https://cdn.jsdelivr.net/npm/tailwindcss@3.4.3/dist/tailwind.min.css" rel="stylesheet" /> -->
-        <script src="https://cdn.tailwindcss.com"></script>
-        <script src="https://cdn.jsdelivr.net/npm/axios/dist/axios.min.js"></script>
-        <link rel="stylesheet" href="/pages/app.css" />
-        <link
-            rel="stylesheet"
-            href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/11.7.0/styles/monokai.min.css"
-        />
-        <script src="https://cdn.jsdelivr.net/npm/marked/marked.min.js"></script>
-
-        <script src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/11.7.0/highlight.min.js"></script>
-    </head>
-    <body class="bg-black text-gray-200">
-        <header class="bg-zinc-950 text-lime-500 py-4 flex">
-            
-            <div class="mx-auto px-4">
-                <h1 class="text-2xl font-bold">🔥🕷️ Crawl4AI: Web Data for your Thoughts</h1>
-            </div>
-            <div class="mx-auto px-4 flex font-bold text-xl gap-2">
-                <span>📊 Total Website Processed</span>
-                <span id="total-count" class="text-lime-400">2</span>
-            </div>
-        </header>
-        
-            {{ try_it | safe }}
-
-            <div class="mx-auto p-4 bg-zinc-950 text-lime-500 min-h-screen">
-                <div class="container mx-auto">
-                <div class="flex h-full px-20">
-                    <div class="sidebar w-1/4 p-4">
-                        <h2 class="text-lg font-bold mb-4">Outline</h2>
-                        <ul>
-                            <li class="mb-2"><a href="#" data-target="installation">Installation</a></li>
-                            <li class="mb-2"><a href="#" data-target="how-to-guide">How to Guide</a></li>
-                            <li class="mb-2"><a href="#" data-target="chunking-strategies">Chunking Strategies</a></li>
-                            <li class="mb-2">
-                                <a href="#" data-target="extraction-strategies">Extraction Strategies</a>
-                            </li>
-                        </ul>
-                    </div>
-
-                    <!-- Main Content -->
-                    <div class="w-3/4 p-4">
-                        {{installation | safe}} {{how_to_guide | safe}}
-
-                        <section id="chunking-strategies" class="content-section">
-                            <h1 class="text-2xl font-bold">Chunking Strategies</h1>
-                            <p>Content for chunking strategies...</p>
-                        </section>
-                        <section id="extraction-strategies" class="content-section">
-                            <h1 class="text-2xl font-bold">Extraction Strategies</h1>
-                            <p>Content for extraction strategies...</p>
-                        </section>
-                    </div>
-                </div>
-            </div>
-            </div>
-        
-        {{ footer | safe }}
-        <script script src="/pages/app.js"></script>
-    </body>
-</html>
diff --git a/pages/index_pooling.html b/pages/index_pooling.html
deleted file mode 100644
index 02128f84..00000000
--- a/pages/index_pooling.html
+++ /dev/null
@@ -1,425 +0,0 @@
-<!DOCTYPE html>
-<html lang="en">
-    <head>
-        <meta charset="UTF-8" />
-        <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-        <title>Crawl4AI</title>
-
-        <link rel="preconnect" href="https://fonts.googleapis.com" />
-        <link rel="preconnect" href="https://fonts.gstatic.com" crossorigin />
-        <link href="https://fonts.googleapis.com/css2?family=Inter:wght@100..900&display=swap" rel="stylesheet" />
-
-        <link href="https://cdn.jsdelivr.net/npm/tailwindcss@2.2.19/dist/tailwind.min.css" rel="stylesheet" />
-        <script src="https://cdn.jsdelivr.net/npm/axios/dist/axios.min.js"></script>
-        <link
-            rel="stylesheet"
-            href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/11.7.0/styles/vs2015.min.css"
-        />
-        <script src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/11.7.0/highlight.min.js"></script>
-        <style>
-            :root {
-                --ifm-font-size-base: 100%;
-                --ifm-line-height-base: 1.65;
-                --ifm-font-family-base: system-ui, -apple-system, Segoe UI, Roboto, Ubuntu, Cantarell, Noto Sans,
-                    sans-serif, BlinkMacSystemFont, "Segoe UI", Helvetica, Arial, sans-serif, "Apple Color Emoji",
-                    "Segoe UI Emoji", "Segoe UI Symbol";
-            }
-            html {
-                -webkit-font-smoothing: antialiased;
-                -webkit-text-size-adjust: 100%;
-                text-size-adjust: 100%;
-                font: var(--ifm-font-size-base) / var(--ifm-line-height-base) var(--ifm-font-family-base);
-            }
-            body {
-                background-color: #1a202c;
-                color: #fff;
-            }
-            .tab-content {
-                max-height: 400px;
-                overflow: auto;
-            }
-            pre {
-                white-space: pre-wrap;
-                font-size: 14px;
-            }
-            pre code {
-                width: 100%;
-            }
-        </style>
-    </head>
-    <body>
-        <header class="bg-gray-900 text-white py-4">
-            <div class="container mx-auto px-4">
-                <h1 class="text-2xl font-bold">🔥🕷️ Crawl4AI: Open-source LLM Friendly Web scraper</h1>
-            </div>
-        </header>
-
-        <section class="try-it py-8 pb-20">
-            <div class="container mx-auto px-4">
-                <h2 class="text-2xl font-bold mb-4">Try It Now</h2>
-                <div class="mb-4 flex w-full gap-2">
-                    <input
-                        type="text"
-                        id="url-input"
-                        value="https://kidocode.com"
-                        class="border border-gray-600 rounded px-4 py-2 flex-grow bg-gray-800 text-white"
-                        placeholder="Enter URL(s) separated by commas"
-                    />
-                    <select
-                        id="provider-model-select"
-                        class="border border-gray-600 rounded px-4 py-2 bg-gray-800 text-white"
-                    >
-                        <!-- Add your option values here -->
-                        <option value="groq/llama3-70b-8192">groq/llama3-70b-8192</option>
-                        <option value="groq/llama3-8b-8192">groq/llama3-8b-8192</option>
-                        <option value="openai/gpt-4-turbo">gpt-4-turbo</option>
-                        <option value="openai/gpt-3.5-turbo">gpt-3.5-turbo</option>
-                        <option value="anthropic/claude-3-haiku-20240307">claude-3-haiku</option>
-                        <option value="anthropic/claude-3-opus-20240229">claude-3-opus</option>
-                        <option value="anthropic/claude-3-sonnet-20240229">claude-3-sonnet</option>
-                    </select>
-                    <input
-                        type="password"
-                        id="token-input"
-                        class="border border-gray-600 rounded px-4 py-2 flex-grow bg-gray-800 text-white"
-                        placeholder="Enter Groq API token"
-                    />
-                    <div class="flex items-center justify-center">
-                        <input type="checkbox" id="extract-blocks-checkbox" class="mr-2" checked>
-                        <label for="extract-blocks-checkbox" class="text-white">Extract Blocks</label>
-                    </div>
-                    <button id="crawl-btn" class="bg-blue-600 text-white px-4 py-2 rounded">Crawl</button>
-                </div>
-                <div class="grid grid-cols-1 md:grid-cols-2 gap-8">
-                    <div id="loading" class="hidden mt-4">
-                        <p>Loading...</p>
-                    </div>
-                    <div id="result" class="tab-container flex-1 h-full flex-col">
-                        <div class="tab-buttons flex gap-2">
-                            <button class="tab-btn px-4 py-2 bg-gray-700 rounded-t" data-tab="json">JSON</button>
-                            <button class="tab-btn px-4 py-2 bg-gray-700 rounded-t" data-tab="cleaned-html">
-                                Cleaned HTML
-                            </button>
-                            <button class="tab-btn px-4 py-2 bg-gray-700 rounded-t" data-tab="markdown">
-                                Markdown
-                            </button>
-                        </div>
-                        <div class="tab-content code bg-gray-800 p-2 rounded  h-full  flex-1 border border-gray-600">
-                            <pre class="h-full flex"><code id="json-result" class="language-json "></code></pre>
-                            <pre
-                                class="hidden h-full flex"
-                            ><code id="cleaned-html-result" class="language-html "></code></pre>
-                            <pre
-                                class="hidden h-full flex"
-                            ><code id="markdown-result" class="language-markdown "></code></pre>
-                        </div>
-                    </div>
-                    <div id="code_help" class="tab-container flex-1 h-full">
-                        <div class="tab-buttons flex gap-2">
-                            <button class="code-tab-btn px-4 py-2 bg-gray-700 rounded-t" data-tab="curl">cURL</button>
-                            <button class="code-tab-btn px-4 py-2 bg-gray-700 rounded-t" data-tab="python">
-                                Python
-                            </button>
-                            <button class="code-tab-btn px-4 py-2 bg-gray-700 rounded-t" data-tab="nodejs">
-                                Node.js
-                            </button>
-                        </div>
-                        <div class="tab-content result bg-gray-800 p-2 rounded h-full  flex-1 border border-gray-600">
-                            <pre class="h-full flex relative">
-                                    <code id="curl-code" class="language-bash"></code>
-                                    <button class="absolute top-2 right-2 bg-gray-700 text-white px-2 py-1 rounded copy-btn" data-target="curl-code">Copy</button>
-                                </pre>
-                            <pre class="hidden h-full flex relative">
-                                    <code id="python-code" class="language-python"></code>
-                                    <button class="absolute top-2 right-2 bg-gray-700 text-white px-2 py-1 rounded copy-btn" data-target="python-code">Copy</button>
-                                </pre>
-                            <pre class="hidden h-full flex relative">
-                                    <code id="nodejs-code" class="language-javascript"></code>
-                                    <button class="absolute top-2 right-2 bg-gray-700 text-white px-2 py-1 rounded copy-btn" data-target="nodejs-code">Copy</button>
-                                </pre>
-                        </div>
-                    </div>
-                </div>
-            </div>
-        </section>
-
-        <section class="hero bg-gray-900 py-8">
-            <div class="container mx-auto px-4">
-                <h2 class="text-3xl font-bold mb-4">🤔 Why building this?</h2>
-                <p class="text-lg mb-4">
-                    In recent times, we've seen numerous startups emerging, riding the AI hype wave and charging for
-                    services that should rightfully be accessible to everyone. 🌍💸 One for example is to scrap and crawl 
-                    a web page, and transform it o a form suitable for LLM. We don't think one should build a business
-                    out of this, but definilty should be opened source. So if you possess the skills to build such things 
-                    and you have such philosphy you should join our "Robinhood" band and help set
-                    these products free. 🆓🤝
-                </p>
-            </div>
-        </section>
-
-        <section class="installation py-8">
-            <div class="container mx-auto px-4">
-                <h2 class="text-2xl font-bold mb-4">⚙️ Installation</h2>
-                <p class="mb-4">
-                    To install and run Crawl4AI locally or on your own service, the best way is to use Docker. 🐳 Follow
-                    these steps:
-                </p>
-                <ol class="list-decimal list-inside mb-4">
-                    <li>
-                        Clone the GitHub repository: 📥
-                        <code>git clone https://github.com/unclecode/crawl4ai.git</code>
-                    </li>
-                    <li>Navigate to the project directory: 📂 <code>cd crawl4ai</code></li>
-                    <li>
-                        Build the Docker image: 🛠️ <code>docker build -t crawl4ai .</code> On Mac, follow: 🍎
-                        <code>docker build --platform linux/amd64 -t crawl4ai .</code>
-                    </li>
-                    <li>Run the Docker container: ▶️ <code>docker run -p 8000:80 crawl4ai</code></li>
-                </ol>
-                <p>
-                    For more detailed instructions and advanced configuration options, please refer to the 📚
-                    <a href="https://github.com/unclecode/crawl4ai" class="text-blue-400">GitHub repository</a>.
-                </p>
-            </div>
-        </section>
-
-        <footer class="bg-gray-900 text-white py-4">
-            <div class="container mx-auto px-4">
-                <div class="flex justify-between items-center">
-                    <p>© 2024 Crawl4AI. All rights reserved.</p>
-                    <div class="social-links">
-                        <a
-                            href="https://github.com/unclecode/crawl4ai"
-                            class="text-white hover:text-gray-300 mx-2"
-                            target="_blank"
-                            >😺 GitHub</a
-                        >
-                        <a
-                            href="https://twitter.com/unclecode"
-                            class="text-white hover:text-gray-300 mx-2"
-                            target="_blank"
-                            >🐦 Twitter</a
-                        >
-                        <a
-                            href="https://discord.gg/your-invite-link"
-                            class="text-white hover:text-gray-300 mx-2"
-                            target="_blank"
-                            >💬 Discord</a
-                        >
-                    </div>
-                </div>
-            </div>
-        </footer>
-
-        <script>
-            // Get the selected provider model and token from local storage
-            const storedProviderModel = localStorage.getItem("provider_model");
-            const storedToken = localStorage.getItem(storedProviderModel);
-
-            if (storedProviderModel) {
-                document.getElementById("provider-model-select").value = storedProviderModel;
-            }
-
-            if (storedToken) {
-                document.getElementById("token-input").value = storedToken;
-            }
-
-            // Handle provider model dropdown change
-            document.getElementById("provider-model-select").addEventListener("change", () => {
-                const selectedProviderModel = document.getElementById("provider-model-select").value;
-                const storedToken = localStorage.getItem(selectedProviderModel);
-
-                if (storedToken) {
-                    document.getElementById("token-input").value = storedToken;
-                } else {
-                    document.getElementById("token-input").value = "";
-                }
-            });
-
-            // Fetch total count from the database
-            axios
-                .get("/total-count")
-                .then((response) => {
-                    document.getElementById("total-count").textContent = response.data.count;
-                })
-                .catch((error) => console.error(error));
-
-            // Handle crawl button click
-            document.getElementById("crawl-btn").addEventListener("click", () => {
-                // validate input to have both URL and API token
-                if (!document.getElementById("url-input").value || !document.getElementById("token-input").value) {
-                    alert("Please enter both URL(s) and API token.");
-                    return;
-                }
-
-                const selectedProviderModel = document.getElementById("provider-model-select").value;
-                const apiToken = document.getElementById("token-input").value;
-                const extractBlocks = document.getElementById("extract-blocks-checkbox").checked;
-
-
-                // Save the selected provider model and token to local storage
-                localStorage.setItem("provider_model", selectedProviderModel);
-                localStorage.setItem(selectedProviderModel, apiToken);
-
-                const urlsInput = document.getElementById("url-input").value;
-                const urls = urlsInput.split(",").map((url) => url.trim());
-                const data = {
-                    urls: urls,
-                    provider_model: selectedProviderModel,
-                    api_token: apiToken,
-                    include_raw_html: true,
-                    forced: false,
-                    extract_blocks: extractBlocks,
-                };
-
-                // save api token to local storage
-                localStorage.setItem("api_token", document.getElementById("token-input").value);
-
-                document.getElementById("loading").classList.remove("hidden");
-                document.getElementById("result").classList.add("hidden");
-                document.getElementById("code_help").classList.add("hidden");
-
-                axios
-                    .post("/crawl", data)
-                    .then((response) => {
-                        const result = response.data.results[0];
-                        const parsedJson = JSON.parse(result.extracted_content);
-                        document.getElementById("json-result").textContent = JSON.stringify(parsedJson, null, 2);
-                        document.getElementById("cleaned-html-result").textContent = result.cleaned_html;
-                        document.getElementById("markdown-result").textContent = result.markdown;
-
-                        // Update code examples dynamically
-                        // Update code examples dynamically
-                        document.getElementById(
-                            "curl-code"
-                        ).textContent = `curl -X POST -H "Content-Type: application/json" -d '${JSON.stringify({
-                            ...data,
-                            api_token: "your_api_token",
-                        })}' http://localhost:8000/crawl`;
-
-                        document.getElementById(
-                            "python-code"
-                        ).textContent = `import requests\n\ndata = ${JSON.stringify(
-                            { ...data, api_token: "your_api_token" },
-                            null,
-                            2
-                        )}\n\nresponse = requests.post("http://localhost:8000/crawl", json=data)\nprint(response.json())`;
-
-                        document.getElementById(
-                            "nodejs-code"
-                        ).textContent = `const axios = require('axios');\n\nconst data = ${JSON.stringify(
-                            { ...data, api_token: "your_api_token" },
-                            null,
-                            2
-                        )};\n\naxios.post("http://localhost:8000/crawl", data)\n    .then(response => console.log(response.data))\n    .catch(error => console.error(error));`;
-                        // Highlight code syntax
-                        hljs.highlightAll();
-
-                        // Select JSON tab by default
-                        document.querySelector('.tab-btn[data-tab="json"]').click();
-
-                        document.getElementById("loading").classList.add("hidden");
-                        document.getElementById("result").classList.remove("hidden");
-                        document.getElementById("code_help").classList.remove("hidden");
-                    })
-                    .catch((error) => {
-                        console.error(error);
-                        document.getElementById("loading").classList.add("hidden");
-                    });
-            });
-
-            // Handle tab clicks
-            document.querySelectorAll(".tab-btn").forEach((btn) => {
-                btn.addEventListener("click", () => {
-                    const tab = btn.dataset.tab;
-                    document
-                        .querySelectorAll(".tab-btn")
-                        .forEach((b) => b.classList.remove("bg-blue-600", "text-white"));
-                    btn.classList.add("bg-blue-600", "text-white");
-                    document.querySelectorAll(".tab-content.code pre").forEach((el) => el.classList.add("hidden"));
-                    document.getElementById(`${tab}-result`).parentElement.classList.remove("hidden");
-                });
-            });
-
-            // Handle code tab clicks
-            document.querySelectorAll(".code-tab-btn").forEach((btn) => {
-                btn.addEventListener("click", () => {
-                    const tab = btn.dataset.tab;
-                    document
-                        .querySelectorAll(".code-tab-btn")
-                        .forEach((b) => b.classList.remove("bg-blue-600", "text-white"));
-                    btn.classList.add("bg-blue-600", "text-white");
-                    document.querySelectorAll(".tab-content.result pre").forEach((el) => el.classList.add("hidden"));
-                    document.getElementById(`${tab}-code`).parentElement.classList.remove("hidden");
-                });
-            });
-
-            // Handle copy to clipboard button clicks
-            document.querySelectorAll(".copy-btn").forEach((btn) => {
-                btn.addEventListener("click", () => {
-                    const target = btn.dataset.target;
-                    const code = document.getElementById(target).textContent;
-                    navigator.clipboard.writeText(code).then(() => {
-                        btn.textContent = "Copied!";
-                        setTimeout(() => {
-                            btn.textContent = "Copy";
-                        }, 2000);
-                    });
-                });
-            });
-
-
-            document.getElementById("crawl-btn").addEventListener("click", () => {
-                const urlsInput = document.getElementById("url-input").value;
-                const urls = urlsInput.split(",").map(url => url.trim());
-                const apiToken = document.getElementById("token-input").value;
-                const selectedProviderModel = document.getElementById("provider-model-select").value;
-                const extractBlocks = document.getElementById("extract-blocks-checkbox").checked;
-            
-                const data = {
-                    urls: urls,
-                    provider_model: selectedProviderModel,
-                    api_token: apiToken,
-                    include_raw_html: true,
-                    forced: false,
-                    extract_blocks: extractBlocks
-                };
-            
-                localStorage.setItem("api_token", apiToken);
-            
-                document.getElementById("loading").classList.remove("hidden");
-                document.getElementById("result").classList.add("hidden");
-                document.getElementById("code_help").classList.add("hidden");
-            
-                axios.post("/crawl", data)
-                    .then(response => {
-                        const taskId = response.data.task_id;
-                        pollTaskStatus(taskId);
-                    })
-                    .catch(error => {
-                        console.error('Error during fetch:', error);
-                        document.getElementById("loading").classList.add("hidden");
-                    });
-            });
-            
-            function pollTaskStatus(taskId) {
-                axios.get(`/task/${taskId}`)
-                    .then(response => {
-                        const task = response.data;
-                        if (task.status === 'done') {
-                            displayResults(task.results[0]);
-                        } else if (task.status === 'pending') {
-                            setTimeout(() => pollTaskStatus(taskId), 2000);  // Poll every 2 seconds
-                        } else {
-                            console.error('Task failed:', task.error);
-                            document.getElementById("loading").classList.add("hidden");
-                        }
-                    })
-                    .catch(error => {
-                        console.error('Error polling task status:', error);
-                        document.getElementById("loading").classList.add("hidden");
-                    });
-            }
-        </script>
-    </body>
-</html>
diff --git a/pages/partial/footer.html b/pages/partial/footer.html
deleted file mode 100644
index 3ab189e1..00000000
--- a/pages/partial/footer.html
+++ /dev/null
@@ -1,36 +0,0 @@
-<section class="hero bg-zinc-900 py-8 px-20 text-zinc-400">
-    <div class="container mx-auto px-4">
-        <h2 class="text-3xl font-bold mb-4">🤔 Why building this?</h2>
-        <p class="text-lg mb-4">
-            In recent times, we've witnessed a surge of startups emerging, riding the AI hype wave and charging
-            for services that should rightfully be accessible to everyone. 🌍💸 One such example is scraping and
-            crawling web pages and transforming them into a format suitable for Large Language Models (LLMs).
-            🕸️🤖 We believe that building a business around this is not the right approach; instead, it should
-            definitely be open-source. 🆓🌟 So, if you possess the skills to build such tools and share our
-            philosophy, we invite you to join our "Robinhood" band and help set these products free for the
-            benefit of all. 🤝💪
-        </p>
-    </div>
-</section>
-
-<footer class="bg-zinc-900 text-zinc-400 py-4">
-    <div class="container mx-auto px-4">
-        <div class="flex justify-between items-center">
-            <p>© 2024 Crawl4AI. All rights reserved.</p>
-            <div class="social-links">
-                <a
-                    href="https://github.com/unclecode/crawl4ai"
-                    class="text-zinc-400 hover:text-gray-300 mx-2"
-                    target="_blank"
-                    >😺 GitHub</a
-                >
-                <a
-                    href="https://twitter.com/unclecode"
-                    class="text-zinc-400 hover:text-gray-300 mx-2"
-                    target="_blank"
-                    >🐦 Twitter</a
-                >
-            </div>
-        </div>
-    </div>
-</footer>
\ No newline at end of file
diff --git a/pages/partial/how_to_guide.html b/pages/partial/how_to_guide.html
deleted file mode 100644
index 785915c1..00000000
--- a/pages/partial/how_to_guide.html
+++ /dev/null
@@ -1,174 +0,0 @@
-<section id="how-to-guide" class="content-section">
-    <h1 class="text-2xl font-bold">How to Guide</h1>
-    <div class="flex flex-col gap-4 p-4 bg-zinc-900 text-lime-500">
-        <!-- Step 1 -->
-        <div class="col-span-2 bg-lime-800 p-2 rounded text-zinc-50">
-            🌟
-            <strong
-                >Welcome to the Crawl4ai Quickstart Guide! Let's dive into some web crawling
-                fun!</strong
-            >
-        </div>
-        <div class="">
-            First Step: Create an instance of WebCrawler and call the
-            <code>warmup()</code> function.
-        </div>
-        <div>
-            <pre><code class="language-python">crawler = WebCrawler()
-crawler.warmup()</code></pre>
-        </div>
-
-        <!-- Step 2 -->
-        <div class="col-span-2 bg-lime-800 p-2 rounded text-zinc-50">
-            🧠 <strong>Understanding 'bypass_cache' and 'include_raw_html' parameters:</strong>
-        </div>
-        <div class="">First crawl (caches the result):</div>
-        <div>
-            <pre><code class="language-python">result = crawler.run(url="https://www.nbcnews.com/business")</code></pre>
-        </div>
-        <div class="">Second crawl (Force to crawl again):</div>
-        <div>
-            <pre><code class="language-python">result = crawler.run(url="https://www.nbcnews.com/business", bypass_cache=True)</code></pre>
-            <div class="bg-red-900 p-2 text-zinc-50">
-                ⚠️ Don't forget to set <code>`bypass_cache`</code> to True if you want to try different strategies for the same URL. Otherwise, the cached result will be returned. You can also set <code>`always_by_pass_cache`</code> in constructor to True to always bypass the cache.
-            </div>
-        </div>
-        <div class="">Crawl result without raw HTML content:</div>
-        <div>
-            <pre><code class="language-python">result = crawler.run(url="https://www.nbcnews.com/business", include_raw_html=False)</code></pre>
-        </div>
-
-        <!-- Step 3 -->
-        <div class="col-span-2 bg-lime-800 p-2 rounded text-zinc-50">
-            📄
-            <strong
-                >The 'include_raw_html' parameter, when set to True, includes the raw HTML content
-                in the response. By default, it is set to True.</strong
-            >
-        </div>
-        <div class="">Set <code>always_by_pass_cache</code> to True:</div>
-        <div>
-            <pre><code class="language-python">crawler.always_by_pass_cache = True</code></pre>
-        </div>
-        <!-- Step 3.5 Screenshot -->
-        <div class="col-span-2 bg-lime-800 p-2 rounded text-zinc-50">
-            📸
-            <strong>Let's take a screenshot of the page!</strong>
-        </div>
-        <div>
-            <pre><code class="language-python">result = crawler.run(
-    url="https://www.nbcnews.com/business",
-    screenshot=True
-)
-with open("screenshot.png", "wb") as f:
-    f.write(base64.b64decode(result.screenshot))</code></pre>
-        </div>
-
-
-        <!-- Step 4 -->
-        <div class="col-span-2 bg-lime-800 p-2 rounded text-zinc-50">
-            🧩 <strong>Let's add a chunking strategy: RegexChunking!</strong>
-        </div>
-        <div class="">Using RegexChunking:</div>
-        <div>
-            <pre><code class="language-python">result = crawler.run(
-    url="https://www.nbcnews.com/business",
-    chunking_strategy=RegexChunking(patterns=["\n\n"])
-)</code></pre>
-        </div>
-        <div class="">Using NlpSentenceChunking:</div>
-        <div>
-            <pre><code class="language-python">result = crawler.run(
-    url="https://www.nbcnews.com/business",
-    chunking_strategy=NlpSentenceChunking()
-)</code></pre>
-        </div>
-
-        <!-- Step 5 -->
-        <div class="col-span-2 bg-lime-800 p-2 rounded text-zinc-50">
-            🧠 <strong>Let's get smarter with an extraction strategy: CosineStrategy!</strong>
-        </div>
-        <div class="">Using CosineStrategy:</div>
-        <div>
-            <pre><code class="language-python">result = crawler.run(
-    url="https://www.nbcnews.com/business",
-    extraction_strategy=CosineStrategy(word_count_threshold=10, max_dist=0.2, linkage_method="ward", top_k=3)
-)</code></pre>
-        </div>
-
-        <!-- Step 6 -->
-        <div class="col-span-2 bg-lime-800 p-2 rounded text-zinc-50">
-            🤖
-            <strong
-                >Time to bring in the big guns: LLMExtractionStrategy without instructions!</strong
-            >
-        </div>
-        <div class="">Using LLMExtractionStrategy without instructions:</div>
-        <div>
-            <pre><code class="language-python">result = crawler.run(
-    url="https://www.nbcnews.com/business",
-    extraction_strategy=LLMExtractionStrategy(provider="openai/gpt-4o", api_token=os.getenv('OPENAI_API_KEY'))
-)</code></pre>
-        </div>
-
-        <!-- Step 7 -->
-        <div class="col-span-2 bg-lime-800 p-2 rounded text-zinc-50">
-            📜
-            <strong
-                >Let's make it even more interesting: LLMExtractionStrategy with
-                instructions!</strong
-            >
-        </div>
-        <div class="">Using LLMExtractionStrategy with instructions:</div>
-        <div>
-            <pre><code class="language-python">result = crawler.run(
-    url="https://www.nbcnews.com/business",
-    extraction_strategy=LLMExtractionStrategy(
-    provider="openai/gpt-4o",
-    api_token=os.getenv('OPENAI_API_KEY'),
-    instruction="I am interested in only financial news"
-)
-)</code></pre>
-        </div>
-
-        <!-- Step 8 -->
-        <div class="col-span-2 bg-lime-800 p-2 rounded text-zinc-50">
-            🎯
-            <strong>Targeted extraction: Let's use a CSS selector to extract only H2 tags!</strong>
-        </div>
-        <div class="">Using CSS selector to extract H2 tags:</div>
-        <div>
-            <pre><code class="language-python">result = crawler.run(
-    url="https://www.nbcnews.com/business",
-    css_selector="h2"
-)</code></pre>
-        </div>
-
-        <!-- Step 9 -->
-        <div class="col-span-2 bg-lime-800 p-2 rounded text-zinc-50">
-            🖱️
-            <strong
-                >Let's get interactive: Passing JavaScript code to click 'Load More' button!</strong
-            >
-        </div>
-        <div class="">Using JavaScript to click 'Load More' button:</div>
-        <div>
-            <pre><code class="language-python">js_code = ["""
-const loadMoreButton = Array.from(document.querySelectorAll('button')).find(button => button.textContent.includes('Load More'));
-loadMoreButton && loadMoreButton.click();
-"""]
-crawler = WebCrawler(verbos=crawler_strategy, always_by_pass_cache=True)
-result = crawler.run(url="https://www.nbcnews.com/business", js = js_code)</code></pre>
-        <div class="">Remember that you can pass multiple JavaScript code snippets in the list. They all will be executed in the order they are passed.</div>
-        </div>
-
-        <!-- Conclusion -->
-        <div class="col-span-2 bg-lime-800 p-2 rounded text-zinc-50">
-            🎉
-            <strong
-                >Congratulations! You've made it through the Crawl4ai Quickstart Guide! Now go forth
-                and crawl the web like a pro! 🕸️</strong
-            >
-        </div>
-    </div>
-</section>
\ No newline at end of file
diff --git a/pages/partial/installation.html b/pages/partial/installation.html
deleted file mode 100644
index 6a6561cd..00000000
--- a/pages/partial/installation.html
+++ /dev/null
@@ -1,65 +0,0 @@
-<section id="installation" class="content-section active">
-    <h1 class="text-2xl font-bold">Installation 💻</h1>
-    <p class="mb-4">
-        There are three ways to use Crawl4AI: 
-        <ol class="list-decimal list-inside mb-4">
-            <li class="">
-                As a library
-            </li>
-            <li class="">
-                As a local server (Docker)
-            </li>
-            <li class="">
-                As a Google Colab notebook. <a href="https://colab.research.google.com/drive/1wz8u30rvbq6Scodye9AGCw8Qg_Z8QGsk"
-                ><img
-                    src="https://colab.research.google.com/assets/colab-badge.svg"
-                    alt="Open In Colab"
-                    style="display: inline-block; width: 100px; height: 20px"
-            /></a>
-            </li>
-    </p>
-
-
-    <p class="my-4">To install Crawl4AI as a library, follow these steps:</p>
-
-    <ol class="list-decimal list-inside mb-4">
-        <li class="mb-4">
-            Install the package from GitHub:
-            <pre
-                class="bg-zinc-800 p-4 rounded mt-2 text-zinc-100"
-            ><code>virtualenv venv
-source venv/bin/activate
-pip install "crawl4ai[all] @ git+https://github.com/unclecode/crawl4ai.git"
-            </code></pre>
-        </li>
-        <li class="mb-4">
-            Run the following command to load the required models. This is optional, but it will boost the performance and speed of the crawler. You need to do this only once.
-            <pre
-                class="bg-zinc-800 p-4 rounded mt-2 text-zinc-100"
-            ><code>crawl4ai-download-models</code></pre>
-        </li>
-        <li class="mb-4">
-            Alternatively, you can clone the repository and install the package locally:
-            <pre
-                class="bg-zinc-800 p-4 rounded mt-2 text-zinc-100"
-            ><code  class = "language-python bash">virtualenv venv
-source venv/bin/activate
-git clone https://github.com/unclecode/crawl4ai.git
-cd crawl4ai
-pip install -e .[all]
-</code></pre>
-        </li>
-        <li class="">
-            Use docker to run the local server:
-            <pre
-                class="bg-zinc-800 p-4 rounded mt-2 text-zinc-100"
-            ><code  class = "language-python bash">docker build -t crawl4ai . 
-# docker build --platform linux/amd64 -t crawl4ai . For Mac users
-docker run -d -p 8000:80 crawl4ai</code></pre>
-        </li>
-    </ol>
-    <p class="mb-4">
-        For more information about how to run Crawl4AI as a local server, please refer to the
-        <a href="https://github.com/unclecode/crawl4ai" class="text-blue-400">GitHub repository</a>.
-    </p>
-</section>
\ No newline at end of file
diff --git a/pages/partial/try_it.html b/pages/partial/try_it.html
deleted file mode 100644
index e3033eec..00000000
--- a/pages/partial/try_it.html
+++ /dev/null
@@ -1,217 +0,0 @@
-<section class="try-it py-8 px-16 pb-20 bg-zinc-900 overflow-hidden">
-    <div class="container mx-auto ">
-        <h2 class="text-2xl font-bold mb-4 text-lime-500">Try It Now</h2>
-        <div class="flex gap-4">
-            <div class="flex flex-col flex-1 gap-2">
-                <div class="flex flex-col">
-                    <label for="url-input" class="text-lime-500 font-bold text-xs">URL(s)</label>
-                    <input
-                        type="text"
-                        id="url-input"
-                        value="https://www.nbcnews.com/business"
-                        class="border border-zinc-700 rounded px-4 py-0 bg-zinc-900 text-zinc-300"
-                        placeholder="Enter URL(s) separated by commas"
-                    />
-                </div>
-                <div class="flex gap-2">
-                    <div class="flex flex-col">
-                        <label for="threshold" class="text-lime-500 font-bold text-xs">Min Words Threshold</label>
-                        <select
-                            id="threshold"
-                            class="border border-zinc-700 rounded px-4 py-1 bg-zinc-900 text-zinc-300"
-                        >
-                            <option value="1">1</option>
-                            <option value="5">5</option>
-                            <option value="10" selected>10</option>
-                            <option value="15">15</option>
-                            <option value="20">20</option>
-                            <option value="25">25</option>
-                        </select>
-                    </div>
-                    <div class="flex flex-col flex-1">
-                        <label for="css-selector" class="text-lime-500 font-bold text-xs">CSS Selector</label>
-                        <input
-                            type="text"
-                            id="css-selector"
-                            class="border border-zinc-700 rounded px-4 py-0 bg-zinc-900 text-zinc-300 placeholder-lime-700"
-                            placeholder="CSS Selector (e.g. .content, #main, article)"
-                        />
-                    </div>
-                </div>
-                <div class="flex gap-2">
-                    <div class="flex flex-col">
-                        <label for="extraction-strategy-select" class="text-lime-500 font-bold text-xs"
-                            >Extraction Strategy</label
-                        >
-                        <select
-                            id="extraction-strategy-select"
-                            class="border border-zinc-700 rounded px-4 py-1 bg-zinc-900 text-zinc-300"
-                        >
-                            <option value="NoExtractionStrategy" selected>NoExtractionStrategy</option>
-                            <option value="CosineStrategy">CosineStrategy</option>
-                            <option value="LLMExtractionStrategy">LLMExtractionStrategy</option>
-                        </select>
-                    </div>
-                    <div class="flex flex-col">
-                        <label for="chunking-strategy-select" class="text-lime-500 font-bold text-xs"
-                            >Chunking Strategy</label
-                        >
-                        <select
-                            id="chunking-strategy-select"
-                            class="border border-zinc-700 rounded px-4 py-1 bg-zinc-900 text-zinc-300"
-                        >
-                            <option value="RegexChunking">RegexChunking</option>
-                            <option value="NlpSentenceChunking">NlpSentenceChunking</option>
-                            <option value="TopicSegmentationChunking">TopicSegmentationChunking</option>
-                            <option value="FixedLengthWordChunking">FixedLengthWordChunking</option>
-                            <option value="SlidingWindowChunking">SlidingWindowChunking</option>
-                        </select>
-                    </div>
-                </div>
-                <div id = "llm_settings" class="flex gap-2 hidden hidden">
-                    <div class="flex flex-col">
-                        <label for="provider-model-select" class="text-lime-500 font-bold text-xs"
-                            >Provider Model</label
-                        >
-                        <select
-                            id="provider-model-select"
-                            class="border border-zinc-700 rounded px-4 py-1 bg-zinc-900 text-zinc-300"
-                        >
-                            <option value="groq/llama3-70b-8192">groq/llama3-70b-8192</option>
-                            <option value="groq/llama3-8b-8192">groq/llama3-8b-8192</option>
-                            <option value="groq/mixtral-8x7b-32768">groq/mixtral-8x7b-32768</option>
-                            <option value="openai/gpt-4-turbo">gpt-4-turbo</option>
-                            <option value="openai/gpt-3.5-turbo">gpt-3.5-turbo</option>
-                            <option value="openai/gpt-4o">gpt-4o</option>
-                            <option value="anthropic/claude-3-haiku-20240307">claude-3-haiku</option>
-                            <option value="anthropic/claude-3-opus-20240229">claude-3-opus</option>
-                            <option value="anthropic/claude-3-sonnet-20240229">claude-3-sonnet</option>
-                        </select>
-                    </div>
-                    <div class="flex flex-col flex-1">
-                        <label for="token-input" class="text-lime-500 font-bold text-xs">API Token</label>
-                        <input
-                            type="password"
-                            id="token-input"
-                            class="border border-zinc-700 rounded px-4 py-0 bg-zinc-900 text-zinc-300"
-                            placeholder="Enter Groq API token"
-                        />
-                    </div>
-                </div>
-                <div  class="flex gap-2">
-                    <!-- Add two textarea one for getting Keyword Filter and another one Instruction, make both grow whole with-->
-                    <div id = "semantic_filter_div" class="flex flex-col flex-1 hidden">
-                        <label for="keyword-filter" class="text-lime-500 font-bold text-xs">Keyword Filter</label>
-                        <textarea
-                            id="semantic_filter"
-                            rows="3"
-                            class="border border-zinc-700 rounded px-4 py-0 bg-zinc-900 text-zinc-300 placeholder-zinc-700"
-                            placeholder="Enter keywords for CosineStrategy to narrow down the content."
-                        ></textarea>
-                    </div>
-                    <div id = "instruction_div" class="flex flex-col flex-1 hidden">
-                        <label for="instruction" class="text-lime-500 font-bold text-xs">Instruction</label>
-                        <textarea
-                            id="instruction"
-                            rows="3"
-                            class="border border-zinc-700 rounded px-4 py-0 bg-zinc-900 text-zinc-300 placeholder-zinc-700"
-                            placeholder="Enter instruction for the LLMEstrategy to instruct the model."
-                        ></textarea>
-                    </div>
-                </div>
-                <div class="flex gap-3">
-                    <div class="flex items-center gap-2">
-                        <input type="checkbox" id="bypass-cache-checkbox" />
-                        <label for="bypass-cache-checkbox" class="text-lime-500 font-bold">Bypass Cache</label>
-                    </div>
-                    <div class="flex items-center gap-2">
-                        <input type="checkbox" id="screenshot-checkbox" checked />
-                        <label for="screenshot-checkbox" class="text-lime-500 font-bold">Screenshot</label>
-                    </div>
-                    <div class="flex items-center gap-2 hidden">
-                        <input type="checkbox" id="extract-blocks-checkbox" />
-                        <label for="extract-blocks-checkbox" class="text-lime-500 font-bold">Extract Blocks</label>
-                    </div>
-                    <button id="crawl-btn" class="bg-lime-600 text-black font-bold px-4 py-0 rounded">Crawl</button>
-                </div>
-            </div>
-
-            <div id="loading" class="hidden">
-                <p class="text-white">Loading... Please wait.</p>
-            </div>
-            <div id="result" class="flex-1  overflow-x-auto">
-                <div class="tab-buttons flex gap-2">
-                    <button class="tab-btn px-4 py-1 text-sm bg-zinc-700 rounded-t text-lime-500" data-tab="json">
-                        JSON
-                    </button>
-                    <button
-                        class="tab-btn px-4 py-1 text-sm bg-zinc-700 rounded-t text-lime-500"
-                        data-tab="cleaned-html"
-                    >
-                        Cleaned HTML
-                    </button>
-                    <button class="tab-btn px-4 py-1 text-sm bg-zinc-700 rounded-t text-lime-500" data-tab="markdown">
-                        Markdown
-                    </button>
-                    <button class="tab-btn px-4 py-1 text-sm bg-zinc-700 rounded-t text-lime-500" data-tab="media">
-                        Medias
-                    </button>
-                    <button class="tab-btn px-4 py-1 text-sm bg-zinc-700 rounded-t text-lime-500" data-tab="screenshot">
-                        Screenshot
-                    </button>
-                </div>
-                <div class="tab-content code bg-zinc-900 p-2 rounded h-full border border-zinc-700 text-sm">
-                    <pre class="h-full flex"><code id="json-result" class="language-json"></code></pre>
-                    <pre class="hidden h-full flex"><code id="cleaned-html-result" class="language-html"></code></pre>
-                    <pre class="hidden h-full flex"><code id="markdown-result" class="language-markdown"></code></pre>
-                    <pre class="hidden h-full flex"><code id="media-result" class="language-json"></code></pre>
-                    <pre class="hidden h-full flex"><code id="screenshot-result"></code></pre>
-                </div>
-            </div>
-
-            <div id="code_help" class="flex-1  overflow-x-auto">
-                <div class="tab-buttons flex gap-2">
-                    <button class="code-tab-btn px-4 py-1 text-sm bg-zinc-700 rounded-t text-lime-500" data-tab="curl">
-                        cURL
-                    </button>
-                    <button
-                        class="code-tab-btn px-4 py-1 text-sm bg-zinc-700 rounded-t text-lime-500"
-                        data-tab="library"
-                    >
-                        Python
-                    </button>
-                    <button
-                        class="code-tab-btn px-4 py-1 text-sm bg-zinc-700 rounded-t text-lime-500"
-                        data-tab="python"
-                    >
-                        REST API
-                    </button>
-                    <!-- <button
-                        class="code-tab-btn px-4 py-1 text-sm bg-zinc-700 rounded-t text-lime-500"
-                        data-tab="nodejs"
-                    >
-                        Node.js
-                    </button> -->
-                </div>
-                <div class="tab-content result bg-zinc-900 p-2 rounded h-full border border-zinc-700 text-sm">
-                    <pre class="h-full flex relative overflow-x-auto">
-                        <code id="curl-code" class="language-bash"></code>
-                        <button class="absolute top-2 right-2 bg-zinc-700 text-white px-2 py-1 rounded copy-btn" data-target="curl-code">Copy</button>
-                    </pre>
-                    <pre class="hidden h-full flex relative overflow-x-auto">
-                        <code id="python-code" class="language-python"></code>
-                        <button class="absolute top-2 right-2 bg-zinc-700 text-white px-2 py-1 rounded copy-btn" data-target="python-code">Copy</button>
-                    </pre>
-                    <pre class="hidden h-full flex relative overflow-x-auto">
-                        <code id="nodejs-code" class="language-javascript"></code>
-                        <button class="absolute top-2 right-2 bg-zinc-700 text-white px-2 py-1 rounded copy-btn" data-target="nodejs-code">Copy</button>
-                    </pre>
-                    <pre class="hidden h-full flex relative overflow-x-auto">
-                        <code id="library-code" class="language-python"></code>
-                        <button class="absolute top-2 right-2 bg-zinc-700 text-white px-2 py-1 rounded copy-btn" data-target="library-code">Copy</button>
-                    </pre>
-                </div>
-            </div>
-        </div>
-    </div>
-</section>
diff --git a/pages/tmp.html b/pages/tmp.html
deleted file mode 100644
index 7c924676..00000000
--- a/pages/tmp.html
+++ /dev/null
@@ -1,434 +0,0 @@
-<div class="w-3/4 p-4">
-    <section id="installation" class="content-section active">
-        <h1 class="text-2xl font-bold">Installation 💻</h1>
-        <p class="mb-4">There are three ways to use Crawl4AI:</p>
-        <ol class="list-decimal list-inside mb-4">
-            <li class="">As a library</li>
-            <li class="">As a local server (Docker)</li>
-            <li class="">
-                As a Google Colab notebook.
-                <a href="https://colab.research.google.com/drive/1wz8u30rvbq6Scodye9AGCw8Qg_Z8QGsk"
-                    ><img
-                        src="https://colab.research.google.com/assets/colab-badge.svg"
-                        alt="Open In Colab"
-                        style="display: inline-block; width: 100px; height: 20px"
-                /></a>
-            </li>
-            <p></p>
-
-            <p class="my-4">To install Crawl4AI as a library, follow these steps:</p>
-
-            <ol class="list-decimal list-inside mb-4">
-                <li class="mb-4">
-                    Install the package from GitHub:
-                    <pre
-                        class="bg-zinc-800 p-4 rounded mt-2 text-zinc-100"
-                    ><code class="hljs language-bash">pip install git+https://github.com/unclecode/crawl4ai.git</code></pre>
-                </li>
-                <li class="mb-4">
-                    Alternatively, you can clone the repository and install the package locally:
-                    <pre
-                        class="bg-zinc-800 p-4 rounded mt-2 text-zinc-100"
-                    ><code class="language-python bash hljs">virtualenv venv
-source venv/<span class="hljs-built_in">bin</span>/activate
-git clone https://github.com/unclecode/crawl4ai.git
-cd crawl4ai
-pip install -e .
-</code></pre>
-                </li>
-                <li class="">
-                    Use docker to run the local server:
-                    <pre
-                        class="bg-zinc-800 p-4 rounded mt-2 text-zinc-100"
-                    ><code class="language-python bash hljs">docker build -t crawl4ai . 
-<span class="hljs-comment"># docker build --platform linux/amd64 -t crawl4ai . For Mac users</span>
-docker run -d -p <span class="hljs-number">8000</span>:<span class="hljs-number">80</span> crawl4ai</code></pre>
-                </li>
-            </ol>
-            <p class="mb-4">
-                For more information about how to run Crawl4AI as a local server, please refer to the
-                <a href="https://github.com/unclecode/crawl4ai" class="text-blue-400">GitHub repository</a>.
-            </p>
-        </ol>
-    </section>
-    <section id="how-to-guide" class="content-section">
-        <h1 class="text-2xl font-bold">How to Guide</h1>
-        <div class="flex flex-col gap-4 p-4 bg-zinc-900 text-lime-500">
-            <!-- Step 1 -->
-            <div class="col-span-2 bg-lime-800 p-2 rounded text-zinc-50">
-                🌟
-                <strong>Welcome to the Crawl4ai Quickstart Guide! Let's dive into some web crawling fun!</strong>
-            </div>
-            <div class="">
-                First Step: Create an instance of WebCrawler and call the
-                <code>warmup()</code> function.
-            </div>
-            <div>
-                <pre><code class="language-python hljs">crawler = WebCrawler()
-crawler.warmup()</code></pre>
-            </div>
-
-            <!-- Step 2 -->
-            <div class="col-span-2 bg-lime-800 p-2 rounded text-zinc-50">
-                🧠 <strong>Understanding 'bypass_cache' and 'include_raw_html' parameters:</strong>
-            </div>
-            <div class="">First crawl (caches the result):</div>
-            <div>
-                <pre><code class="language-python hljs">result = crawler.run(url=<span class="hljs-string">"https://www.nbcnews.com/business"</span>)</code></pre>
-            </div>
-            <div class="">Second crawl (Force to crawl again):</div>
-            <div>
-                <pre><code class="language-python hljs">result = crawler.run(url=<span class="hljs-string">"https://www.nbcnews.com/business"</span>, bypass_cache=<span class="hljs-literal">True</span>)</code></pre>
-                <div class="bg-red-900 p-2 text-zinc-50">
-                    ⚠️ Don't forget to set <code>`bypass_cache`</code> to True if you want to try different strategies
-                    for the same URL. Otherwise, the cached result will be returned. You can also set
-                    <code>`always_by_pass_cache`</code> in constructor to True to always bypass the cache.
-                </div>
-            </div>
-            <div class="">Crawl result without raw HTML content:</div>
-            <div>
-                <pre><code class="language-python hljs">result = crawler.run(url=<span class="hljs-string">"https://www.nbcnews.com/business"</span>, include_raw_html=<span class="hljs-literal">False</span>)</code></pre>
-            </div>
-
-            <!-- Step 3 -->
-            <div class="col-span-2 bg-lime-800 p-2 rounded text-zinc-50">
-                📄
-                <strong
-                    >The 'include_raw_html' parameter, when set to True, includes the raw HTML content in the response.
-                    By default, it is set to True.</strong
-                >
-            </div>
-            <div class="">Set <code>always_by_pass_cache</code> to True:</div>
-            <div>
-                <pre><code class="language-python hljs">crawler.always_by_pass_cache = <span class="hljs-literal">True</span></code></pre>
-            </div>
-
-            <!-- Step 4 -->
-            <div class="col-span-2 bg-lime-800 p-2 rounded text-zinc-50">
-                🧩 <strong>Let's add a chunking strategy: RegexChunking!</strong>
-            </div>
-            <div class="">Using RegexChunking:</div>
-            <div>
-                <pre><code class="language-python hljs">result = crawler.run(
-url=<span class="hljs-string">"https://www.nbcnews.com/business"</span>,
-chunking_strategy=RegexChunking(patterns=[<span class="hljs-string">"\n\n"</span>])
-)</code></pre>
-            </div>
-            <div class="">Using NlpSentenceChunking:</div>
-            <div>
-                <pre><code class="language-python hljs">result = crawler.run(
-url=<span class="hljs-string">"https://www.nbcnews.com/business"</span>,
-chunking_strategy=NlpSentenceChunking()
-)</code></pre>
-            </div>
-
-            <!-- Step 5 -->
-            <div class="col-span-2 bg-lime-800 p-2 rounded text-zinc-50">
-                🧠 <strong>Let's get smarter with an extraction strategy: CosineStrategy!</strong>
-            </div>
-            <div class="">Using CosineStrategy:</div>
-            <div>
-                <pre><code class="language-python hljs">result = crawler.run(
-url=<span class="hljs-string">"https://www.nbcnews.com/business"</span>,
-extraction_strategy=CosineStrategy(word_count_threshold=<span class="hljs-number">20</span>, max_dist=<span class="hljs-number">0.2</span>, linkage_method=<span class="hljs-string">"ward"</span>, top_k=<span class="hljs-number">3</span>)
-)</code></pre>
-            </div>
-
-            <!-- Step 6 -->
-            <div class="col-span-2 bg-lime-800 p-2 rounded text-zinc-50">
-                🤖
-                <strong>Time to bring in the big guns: LLMExtractionStrategy without instructions!</strong>
-            </div>
-            <div class="">Using LLMExtractionStrategy without instructions:</div>
-            <div>
-                <pre><code class="language-python hljs">result = crawler.run(
-url=<span class="hljs-string">"https://www.nbcnews.com/business"</span>,
-extraction_strategy=LLMExtractionStrategy(provider=<span class="hljs-string">"openai/gpt-4o"</span>, api_token=os.getenv(<span class="hljs-string">'OPENAI_API_KEY'</span>))
-)</code></pre>
-            </div>
-
-            <!-- Step 7 -->
-            <div class="col-span-2 bg-lime-800 p-2 rounded text-zinc-50">
-                📜
-                <strong>Let's make it even more interesting: LLMExtractionStrategy with instructions!</strong>
-            </div>
-            <div class="">Using LLMExtractionStrategy with instructions:</div>
-            <div>
-                <pre><code class="language-python hljs">result = crawler.run(
-url=<span class="hljs-string">"https://www.nbcnews.com/business"</span>,
-extraction_strategy=LLMExtractionStrategy(
-provider=<span class="hljs-string">"openai/gpt-4o"</span>,
-api_token=os.getenv(<span class="hljs-string">'OPENAI_API_KEY'</span>),
-instruction=<span class="hljs-string">"I am interested in only financial news"</span>
-)
-)</code></pre>
-            </div>
-
-            <!-- Step 8 -->
-            <div class="col-span-2 bg-lime-800 p-2 rounded text-zinc-50">
-                🎯
-                <strong>Targeted extraction: Let's use a CSS selector to extract only H2 tags!</strong>
-            </div>
-            <div class="">Using CSS selector to extract H2 tags:</div>
-            <div>
-                <pre><code class="language-python hljs">result = crawler.run(
-url=<span class="hljs-string">"https://www.nbcnews.com/business"</span>,
-css_selector=<span class="hljs-string">"h2"</span>
-)</code></pre>
-            </div>
-
-            <!-- Step 9 -->
-            <div class="col-span-2 bg-lime-800 p-2 rounded text-zinc-50">
-                🖱️
-                <strong>Let's get interactive: Passing JavaScript code to click 'Load More' button!</strong>
-            </div>
-            <div class="">Using JavaScript to click 'Load More' button:</div>
-            <div>
-                <pre><code class="language-python hljs">js_code = <span class="hljs-string">"""
-const loadMoreButton = Array.from(document.querySelectorAll('button')).find(button =&gt; button.textContent.includes('Load More'));
-loadMoreButton &amp;&amp; loadMoreButton.click();
-"""</span>
-crawler_strategy = LocalSeleniumCrawlerStrategy(js_code=js_code)
-crawler = WebCrawler(crawler_strategy=crawler_strategy, always_by_pass_cache=<span class="hljs-literal">True</span>)
-result = crawler.run(url=<span class="hljs-string">"https://www.nbcnews.com/business"</span>)</code></pre>
-            </div>
-
-            <!-- Conclusion -->
-            <div class="col-span-2 bg-lime-800 p-2 rounded text-zinc-50">
-                🎉
-                <strong
-                    >Congratulations! You've made it through the Crawl4ai Quickstart Guide! Now go forth and crawl the
-                    web like a pro! 🕸️</strong
-                >
-            </div>
-        </div>
-    </section>
-
-    <section id="chunking-strategies" class="content-section">
-        <div class="bg-zinc-800 p-4 rounded shadow-md docs-item">
-            <div class="text-gray-300 prose prose-sm">
-                <h3>RegexChunking</h3>
-                <p>
-                    <code>RegexChunking</code> is a text chunking strategy that splits a given text into smaller parts
-                    using regular expressions. This is useful for preparing large texts for processing by language
-                    models, ensuring they are divided into manageable segments.
-                </p>
-                <h4>Constructor Parameters:</h4>
-                <ul>
-                    <li>
-                        <code>patterns</code> (list, optional): A list of regular expression patterns used to split the
-                        text. Default is to split by double newlines (<code>['\n\n']</code>).
-                    </li>
-                </ul>
-                <h4>Example usage:</h4>
-                <pre><code class="language-python">chunker = RegexChunking(patterns=[r'\n\n', r'\. '])
-chunks = chunker.chunk("This is a sample text. It will be split into chunks.")
-</code></pre>
-            </div>
-        </div>
-        <div class="bg-zinc-800 p-4 rounded shadow-md docs-item">
-            <div class="text-gray-300 prose prose-sm">
-                <h3>NlpSentenceChunking</h3>
-                <p>
-                    <code>NlpSentenceChunking</code> uses a natural language processing model to chunk a given text into
-                    sentences. This approach leverages SpaCy to accurately split text based on sentence boundaries.
-                </p>
-                <h4>Constructor Parameters:</h4>
-                <ul>
-                    <li>
-                        None.
-                    </li>
-                </ul>
-                <h4>Example usage:</h4>
-                <pre><code class="language-python">chunker = NlpSentenceChunking()
-chunks = chunker.chunk("This is a sample text. It will be split into sentences.")
-</code></pre>
-            </div>
-        </div>
-        <div class="bg-zinc-800 p-4 rounded shadow-md docs-item">
-            <div class="text-gray-300 prose prose-sm">
-                <h3>TopicSegmentationChunking</h3>
-                <p>
-                    <code>TopicSegmentationChunking</code> uses the TextTiling algorithm to segment a given text into
-                    topic-based chunks. This method identifies thematic boundaries in the text.
-                </p>
-                <h4>Constructor Parameters:</h4>
-                <ul>
-                    <li>
-                        <code>num_keywords</code> (int, optional): The number of keywords to extract for each topic
-                        segment. Default is <code>3</code>.
-                    </li>
-                </ul>
-                <h4>Example usage:</h4>
-                <pre><code class="language-python">chunker = TopicSegmentationChunking(num_keywords=3)
-chunks = chunker.chunk("This is a sample text. It will be split into topic-based segments.")
-</code></pre>
-            </div>
-        </div>
-        <div class="bg-zinc-800 p-4 rounded shadow-md docs-item">
-            <div class="text-gray-300 prose prose-sm">
-                <h3>FixedLengthWordChunking</h3>
-                <p>
-                    <code>FixedLengthWordChunking</code> splits a given text into chunks of fixed length, based on the
-                    number of words.
-                </p>
-                <h4>Constructor Parameters:</h4>
-                <ul>
-                    <li>
-                        <code>chunk_size</code> (int, optional): The number of words in each chunk. Default is
-                        <code>100</code>.
-                    </li>
-                </ul>
-                <h4>Example usage:</h4>
-                <pre><code class="language-python">chunker = FixedLengthWordChunking(chunk_size=100)
-chunks = chunker.chunk("This is a sample text. It will be split into fixed-length word chunks.")
-</code></pre>
-            </div>
-        </div>
-        <div class="bg-zinc-800 p-4 rounded shadow-md docs-item">
-            <div class="text-gray-300 prose prose-sm">
-                <h3>SlidingWindowChunking</h3>
-                <p>
-                    <code>SlidingWindowChunking</code> uses a sliding window approach to chunk a given text. Each chunk
-                    has a fixed length, and the window slides by a specified step size.
-                </p>
-                <h4>Constructor Parameters:</h4>
-                <ul>
-                    <li>
-                        <code>window_size</code> (int, optional): The number of words in each chunk. Default is
-                        <code>100</code>.
-                    </li>
-                    <li>
-                        <code>step</code> (int, optional): The number of words to slide the window. Default is
-                        <code>50</code>.
-                    </li>
-                </ul>
-                <h4>Example usage:</h4>
-                <pre><code class="language-python">chunker = SlidingWindowChunking(window_size=100, step=50)
-chunks = chunker.chunk("This is a sample text. It will be split using a sliding window approach.")
-</code></pre>
-            </div>
-        </div>
-    </section>
-    <section id="extraction-strategies" class="content-section">
-        <div class="bg-zinc-800 p-4 rounded shadow-md docs-item">
-            <div class="text-gray-300 prose prose-sm">
-                <h3>NoExtractionStrategy</h3>
-                <p>
-                    <code>NoExtractionStrategy</code> is a basic extraction strategy that returns the entire HTML
-                    content without any modification. It is useful for cases where no specific extraction is required.
-                    Only clean html, and amrkdown.
-                </p>
-                <h4>Constructor Parameters:</h4>
-                <p>None.</p>
-                <h4>Example usage:</h4>
-                <pre><code class="language-python">extractor = NoExtractionStrategy()
-extracted_content = extractor.extract(url, html)
-</code></pre>
-            </div>
-        </div>
-        <div class="bg-zinc-800 p-4 rounded shadow-md docs-item">
-            <div class="text-gray-300 prose prose-sm">
-                <h3>LLMExtractionStrategy</h3>
-                <p>
-                    <code>LLMExtractionStrategy</code> uses a Language Model (LLM) to extract meaningful blocks or
-                    chunks from the given HTML content. This strategy leverages an external provider for language model
-                    completions.
-                </p>
-                <h4>Constructor Parameters:</h4>
-                <ul>
-                    <li>
-                        <code>provider</code> (str, optional): The provider to use for the language model completions.
-                        Default is <code>DEFAULT_PROVIDER</code> (e.g., openai/gpt-4).
-                    </li>
-                    <li>
-                        <code>api_token</code> (str, optional): The API token for the provider. If not provided, it will
-                        try to load from the environment variable <code>OPENAI_API_KEY</code>.
-                    </li>
-                    <li>
-                        <code>instruction</code> (str, optional): An instruction to guide the LLM on how to perform the
-                        extraction. This allows users to specify the type of data they are interested in or set the tone
-                        of the response. Default is <code>None</code>.
-                    </li>
-                </ul>
-                <h4>Example usage:</h4>
-                <pre><code class="language-python">extractor = LLMExtractionStrategy(provider='openai', api_token='your_api_token', instruction='Extract only news about AI.')
-extracted_content = extractor.extract(url, html)
-</code></pre>
-                <p>
-                    By providing clear instructions, users can tailor the extraction process to their specific needs,
-                    enhancing the relevance and utility of the extracted content.
-                </p>
-            </div>
-        </div>
-        <div class="bg-zinc-800 p-4 rounded shadow-md docs-item">
-            <div class="text-gray-300 prose prose-sm">
-                <h3>CosineStrategy</h3>
-                <p>
-                    <code>CosineStrategy</code> uses hierarchical clustering based on cosine similarity to extract
-                    clusters of text from the given HTML content. This strategy is suitable for identifying related
-                    content sections.
-                </p>
-                <h4>Constructor Parameters:</h4>
-                <ul>
-                    <li>
-                        <code>semantic_filter</code> (str, optional): A string containing keywords for filtering relevant
-                        documents before clustering. If provided, documents are filtered based on their cosine
-                        similarity to the keyword filter embedding. Default is <code>None</code>.
-                    </li>
-                    <li>
-                        <code>word_count_threshold</code> (int, optional): Minimum number of words per cluster. Default
-                        is <code>20</code>.
-                    </li>
-                    <li>
-                        <code>max_dist</code> (float, optional): The maximum cophenetic distance on the dendrogram to
-                        form clusters. Default is <code>0.2</code>.
-                    </li>
-                    <li>
-                        <code>linkage_method</code> (str, optional): The linkage method for hierarchical clustering.
-                        Default is <code>'ward'</code>.
-                    </li>
-                    <li>
-                        <code>top_k</code> (int, optional): Number of top categories to extract. Default is
-                        <code>3</code>.
-                    </li>
-                    <li>
-                        <code>model_name</code> (str, optional): The model name for embedding generation. Default is
-                        <code>'BAAI/bge-small-en-v1.5'</code>.
-                    </li>
-                </ul>
-                <h4>Example usage:</h4>
-                <pre><code class="language-python">extractor = CosineStrategy(semantic_filter='artificial intelligence', word_count_threshold=10, max_dist=0.2, linkage_method='ward', top_k=3, model_name='BAAI/bge-small-en-v1.5')
-extracted_content = extractor.extract(url, html)
-</code></pre>
-                <h4>Cosine Similarity Filtering</h4>
-                <p>
-                    When a <code>semantic_filter</code> is provided, the <code>CosineStrategy</code> applies an
-                    embedding-based filtering process to select relevant documents before performing hierarchical
-                    clustering.
-                </p>
-            </div>
-        </div>
-        <div class="bg-zinc-800 p-4 rounded shadow-md docs-item">
-            <div class="text-gray-300 prose prose-sm">
-                <h3>TopicExtractionStrategy</h3>
-                <p>
-                    <code>TopicExtractionStrategy</code> uses the TextTiling algorithm to segment the HTML content into
-                    topics and extracts keywords for each segment. This strategy is useful for identifying and
-                    summarizing thematic content.
-                </p>
-                <h4>Constructor Parameters:</h4>
-                <ul>
-                    <li>
-                        <code>num_keywords</code> (int, optional): Number of keywords to represent each topic segment.
-                        Default is <code>3</code>.
-                    </li>
-                </ul>
-                <h4>Example usage:</h4>
-                <pre><code class="language-python">extractor = TopicExtractionStrategy(num_keywords=3)
-extracted_content = extractor.extract(url, html)
-</code></pre>
-            </div>
-        </div>
-    </section>
-</div>

From d7c5b900b8d5d965d56417ac94681e7a11bbb1ee Mon Sep 17 00:00:00 2001
From: unclecode <unclecode@kidocode.com>
Date: Sun, 24 Nov 2024 19:35:53 +0800
Subject: [PATCH 067/115] feat: add support for arm64 platform in Docker
 commands and update INSTALL_TYPE variable in docker-compose

---
 README.md          | 9 +++++++++
 docker-compose.yml | 4 ++--
 2 files changed, 11 insertions(+), 2 deletions(-)

diff --git a/README.md b/README.md
index fa88a507..6c5e256e 100644
--- a/README.md
+++ b/README.md
@@ -142,6 +142,9 @@ docker pull unclecode/crawl4ai:gpu      # GPU-enabled version
 # Run the container
 docker run -p 11235:11235 unclecode/crawl4ai:basic  # Replace 'basic' with your chosen version
 
+# In case you want to set platform to arm64
+docker run --platform linux/arm64 -p 11235:11235 unclecode/crawl4ai:basic
+
 # In case to allocate more shared memory for the container
 docker run --shm-size=2gb -p 11235:11235 unclecode/crawl4ai:basic
 ```
@@ -158,6 +161,12 @@ docker build -t crawl4ai:local \
   --build-arg INSTALL_TYPE=basic \  # Options: basic, all
   .
 
+# In case you want to set platform to arm64
+docker build -t crawl4ai:local \
+  --build-arg INSTALL_TYPE=basic \  # Options: basic, all
+  --platform linux/arm64 \
+  .
+
 # Run your local build
 docker run -p 11235:11235 crawl4ai:local
 ```
diff --git a/docker-compose.yml b/docker-compose.yml
index 1097ef11..b93beda9 100644
--- a/docker-compose.yml
+++ b/docker-compose.yml
@@ -4,8 +4,8 @@ services:
       context: .
       dockerfile: Dockerfile
       args:
-        PYTHON_VERSION: 3.10
-        INSTALL_TYPE: all
+        PYTHON_VERSION: "3.10"
+        INSTALL_TYPE: ${INSTALL_TYPE:-basic}
         ENABLE_GPU: false
     profiles: ["local"]
     ports:

From de43505ae4177ddf671c8b765f2f55c28a740e47 Mon Sep 17 00:00:00 2001
From: unclecode <unclecode@kidocode.com>
Date: Sun, 24 Nov 2024 19:36:30 +0800
Subject: [PATCH 068/115] feat: update version to 0.3.742

---
 crawl4ai/__version__.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/crawl4ai/__version__.py b/crawl4ai/__version__.py
index 05bfd336..f06970ce 100644
--- a/crawl4ai/__version__.py
+++ b/crawl4ai/__version__.py
@@ -1,2 +1,2 @@
 # crawl4ai/_version.py
-__version__ = "0.3.741"
\ No newline at end of file
+__version__ = "0.3.742"
\ No newline at end of file

From b09a86c0c1bc1036ff4954da991dfbccf65534cd Mon Sep 17 00:00:00 2001
From: unclecode <unclecode@kidocode.com>
Date: Sun, 24 Nov 2024 19:40:10 +0800
Subject: [PATCH 069/115] chore: remove deprecated Docker Compose
 configurations for crawl4ai service

---
 docker-compose.hub.yml   | 27 ---------------------------
 docker-compose.local.yml | 33 ---------------------------------
 2 files changed, 60 deletions(-)
 delete mode 100644 docker-compose.hub.yml
 delete mode 100644 docker-compose.local.yml

diff --git a/docker-compose.hub.yml b/docker-compose.hub.yml
deleted file mode 100644
index 9bcfa982..00000000
--- a/docker-compose.hub.yml
+++ /dev/null
@@ -1,27 +0,0 @@
-services:
-  crawl4ai:
-    image: unclecode/crawl4ai:basic  # Pull image from Docker Hub
-    ports:
-      - "11235:11235"  # FastAPI server
-      - "8000:8000"    # Alternative port
-      - "9222:9222"    # Browser debugging
-      - "8080:8080"    # Additional port
-    environment:
-      - CRAWL4AI_API_TOKEN=${CRAWL4AI_API_TOKEN:-}  # Optional API token
-      - OPENAI_API_KEY=${OPENAI_API_KEY:-}          # Optional OpenAI API key
-      - CLAUDE_API_KEY=${CLAUDE_API_KEY:-}          # Optional Claude API key
-    volumes:
-      - /dev/shm:/dev/shm  # Shared memory for browser operations
-    deploy:
-      resources:
-        limits:
-          memory: 4G
-        reservations:
-          memory: 1G
-    restart: unless-stopped
-    healthcheck:
-      test: ["CMD", "curl", "-f", "http://localhost:11235/health"]
-      interval: 30s
-      timeout: 10s
-      retries: 3
-      start_period: 40s
diff --git a/docker-compose.local.yml b/docker-compose.local.yml
deleted file mode 100644
index 7dc41b47..00000000
--- a/docker-compose.local.yml
+++ /dev/null
@@ -1,33 +0,0 @@
-services:
-  crawl4ai:
-    build:
-      context: .
-      dockerfile: Dockerfile
-      args:
-        PYTHON_VERSION: 3.10
-        INSTALL_TYPE: all
-        ENABLE_GPU: false
-    ports:
-      - "11235:11235"  # FastAPI server
-      - "8000:8000"    # Alternative port
-      - "9222:9222"    # Browser debugging
-      - "8080:8080"    # Additional port
-    environment:
-      - CRAWL4AI_API_TOKEN=${CRAWL4AI_API_TOKEN:-}  # Optional API token
-      - OPENAI_API_KEY=${OPENAI_API_KEY:-}          # Optional OpenAI API key
-      - CLAUDE_API_KEY=${CLAUDE_API_KEY:-}          # Optional Claude API key
-    volumes:
-      - /dev/shm:/dev/shm  # Shared memory for browser operations
-    deploy:
-      resources:
-        limits:
-          memory: 4G
-        reservations:
-          memory: 1G
-    restart: unless-stopped
-    healthcheck:
-      test: ["CMD", "curl", "-f", "http://localhost:11235/health"]
-      interval: 30s
-      timeout: 10s
-      retries: 3
-      start_period: 40s
\ No newline at end of file

From 195c0ccf8aa5e0462b97bc8a7f5cff608b69b53a Mon Sep 17 00:00:00 2001
From: unclecode <unclecode@kidocode.com>
Date: Sun, 24 Nov 2024 19:40:27 +0800
Subject: [PATCH 070/115] chore: remove deprecated Docker Compose
 configurations for crawl4ai service

---
 docker-compose.hub.yml   | 27 ---------------------------
 docker-compose.local.yml | 33 ---------------------------------
 2 files changed, 60 deletions(-)
 delete mode 100644 docker-compose.hub.yml
 delete mode 100644 docker-compose.local.yml

diff --git a/docker-compose.hub.yml b/docker-compose.hub.yml
deleted file mode 100644
index 9bcfa982..00000000
--- a/docker-compose.hub.yml
+++ /dev/null
@@ -1,27 +0,0 @@
-services:
-  crawl4ai:
-    image: unclecode/crawl4ai:basic  # Pull image from Docker Hub
-    ports:
-      - "11235:11235"  # FastAPI server
-      - "8000:8000"    # Alternative port
-      - "9222:9222"    # Browser debugging
-      - "8080:8080"    # Additional port
-    environment:
-      - CRAWL4AI_API_TOKEN=${CRAWL4AI_API_TOKEN:-}  # Optional API token
-      - OPENAI_API_KEY=${OPENAI_API_KEY:-}          # Optional OpenAI API key
-      - CLAUDE_API_KEY=${CLAUDE_API_KEY:-}          # Optional Claude API key
-    volumes:
-      - /dev/shm:/dev/shm  # Shared memory for browser operations
-    deploy:
-      resources:
-        limits:
-          memory: 4G
-        reservations:
-          memory: 1G
-    restart: unless-stopped
-    healthcheck:
-      test: ["CMD", "curl", "-f", "http://localhost:11235/health"]
-      interval: 30s
-      timeout: 10s
-      retries: 3
-      start_period: 40s
diff --git a/docker-compose.local.yml b/docker-compose.local.yml
deleted file mode 100644
index 7dc41b47..00000000
--- a/docker-compose.local.yml
+++ /dev/null
@@ -1,33 +0,0 @@
-services:
-  crawl4ai:
-    build:
-      context: .
-      dockerfile: Dockerfile
-      args:
-        PYTHON_VERSION: 3.10
-        INSTALL_TYPE: all
-        ENABLE_GPU: false
-    ports:
-      - "11235:11235"  # FastAPI server
-      - "8000:8000"    # Alternative port
-      - "9222:9222"    # Browser debugging
-      - "8080:8080"    # Additional port
-    environment:
-      - CRAWL4AI_API_TOKEN=${CRAWL4AI_API_TOKEN:-}  # Optional API token
-      - OPENAI_API_KEY=${OPENAI_API_KEY:-}          # Optional OpenAI API key
-      - CLAUDE_API_KEY=${CLAUDE_API_KEY:-}          # Optional Claude API key
-    volumes:
-      - /dev/shm:/dev/shm  # Shared memory for browser operations
-    deploy:
-      resources:
-        limits:
-          memory: 4G
-        reservations:
-          memory: 1G
-    restart: unless-stopped
-    healthcheck:
-      test: ["CMD", "curl", "-f", "http://localhost:11235/health"]
-      interval: 30s
-      timeout: 10s
-      retries: 3
-      start_period: 40s
\ No newline at end of file

From c6a022132b9fff4db14586a55c95f346ac3da5f7 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Wed, 27 Nov 2024 14:55:56 +0800
Subject: [PATCH 071/115] docs: update CONTRIBUTORS.md to acknowledge
 aadityakanjolia4 for fixing 'CustomHTML2Text' bug

---
 CONTRIBUTORS.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/CONTRIBUTORS.md b/CONTRIBUTORS.md
index 0b5dcede..81e916cb 100644
--- a/CONTRIBUTORS.md
+++ b/CONTRIBUTORS.md
@@ -10,6 +10,7 @@ We would like to thank the following people for their contributions to Crawl4AI:
 
 ## Community Contributors
 
+- [aadityakanjolia4](https://github.com/aadityakanjolia4) - Fixing 'CustomHTML2Text' is not defined bug in the code.
 - [FractalMind](https://github.com/FractalMind) - Created the first official Docker Hub image and fixed Dockerfile errors
 - [ketonkss4](https://github.com/ketonkss4) - Identified Selenium's new capabilities, helping reduce dependencies
 - [jonymusky](https://github.com/jonymusky) - Javascript execution documentation, and wait_for

From 73661f7d1fd37111e34e4dc9ec10f87d5a5f3afe Mon Sep 17 00:00:00 2001
From: zhounan <nelzomal@gmail.com>
Date: Wed, 27 Nov 2024 15:04:20 +0800
Subject: [PATCH 072/115] docs: enhance development installation instructions
 (#286)

Thanks for your contribution. I'm merging your changes and I'll add your name to our contributor list. Thank you so much.
---
 README.md | 10 +++++++++-
 1 file changed, 9 insertions(+), 1 deletion(-)

diff --git a/README.md b/README.md
index 6c5e256e..5ba33dea 100644
--- a/README.md
+++ b/README.md
@@ -110,7 +110,15 @@ For contributors who plan to modify the source code:
 ```bash
 git clone https://github.com/unclecode/crawl4ai.git
 cd crawl4ai
-pip install -e .
+pip install -e .                    # Basic installation in editable mode
+```
+Install optional features:
+```bash
+pip install -e ".[torch]"           # With PyTorch features
+pip install -e ".[transformer]"     # With Transformer features
+pip install -e ".[cosine]"          # With cosine similarity features
+pip install -e ".[sync]"            # With synchronous crawling (Selenium)
+pip install -e ".[all]"             # Install all optional features
 ```
 
 ## One-Click Deployment 🚀

From f998e9e94906302a4ee32cd5e581f4fa7bd22021 Mon Sep 17 00:00:00 2001
From: Hamza Farhan <thehamza96@gmail.com>
Date: Wed, 27 Nov 2024 16:20:54 +0500
Subject: [PATCH 073/115] Fix: handled the cases where markdown_with_citations,
 references_markdown, and filtered_html might not be defined. (#293)

Thanks, dear Farhan, for the changes you made in the code. I accepted and merged them into the main branch. Also, I will add your name to our contributor list. Thank you so much.
---
 crawl4ai/markdown_generation_strategy.py | 8 +++++---
 1 file changed, 5 insertions(+), 3 deletions(-)

diff --git a/crawl4ai/markdown_generation_strategy.py b/crawl4ai/markdown_generation_strategy.py
index 7922c413..249bc1ce 100644
--- a/crawl4ai/markdown_generation_strategy.py
+++ b/crawl4ai/markdown_generation_strategy.py
@@ -84,6 +84,8 @@ class DefaultMarkdownGenerationStrategy(MarkdownGenerationStrategy):
         raw_markdown = raw_markdown.replace('    ```', '```')
 
         # Convert links to citations
+        markdown_with_citations: str = ""
+        references_markdown: str = ""
         if citations:
             markdown_with_citations, references_markdown = self.convert_links_to_citations(
                 raw_markdown, base_url
@@ -91,9 +93,9 @@ class DefaultMarkdownGenerationStrategy(MarkdownGenerationStrategy):
 
         # Generate fit markdown if content filter is provided
         fit_markdown: Optional[str] = None
+        filtered_html: Optional[str] = None
         if content_filter:
-            filtered_html = content_filter.filter_content(cleaned_html)
-            filtered_html = '\n'.join('<div>{}</div>'.format(s) for s in filtered_html)
+            filtered_html = '\n'.join('<div>{}</div>'.format(s) for s in content_filter.filter_content(cleaned_html))
             fit_markdown = h.handle(filtered_html)
 
         return MarkdownGenerationResult(
@@ -101,7 +103,7 @@ class DefaultMarkdownGenerationStrategy(MarkdownGenerationStrategy):
             markdown_with_citations=markdown_with_citations,
             references_markdown=references_markdown,
             fit_markdown=fit_markdown,
-            fit_html=filtered_html
+            fit_html=filtered_html,
         )
 
 def fast_urljoin(base: str, url: str) -> str:

From 24723b2f100ed25747b1b84a833f82e17340b457 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Thu, 28 Nov 2024 12:45:05 +0800
Subject: [PATCH 074/115] Enhance features and documentation   - Updated
 version to 0.3.743   - Improved ManagedBrowser configuration with dynamic
 host/port   - Implemented fast HTML formatting in web crawler   - Enhanced
 markdown generation with a new generator class   - Improved sanitization and
 utility functions   - Added contributor details and pull request
 acknowledgments   - Updated documentation for clearer usage scenarios   -
 Adjusted tests to reflect class name changes

---
 CONTRIBUTORS.md                          |  8 +++
 crawl4ai/__version__.py                  |  2 +-
 crawl4ai/async_crawler_strategy.py       | 24 +++++----
 crawl4ai/async_webcrawler.py             | 12 +++--
 crawl4ai/content_scraping_strategy.py    | 19 ++++---
 crawl4ai/markdown_generation_strategy.py | 14 ++++--
 crawl4ai/utils.py                        | 64 +++++++++++++++++++++---
 docs/md_v2/advanced/hooks-auth.md        |  8 ++-
 tests/async/test_markdown_genertor.py    | 14 +++---
 9 files changed, 123 insertions(+), 42 deletions(-)

diff --git a/CONTRIBUTORS.md b/CONTRIBUTORS.md
index 0b5dcede..deb46a9c 100644
--- a/CONTRIBUTORS.md
+++ b/CONTRIBUTORS.md
@@ -10,11 +10,19 @@ We would like to thank the following people for their contributions to Crawl4AI:
 
 ## Community Contributors
 
+- [aadityakanjolia4](https://github.com/aadityakanjolia4) - Fix for `CustomHTML2Text` is not defined.
 - [FractalMind](https://github.com/FractalMind) - Created the first official Docker Hub image and fixed Dockerfile errors
 - [ketonkss4](https://github.com/ketonkss4) - Identified Selenium's new capabilities, helping reduce dependencies
 - [jonymusky](https://github.com/jonymusky) - Javascript execution documentation, and wait_for
 - [datehoer](https://github.com/datehoer) - Add browser prxy support
 
+## Pull Requests
+
+- [nelzomal](https://github.com/nelzomal) - Enhance development installation instructions [#286](https://github.com/unclecode/crawl4ai/pull/286)
+- [HamzaFarhan](https://github.com/HamzaFarhan) - Handled the cases where markdown_with_citations, references_markdown, and filtered_html might not be defined [#293](https://github.com/unclecode/crawl4ai/pull/293)
+- [NanmiCoder](https://github.com/NanmiCoder) - fix: crawler strategy exception handling and fixes [#271](https://github.com/unclecode/crawl4ai/pull/271)
+
+
 ## Other Contributors
 
 - [Gokhan](https://github.com/gkhngyk) 
diff --git a/crawl4ai/__version__.py b/crawl4ai/__version__.py
index 05bfd336..37e3c08a 100644
--- a/crawl4ai/__version__.py
+++ b/crawl4ai/__version__.py
@@ -1,2 +1,2 @@
 # crawl4ai/_version.py
-__version__ = "0.3.741"
\ No newline at end of file
+__version__ = "0.3.743"
\ No newline at end of file
diff --git a/crawl4ai/async_crawler_strategy.py b/crawl4ai/async_crawler_strategy.py
index 3f332eb0..882f9a50 100644
--- a/crawl4ai/async_crawler_strategy.py
+++ b/crawl4ai/async_crawler_strategy.py
@@ -35,13 +35,14 @@ stealth_config = StealthConfig(
 
 
 class ManagedBrowser:
-    def __init__(self, browser_type: str = "chromium", user_data_dir: Optional[str] = None, headless: bool = False, logger = None):
+    def __init__(self, browser_type: str = "chromium", user_data_dir: Optional[str] = None, headless: bool = False, logger = None, host: str = "localhost", debugging_port: int = 9222):
         self.browser_type = browser_type
         self.user_data_dir = user_data_dir
         self.headless = headless
         self.browser_process = None
         self.temp_dir = None
-        self.debugging_port = 9222
+        self.debugging_port = debugging_port
+        self.host = host
         self.logger = logger
         self.shutting_down = False
 
@@ -70,7 +71,7 @@ class ManagedBrowser:
             # Monitor browser process output for errors
             asyncio.create_task(self._monitor_browser_process())
             await asyncio.sleep(2)  # Give browser time to start
-            return f"http://localhost:{self.debugging_port}"
+            return f"http://{self.host}:{self.debugging_port}"
         except Exception as e:
             await self.cleanup()
             raise Exception(f"Failed to start browser: {e}")
@@ -416,13 +417,13 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
         else:
             raise ValueError(f"Invalid hook type: {hook_type}")
 
-    async def execute_hook(self, hook_type: str, *args):
+    async def execute_hook(self, hook_type: str, *args, **kwargs):
         hook = self.hooks.get(hook_type)
         if hook:
             if asyncio.iscoroutinefunction(hook):
-                return await hook(*args)
+                return await hook(*args, **kwargs)
             else:
-                return hook(*args)
+                return hook(*args, **kwargs)
         return args[0] if args else None
 
     def update_user_agent(self, user_agent: str):
@@ -642,6 +643,7 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
         session_id = kwargs.get("session_id")
         
         # Handle page creation differently for managed browser
+        context = None
         if self.use_managed_browser:
             if session_id:
                 # Reuse existing session if available
@@ -760,7 +762,7 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
                     return response
 
             if not kwargs.get("js_only", False):
-                await self.execute_hook('before_goto', page)
+                await self.execute_hook('before_goto', page, context = context)
                 
 
                 response = await page.goto(
@@ -773,7 +775,7 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
                 # response = await page.goto("about:blank")
                 # await page.evaluate(f"window.location.href = '{url}'")
                 
-                await self.execute_hook('after_goto', page)
+                await self.execute_hook('after_goto', page, context = context)
                 
                 # Get status code and headers
                 status_code = response.status
@@ -838,7 +840,7 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
                 # await page.wait_for_timeout(100)
                 
                 # Check for on execution event
-                await self.execute_hook('on_execution_started', page)
+                await self.execute_hook('on_execution_started', page, context = context)
                 
             if kwargs.get("simulate_user", False) or kwargs.get("magic", False):
                 # Simulate user interactions
@@ -924,7 +926,7 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
             if kwargs.get("process_iframes", False):
                 page = await self.process_iframes(page)
             
-            await self.execute_hook('before_retrieve_html', page)
+            await self.execute_hook('before_retrieve_html', page, context = context)
             # Check if delay_before_return_html is set then wait for that time
             delay_before_return_html = kwargs.get("delay_before_return_html")
             if delay_before_return_html:
@@ -935,7 +937,7 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
                 await self.remove_overlay_elements(page)
             
             html = await page.content()
-            await self.execute_hook('before_return_html', page, html)
+            await self.execute_hook('before_return_html', page, html, context = context)
             
             # Check if kwargs has screenshot=True then take screenshot
             screenshot_data = None
diff --git a/crawl4ai/async_webcrawler.py b/crawl4ai/async_webcrawler.py
index b8be6f35..5a46fe39 100644
--- a/crawl4ai/async_webcrawler.py
+++ b/crawl4ai/async_webcrawler.py
@@ -25,7 +25,8 @@ from .config import (
 from .utils import (
     sanitize_input_encode,
     InvalidCSSSelectorError,
-    format_html
+    format_html,
+    fast_format_html
 )
 from urllib.parse import urlparse
 import random
@@ -534,16 +535,17 @@ class AsyncWebCrawler:
                     "timing": time.perf_counter() - t1
                 }
             )
-        
-
-                
 
         screenshot = None if not screenshot else screenshot
         
+        
+        if kwargs.get("prettiify", False):
+            cleaned_html = fast_format_html(cleaned_html)
+        
         return CrawlResult(
             url=url,
             html=html,
-            cleaned_html=format_html(cleaned_html),
+            cleaned_html=cleaned_html,
             markdown_v2=markdown_v2,
             markdown=markdown,
             fit_markdown=fit_markdown,
diff --git a/crawl4ai/content_scraping_strategy.py b/crawl4ai/content_scraping_strategy.py
index ea6a2ef8..ec6c3361 100644
--- a/crawl4ai/content_scraping_strategy.py
+++ b/crawl4ai/content_scraping_strategy.py
@@ -10,7 +10,7 @@ from urllib.parse import urljoin
 from requests.exceptions import InvalidSchema
 # from .content_cleaning_strategy import ContentCleaningStrategy
 from .content_filter_strategy import RelevantContentFilter, BM25ContentFilter#, HeuristicContentFilter
-from .markdown_generation_strategy import MarkdownGenerationStrategy, DefaultMarkdownGenerationStrategy
+from .markdown_generation_strategy import MarkdownGenerationStrategy, DefaultMarkdownGenerator
 from .models import MarkdownGenerationResult
 from .utils import (
     sanitize_input_encode,
@@ -105,21 +105,28 @@ class WebScrapingStrategy(ContentScrapingStrategy):
         Returns:
             Dict containing markdown content in various formats
         """
-        markdown_generator: Optional[MarkdownGenerationStrategy] = kwargs.get('markdown_generator', DefaultMarkdownGenerationStrategy())
+        markdown_generator: Optional[MarkdownGenerationStrategy] = kwargs.get('markdown_generator', DefaultMarkdownGenerator())
         
         if markdown_generator:
             try:
+                if kwargs.get('fit_markdown', False) and not markdown_generator.content_filter:
+                        markdown_generator.content_filter = BM25ContentFilter(
+                            user_query=kwargs.get('fit_markdown_user_query', None),
+                            bm25_threshold=kwargs.get('fit_markdown_bm25_threshold', 1.0)
+                        )
+                
                 markdown_result: MarkdownGenerationResult = markdown_generator.generate_markdown(
                     cleaned_html=cleaned_html,
                     base_url=url,
-                    html2text_options=kwargs.get('html2text', {}),
-                    content_filter=kwargs.get('content_filter', None)
+                    html2text_options=kwargs.get('html2text', {})
                 )
                 
+                help_message = """"""
+                
                 return {
                     'markdown': markdown_result.raw_markdown,  
-                    'fit_markdown': markdown_result.fit_markdown or "Set flag 'fit_markdown' to True to get cleaned HTML content.",
-                    'fit_html': markdown_result.fit_html or "Set flag 'fit_markdown' to True to get cleaned HTML content.",
+                    'fit_markdown': markdown_result.fit_markdown,
+                    'fit_html': markdown_result.fit_html, 
                     'markdown_v2': markdown_result
                 }
             except Exception as e:
diff --git a/crawl4ai/markdown_generation_strategy.py b/crawl4ai/markdown_generation_strategy.py
index 7922c413..b1e43f9d 100644
--- a/crawl4ai/markdown_generation_strategy.py
+++ b/crawl4ai/markdown_generation_strategy.py
@@ -11,6 +11,8 @@ LINK_PATTERN = re.compile(r'!?\[([^\]]+)\]\(([^)]+?)(?:\s+"([^"]*)")?\)')
 
 class MarkdownGenerationStrategy(ABC):
     """Abstract base class for markdown generation strategies."""
+    def __init__(self, content_filter: Optional[RelevantContentFilter] = None):
+        self.content_filter = content_filter
     
     @abstractmethod
     def generate_markdown(self, 
@@ -23,8 +25,10 @@ class MarkdownGenerationStrategy(ABC):
         """Generate markdown from cleaned HTML."""
         pass
 
-class DefaultMarkdownGenerationStrategy(MarkdownGenerationStrategy):
+class DefaultMarkdownGenerator(MarkdownGenerationStrategy):
     """Default implementation of markdown generation strategy."""
+    def __init__(self, content_filter: Optional[RelevantContentFilter] = None):
+        super().__init__(content_filter)
     
     def convert_links_to_citations(self, markdown: str, base_url: str = "") -> Tuple[str, str]:
         link_map = {}
@@ -84,14 +88,18 @@ class DefaultMarkdownGenerationStrategy(MarkdownGenerationStrategy):
         raw_markdown = raw_markdown.replace('    ```', '```')
 
         # Convert links to citations
+        markdown_with_citations: str = ""
+        references_markdown: str = ""
         if citations:
             markdown_with_citations, references_markdown = self.convert_links_to_citations(
                 raw_markdown, base_url
             )
 
         # Generate fit markdown if content filter is provided
-        fit_markdown: Optional[str] = None
-        if content_filter:
+        fit_markdown: Optional[str] = ""
+        filtered_html: Optional[str] = ""
+        if content_filter or self.content_filter:
+            content_filter = content_filter or self.content_filter
             filtered_html = content_filter.filter_content(cleaned_html)
             filtered_html = '\n'.join('<div>{}</div>'.format(s) for s in filtered_html)
             fit_markdown = h.handle(filtered_html)
diff --git a/crawl4ai/utils.py b/crawl4ai/utils.py
index b07562df..aaf27e91 100644
--- a/crawl4ai/utils.py
+++ b/crawl4ai/utils.py
@@ -233,12 +233,17 @@ def sanitize_html(html):
 def sanitize_input_encode(text: str) -> str:
     """Sanitize input to handle potential encoding issues."""
     try:
-        # Attempt to encode and decode as UTF-8 to handle potential encoding issues
-        return text.encode('utf-8', errors='ignore').decode('utf-8')
-    except UnicodeEncodeError as e:
-        print(f"Warning: Encoding issue detected. Some characters may be lost. Error: {e}")
-        # Fall back to ASCII if UTF-8 fails
-        return text.encode('ascii', errors='ignore').decode('ascii')
+        try:
+            if not text:
+                return ''
+            # Attempt to encode and decode as UTF-8 to handle potential encoding issues
+            return text.encode('utf-8', errors='ignore').decode('utf-8')
+        except UnicodeEncodeError as e:
+            print(f"Warning: Encoding issue detected. Some characters may be lost. Error: {e}")
+            # Fall back to ASCII if UTF-8 fails
+            return text.encode('ascii', errors='ignore').decode('ascii')
+    except Exception as e:
+        raise ValueError(f"Error sanitizing input: {str(e)}") from e
 
 def escape_json_string(s):
     """
@@ -1079,9 +1084,54 @@ def wrap_text(draw, text, font, max_width):
     return '\n'.join(lines)
 
 def format_html(html_string):
-    soup = BeautifulSoup(html_string, 'html.parser')
+    soup = BeautifulSoup(html_string, 'lxml.parser')
     return soup.prettify()
 
+def fast_format_html(html_string):
+    """
+    A fast HTML formatter that uses string operations instead of parsing.
+    
+    Args:
+        html_string (str): The HTML string to format
+        
+    Returns:
+        str: The formatted HTML string
+    """
+    # Initialize variables
+    indent = 0
+    indent_str = "  "  # Two spaces for indentation
+    formatted = []
+    in_content = False
+    
+    # Split by < and > to separate tags and content
+    parts = html_string.replace('>', '>\n').replace('<', '\n<').split('\n')
+    
+    for part in parts:
+        if not part.strip():
+            continue
+            
+        # Handle closing tags
+        if part.startswith('</'):
+            indent -= 1
+            formatted.append(indent_str * indent + part)
+            
+        # Handle self-closing tags
+        elif part.startswith('<') and part.endswith('/>'):
+            formatted.append(indent_str * indent + part)
+            
+        # Handle opening tags
+        elif part.startswith('<'):
+            formatted.append(indent_str * indent + part)
+            indent += 1
+            
+        # Handle content between tags
+        else:
+            content = part.strip()
+            if content:
+                formatted.append(indent_str * indent + content)
+    
+    return '\n'.join(formatted)
+
 def normalize_url(href, base_url):
     """Normalize URLs to ensure consistent format"""
     from urllib.parse import urljoin, urlparse
diff --git a/docs/md_v2/advanced/hooks-auth.md b/docs/md_v2/advanced/hooks-auth.md
index e4b7d7ce..8da3a1cc 100644
--- a/docs/md_v2/advanced/hooks-auth.md
+++ b/docs/md_v2/advanced/hooks-auth.md
@@ -18,7 +18,7 @@ Let's see how we can customize the AsyncWebCrawler using hooks! In this example,
 import asyncio
 from crawl4ai import AsyncWebCrawler
 from crawl4ai.async_crawler_strategy import AsyncPlaywrightCrawlerStrategy
-from playwright.async_api import Page, Browser
+from playwright.async_api import Page, Browser, BrowserContext
 
 async def on_browser_created(browser: Browser):
     print("[HOOK] on_browser_created")
@@ -71,7 +71,11 @@ from crawl4ai.async_crawler_strategy import AsyncPlaywrightCrawlerStrategy
 async def main():
     print("\n🔗 Using Crawler Hooks: Let's see how we can customize the AsyncWebCrawler using hooks!")
     
-    crawler_strategy = AsyncPlaywrightCrawlerStrategy(verbose=True)
+    initial_cookies = [
+        {"name": "sessionId", "value": "abc123", "domain": ".example.com"},
+        {"name": "userId", "value": "12345", "domain": ".example.com"}
+    ]
+    crawler_strategy = AsyncPlaywrightCrawlerStrategy(verbose=True, cookies=initial_cookies)
     crawler_strategy.set_hook('on_browser_created', on_browser_created)
     crawler_strategy.set_hook('before_goto', before_goto)
     crawler_strategy.set_hook('after_goto', after_goto)
diff --git a/tests/async/test_markdown_genertor.py b/tests/async/test_markdown_genertor.py
index 025a0318..2b1102ab 100644
--- a/tests/async/test_markdown_genertor.py
+++ b/tests/async/test_markdown_genertor.py
@@ -11,7 +11,7 @@ import asyncio
 import os
 import time
 from typing import Dict, Any
-from crawl4ai.markdown_generation_strategy import DefaultMarkdownGenerationStrategy
+from crawl4ai.markdown_generation_strategy import DefaultMarkdownGenerator
 
 # Get current directory
 __location__ = os.path.realpath(os.path.join(os.getcwd(), os.path.dirname(__file__)))
@@ -41,7 +41,7 @@ def test_basic_markdown_conversion():
     with open(__location__ + "/data/wikipedia.html", "r") as f:
         cleaned_html = f.read()
 
-    generator = DefaultMarkdownGenerationStrategy()
+    generator = DefaultMarkdownGenerator()
     
     start_time = time.perf_counter()
     result = generator.generate_markdown(
@@ -70,7 +70,7 @@ def test_relative_links():
     Also an [image](/images/test.png) and another [page](/wiki/Banana).
     """
     
-    generator = DefaultMarkdownGenerationStrategy()
+    generator = DefaultMarkdownGenerator()
     result = generator.generate_markdown(
         cleaned_html=markdown,
         base_url="https://en.wikipedia.org"
@@ -86,7 +86,7 @@ def test_duplicate_links():
     Here's a [link](/test) and another [link](/test) and a [different link](/other).
     """
     
-    generator = DefaultMarkdownGenerationStrategy()
+    generator = DefaultMarkdownGenerator()
     result = generator.generate_markdown(
         cleaned_html=markdown,
         base_url="https://example.com"
@@ -102,7 +102,7 @@ def test_link_descriptions():
     Here's a [link with title](/test "Test Title") and a [link with description](/other) to test.
     """
     
-    generator = DefaultMarkdownGenerationStrategy()
+    generator = DefaultMarkdownGenerator()
     result = generator.generate_markdown(
         cleaned_html=markdown,
         base_url="https://example.com"
@@ -120,7 +120,7 @@ def test_performance_large_document():
     iterations = 5
     times = []
     
-    generator = DefaultMarkdownGenerationStrategy()
+    generator = DefaultMarkdownGenerator()
     
     for i in range(iterations):
         start_time = time.perf_counter()
@@ -144,7 +144,7 @@ def test_image_links():
     And a regular [link](/page).
     """
     
-    generator = DefaultMarkdownGenerationStrategy()
+    generator = DefaultMarkdownGenerator()
     result = generator.generate_markdown(
         cleaned_html=markdown,
         base_url="https://example.com"

From 3ff0b0b2c472f6adfd864f580a5a73de65505e5b Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Thu, 28 Nov 2024 12:48:07 +0800
Subject: [PATCH 075/115] feat: update changelog for version 0.3.743 with new
 features, improvements, and contributor acknowledgments

---
 CHANGELOG.md | 48 ++++++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 48 insertions(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 8e5cc91a..5ec79639 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -1,5 +1,53 @@
 # Changelog
 
+## [0.3.743] November 27, 2024
+
+Enhance features and documentation
+- Updated version to 0.3.743
+- Improved ManagedBrowser configuration with dynamic host/port
+- Implemented fast HTML formatting in web crawler
+- Enhanced markdown generation with a new generator class
+- Improved sanitization and utility functions
+- Added contributor details and pull request acknowledgments
+- Updated documentation for clearer usage scenarios
+- Adjusted tests to reflect class name changes
+
+### CONTRIBUTORS.md
+Added new contributors and pull request details.
+Updated community contributions and acknowledged pull requests.
+
+### crawl4ai/__version__.py
+Version update.
+Bumped version to 0.3.743.
+
+### crawl4ai/async_crawler_strategy.py
+Improved ManagedBrowser configuration.
+Enhanced browser initialization with configurable host and debugging port; improved hook execution.
+
+### crawl4ai/async_webcrawler.py
+Optimized HTML processing.
+Implemented 'fast_format_html' for optimized HTML formatting; applied it when 'prettiify' is enabled.
+
+### crawl4ai/content_scraping_strategy.py
+Enhanced markdown generation strategy.
+Updated to use DefaultMarkdownGenerator and improved markdown generation with filters option.
+
+### crawl4ai/markdown_generation_strategy.py
+Refactored markdown generation class.
+Renamed DefaultMarkdownGenerationStrategy to DefaultMarkdownGenerator; added content filter handling.
+
+### crawl4ai/utils.py
+Enhanced utility functions.
+Improved input sanitization and enhanced HTML formatting method.
+
+### docs/md_v2/advanced/hooks-auth.md
+Improved documentation for hooks.
+Updated code examples to include cookies in crawler strategy initialization.
+
+### tests/async/test_markdown_genertor.py
+Refactored tests to match class renaming.
+Updated tests to use renamed DefaultMarkdownGenerator class.
+
 ## [0.3.74] November 17, 2024
 
 This changelog details the updates and changes introduced in Crawl4AI version 0.3.74. It's designed to inform developers about new features, modifications to existing components, removals, and other important information.

From c2d47848102138e226ab06a4e2c40c80aef2a2cd Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Thu, 28 Nov 2024 12:56:31 +0800
Subject: [PATCH 076/115] fix: resolve merge conflict in
 DefaultMarkdownGenerator affecting fit_markdown generation

---
 crawl4ai/markdown_generation_strategy.py | 3 ---
 1 file changed, 3 deletions(-)

diff --git a/crawl4ai/markdown_generation_strategy.py b/crawl4ai/markdown_generation_strategy.py
index 377f6c84..f242054d 100644
--- a/crawl4ai/markdown_generation_strategy.py
+++ b/crawl4ai/markdown_generation_strategy.py
@@ -96,7 +96,6 @@ class DefaultMarkdownGenerator(MarkdownGenerationStrategy):
             )
 
         # Generate fit markdown if content filter is provided
-<<<<<<< HEAD
         fit_markdown: Optional[str] = ""
         filtered_html: Optional[str] = ""
         if content_filter or self.content_filter:
@@ -104,8 +103,6 @@ class DefaultMarkdownGenerator(MarkdownGenerationStrategy):
             filtered_html = content_filter.filter_content(cleaned_html)
             filtered_html = '\n'.join('<div>{}</div>'.format(s) for s in filtered_html)
             fit_markdown = h.handle(filtered_html)
->>>>>>> origin/main
-            fit_markdown = h.handle(filtered_html)
 
         return MarkdownGenerationResult(
             raw_markdown=raw_markdown,

From e4acd18429cf93ae7cd454c6b433fad703dee21c Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Thu, 28 Nov 2024 13:06:30 +0800
Subject: [PATCH 077/115] docs: update README for version 0.3.743 with new
 features, enhancements, and contributor acknowledgments

---
 README.md | 125 +++++++++++++++++++++++++++++++++++++-----------------
 1 file changed, 87 insertions(+), 38 deletions(-)

diff --git a/README.md b/README.md
index 5ba33dea..16d154b5 100644
--- a/README.md
+++ b/README.md
@@ -11,20 +11,15 @@
 
 Crawl4AI simplifies asynchronous web crawling and data extraction, making it accessible for large language models (LLMs) and AI applications. 🆓🌐
 
-## New in 0.3.74 ✨
+## New in 0.3.743 ✨  
 
-- 🚀 **Blazing Fast Scraping**: Significantly improved scraping speed.  
-- 📥 **Download Manager**: Integrated file crawling, downloading, and tracking within `CrawlResult`.  
-- 📝 **Markdown Strategy**: Flexible system for custom markdown generation and formats.  
-- 🔗 **LLM-Friendly Citations**: Auto-converts links to numbered citations with reference lists.  
-- 🔎 **Markdown Filter**: BM25-based content extraction for cleaner, relevant markdown.  
-- 🖼️ **Image Extraction**: Supports `srcset`, `picture`, and responsive image formats.  
-- 🗂️ **Local/Raw HTML**: Crawl `file://` paths and raw HTML (`raw:`) directly.  
-- 🤖 **Browser Control**: Custom browser setups with stealth integration to bypass bots.  
-- ☁️ **API & Cache Boost**: CORS, static serving, and enhanced filesystem-based caching.  
-- 🐳 **API Gateway**: Run as an API service with secure token authentication.  
-- 🛠️ **Database Upgrades**: Optimized for larger content sets with faster caching.  
-- 🐛 **Bug Fixes**: Resolved browser context issues, memory leaks, and improved error handling.
+🚀 **Improved ManagedBrowser Configuration**: Dynamic host and port support for more flexible browser management.  
+📝 **Enhanced Markdown Generation**: New generator class for better formatting and customization.  
+⚡ **Fast HTML Formatting**: Significantly optimized HTML formatting in the web crawler.  
+🛠️ **Utility & Sanitization Upgrades**: Improved sanitization and expanded utility functions for streamlined workflows.  
+👥 **Acknowledgments**: Added contributor details and pull request acknowledgments for better transparency.  
+📖 **Documentation Updates**: Clearer usage scenarios and updated guidance for better user onboarding.  
+🧪 **Test Adjustments**: Refined tests to align with recent class name changes.  
 
 
 ## Try it Now!
@@ -35,31 +30,85 @@ Crawl4AI simplifies asynchronous web crawling and data extraction, making it acc
 
 ## Features ✨
 
-- 🆓 Completely free and open-source
-- 🚀 Blazing fast performance, outperforming many paid services
-- 🤖 LLM-friendly output formats (JSON, cleaned HTML, markdown)
-- 🌐 Multi-browser support (Chromium, Firefox, WebKit)
-- 🌍 Supports crawling multiple URLs simultaneously
-- 🎨 Extracts and returns all media tags (Images, Audio, and Video)
-- 🔗 Extracts all external and internal links
-- 📚 Extracts metadata from the page
-- 🔄 Custom hooks for authentication, headers, and page modifications
-- 🕵️ User-agent customization
-- 🖼️ Takes screenshots of pages with enhanced error handling
-- 📜 Executes multiple custom JavaScripts before crawling
-- 📊 Generates structured output without LLM using JsonCssExtractionStrategy
-- 📚 Various chunking strategies: topic-based, regex, sentence, and more
-- 🧠 Advanced extraction strategies: cosine clustering, LLM, and more
-- 🎯 CSS selector support for precise data extraction
-- 📝 Passes instructions/keywords to refine extraction
-- 🔒 Proxy support with authentication for enhanced access
-- 🔄 Session management for complex multi-page crawling
-- 🌐 Asynchronous architecture for improved performance
-- 🖼️ Improved image processing with lazy-loading detection
-- 🕰️ Enhanced handling of delayed content loading
-- 🔑 Custom headers support for LLM interactions
-- 🖼️ iframe content extraction for comprehensive analysis
-- ⏱️ Flexible timeout and delayed content retrieval options
+<details open>
+<summary>🚀 <strong>Performance & Scalability</strong></summary>
+
+- ⚡ **Blazing Fast Scraping**: Outperforms many paid services with cutting-edge optimization.
+- 🔄 **Asynchronous Architecture**: Enhanced performance for complex multi-page crawling.
+- ⚡ **Dynamic HTML Formatting**: New, fast HTML formatting for streamlined workflows.
+- 🗂️ **Large Dataset Optimization**: Improved caching for handling massive content sets.
+
+</details>
+
+<details>
+<summary>🔎 <strong>Extraction Capabilities</strong></summary>
+
+- 🖼️ **Comprehensive Media Support**: Extracts images, audio, video, and responsive image formats like `srcset` and `picture`.
+- 📚 **Advanced Content Chunking**: Topic-based, regex, sentence-level, and cosine clustering strategies.
+- 🎯 **Precise Data Extraction**: Supports CSS selectors and keyword-based refinements.
+- 🔗 **All-Inclusive Link Crawling**: Extracts internal and external links.
+- 📝 **Markdown Generation**: Enhanced markdown generator class for custom, clean, LLM-friendly outputs.
+- 🏷️ **Metadata Extraction**: Fetches metadata directly from pages.
+
+</details>
+
+<details>
+<summary>🌐 <strong>Browser Integration</strong></summary>
+
+- 🌍 **Multi-Browser Support**: Works with Chromium, Firefox, and WebKit.
+- 🖥️ **ManagedBrowser with Dynamic Config**: Flexible host/port control for tailored setups.
+- ⚙️ **Custom Browser Hooks**: Authentication, headers, and page modifications.
+- 🕶️ **Stealth Mode**: Bypasses bot detection with advanced techniques.
+- 📸 **Screenshots & JavaScript Execution**: Takes screenshots and executes custom JavaScript before crawling.
+
+</details>
+
+<details>
+<summary>📁 <strong>Input/Output Flexibility</strong></summary>
+
+- 📂 **Local & Raw HTML Crawling**: Directly processes `file://` paths and raw HTML.
+- 🌐 **Custom Headers for LLM**: Tailored headers for enhanced AI interactions.
+- 🛠️ **Structured Output Options**: Supports JSON, cleaned HTML, and markdown outputs.
+
+</details>
+
+<details>
+<summary>🔧 <strong>Utility & Debugging</strong></summary>
+
+- 🛡️ **Error Handling**: Robust error management for seamless execution.
+- 🔐 **Session Management**: Handles complex, multi-page interactions.
+- 🧹 **Utility Functions**: Enhanced sanitization and flexible extraction helpers.
+- 🕰️ **Delayed Content Loading**: Improved handling of lazy-loading and dynamic content.
+
+</details>
+
+<details>
+<summary>🔐 <strong>Security & Accessibility</strong></summary>
+
+- 🕵️ **Proxy Support**: Enables authenticated access for restricted pages.
+- 🚪 **API Gateway**: Deploy as an API service with secure token authentication.
+- 🌐 **CORS & Static Serving**: Enhanced support for filesystem-based caching and cross-origin requests.
+
+</details>
+
+<details>
+<summary>🌟 <strong>Community & Documentation</strong></summary>
+
+- 🙌 **Contributor Acknowledgments**: Recognition for pull requests and contributions.
+- 📖 **Clear Documentation**: Simplified and updated for better onboarding and usage.
+
+</details>
+
+<details>
+<summary>🎯 <strong>Cutting-Edge Features</strong></summary>
+
+- 🛠️ **BM25-Based Markdown Filtering**: Extracts cleaner, context-relevant markdown.
+- 📚 **LLM-Friendly Citations**: Auto-converts links to numbered citations with reference lists.
+- 📡 **IFrame Content Extraction**: Comprehensive analysis for embedded content.
+- 🕰️ **Flexible Content Retrieval**: Combines timing-based strategies for reliable extractions.
+
+</details>
+
 
 ## Installation 🛠️
 

From ce7d49484fc097a834d1eac883ecce6f444ceb1e Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Thu, 28 Nov 2024 13:06:46 +0800
Subject: [PATCH 078/115] docs: update README for version 0.3.743 with new
 features, enhancements, and contributor acknowledgments

---
 README.md | 125 +++++++++++++++++++++++++++++++++++++-----------------
 1 file changed, 87 insertions(+), 38 deletions(-)

diff --git a/README.md b/README.md
index 5ba33dea..16d154b5 100644
--- a/README.md
+++ b/README.md
@@ -11,20 +11,15 @@
 
 Crawl4AI simplifies asynchronous web crawling and data extraction, making it accessible for large language models (LLMs) and AI applications. 🆓🌐
 
-## New in 0.3.74 ✨
+## New in 0.3.743 ✨  
 
-- 🚀 **Blazing Fast Scraping**: Significantly improved scraping speed.  
-- 📥 **Download Manager**: Integrated file crawling, downloading, and tracking within `CrawlResult`.  
-- 📝 **Markdown Strategy**: Flexible system for custom markdown generation and formats.  
-- 🔗 **LLM-Friendly Citations**: Auto-converts links to numbered citations with reference lists.  
-- 🔎 **Markdown Filter**: BM25-based content extraction for cleaner, relevant markdown.  
-- 🖼️ **Image Extraction**: Supports `srcset`, `picture`, and responsive image formats.  
-- 🗂️ **Local/Raw HTML**: Crawl `file://` paths and raw HTML (`raw:`) directly.  
-- 🤖 **Browser Control**: Custom browser setups with stealth integration to bypass bots.  
-- ☁️ **API & Cache Boost**: CORS, static serving, and enhanced filesystem-based caching.  
-- 🐳 **API Gateway**: Run as an API service with secure token authentication.  
-- 🛠️ **Database Upgrades**: Optimized for larger content sets with faster caching.  
-- 🐛 **Bug Fixes**: Resolved browser context issues, memory leaks, and improved error handling.
+🚀 **Improved ManagedBrowser Configuration**: Dynamic host and port support for more flexible browser management.  
+📝 **Enhanced Markdown Generation**: New generator class for better formatting and customization.  
+⚡ **Fast HTML Formatting**: Significantly optimized HTML formatting in the web crawler.  
+🛠️ **Utility & Sanitization Upgrades**: Improved sanitization and expanded utility functions for streamlined workflows.  
+👥 **Acknowledgments**: Added contributor details and pull request acknowledgments for better transparency.  
+📖 **Documentation Updates**: Clearer usage scenarios and updated guidance for better user onboarding.  
+🧪 **Test Adjustments**: Refined tests to align with recent class name changes.  
 
 
 ## Try it Now!
@@ -35,31 +30,85 @@ Crawl4AI simplifies asynchronous web crawling and data extraction, making it acc
 
 ## Features ✨
 
-- 🆓 Completely free and open-source
-- 🚀 Blazing fast performance, outperforming many paid services
-- 🤖 LLM-friendly output formats (JSON, cleaned HTML, markdown)
-- 🌐 Multi-browser support (Chromium, Firefox, WebKit)
-- 🌍 Supports crawling multiple URLs simultaneously
-- 🎨 Extracts and returns all media tags (Images, Audio, and Video)
-- 🔗 Extracts all external and internal links
-- 📚 Extracts metadata from the page
-- 🔄 Custom hooks for authentication, headers, and page modifications
-- 🕵️ User-agent customization
-- 🖼️ Takes screenshots of pages with enhanced error handling
-- 📜 Executes multiple custom JavaScripts before crawling
-- 📊 Generates structured output without LLM using JsonCssExtractionStrategy
-- 📚 Various chunking strategies: topic-based, regex, sentence, and more
-- 🧠 Advanced extraction strategies: cosine clustering, LLM, and more
-- 🎯 CSS selector support for precise data extraction
-- 📝 Passes instructions/keywords to refine extraction
-- 🔒 Proxy support with authentication for enhanced access
-- 🔄 Session management for complex multi-page crawling
-- 🌐 Asynchronous architecture for improved performance
-- 🖼️ Improved image processing with lazy-loading detection
-- 🕰️ Enhanced handling of delayed content loading
-- 🔑 Custom headers support for LLM interactions
-- 🖼️ iframe content extraction for comprehensive analysis
-- ⏱️ Flexible timeout and delayed content retrieval options
+<details open>
+<summary>🚀 <strong>Performance & Scalability</strong></summary>
+
+- ⚡ **Blazing Fast Scraping**: Outperforms many paid services with cutting-edge optimization.
+- 🔄 **Asynchronous Architecture**: Enhanced performance for complex multi-page crawling.
+- ⚡ **Dynamic HTML Formatting**: New, fast HTML formatting for streamlined workflows.
+- 🗂️ **Large Dataset Optimization**: Improved caching for handling massive content sets.
+
+</details>
+
+<details>
+<summary>🔎 <strong>Extraction Capabilities</strong></summary>
+
+- 🖼️ **Comprehensive Media Support**: Extracts images, audio, video, and responsive image formats like `srcset` and `picture`.
+- 📚 **Advanced Content Chunking**: Topic-based, regex, sentence-level, and cosine clustering strategies.
+- 🎯 **Precise Data Extraction**: Supports CSS selectors and keyword-based refinements.
+- 🔗 **All-Inclusive Link Crawling**: Extracts internal and external links.
+- 📝 **Markdown Generation**: Enhanced markdown generator class for custom, clean, LLM-friendly outputs.
+- 🏷️ **Metadata Extraction**: Fetches metadata directly from pages.
+
+</details>
+
+<details>
+<summary>🌐 <strong>Browser Integration</strong></summary>
+
+- 🌍 **Multi-Browser Support**: Works with Chromium, Firefox, and WebKit.
+- 🖥️ **ManagedBrowser with Dynamic Config**: Flexible host/port control for tailored setups.
+- ⚙️ **Custom Browser Hooks**: Authentication, headers, and page modifications.
+- 🕶️ **Stealth Mode**: Bypasses bot detection with advanced techniques.
+- 📸 **Screenshots & JavaScript Execution**: Takes screenshots and executes custom JavaScript before crawling.
+
+</details>
+
+<details>
+<summary>📁 <strong>Input/Output Flexibility</strong></summary>
+
+- 📂 **Local & Raw HTML Crawling**: Directly processes `file://` paths and raw HTML.
+- 🌐 **Custom Headers for LLM**: Tailored headers for enhanced AI interactions.
+- 🛠️ **Structured Output Options**: Supports JSON, cleaned HTML, and markdown outputs.
+
+</details>
+
+<details>
+<summary>🔧 <strong>Utility & Debugging</strong></summary>
+
+- 🛡️ **Error Handling**: Robust error management for seamless execution.
+- 🔐 **Session Management**: Handles complex, multi-page interactions.
+- 🧹 **Utility Functions**: Enhanced sanitization and flexible extraction helpers.
+- 🕰️ **Delayed Content Loading**: Improved handling of lazy-loading and dynamic content.
+
+</details>
+
+<details>
+<summary>🔐 <strong>Security & Accessibility</strong></summary>
+
+- 🕵️ **Proxy Support**: Enables authenticated access for restricted pages.
+- 🚪 **API Gateway**: Deploy as an API service with secure token authentication.
+- 🌐 **CORS & Static Serving**: Enhanced support for filesystem-based caching and cross-origin requests.
+
+</details>
+
+<details>
+<summary>🌟 <strong>Community & Documentation</strong></summary>
+
+- 🙌 **Contributor Acknowledgments**: Recognition for pull requests and contributions.
+- 📖 **Clear Documentation**: Simplified and updated for better onboarding and usage.
+
+</details>
+
+<details>
+<summary>🎯 <strong>Cutting-Edge Features</strong></summary>
+
+- 🛠️ **BM25-Based Markdown Filtering**: Extracts cleaner, context-relevant markdown.
+- 📚 **LLM-Friendly Citations**: Auto-converts links to numbered citations with reference lists.
+- 📡 **IFrame Content Extraction**: Comprehensive analysis for embedded content.
+- 🕰️ **Flexible Content Retrieval**: Combines timing-based strategies for reliable extractions.
+
+</details>
+
 
 ## Installation 🛠️
 

From d556dada9fb4003b42cf7d619ff44feef478cf2c Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Thu, 28 Nov 2024 13:07:33 +0800
Subject: [PATCH 079/115] docs: update README to keep details open for
 extraction capabilities, browser integration, input/output flexibility,
 utility & debugging, security & accessibility, community & documentation, and
 cutting-edge features

---
 README.md | 14 +++++++-------
 1 file changed, 7 insertions(+), 7 deletions(-)

diff --git a/README.md b/README.md
index 16d154b5..cd643211 100644
--- a/README.md
+++ b/README.md
@@ -40,7 +40,7 @@ Crawl4AI simplifies asynchronous web crawling and data extraction, making it acc
 
 </details>
 
-<details>
+<details open>
 <summary>🔎 <strong>Extraction Capabilities</strong></summary>
 
 - 🖼️ **Comprehensive Media Support**: Extracts images, audio, video, and responsive image formats like `srcset` and `picture`.
@@ -52,7 +52,7 @@ Crawl4AI simplifies asynchronous web crawling and data extraction, making it acc
 
 </details>
 
-<details>
+<details open>
 <summary>🌐 <strong>Browser Integration</strong></summary>
 
 - 🌍 **Multi-Browser Support**: Works with Chromium, Firefox, and WebKit.
@@ -63,7 +63,7 @@ Crawl4AI simplifies asynchronous web crawling and data extraction, making it acc
 
 </details>
 
-<details>
+<details open>
 <summary>📁 <strong>Input/Output Flexibility</strong></summary>
 
 - 📂 **Local & Raw HTML Crawling**: Directly processes `file://` paths and raw HTML.
@@ -72,7 +72,7 @@ Crawl4AI simplifies asynchronous web crawling and data extraction, making it acc
 
 </details>
 
-<details>
+<details open>
 <summary>🔧 <strong>Utility & Debugging</strong></summary>
 
 - 🛡️ **Error Handling**: Robust error management for seamless execution.
@@ -82,7 +82,7 @@ Crawl4AI simplifies asynchronous web crawling and data extraction, making it acc
 
 </details>
 
-<details>
+<details open>
 <summary>🔐 <strong>Security & Accessibility</strong></summary>
 
 - 🕵️ **Proxy Support**: Enables authenticated access for restricted pages.
@@ -91,7 +91,7 @@ Crawl4AI simplifies asynchronous web crawling and data extraction, making it acc
 
 </details>
 
-<details>
+<details open>
 <summary>🌟 <strong>Community & Documentation</strong></summary>
 
 - 🙌 **Contributor Acknowledgments**: Recognition for pull requests and contributions.
@@ -99,7 +99,7 @@ Crawl4AI simplifies asynchronous web crawling and data extraction, making it acc
 
 </details>
 
-<details>
+<details open>
 <summary>🎯 <strong>Cutting-Edge Features</strong></summary>
 
 - 🛠️ **BM25-Based Markdown Filtering**: Extracts cleaner, context-relevant markdown.

From 3abb573142d5588a1fc5790e2731ca8641ca4a95 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Thu, 28 Nov 2024 13:07:59 +0800
Subject: [PATCH 080/115] docs: update README for version 0.3.743 with improved
 formatting and contributor acknowledgments

---
 README.md | 12 +++++-------
 1 file changed, 5 insertions(+), 7 deletions(-)

diff --git a/README.md b/README.md
index cd643211..e02d7ef8 100644
--- a/README.md
+++ b/README.md
@@ -13,13 +13,11 @@ Crawl4AI simplifies asynchronous web crawling and data extraction, making it acc
 
 ## New in 0.3.743 ✨  
 
-🚀 **Improved ManagedBrowser Configuration**: Dynamic host and port support for more flexible browser management.  
-📝 **Enhanced Markdown Generation**: New generator class for better formatting and customization.  
-⚡ **Fast HTML Formatting**: Significantly optimized HTML formatting in the web crawler.  
-🛠️ **Utility & Sanitization Upgrades**: Improved sanitization and expanded utility functions for streamlined workflows.  
-👥 **Acknowledgments**: Added contributor details and pull request acknowledgments for better transparency.  
-📖 **Documentation Updates**: Clearer usage scenarios and updated guidance for better user onboarding.  
-🧪 **Test Adjustments**: Refined tests to align with recent class name changes.  
+- 🚀 **Improved ManagedBrowser Configuration**: Dynamic host and port support for more flexible browser management.  
+- 📝 **Enhanced Markdown Generation**: New generator class for better formatting and customization.  
+- ⚡ **Fast HTML Formatting**: Significantly optimized HTML formatting in the web crawler.  
+- 🛠️ **Utility & Sanitization Upgrades**: Improved sanitization and expanded utility functions for streamlined workflows.  
+- 👥 **Acknowledgments**: Added contributor details and pull request acknowledgments for better transparency.  
 
 
 ## Try it Now!

From d583aa43ca1404788838820ebfb90d2e8ee8680d Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Thu, 28 Nov 2024 15:53:25 +0800
Subject: [PATCH 081/115] refactor: update cache handling in quickstart_async
 example to use CacheMode enum

---
 README.md                         | 470 +++++++++++++++---------------
 docs/examples/quickstart_async.py |  95 +++---
 2 files changed, 296 insertions(+), 269 deletions(-)

diff --git a/README.md b/README.md
index e02d7ef8..5c50cdc5 100644
--- a/README.md
+++ b/README.md
@@ -29,94 +29,86 @@ Crawl4AI simplifies asynchronous web crawling and data extraction, making it acc
 ## Features ✨
 
 <details open>
-<summary>🚀 <strong>Performance & Scalability</strong></summary>
-
-- ⚡ **Blazing Fast Scraping**: Outperforms many paid services with cutting-edge optimization.
-- 🔄 **Asynchronous Architecture**: Enhanced performance for complex multi-page crawling.
-- ⚡ **Dynamic HTML Formatting**: New, fast HTML formatting for streamlined workflows.
-- 🗂️ **Large Dataset Optimization**: Improved caching for handling massive content sets.
+<summary>📝 <strong>Markdown Generation</strong></summary>
 
+- 🧹 **Clean Markdown**: Generates clean, structured Markdown with accurate formatting.
+- 🎯 **Fit Markdown**: Heuristic-based filtering to remove noise and irrelevant parts for AI-friendly processing.
+- 🔗 **Citations and References**: Converts page links into a numbered reference list with clean citations.
+- 🛠️ **Custom Strategies**: Users can create their own Markdown generation strategies tailored to specific needs.
+- 📚 **BM25 Algorithm**: Employs BM25-based filtering for extracting core information and removing irrelevant content. 
 </details>
 
 <details open>
-<summary>🔎 <strong>Extraction Capabilities</strong></summary>
+<summary>📊 <strong>Structured Data Extraction</strong></summary>
 
-- 🖼️ **Comprehensive Media Support**: Extracts images, audio, video, and responsive image formats like `srcset` and `picture`.
-- 📚 **Advanced Content Chunking**: Topic-based, regex, sentence-level, and cosine clustering strategies.
-- 🎯 **Precise Data Extraction**: Supports CSS selectors and keyword-based refinements.
-- 🔗 **All-Inclusive Link Crawling**: Extracts internal and external links.
-- 📝 **Markdown Generation**: Enhanced markdown generator class for custom, clean, LLM-friendly outputs.
-- 🏷️ **Metadata Extraction**: Fetches metadata directly from pages.
+- 🤖 **LLM-Driven Extraction**: Supports all LLMs (open-source and proprietary) for structured data extraction.
+- 🧱 **Chunking Strategies**: Implements chunking (topic-based, regex, sentence-level) for targeted content processing.
+- 🌌 **Cosine Similarity**: Find relevant content chunks based on user queries for semantic extraction.
+- 🔎 **CSS-Based Extraction**: Fast schema-based data extraction using XPath and CSS selectors.
+- 🔧 **Schema Definition**: Define custom schemas for extracting structured JSON from repetitive patterns.
 
 </details>
 
 <details open>
 <summary>🌐 <strong>Browser Integration</strong></summary>
 
-- 🌍 **Multi-Browser Support**: Works with Chromium, Firefox, and WebKit.
-- 🖥️ **ManagedBrowser with Dynamic Config**: Flexible host/port control for tailored setups.
-- ⚙️ **Custom Browser Hooks**: Authentication, headers, and page modifications.
-- 🕶️ **Stealth Mode**: Bypasses bot detection with advanced techniques.
-- 📸 **Screenshots & JavaScript Execution**: Takes screenshots and executes custom JavaScript before crawling.
+- 🖥️ **Managed Browser**: Use user-owned browsers with full control, avoiding bot detection.
+- 🔄 **Remote Browser Control**: Connect to Chrome Developer Tools Protocol for remote, large-scale data extraction.
+- 🔒 **Session Management**: Preserve browser states and reuse them for multi-step crawling.
+- 🧩 **Proxy Support**: Seamlessly connect to proxies with authentication for secure access.
+- ⚙️ **Full Browser Control**: Modify headers, cookies, user agents, and more for tailored crawling setups.
+- 🌍 **Multi-Browser Support**: Compatible with Chromium, Firefox, and WebKit.
 
 </details>
 
 <details open>
-<summary>📁 <strong>Input/Output Flexibility</strong></summary>
+<summary>🔎 <strong>Crawling & Scraping</strong></summary>
 
-- 📂 **Local & Raw HTML Crawling**: Directly processes `file://` paths and raw HTML.
-- 🌐 **Custom Headers for LLM**: Tailored headers for enhanced AI interactions.
-- 🛠️ **Structured Output Options**: Supports JSON, cleaned HTML, and markdown outputs.
+- 🖼️ **Media Support**: Extract images, audio, videos, and responsive image formats like `srcset` and `picture`.
+- 🚀 **Dynamic Crawling**: Execute JS and wait for async or sync for dynamic content extraction.
+- 📸 **Screenshots**: Capture page screenshots during crawling for debugging or analysis.
+- 📂 **Raw Data Crawling**: Directly process raw HTML (`raw:`) or local files (`file://`).
+- 🔗 **Comprehensive Link Extraction**: Extracts internal, external links, and embedded iframe content.
+- 🛠️ **Customizable Hooks**: Define hooks at every step to customize crawling behavior.
+- 💾 **Caching**: Cache data for improved speed and to avoid redundant fetches.
+- 📄 **Metadata Extraction**: Retrieve structured metadata from web pages.
+- 📡 **IFrame Content Extraction**: Seamless extraction from embedded iframe content.
 
 </details>
 
 <details open>
-<summary>🔧 <strong>Utility & Debugging</strong></summary>
+<summary>🚀 <strong>Deployment</strong></summary>
 
+- 🐳 **Dockerized Setup**: Optimized Docker image with API server for easy deployment.
+- 🔄 **API Gateway**: One-click deployment with secure token authentication for API-based workflows.
+- 🌐 **Scalable Architecture**: Designed for mass-scale production and optimized server performance.
+- ⚙️ **DigitalOcean Deployment**: Ready-to-deploy configurations for DigitalOcean and similar platforms.
+
+</details>
+
+<details>
+<summary>🎯 <strong>Additional Features</strong></summary>
+
+- 🕶️ **Stealth Mode**: Avoid bot detection by mimicking real users.
+- 🏷️ **Tag-Based Content Extraction**: Refine crawling based on custom tags, headers, or metadata.
+- 🔗 **Link Analysis**: Extract and analyze all links for detailed data exploration.
 - 🛡️ **Error Handling**: Robust error management for seamless execution.
-- 🔐 **Session Management**: Handles complex, multi-page interactions.
-- 🧹 **Utility Functions**: Enhanced sanitization and flexible extraction helpers.
-- 🕰️ **Delayed Content Loading**: Improved handling of lazy-loading and dynamic content.
+- 🔐 **CORS & Static Serving**: Supports filesystem-based caching and cross-origin requests.
+- 📖 **Clear Documentation**: Simplified and updated guides for onboarding and advanced usage.
+- 🙌 **Community Recognition**: Acknowledges contributors and pull requests for transparency.
 
 </details>
 
-<details open>
-<summary>🔐 <strong>Security & Accessibility</strong></summary>
-
-- 🕵️ **Proxy Support**: Enables authenticated access for restricted pages.
-- 🚪 **API Gateway**: Deploy as an API service with secure token authentication.
-- 🌐 **CORS & Static Serving**: Enhanced support for filesystem-based caching and cross-origin requests.
-
-</details>
-
-<details open>
-<summary>🌟 <strong>Community & Documentation</strong></summary>
-
-- 🙌 **Contributor Acknowledgments**: Recognition for pull requests and contributions.
-- 📖 **Clear Documentation**: Simplified and updated for better onboarding and usage.
-
-</details>
-
-<details open>
-<summary>🎯 <strong>Cutting-Edge Features</strong></summary>
-
-- 🛠️ **BM25-Based Markdown Filtering**: Extracts cleaner, context-relevant markdown.
-- 📚 **LLM-Friendly Citations**: Auto-converts links to numbered citations with reference lists.
-- 📡 **IFrame Content Extraction**: Comprehensive analysis for embedded content.
-- 🕰️ **Flexible Content Retrieval**: Combines timing-based strategies for reliable extractions.
-
-</details>
-
-
 ## Installation 🛠️
 
 Crawl4AI offers flexible installation options to suit various use cases. You can install it as a Python package or use Docker.
 
-### Using pip 🐍
+<details open>
+<summary>🐍 <strong>Using pip</strong></summary>
 
 Choose the installation option that best fits your needs:
 
-#### Basic Installation
+### Basic Installation
 
 For basic web crawling and scraping tasks:
 
@@ -126,7 +118,7 @@ pip install crawl4ai
 
 By default, this will install the asynchronous version of Crawl4AI, using Playwright for web crawling.
 
-👉 Note: When you install Crawl4AI, the setup script should automatically install and set up Playwright. However, if you encounter any Playwright-related errors, you can manually install it using one of these methods:
+👉 **Note**: When you install Crawl4AI, the setup script should automatically install and set up Playwright. However, if you encounter any Playwright-related errors, you can manually install it using one of these methods:
 
 1. Through the command line:
 
@@ -142,15 +134,19 @@ By default, this will install the asynchronous version of Crawl4AI, using Playwr
 
 This second method has proven to be more reliable in some cases.
 
-#### Installation with Synchronous Version
+---
 
-If you need the synchronous version using Selenium:
+### Installation with Synchronous Version
+
+The sync version is deprecated and will be removed in future versions. If you need the synchronous version using Selenium:
 
 ```bash
 pip install crawl4ai[sync]
 ```
 
-#### Development Installation
+---
+
+### Development Installation
 
 For contributors who plan to modify the source code:
 
@@ -159,7 +155,9 @@ git clone https://github.com/unclecode/crawl4ai.git
 cd crawl4ai
 pip install -e .                    # Basic installation in editable mode
 ```
+
 Install optional features:
+
 ```bash
 pip install -e ".[torch]"           # With PyTorch features
 pip install -e ".[transformer]"     # With Transformer features
@@ -168,7 +166,10 @@ pip install -e ".[sync]"            # With synchronous crawling (Selenium)
 pip install -e ".[all]"             # Install all optional features
 ```
 
-## One-Click Deployment 🚀
+</details>
+
+<details open>
+<summary>🚀 <strong>One-Click Deployment</strong></summary>
 
 Deploy your own instance of Crawl4AI with one click:
 
@@ -179,14 +180,19 @@ Deploy your own instance of Crawl4AI with one click:
 The deploy will:
 - Set up a Docker container with Crawl4AI
 - Configure Playwright and all dependencies
-- Start the FastAPI server on port 11235
+- Start the FastAPI server on port `11235`
 - Set up health checks and auto-deployment
 
-### Using Docker 🐳
+</details>
+
+<details open>
+<summary>🐳 <strong>Using Docker</strong></summary>
 
 Crawl4AI is available as Docker images for easy deployment. You can either pull directly from Docker Hub (recommended) or build from the repository.
 
-#### Option 1: Docker Hub (Recommended)
+---
+
+### Option 1: Docker Hub (Recommended)
 
 ```bash
 # Pull and run from Docker Hub (choose one):
@@ -204,7 +210,9 @@ docker run --platform linux/arm64 -p 11235:11235 unclecode/crawl4ai:basic
 docker run --shm-size=2gb -p 11235:11235 unclecode/crawl4ai:basic
 ```
 
-#### Option 2: Build from Repository
+---
+
+### Option 2: Build from Repository
 
 ```bash
 # Clone the repository
@@ -226,7 +234,12 @@ docker build -t crawl4ai:local \
 docker run -p 11235:11235 crawl4ai:local
 ```
 
-Quick test (works for both options):
+---
+
+### Quick Test
+
+Run a quick test (works for both Docker options):
+
 ```python
 import requests
 
@@ -243,143 +256,149 @@ result = requests.get(f"http://localhost:11235/task/{task_id}")
 
 For advanced configuration, environment variables, and usage examples, see our [Docker Deployment Guide](https://crawl4ai.com/mkdocs/basic/docker-deployment/).
 
+</details>
+
 
 ## Quick Start 🚀
 
 ```python
 import asyncio
-from crawl4ai import AsyncWebCrawler
+from crawl4ai import AsyncWebCrawler, CacheMode
 
 async def main():
     async with AsyncWebCrawler(verbose=True) as crawler:
         result = await crawler.arun(url="https://www.nbcnews.com/business")
-        print(result.markdown)
+        print(result.markdown_v2.raw_markdown) # Soone will be change to result.markdown
 
 if __name__ == "__main__":
     asyncio.run(main())
 ```
 
-## Advanced Usage 🔬
+## Advanced Usage Examples 🔬
 
-### Executing JavaScript and Using CSS Selectors
+You can check the project structure in the directory [https://github.com/unclecode/crawl4ai/docs/examples](docs/examples). Over there, you can find a variety of examples; here, some popular examples are shared.
+
+<details open>
+<summary>🖥️ <strong>Heuristic Markdown Generation with Clean and Fit Markdown</strong></summary>
 
 ```python
 import asyncio
-from crawl4ai import AsyncWebCrawler
+from crawl4ai import AsyncWebCrawler, CacheMode
+from crawl4ai.content_filter_strategy import BM25ContentFilter
+from crawl4ai.markdown_generation_strategy import DefaultMarkdownGenerator
 
 async def main():
-    async with AsyncWebCrawler(verbose=True) as crawler:
-        js_code = ["const loadMoreButton = Array.from(document.querySelectorAll('button')).find(button => button.textContent.includes('Load More')); loadMoreButton && loadMoreButton.click();"]
+    async with AsyncWebCrawler(
+        headless=True,  
+        verbose=True,
+    ) as crawler:
         result = await crawler.arun(
-            url="https://www.nbcnews.com/business",
-            js_code=js_code,
-            css_selector=".wide-tease-item__description",
-            bypass_cache=True
+            url="https://docs.micronaut.io/4.7.6/guide/",
+            cache_mode=CacheMode.ENABLED,
+            markdown_generator=DefaultMarkdownGenerator(
+                content_filter=BM25ContentFilter(user_query=None, bm25_threshold=1.0)
+            ),
         )
-        print(result.extracted_content)
+        print(len(result.markdown))
+        print(len(result.fit_markdown))
+        print(len(result.markdown_v2.fit_markdown))
 
 if __name__ == "__main__":
     asyncio.run(main())
 ```
 
-### Using a Proxy
+</details>
+
+<details open>
+<summary>🖥️ <strong>Structured Data Extraction and Executing JavaScript</strong></summary>
 
 ```python
 import asyncio
-from crawl4ai import AsyncWebCrawler
-
-async def main():
-    async with AsyncWebCrawler(verbose=True, proxy="http://127.0.0.1:7890") as crawler:
-        result = await crawler.arun(
-            url="https://www.nbcnews.com/business",
-            bypass_cache=True
-        )
-        print(result.markdown)
-
-if __name__ == "__main__":
-    asyncio.run(main())
-```
-
-### Extracting Structured Data without LLM
-
-The `JsonCssExtractionStrategy` allows for precise extraction of structured data from web pages using CSS selectors.
-
-```python
-import asyncio
-import json
-from crawl4ai import AsyncWebCrawler
+from crawl4ai import AsyncWebCrawler, CacheMode
 from crawl4ai.extraction_strategy import JsonCssExtractionStrategy
+import json
 
-async def extract_news_teasers():
+async def main():
     schema = {
-        "name": "News Teaser Extractor",
-        "baseSelector": ".wide-tease-item__wrapper",
-        "fields": [
-            {
-                "name": "category",
-                "selector": ".unibrow span[data-testid='unibrow-text']",
-                "type": "text",
-            },
-            {
-                "name": "headline",
-                "selector": ".wide-tease-item__headline",
-                "type": "text",
-            },
-            {
-                "name": "summary",
-                "selector": ".wide-tease-item__description",
-                "type": "text",
-            },
-            {
-                "name": "time",
-                "selector": "[data-testid='wide-tease-date']",
-                "type": "text",
-            },
-            {
-                "name": "image",
-                "type": "nested",
-                "selector": "picture.teasePicture img",
-                "fields": [
-                    {"name": "src", "type": "attribute", "attribute": "src"},
-                    {"name": "alt", "type": "attribute", "attribute": "alt"},
-                ],
-            },
-            {
-                "name": "link",
-                "selector": "a[href]",
-                "type": "attribute",
-                "attribute": "href",
-            },
-        ],
-    }
+    "name": "KidoCode Courses",
+    "baseSelector": "section.charge-methodology .w-tab-content > div",
+    "fields": [
+        {
+            "name": "section_title",
+            "selector": "h3.heading-50",
+            "type": "text",
+        },
+        {
+            "name": "section_description",
+            "selector": ".charge-content",
+            "type": "text",
+        },
+        {
+            "name": "course_name",
+            "selector": ".text-block-93",
+            "type": "text",
+        },
+        {
+            "name": "course_description",
+            "selector": ".course-content-text",
+            "type": "text",
+        },
+        {
+            "name": "course_icon",
+            "selector": ".image-92",
+            "type": "attribute",
+            "attribute": "src"
+        }
+    ]
+}
 
     extraction_strategy = JsonCssExtractionStrategy(schema, verbose=True)
 
-    async with AsyncWebCrawler(verbose=True) as crawler:
+    async with AsyncWebCrawler(
+        headless=False,
+        verbose=True
+    ) as crawler:
+        
+        # Create the JavaScript that handles clicking multiple times
+        js_click_tabs = """
+        (async () => {
+            const tabs = document.querySelectorAll("section.charge-methodology .tabs-menu-3 > div");
+            
+            for(let tab of tabs) {
+                // scroll to the tab
+                tab.scrollIntoView();
+                tab.click();
+                // Wait for content to load and animations to complete
+                await new Promise(r => setTimeout(r, 500));
+            }
+        })();
+        """     
+
         result = await crawler.arun(
-            url="https://www.nbcnews.com/business",
-            extraction_strategy=extraction_strategy,
-            bypass_cache=True,
+            url="https://www.kidocode.com/degrees/technology",
+            extraction_strategy=JsonCssExtractionStrategy(schema, verbose=True),
+            js_code=[js_click_tabs],
+            cache_mode=CacheMode.BYPASS
         )
 
-        assert result.success, "Failed to crawl the page"
+        companies = json.loads(result.extracted_content)
+        print(f"Successfully extracted {len(companies)} companies")
+        print(json.dumps(companies[0], indent=2))
 
-        news_teasers = json.loads(result.extracted_content)
-        print(f"Successfully extracted {len(news_teasers)} news teasers")
-        print(json.dumps(news_teasers[0], indent=2))
 
 if __name__ == "__main__":
-    asyncio.run(extract_news_teasers())
+    asyncio.run(main())
 ```
 
-For more advanced usage examples, check out our [Examples](https://crawl4ai.com/mkdocs/extraction/css-advanced/) section in the documentation.
+</details>
 
-### Extracting Structured Data with OpenAI
+<details open>
+<summary>🤖 <strong>Extracting Structured Data with LLMs</strong></summary>
 
 ```python
 import os
 import asyncio
-from crawl4ai import AsyncWebCrawler
+from crawl4ai import AsyncWebCrawler, CacheMode
 from crawl4ai.extraction_strategy import LLMExtractionStrategy
 from pydantic import BaseModel, Field
 
@@ -394,6 +413,8 @@ async def main():
             url='https://openai.com/api/pricing/',
             word_count_threshold=1,
             extraction_strategy=LLMExtractionStrategy(
+                # Here you can use any provider that Litellm library supports, for instance: ollama/qwen2
+                # provider="ollama/qwen2", api_token="no-token", 
                 provider="openai/gpt-4o", api_token=os.getenv('OPENAI_API_KEY'), 
                 schema=OpenAIModelFee.schema(),
                 extraction_type="schema",
@@ -401,7 +422,7 @@ async def main():
                 Do not miss any models in the entire content. One extracted model JSON format should look like this: 
                 {"model_name": "GPT-4", "input_fee": "US$10.00 / 1M tokens", "output_fee": "US$30.00 / 1M tokens"}."""
             ),            
-            bypass_cache=True,
+            cache_mode=CacheMode.BYPASS,
         )
         print(result.extracted_content)
 
@@ -409,105 +430,86 @@ if __name__ == "__main__":
     asyncio.run(main())
 ```
 
-### Session Management and Dynamic Content Crawling
+</details>
 
-Crawl4AI excels at handling complex scenarios, such as crawling multiple pages with dynamic content loaded via JavaScript. Here's an example of crawling GitHub commits across multiple pages:
+<details open>
+<summary>🤖 <strong>Using You own Browswer with Custome User Profile</strong></summary>
 
 ```python
-import asyncio
-import re
-from bs4 import BeautifulSoup
+import os, sys
+from pathlib import Path
+import asyncio, time
 from crawl4ai import AsyncWebCrawler
 
-async def crawl_typescript_commits():
-    first_commit = ""
-    async def on_execution_started(page):
-        nonlocal first_commit 
-        try:
-            while True:
-                await page.wait_for_selector('li.Box-sc-g0xbh4-0 h4')
-                commit = await page.query_selector('li.Box-sc-g0xbh4-0 h4')
-                commit = await commit.evaluate('(element) => element.textContent')
-                commit = re.sub(r'\s+', '', commit)
-                if commit and commit != first_commit:
-                    first_commit = commit
-                    break
-                await asyncio.sleep(0.5)
-        except Exception as e:
-            print(f"Warning: New content didn't appear after JavaScript execution: {e}")
+async def test_news_crawl():
+    # Create a persistent user data directory
+    user_data_dir = os.path.join(Path.home(), ".crawl4ai", "browser_profile")
+    os.makedirs(user_data_dir, exist_ok=True)
 
-    async with AsyncWebCrawler(verbose=True) as crawler:
-        crawler.crawler_strategy.set_hook('on_execution_started', on_execution_started)
-
-        url = "https://github.com/microsoft/TypeScript/commits/main"
-        session_id = "typescript_commits_session"
-        all_commits = []
-
-        js_next_page = """
-        const button = document.querySelector('a[data-testid="pagination-next-button"]');
-        if (button) button.click();
-        """
-
-        for page in range(3):  # Crawl 3 pages
-            result = await crawler.arun(
-                url=url,
-                session_id=session_id,
-                css_selector="li.Box-sc-g0xbh4-0",
-                js=js_next_page if page > 0 else None,
-                bypass_cache=True,
-                js_only=page > 0
-            )
-
-            assert result.success, f"Failed to crawl page {page + 1}"
-
-            soup = BeautifulSoup(result.cleaned_html, 'html.parser')
-            commits = soup.select("li")
-            all_commits.extend(commits)
-
-            print(f"Page {page + 1}: Found {len(commits)} commits")
-
-        await crawler.crawler_strategy.kill_session(session_id)
-        print(f"Successfully crawled {len(all_commits)} commits across 3 pages")
-
-if __name__ == "__main__":
-    asyncio.run(crawl_typescript_commits())
+    async with AsyncWebCrawler(
+        verbose=True,
+        headless=True,
+        user_data_dir=user_data_dir,
+        use_persistent_context=True,
+        headers={
+            "Accept": "text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,*/*;q=0.8",
+            "Accept-Language": "en-US,en;q=0.5",
+            "Accept-Encoding": "gzip, deflate, br",
+            "DNT": "1",
+            "Connection": "keep-alive",
+            "Upgrade-Insecure-Requests": "1",
+            "Sec-Fetch-Dest": "document",
+            "Sec-Fetch-Mode": "navigate",
+            "Sec-Fetch-Site": "none",
+            "Sec-Fetch-User": "?1",
+            "Cache-Control": "max-age=0",
+        }
+    ) as crawler:
+        url = "ADDRESS_OF_A_CHALLENGING_WEBSITE"
+        
+        result = await crawler.arun(
+            url,
+            cache_mode=CacheMode.BYPASS,
+            magic=True,
+        )
+        
+        print(f"Successfully crawled {url}")
+        print(f"Content length: {len(result.markdown)}")
 ```
 
-This example demonstrates Crawl4AI's ability to handle complex scenarios where content is loaded asynchronously. It crawls multiple pages of GitHub commits, executing JavaScript to load new content and using custom hooks to ensure data is loaded before proceeding.
-
-For more advanced usage examples, check out our [Examples](https://crawl4ai.com/mkdocs/tutorial/episode_12_Session-Based_Crawling_for_Dynamic_Websites/) section in the documentation.
 </details>
 
 
 ## Speed Comparison 🚀
+A test was conducted on **[NBC News - Business Section](https://www.nbcnews.com/business)** to compare Crawl4AI and Firecrawl, highlighting Crawl4AI's speed, efficiency, and advanced features.
 
-Crawl4AI is designed with speed as a primary focus. Our goal is to provide the fastest possible response with high-quality data extraction, minimizing abstractions between the data and the user.
+---
 
-We've conducted a speed comparison between Crawl4AI and Firecrawl, a paid service. The results demonstrate Crawl4AI's superior performance:
+#### Results Summary  
 
-```bash
-Firecrawl:
-Time taken: 7.02 seconds
-Content length: 42074 characters
-Images found: 49
+| **Method**                     | **Time Taken** | **Markdown Length** | **Fit Markdown** | **Images Found** |
+|--------------------------------|----------------|----------------------|-------------------|------------------|
+| **Firecrawl**                  | 6.04 seconds   | 38,382 characters    | -                 | 52               |
+| **Crawl4AI (Simple Crawl)**    | 1.06 seconds   | 42,027 characters    | -                 | 52               |
+| **Crawl4AI (Markdown Plus)**   | 1.30 seconds   | 54,342 characters    | 11,119 characters | 52               |
+| **Crawl4AI (JavaScript)**      | 1.56 seconds   | 75,869 characters    | 13,406 characters | 92               |
 
-Crawl4AI (simple crawl):
-Time taken: 1.60 seconds
-Content length: 18238 characters
-Images found: 49
+---
 
-Crawl4AI (with JavaScript execution):
-Time taken: 4.64 seconds
-Content length: 40869 characters
-Images found: 89
-```
+#### Key Takeaways  
 
-As you can see, Crawl4AI outperforms Firecrawl significantly:
+1. **Superior Speed**: Crawl4AI processes even advanced crawls up to **6x faster** than Firecrawl, with times as low as **1.06 seconds**.  
+2. **Rich Content Extraction**: Crawl4AI consistently captures more comprehensive content, producing a **Markdown Plus** output of **54,342 characters**, compared to Firecrawl's **38,382 characters**.  
+3. **AI-Optimized Output**: With **Fit Markdown**, Crawl4AI removes noise to produce concise, AI-friendly outputs (**11,119–13,406 characters**) tailored for LLM workflows.  
+4. **Dynamic Content Handling**: Using JavaScript execution, Crawl4AI extracted **92 images** and enriched content dynamically loaded via “Load More” buttons—unmatched by Firecrawl.  
 
-- Simple crawl: Crawl4AI is over 4 times faster than Firecrawl.
-- With JavaScript execution: Even when executing JavaScript to load more content (doubling the number of images found), Crawl4AI is still faster than Firecrawl's simple crawl.
+---
 
-You can find the full comparison code in our repository at `docs/examples/crawl4ai_vs_firecrawl.py`.
+#### Conclusion  
+
+Crawl4AI outshines Firecrawl in speed, completeness, and flexibility. Its advanced features, including **Markdown Plus**, **Fit Markdown**, and **dynamic content handling**, make it the ideal choice for AI-ready web crawling. Whether you're targeting rich structured data or handling complex dynamic websites, Crawl4AI delivers unmatched performance and precision.
+
+You can find the full comparison code in our repository at [docs/examples/quickstart_async.py](https://github.com/unclecode/crawl4ai/blob/main/docs/examples/quickstart_async.py).
 
 ## Documentation 📚
 
diff --git a/docs/examples/quickstart_async.py b/docs/examples/quickstart_async.py
index d67a8c30..e50fe456 100644
--- a/docs/examples/quickstart_async.py
+++ b/docs/examples/quickstart_async.py
@@ -13,7 +13,9 @@ import re
 from typing import Dict, List
 from bs4 import BeautifulSoup
 from pydantic import BaseModel, Field
-from crawl4ai import AsyncWebCrawler
+from crawl4ai import AsyncWebCrawler, CacheMode
+from crawl4ai.markdown_generation_strategy import DefaultMarkdownGenerator
+from crawl4ai.content_filter_strategy import BM25ContentFilter
 from crawl4ai.extraction_strategy import (
     JsonCssExtractionStrategy,
     LLMExtractionStrategy,
@@ -51,7 +53,7 @@ async def simple_example_with_running_js_code():
             url="https://www.nbcnews.com/business",
             js_code=js_code,
             # wait_for=wait_for,
-            bypass_cache=True,
+            cache_mode=CacheMode.BYPASS,
         )
         print(result.markdown[:500])  # Print first 500 characters
 
@@ -61,7 +63,7 @@ async def simple_example_with_css_selector():
         result = await crawler.arun(
             url="https://www.nbcnews.com/business",
             css_selector=".wide-tease-item__description",
-            bypass_cache=True,
+            cache_mode=CacheMode.BYPASS,
         )
         print(result.markdown[:500])  # Print first 500 characters
 
@@ -132,7 +134,7 @@ async def extract_structured_data_using_llm(provider: str, api_token: str = None
                 {"model_name": "GPT-4", "input_fee": "US$10.00 / 1M tokens", "output_fee": "US$30.00 / 1M tokens"}.""",
                 extra_args=extra_args
             ),
-            bypass_cache=True,
+            cache_mode=CacheMode.BYPASS,
         )
         print(result.extracted_content)
 
@@ -166,7 +168,7 @@ async def extract_structured_data_using_css_extractor():
         result = await crawler.arun(
             url="https://www.coinbase.com/explore",
             extraction_strategy=extraction_strategy,
-            bypass_cache=True,
+            cache_mode=CacheMode.BYPASS,
         )
 
         assert result.success, "Failed to crawl the page"
@@ -213,7 +215,7 @@ async def crawl_dynamic_content_pages_method_1():
                 session_id=session_id,
                 css_selector="li.Box-sc-g0xbh4-0",
                 js=js_next_page if page > 0 else None,
-                bypass_cache=True,
+                cache_mode=CacheMode.BYPASS,
                 js_only=page > 0,
                 headless=False,
             )
@@ -282,7 +284,7 @@ async def crawl_dynamic_content_pages_method_2():
                 extraction_strategy=extraction_strategy,
                 js_code=js_next_page_and_wait if page > 0 else None,
                 js_only=page > 0,
-                bypass_cache=True,
+                cache_mode=CacheMode.BYPASS,
                 headless=False,
             )
 
@@ -343,7 +345,7 @@ async def crawl_dynamic_content_pages_method_3():
                 js_code=js_next_page if page > 0 else None,
                 wait_for=wait_for if page > 0 else None,
                 js_only=page > 0,
-                bypass_cache=True,
+                cache_mode=CacheMode.BYPASS,
                 headless=False,
             )
 
@@ -384,7 +386,7 @@ async def crawl_with_user_simultion():
         url = "YOUR-URL-HERE"
         result = await crawler.arun(
             url=url,            
-            bypass_cache=True,
+            cache_mode=CacheMode.BYPASS,
             magic = True, # Automatically detects and removes overlays, popups, and other elements that block content
             # simulate_user = True,# Causes a series of random mouse movements and clicks to simulate user interaction
             # override_navigator = True # Overrides the navigator object to make it look like a real user
@@ -408,7 +410,7 @@ async def speed_comparison():
     params={'formats': ['markdown', 'html']}
     )
     end = time.time()
-    print("Firecrawl (simulated):")
+    print("Firecrawl:")
     print(f"Time taken: {end - start:.2f} seconds")
     print(f"Content length: {len(scrape_status['markdown'])} characters")
     print(f"Images found: {scrape_status['markdown'].count('cldnry.s-nbcnews.com')}")
@@ -420,7 +422,7 @@ async def speed_comparison():
         result = await crawler.arun(
             url="https://www.nbcnews.com/business",
             word_count_threshold=0,
-            bypass_cache=True,
+            cache_mode=CacheMode.BYPASS,
             verbose=False,
         )
         end = time.time()
@@ -430,6 +432,25 @@ async def speed_comparison():
         print(f"Images found: {result.markdown.count('cldnry.s-nbcnews.com')}")
         print()
 
+        # Crawl4AI with advanced content filtering
+        start = time.time()
+        result = await crawler.arun(
+            url="https://www.nbcnews.com/business",
+            word_count_threshold=0,
+            markdown_generator=DefaultMarkdownGenerator(
+                content_filter=BM25ContentFilter(user_query=None, bm25_threshold=1.0)
+            ),
+            cache_mode=CacheMode.BYPASS,
+            verbose=False,
+        )
+        end = time.time()
+        print("Crawl4AI (Markdown Plus):")
+        print(f"Time taken: {end - start:.2f} seconds")
+        print(f"Content length: {len(result.markdown_v2.raw_markdown)} characters")
+        print(f"Fit Markdown: {len(result.markdown_v2.fit_markdown)} characters")
+        print(f"Images found: {result.markdown.count('cldnry.s-nbcnews.com')}")
+        print()
+
         # Crawl4AI with JavaScript execution
         start = time.time()
         result = await crawler.arun(
@@ -438,13 +459,17 @@ async def speed_comparison():
                 "const loadMoreButton = Array.from(document.querySelectorAll('button')).find(button => button.textContent.includes('Load More')); loadMoreButton && loadMoreButton.click();"
             ],
             word_count_threshold=0,
-            bypass_cache=True,
+            cache_mode=CacheMode.BYPASS,
+            markdown_generator=DefaultMarkdownGenerator(
+                content_filter=BM25ContentFilter(user_query=None, bm25_threshold=1.0)
+            ),
             verbose=False,
         )
         end = time.time()
         print("Crawl4AI (with JavaScript execution):")
         print(f"Time taken: {end - start:.2f} seconds")
         print(f"Content length: {len(result.markdown)} characters")
+        print(f"Fit Markdown: {len(result.markdown_v2.fit_markdown)} characters")
         print(f"Images found: {result.markdown.count('cldnry.s-nbcnews.com')}")
 
     print("\nNote on Speed Comparison:")
@@ -483,7 +508,7 @@ async def generate_knowledge_graph():
         url = "https://paulgraham.com/love.html"
         result = await crawler.arun(
             url=url,
-            bypass_cache=True,
+            cache_mode=CacheMode.BYPASS,
             extraction_strategy=extraction_strategy,
             # magic=True
         )
@@ -496,7 +521,7 @@ async def fit_markdown_remove_overlay():
         url = "https://janineintheworld.com/places-to-visit-in-central-mexico"
         result = await crawler.arun(
             url=url,
-            bypass_cache=True,
+            cache_mode=CacheMode.BYPASS,
             word_count_threshold = 10,
             remove_overlay_elements=True,
             screenshot = True
@@ -509,31 +534,31 @@ async def fit_markdown_remove_overlay():
 
 
 async def main():
-    await simple_crawl()
-    await simple_example_with_running_js_code()
-    await simple_example_with_css_selector()
-    await use_proxy()
-    await capture_and_save_screenshot("https://www.example.com", os.path.join(__location__, "tmp/example_screenshot.jpg"))
-    await extract_structured_data_using_css_extractor()
+    # await simple_crawl()
+    # await simple_example_with_running_js_code()
+    # await simple_example_with_css_selector()
+    # await use_proxy()
+    # await capture_and_save_screenshot("https://www.example.com", os.path.join(__location__, "tmp/example_screenshot.jpg"))
+    # await extract_structured_data_using_css_extractor()
 
-    # LLM extraction examples
-    await extract_structured_data_using_llm()
-    await extract_structured_data_using_llm("huggingface/meta-llama/Meta-Llama-3.1-8B-Instruct", os.getenv("HUGGINGFACE_API_KEY"))
-    await extract_structured_data_using_llm("openai/gpt-4o", os.getenv("OPENAI_API_KEY"))
-    await extract_structured_data_using_llm("ollama/llama3.2")    
+    # # LLM extraction examples
+    # await extract_structured_data_using_llm()
+    # await extract_structured_data_using_llm("huggingface/meta-llama/Meta-Llama-3.1-8B-Instruct", os.getenv("HUGGINGFACE_API_KEY"))
+    # await extract_structured_data_using_llm("openai/gpt-4o", os.getenv("OPENAI_API_KEY"))
+    # await extract_structured_data_using_llm("ollama/llama3.2")    
 
-    # You always can pass custom headers to the extraction strategy
-    custom_headers = {
-        "Authorization": "Bearer your-custom-token",
-        "X-Custom-Header": "Some-Value"
-    }
-    await extract_structured_data_using_llm(extra_headers=custom_headers)
+    # # You always can pass custom headers to the extraction strategy
+    # custom_headers = {
+    #     "Authorization": "Bearer your-custom-token",
+    #     "X-Custom-Header": "Some-Value"
+    # }
+    # await extract_structured_data_using_llm(extra_headers=custom_headers)
     
-    # await crawl_dynamic_content_pages_method_1()
-    # await crawl_dynamic_content_pages_method_2()
-    await crawl_dynamic_content_pages_method_3()
+    # # await crawl_dynamic_content_pages_method_1()
+    # # await crawl_dynamic_content_pages_method_2()
+    # await crawl_dynamic_content_pages_method_3()
     
-    await crawl_custom_browser_type()
+    # await crawl_custom_browser_type()
     
     await speed_comparison()
 

From a69f7a953198df1d9d93420161794aafe3fcffcb Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Thu, 28 Nov 2024 16:31:41 +0800
Subject: [PATCH 082/115] fix: correct typo in function documentation for
 clarity and accuracy

---
 README.md | 184 +++++++++++++++++++++++++++++++-----------------------
 1 file changed, 105 insertions(+), 79 deletions(-)

diff --git a/README.md b/README.md
index 5c50cdc5..c4ef1bd3 100644
--- a/README.md
+++ b/README.md
@@ -1,5 +1,7 @@
 # 🔥🕷️ Crawl4AI: LLM Friendly Web Crawler & Scraper
 
+[✨ Check out what's new in the latest update!](#new-in-03743)
+
 <a href="https://trendshift.io/repositories/11716" target="_blank"><img src="https://trendshift.io/api/badge/repositories/11716" alt="unclecode%2Fcrawl4ai | Trendshift" style="width: 250px; height: 55px;" width="250" height="55"/></a>
 
 [![GitHub Stars](https://img.shields.io/github/stars/unclecode/crawl4ai?style=social)](https://github.com/unclecode/crawl4ai/stargazers)
@@ -9,26 +11,47 @@
 [![GitHub Pull Requests](https://img.shields.io/github/issues-pr/unclecode/crawl4ai)](https://github.com/unclecode/crawl4ai/pulls)
 [![License](https://img.shields.io/github/license/unclecode/crawl4ai)](https://github.com/unclecode/crawl4ai/blob/main/LICENSE)
 
-Crawl4AI simplifies asynchronous web crawling and data extraction, making it accessible for large language models (LLMs) and AI applications. 🆓🌐
+## 🔥 Crawl4AI: Crawl Smarter, Faster, Freely. For AI.  
 
-## New in 0.3.743 ✨  
+Crawl4AI is the #1 trending GitHub repository, actively maintained by a vibrant community. It delivers blazing-fast, AI-ready web crawling tailored for LLMs, AI agents, and data pipelines. Open source, flexible, and built for real-time performance, Crawl4AI empowers developers with unmatched speed, precision, and deployment ease.  
 
-- 🚀 **Improved ManagedBrowser Configuration**: Dynamic host and port support for more flexible browser management.  
-- 📝 **Enhanced Markdown Generation**: New generator class for better formatting and customization.  
-- ⚡ **Fast HTML Formatting**: Significantly optimized HTML formatting in the web crawler.  
-- 🛠️ **Utility & Sanitization Upgrades**: Improved sanitization and expanded utility functions for streamlined workflows.  
-- 👥 **Acknowledgments**: Added contributor details and pull request acknowledgments for better transparency.  
+[✨ Check out what's new in the latest update!](#new-in-03743)
+
+## 🧐 Why Crawl4AI?
+
+1. **Built for LLMs**: Creates **smart, concise Markdown** optimized for applications like Retrieval-Augmented Generation (RAG) and fine-tuning.  
+2. **Lightning Fast**: Delivers results **6x faster** than competitors with real-time, cost-efficient performance.  
+3. **Flexible Browser Control**: Offers session management, proxies, and custom hooks for precise, seamless data access.  
+4. **Heuristic Intelligence**: Leverages **advanced algorithms** to extract data efficiently, reducing reliance on costly language models.  
+5. **Open Source & Deployable**: 100% open-source with no API keys or registration required-ready for **Docker and cloud integration**.  
+6. **Thriving Community**: Actively maintained by a vibrant developer community and the **#1 trending GitHub repository** across all languages.
 
 
-## Try it Now!
+## 🚀 Quick Start 
 
-✨ Play around with this [![Open In Colab](https://colab.research.google.com/assets/colab-badge.svg)](https://colab.research.google.com/drive/1SgRPrByQLzjRfwoRNq1wSGE9nYY_EE8C?usp=sharing)
+1. Install Crawl4AI:
+```bash
+pip install crawl4ai
+```
 
-✨ Visit our [Documentation Website](https://crawl4ai.com/mkdocs/)
+2. Run a simple web crawl:
+```python
+import asyncio
+from crawl4ai import AsyncWebCrawler, CacheMode
 
-## Features ✨
+async def main():
+    async with AsyncWebCrawler(verbose=True) as crawler:
+        result = await crawler.arun(url="https://www.nbcnews.com/business")
+        # Soone will be change to result.markdown
+        print(result.markdown_v2.raw_markdown) 
 
-<details open>
+if __name__ == "__main__":
+    asyncio.run(main())
+```
+
+## ✨ Features 
+
+<details>
 <summary>📝 <strong>Markdown Generation</strong></summary>
 
 - 🧹 **Clean Markdown**: Generates clean, structured Markdown with accurate formatting.
@@ -38,7 +61,7 @@ Crawl4AI simplifies asynchronous web crawling and data extraction, making it acc
 - 📚 **BM25 Algorithm**: Employs BM25-based filtering for extracting core information and removing irrelevant content. 
 </details>
 
-<details open>
+<details>
 <summary>📊 <strong>Structured Data Extraction</strong></summary>
 
 - 🤖 **LLM-Driven Extraction**: Supports all LLMs (open-source and proprietary) for structured data extraction.
@@ -49,7 +72,7 @@ Crawl4AI simplifies asynchronous web crawling and data extraction, making it acc
 
 </details>
 
-<details open>
+<details>
 <summary>🌐 <strong>Browser Integration</strong></summary>
 
 - 🖥️ **Managed Browser**: Use user-owned browsers with full control, avoiding bot detection.
@@ -61,7 +84,7 @@ Crawl4AI simplifies asynchronous web crawling and data extraction, making it acc
 
 </details>
 
-<details open>
+<details>
 <summary>🔎 <strong>Crawling & Scraping</strong></summary>
 
 - 🖼️ **Media Support**: Extract images, audio, videos, and responsive image formats like `srcset` and `picture`.
@@ -76,7 +99,7 @@ Crawl4AI simplifies asynchronous web crawling and data extraction, making it acc
 
 </details>
 
-<details open>
+<details>
 <summary>🚀 <strong>Deployment</strong></summary>
 
 - 🐳 **Dockerized Setup**: Optimized Docker image with API server for easy deployment.
@@ -99,7 +122,54 @@ Crawl4AI simplifies asynchronous web crawling and data extraction, making it acc
 
 </details>
 
-## Installation 🛠️
+
+
+## Try it Now!
+
+✨ Play around with this [![Open In Colab](https://colab.research.google.com/assets/colab-badge.svg)](https://colab.research.google.com/drive/1SgRPrByQLzjRfwoRNq1wSGE9nYY_EE8C?usp=sharing)
+
+✨ Visit our [Documentation Website](https://crawl4ai.com/mkdocs/)
+
+
+## 🚀 Speed Comparison
+
+A test was conducted on **[NBC News - Business Section](https://www.nbcnews.com/business)** to compare Crawl4AI and Firecrawl, highlighting Crawl4AI's speed, efficiency, and advanced features.
+
+<details open>
+<summary>📊 <strong>Results Summary</strong></summary>
+
+#### Results Summary  
+
+| **Method**                     | **Time Taken** | **Markdown Length** | **Fit Markdown** | **Images Found** |
+|--------------------------------|----------------|----------------------|-------------------|------------------|
+| **Firecrawl**                  | 6.04 seconds   | 38,382 characters    | -                 | 52               |
+| **Crawl4AI (Simple Crawl)**    | 1.06 seconds   | 42,027 characters    | -                 | 52               |
+| **Crawl4AI (Markdown Plus)**   | 1.30 seconds   | 54,342 characters    | 11,119 characters | 52               |
+| **Crawl4AI (JavaScript)**      | 1.56 seconds   | 75,869 characters    | 13,406 characters | 92               |
+
+</details>
+
+<details open>
+<summary>⚡ <strong>Key Takeaways</strong></summary>
+
+1. **Superior Speed**: Crawl4AI processes even advanced crawls up to **6x faster** than Firecrawl, with times as low as **1.06 seconds**.  
+2. **Rich Content Extraction**: Crawl4AI consistently captures more comprehensive content, producing a **Markdown Plus** output of **54,342 characters**, compared to Firecrawl's **38,382 characters**.  
+3. **AI-Optimized Output**: With **Fit Markdown**, Crawl4AI removes noise to produce concise, AI-friendly outputs (**11,119–13,406 characters**) tailored for LLM workflows.  
+4. **Dynamic Content Handling**: Using JavaScript execution, Crawl4AI extracted **92 images** and enriched content dynamically loaded via “Load More” buttons—unmatched by Firecrawl.  
+
+</details>
+
+<details open>
+<summary>🏁 <strong>Conclusion</strong></summary>
+
+Crawl4AI outshines Firecrawl in speed, completeness, and flexibility. Its advanced features, including **Markdown Plus**, **Fit Markdown**, and **dynamic content handling**, make it the ideal choice for AI-ready web crawling. Whether you're targeting rich structured data or handling complex dynamic websites, Crawl4AI delivers unmatched performance and precision.
+
+You can find the full comparison code in our repository at [docs/examples/quickstart_async.py](https://github.com/unclecode/crawl4ai/blob/main/docs/examples/quickstart_async.py).
+
+</details>
+
+
+## 🛠️ Installation 🛠️
 
 Crawl4AI offers flexible installation options to suit various use cases. You can install it as a Python package or use Docker.
 
@@ -259,27 +329,14 @@ For advanced configuration, environment variables, and usage examples, see our [
 </details>
 
 
-## Quick Start 🚀
 
-```python
-import asyncio
-from crawl4ai import AsyncWebCrawler, CacheMode
 
-async def main():
-    async with AsyncWebCrawler(verbose=True) as crawler:
-        result = await crawler.arun(url="https://www.nbcnews.com/business")
-        print(result.markdown_v2.raw_markdown) # Soone will be change to result.markdown
-
-if __name__ == "__main__":
-    asyncio.run(main())
-```
-
-## Advanced Usage Examples 🔬
+## 🔬 Advanced Usage Examples 🔬
 
 You can check the project structure in the directory [https://github.com/unclecode/crawl4ai/docs/examples](docs/examples). Over there, you can find a variety of examples; here, some popular examples are shared.
 
 <details open>
-<summary>🖥️ <strong>Heuristic Markdown Generation with Clean and Fit Markdown</strong></summary>
+<summary>📝 <strong>Heuristic Markdown Generation with Clean and Fit Markdown</strong></summary>
 
 ```python
 import asyncio
@@ -310,7 +367,7 @@ if __name__ == "__main__":
 </details>
 
 <details open>
-<summary>🖥️ <strong>Structured Data Extraction and Executing JavaScript</strong></summary>
+<summary>🖥️ <strong>Executing JavaScript & Extract Structured Data without LLMs</strong></summary>
 
 ```python
 import asyncio
@@ -393,7 +450,7 @@ if __name__ == "__main__":
 </details>
 
 <details open>
-<summary>🤖 <strong>Extracting Structured Data with LLMs</strong></summary>
+<summary>📚 <strong>Extracting Structured Data with LLMs</strong></summary>
 
 ```python
 import os
@@ -480,74 +537,43 @@ async def test_news_crawl():
 </details>
 
 
-## Speed Comparison 🚀
-A test was conducted on **[NBC News - Business Section](https://www.nbcnews.com/business)** to compare Crawl4AI and Firecrawl, highlighting Crawl4AI's speed, efficiency, and advanced features.
+## ✨ New in 0.3.743   
 
----
+- 🚀 **Improved ManagedBrowser Configuration**: Dynamic host and port support for more flexible browser management.  
+- 📝 **Enhanced Markdown Generation**: New generator class for better formatting and customization.  
+- ⚡ **Fast HTML Formatting**: Significantly optimized HTML formatting in the web crawler.  
+- 🛠️ **Utility & Sanitization Upgrades**: Improved sanitization and expanded utility functions for streamlined workflows.  
+- 👥 **Acknowledgments**: Added contributor details and pull request acknowledgments for better transparency.  
 
-#### Results Summary  
 
-| **Method**                     | **Time Taken** | **Markdown Length** | **Fit Markdown** | **Images Found** |
-|--------------------------------|----------------|----------------------|-------------------|------------------|
-| **Firecrawl**                  | 6.04 seconds   | 38,382 characters    | -                 | 52               |
-| **Crawl4AI (Simple Crawl)**    | 1.06 seconds   | 42,027 characters    | -                 | 52               |
-| **Crawl4AI (Markdown Plus)**   | 1.30 seconds   | 54,342 characters    | 11,119 characters | 52               |
-| **Crawl4AI (JavaScript)**      | 1.56 seconds   | 75,869 characters    | 13,406 characters | 92               |
-
----
-
-#### Key Takeaways  
-
-1. **Superior Speed**: Crawl4AI processes even advanced crawls up to **6x faster** than Firecrawl, with times as low as **1.06 seconds**.  
-2. **Rich Content Extraction**: Crawl4AI consistently captures more comprehensive content, producing a **Markdown Plus** output of **54,342 characters**, compared to Firecrawl's **38,382 characters**.  
-3. **AI-Optimized Output**: With **Fit Markdown**, Crawl4AI removes noise to produce concise, AI-friendly outputs (**11,119–13,406 characters**) tailored for LLM workflows.  
-4. **Dynamic Content Handling**: Using JavaScript execution, Crawl4AI extracted **92 images** and enriched content dynamically loaded via “Load More” buttons—unmatched by Firecrawl.  
-
----
-
-#### Conclusion  
-
-Crawl4AI outshines Firecrawl in speed, completeness, and flexibility. Its advanced features, including **Markdown Plus**, **Fit Markdown**, and **dynamic content handling**, make it the ideal choice for AI-ready web crawling. Whether you're targeting rich structured data or handling complex dynamic websites, Crawl4AI delivers unmatched performance and precision.
-
-You can find the full comparison code in our repository at [docs/examples/quickstart_async.py](https://github.com/unclecode/crawl4ai/blob/main/docs/examples/quickstart_async.py).
-
-## Documentation 📚
+## 📖 Documentation & Roadmap 
 
 For detailed documentation, including installation instructions, advanced features, and API reference, visit our [Documentation Website](https://crawl4ai.com/mkdocs/).
 
-## Crawl4AI Roadmap 🗺️
+Moreover to check our development plans and upcoming features, check out our [Roadmap](https://github.com/unclecode/crawl4ai/blob/main/ROADMAP.md).
 
-For detailed information on our development plans and upcoming features, check out our [Roadmap](https://github.com/unclecode/crawl4ai/blob/main/ROADMAP.md).
-
-### Advanced Crawling Systems 🔧
 - [x] 0. Graph Crawler: Smart website traversal using graph search algorithms for comprehensive nested page extraction
 - [ ] 1. Question-Based Crawler: Natural language driven web discovery and content extraction
 - [ ] 2. Knowledge-Optimal Crawler: Smart crawling that maximizes knowledge while minimizing data extraction
 - [ ] 3. Agentic Crawler: Autonomous system for complex multi-step crawling operations
-
-### Specialized Features 🛠️
 - [ ] 4. Automated Schema Generator: Convert natural language to extraction schemas
 - [ ] 5. Domain-Specific Scrapers: Pre-configured extractors for common platforms (academic, e-commerce)
 - [ ] 6. Web Embedding Index: Semantic search infrastructure for crawled content
-
-### Development Tools 🔨
 - [ ] 7. Interactive Playground: Web UI for testing, comparing strategies with AI assistance
 - [ ] 8. Performance Monitor: Real-time insights into crawler operations
 - [ ] 9. Cloud Integration: One-click deployment solutions across cloud providers
-
-### Community & Growth 🌱
 - [ ] 10. Sponsorship Program: Structured support system with tiered benefits
 - [ ] 11. Educational Content: "How to Crawl" video series and interactive tutorials
 
-## Contributing 🤝
+## 🤝 Contributing 
 
 We welcome contributions from the open-source community. Check out our [contribution guidelines](https://github.com/unclecode/crawl4ai/blob/main/CONTRIBUTING.md) for more information.
 
-## License 📄
+## 📄 License 
 
 Crawl4AI is released under the [Apache 2.0 License](https://github.com/unclecode/crawl4ai/blob/main/LICENSE).
 
-## Contact 📧
+## 📧 Contact 
 
 For questions, suggestions, or feedback, feel free to reach out:
 
@@ -558,7 +584,7 @@ For questions, suggestions, or feedback, feel free to reach out:
 Happy Crawling! 🕸️🚀
 
 
-# Mission
+## 🗾 Mission
 
 Our mission is to unlock the untapped potential of personal and enterprise data in the digital age. In today's world, individuals and organizations generate vast amounts of valuable digital footprints, yet this data remains largely uncapitalized as a true asset. 
 
@@ -570,13 +596,13 @@ This democratization of data represents the first step toward a shared data econ
 
 For a detailed exploration of our vision, opportunities, and pathway forward, please see our [full mission statement](./MISSION.md).
 
-## Key Opportunities
+### Key Opportunities
 
 - **Data Capitalization**: Transform digital footprints into valuable assets that can appear on personal and enterprise balance sheets
 - **Authentic Data**: Unlock the vast reservoir of real human insights and knowledge for AI advancement
 - **Shared Economy**: Create new value streams where data creators directly benefit from their contributions
 
-## Development Pathway
+### Development Pathway
 
 1. **Open-Source Foundation**: Building transparent, community-driven data extraction tools
 2. **Data Capitalization Platform**: Creating tools to structure and value digital assets

From ddfb6707b47b6be786c2115cd7511b3d94d89e7c Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Thu, 28 Nov 2024 16:34:08 +0800
Subject: [PATCH 083/115] docs: update README to reflect new branding and
 improve section headings for clarity

---
 README.md | 10 +++-------
 1 file changed, 3 insertions(+), 7 deletions(-)

diff --git a/README.md b/README.md
index c4ef1bd3..ed6892ec 100644
--- a/README.md
+++ b/README.md
@@ -1,6 +1,4 @@
-# 🔥🕷️ Crawl4AI: LLM Friendly Web Crawler & Scraper
-
-[✨ Check out what's new in the latest update!](#new-in-03743)
+# 🔥🕷️ Crawl4AI: Crawl Smarter, Faster, Freely. For AI.
 
 <a href="https://trendshift.io/repositories/11716" target="_blank"><img src="https://trendshift.io/api/badge/repositories/11716" alt="unclecode%2Fcrawl4ai | Trendshift" style="width: 250px; height: 55px;" width="250" height="55"/></a>
 
@@ -11,11 +9,9 @@
 [![GitHub Pull Requests](https://img.shields.io/github/issues-pr/unclecode/crawl4ai)](https://github.com/unclecode/crawl4ai/pulls)
 [![License](https://img.shields.io/github/license/unclecode/crawl4ai)](https://github.com/unclecode/crawl4ai/blob/main/LICENSE)
 
-## 🔥 Crawl4AI: Crawl Smarter, Faster, Freely. For AI.  
-
 Crawl4AI is the #1 trending GitHub repository, actively maintained by a vibrant community. It delivers blazing-fast, AI-ready web crawling tailored for LLMs, AI agents, and data pipelines. Open source, flexible, and built for real-time performance, Crawl4AI empowers developers with unmatched speed, precision, and deployment ease.  
 
-[✨ Check out what's new in the latest update!](#new-in-03743)
+[✨ Check out what's new in the latest update!](#recent-updates)  
 
 ## 🧐 Why Crawl4AI?
 
@@ -537,7 +533,7 @@ async def test_news_crawl():
 </details>
 
 
-## ✨ New in 0.3.743   
+## ✨ Recent Updates   
 
 - 🚀 **Improved ManagedBrowser Configuration**: Dynamic host and port support for more flexible browser management.  
 - 📝 **Enhanced Markdown Generation**: New generator class for better formatting and customization.  

From 3fda66b85b793655a92b3627599472f4d3279b0b Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Thu, 28 Nov 2024 16:36:24 +0800
Subject: [PATCH 084/115] docs: refine README content for clarity and
 conciseness, improving descriptions and formatting

---
 README.md | 33 +++++++++++++++------------------
 1 file changed, 15 insertions(+), 18 deletions(-)

diff --git a/README.md b/README.md
index ed6892ec..7bf4b4a4 100644
--- a/README.md
+++ b/README.md
@@ -15,13 +15,12 @@ Crawl4AI is the #1 trending GitHub repository, actively maintained by a vibrant
 
 ## 🧐 Why Crawl4AI?
 
-1. **Built for LLMs**: Creates **smart, concise Markdown** optimized for applications like Retrieval-Augmented Generation (RAG) and fine-tuning.  
-2. **Lightning Fast**: Delivers results **6x faster** than competitors with real-time, cost-efficient performance.  
-3. **Flexible Browser Control**: Offers session management, proxies, and custom hooks for precise, seamless data access.  
-4. **Heuristic Intelligence**: Leverages **advanced algorithms** to extract data efficiently, reducing reliance on costly language models.  
-5. **Open Source & Deployable**: 100% open-source with no API keys or registration required-ready for **Docker and cloud integration**.  
-6. **Thriving Community**: Actively maintained by a vibrant developer community and the **#1 trending GitHub repository** across all languages.
-
+1. **Built for LLMs**: Creates smart, concise Markdown optimized for RAG and fine-tuning applications.  
+2. **Lightning Fast**: Delivers results 6x faster with real-time, cost-efficient performance.  
+3. **Flexible Browser Control**: Offers session management, proxies, and custom hooks for seamless data access.  
+4. **Heuristic Intelligence**: Uses advanced algorithms for efficient extraction, reducing reliance on costly models.  
+5. **Open Source & Deployable**: Fully open-source with no API keys—ready for Docker and cloud integration.  
+6. **Thriving Community**: Actively maintained by a vibrant community and the #1 trending GitHub repository.
 
 ## 🚀 Quick Start 
 
@@ -145,7 +144,7 @@ A test was conducted on **[NBC News - Business Section](https://www.nbcnews.com/
 
 </details>
 
-<details open>
+<details>
 <summary>⚡ <strong>Key Takeaways</strong></summary>
 
 1. **Superior Speed**: Crawl4AI processes even advanced crawls up to **6x faster** than Firecrawl, with times as low as **1.06 seconds**.  
@@ -155,7 +154,7 @@ A test was conducted on **[NBC News - Business Section](https://www.nbcnews.com/
 
 </details>
 
-<details open>
+<details>
 <summary>🏁 <strong>Conclusion</strong></summary>
 
 Crawl4AI outshines Firecrawl in speed, completeness, and flexibility. Its advanced features, including **Markdown Plus**, **Fit Markdown**, and **dynamic content handling**, make it the ideal choice for AI-ready web crawling. Whether you're targeting rich structured data or handling complex dynamic websites, Crawl4AI delivers unmatched performance and precision.
@@ -169,7 +168,7 @@ You can find the full comparison code in our repository at [docs/examples/quicks
 
 Crawl4AI offers flexible installation options to suit various use cases. You can install it as a Python package or use Docker.
 
-<details open>
+<details>
 <summary>🐍 <strong>Using pip</strong></summary>
 
 Choose the installation option that best fits your needs:
@@ -234,7 +233,7 @@ pip install -e ".[all]"             # Install all optional features
 
 </details>
 
-<details open>
+<details>
 <summary>🚀 <strong>One-Click Deployment</strong></summary>
 
 Deploy your own instance of Crawl4AI with one click:
@@ -251,7 +250,7 @@ The deploy will:
 
 </details>
 
-<details open>
+<details>
 <summary>🐳 <strong>Using Docker</strong></summary>
 
 Crawl4AI is available as Docker images for easy deployment. You can either pull directly from Docker Hub (recommended) or build from the repository.
@@ -325,13 +324,11 @@ For advanced configuration, environment variables, and usage examples, see our [
 </details>
 
 
-
-
 ## 🔬 Advanced Usage Examples 🔬
 
 You can check the project structure in the directory [https://github.com/unclecode/crawl4ai/docs/examples](docs/examples). Over there, you can find a variety of examples; here, some popular examples are shared.
 
-<details open>
+<details>
 <summary>📝 <strong>Heuristic Markdown Generation with Clean and Fit Markdown</strong></summary>
 
 ```python
@@ -362,7 +359,7 @@ if __name__ == "__main__":
 
 </details>
 
-<details open>
+<details>
 <summary>🖥️ <strong>Executing JavaScript & Extract Structured Data without LLMs</strong></summary>
 
 ```python
@@ -445,7 +442,7 @@ if __name__ == "__main__":
 
 </details>
 
-<details open>
+<details>
 <summary>📚 <strong>Extracting Structured Data with LLMs</strong></summary>
 
 ```python
@@ -485,7 +482,7 @@ if __name__ == "__main__":
 
 </details>
 
-<details open>
+<details>
 <summary>🤖 <strong>Using You own Browswer with Custome User Profile</strong></summary>
 
 ```python

From efe93a5f57ebe677cc12dca90549525626a85b98 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Thu, 28 Nov 2024 16:41:11 +0800
Subject: [PATCH 085/115] docs: enhance README with development TODOs and
 refine mission statement for clarity

---
 README.md | 37 +++++++++++++++++++++----------------
 1 file changed, 21 insertions(+), 16 deletions(-)

diff --git a/README.md b/README.md
index 7bf4b4a4..20395b58 100644
--- a/README.md
+++ b/README.md
@@ -545,6 +545,9 @@ For detailed documentation, including installation instructions, advanced featur
 
 Moreover to check our development plans and upcoming features, check out our [Roadmap](https://github.com/unclecode/crawl4ai/blob/main/ROADMAP.md).
 
+<details>
+<summary>📈 <strong>Development TODOs</strong></summary>
+
 - [x] 0. Graph Crawler: Smart website traversal using graph search algorithms for comprehensive nested page extraction
 - [ ] 1. Question-Based Crawler: Natural language driven web discovery and content extraction
 - [ ] 2. Knowledge-Optimal Crawler: Smart crawling that maximizes knowledge while minimizing data extraction
@@ -558,6 +561,8 @@ Moreover to check our development plans and upcoming features, check out our [Ro
 - [ ] 10. Sponsorship Program: Structured support system with tiered benefits
 - [ ] 11. Educational Content: "How to Crawl" video series and interactive tutorials
 
+</details>
+
 ## 🤝 Contributing 
 
 We welcome contributions from the open-source community. Check out our [contribution guidelines](https://github.com/unclecode/crawl4ai/blob/main/CONTRIBUTING.md) for more information.
@@ -576,32 +581,32 @@ For questions, suggestions, or feedback, feel free to reach out:
 
 Happy Crawling! 🕸️🚀
 
-
 ## 🗾 Mission
 
-Our mission is to unlock the untapped potential of personal and enterprise data in the digital age. In today's world, individuals and organizations generate vast amounts of valuable digital footprints, yet this data remains largely uncapitalized as a true asset. 
+Our mission is to unlock the value of personal and enterprise data by transforming digital footprints into structured, tradeable assets. Crawl4AI empowers individuals and organizations with open-source tools to extract and structure data, fostering a shared data economy.  
 
-Our open-source solution empowers developers and innovators to build tools for data extraction and structuring, laying the foundation for a new era of data ownership. By transforming personal and enterprise data into structured, tradeable assets, we're creating opportunities for individuals to capitalize on their digital footprints and for organizations to unlock the value of their collective knowledge.
+We envision a future where AI is powered by real human knowledge, ensuring data creators directly benefit from their contributions. By democratizing data and enabling ethical sharing, we are laying the foundation for authentic AI advancement.
 
-This democratization of data represents the first step toward a shared data economy, where willing participation in data sharing drives AI advancement while ensuring the benefits flow back to data creators. Through this approach, we're building a future where AI development is powered by authentic human knowledge rather than synthetic alternatives.
+<details>
+<summary>🔑 <strong>Key Opportunities</strong></summary>
+ 
+- **Data Capitalization**: Transform digital footprints into measurable, valuable assets.  
+- **Authentic AI Data**: Provide AI systems with real human insights.  
+- **Shared Economy**: Create a fair data marketplace that benefits data creators.  
 
-![Mission Diagram](./docs/assets/pitch-dark.svg)
+</details>
 
-For a detailed exploration of our vision, opportunities, and pathway forward, please see our [full mission statement](./MISSION.md).
+<details>
+<summary>🚀 <strong>Development Pathway</strong></summary>
 
-### Key Opportunities
+1. **Open-Source Tools**: Community-driven platforms for transparent data extraction.  
+2. **Digital Asset Structuring**: Tools to organize and value digital knowledge.  
+3. **Ethical Data Marketplace**: A secure, fair platform for exchanging structured data.  
 
-- **Data Capitalization**: Transform digital footprints into valuable assets that can appear on personal and enterprise balance sheets
-- **Authentic Data**: Unlock the vast reservoir of real human insights and knowledge for AI advancement
-- **Shared Economy**: Create new value streams where data creators directly benefit from their contributions
+For more details, see our [full mission statement](./MISSION.md).
+</details>
 
-### Development Pathway
 
-1. **Open-Source Foundation**: Building transparent, community-driven data extraction tools
-2. **Data Capitalization Platform**: Creating tools to structure and value digital assets
-3. **Shared Data Marketplace**: Establishing an economic platform for ethical data exchange
-
-For a detailed exploration of our vision, challenges, and solutions, please see our [full mission statement](./MISSION.md).
 
 
 ## Star History

From 0bccf23db3f90bf07342f34591c91b92eb1cdf89 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Thu, 28 Nov 2024 18:19:42 +0800
Subject: [PATCH 086/115] docs: update quickstart_async.py to enable example
 function calls for better demonstration

---
 docs/examples/quickstart_async.py | 36 +++++++++++++++----------------
 1 file changed, 18 insertions(+), 18 deletions(-)

diff --git a/docs/examples/quickstart_async.py b/docs/examples/quickstart_async.py
index e50fe456..9f1eff53 100644
--- a/docs/examples/quickstart_async.py
+++ b/docs/examples/quickstart_async.py
@@ -534,31 +534,31 @@ async def fit_markdown_remove_overlay():
 
 
 async def main():
-    # await simple_crawl()
-    # await simple_example_with_running_js_code()
-    # await simple_example_with_css_selector()
-    # await use_proxy()
-    # await capture_and_save_screenshot("https://www.example.com", os.path.join(__location__, "tmp/example_screenshot.jpg"))
-    # await extract_structured_data_using_css_extractor()
+    await simple_crawl()
+    await simple_example_with_running_js_code()
+    await simple_example_with_css_selector()
+    await use_proxy()
+    await capture_and_save_screenshot("https://www.example.com", os.path.join(__location__, "tmp/example_screenshot.jpg"))
+    await extract_structured_data_using_css_extractor()
 
-    # # LLM extraction examples
+    # LLM extraction examples
     # await extract_structured_data_using_llm()
     # await extract_structured_data_using_llm("huggingface/meta-llama/Meta-Llama-3.1-8B-Instruct", os.getenv("HUGGINGFACE_API_KEY"))
-    # await extract_structured_data_using_llm("openai/gpt-4o", os.getenv("OPENAI_API_KEY"))
     # await extract_structured_data_using_llm("ollama/llama3.2")    
+    await extract_structured_data_using_llm("openai/gpt-4o", os.getenv("OPENAI_API_KEY"))
 
-    # # You always can pass custom headers to the extraction strategy
-    # custom_headers = {
-    #     "Authorization": "Bearer your-custom-token",
-    #     "X-Custom-Header": "Some-Value"
-    # }
-    # await extract_structured_data_using_llm(extra_headers=custom_headers)
+    # You always can pass custom headers to the extraction strategy
+    custom_headers = {
+        "Authorization": "Bearer your-custom-token",
+        "X-Custom-Header": "Some-Value"
+    }
+    await extract_structured_data_using_llm(extra_headers=custom_headers)
     
-    # # await crawl_dynamic_content_pages_method_1()
-    # # await crawl_dynamic_content_pages_method_2()
-    # await crawl_dynamic_content_pages_method_3()
+    # await crawl_dynamic_content_pages_method_1()
+    # await crawl_dynamic_content_pages_method_2()
+    await crawl_dynamic_content_pages_method_3()
     
-    # await crawl_custom_browser_type()
+    await crawl_custom_browser_type()
     
     await speed_comparison()
 

From a036b7f12224d6a424118e3d113e49ab1e2c9e13 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Thu, 28 Nov 2024 19:24:07 +0800
Subject: [PATCH 087/115] feat: implement create_box_message utility for
 formatted error messages and enhance error logging in AsyncWebCrawler

---
 crawl4ai/async_crawler_strategy.py | 21 +++++-----
 crawl4ai/async_webcrawler.py       |  8 ++--
 crawl4ai/utils.py                  | 64 ++++++++++++++++++++++++++++--
 3 files changed, 77 insertions(+), 16 deletions(-)

diff --git a/crawl4ai/async_crawler_strategy.py b/crawl4ai/async_crawler_strategy.py
index 882f9a50..e5316187 100644
--- a/crawl4ai/async_crawler_strategy.py
+++ b/crawl4ai/async_crawler_strategy.py
@@ -15,7 +15,7 @@ import hashlib
 import json
 import uuid
 from .models import AsyncCrawlResponse
-
+from .utils import create_box_message
 from playwright_stealth import StealthConfig, stealth_async
 
 stealth_config = StealthConfig(
@@ -321,10 +321,10 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
                         "--disable-infobars",
                         "--window-position=0,0",
                         "--ignore-certificate-errors",
-                        "--ignore-certificate-errors-spki-list",
+                        "--ignore-certificate-errors-spki-list"
                     ]
                 }
-
+                
                 # Add channel if specified (try Chrome first)
                 if self.chrome_channel:
                     browser_args["channel"] = self.chrome_channel
@@ -765,12 +765,15 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
                 await self.execute_hook('before_goto', page, context = context)
                 
 
-                response = await page.goto(
-                    url,
-                    # wait_until=kwargs.get("wait_until", ["domcontentloaded", "networkidle"]),
-                    wait_until=kwargs.get("wait_until", "domcontentloaded"),
-                    timeout=kwargs.get("page_timeout", 60000)
-                )
+                try:
+                    response = await page.goto(
+                        url,
+                        # wait_until=kwargs.get("wait_until", ["domcontentloaded", "networkidle"]),
+                        wait_until=kwargs.get("wait_until", "domcontentloaded"),
+                        timeout=kwargs.get("page_timeout", 60000),
+                    )
+                except Error as e:
+                    raise RuntimeError(f"Failed on navigating ACS-GOTO :\n{str(e)}")
                 
                 # response = await page.goto("about:blank")
                 # await page.evaluate(f"window.location.href = '{url}'")
diff --git a/crawl4ai/async_webcrawler.py b/crawl4ai/async_webcrawler.py
index 5a46fe39..66b4c21b 100644
--- a/crawl4ai/async_webcrawler.py
+++ b/crawl4ai/async_webcrawler.py
@@ -26,8 +26,10 @@ from .utils import (
     sanitize_input_encode,
     InvalidCSSSelectorError,
     format_html,
-    fast_format_html
+    fast_format_html,
+    create_box_message
 )
+
 from urllib.parse import urlparse
 import random
 from .__version__ import __version__ as crawl4ai_version
@@ -326,15 +328,15 @@ class AsyncWebCrawler:
             if not hasattr(e, "msg"):
                 e.msg = str(e)
             # print(f"{Fore.RED}{self.tag_format('ERROR')} {self.log_icons['ERROR']} Failed to crawl {cache_context.display_url[:URL_LOG_SHORTEN_LENGTH]}... | {e.msg}{Style.RESET_ALL}")
+            
             self.logger.error_status(
                 url=cache_context.display_url,
-                error=e.msg,
+                error=create_box_message(e.msg, type = "error"),
                 tag="ERROR"
             )            
             return CrawlResult(
                 url=url, 
                 html="", 
-                markdown=f"[ERROR] 🚫 arun(): Failed to crawl {cache_context.display_url}, error: {e.msg}", 
                 success=False, 
                 error_message=e.msg
             )
diff --git a/crawl4ai/utils.py b/crawl4ai/utils.py
index aaf27e91..253ec079 100644
--- a/crawl4ai/utils.py
+++ b/crawl4ai/utils.py
@@ -17,7 +17,8 @@ from requests.exceptions import InvalidSchema
 import hashlib
 from typing import Optional, Tuple, Dict, Any
 import xxhash
-
+from colorama import Fore, Style, init
+import textwrap
 
 from .html2text import HTML2Text
 class CustomHTML2Text(HTML2Text):
@@ -103,12 +104,67 @@ class CustomHTML2Text(HTML2Text):
             self.preserved_content.append(data)
             return
         super().handle_data(data, entity_char)
-
-
-
 class InvalidCSSSelectorError(Exception):
     pass
 
+
+def create_box_message(
+   message: str, 
+   type: str = "info", 
+   width: int = 80, 
+   add_newlines: bool = True,
+   double_line: bool = False
+) -> str:
+   init()
+   
+   # Define border and text colors for different types
+   styles = {
+       "warning": (Fore.YELLOW, Fore.LIGHTYELLOW_EX, "⚠"),
+       "info": (Fore.BLUE, Fore.LIGHTBLUE_EX, "ℹ"), 
+       "success": (Fore.GREEN, Fore.LIGHTGREEN_EX, "✓"),
+       "error": (Fore.RED, Fore.LIGHTRED_EX, "×"),
+   }
+   
+   border_color, text_color, prefix = styles.get(type.lower(), styles["info"])
+   
+   # Define box characters based on line style
+   box_chars = {
+       "single": ("─", "│", "┌", "┐", "└", "┘"),
+       "double": ("═", "║", "╔", "╗", "╚", "╝")
+   }
+   line_style = "double" if double_line else "single"
+   h_line, v_line, tl, tr, bl, br = box_chars[line_style]
+   
+   # Process lines with lighter text color
+   formatted_lines = []
+   raw_lines = message.split('\n')
+   
+   if raw_lines:
+       first_line = f"{prefix} {raw_lines[0].strip()}"
+       wrapped_first = textwrap.fill(first_line, width=width-4)
+       formatted_lines.extend(wrapped_first.split('\n'))
+       
+       for line in raw_lines[1:]:
+           if line.strip():
+               wrapped = textwrap.fill(f"  {line.strip()}", width=width-4)
+               formatted_lines.extend(wrapped.split('\n'))
+           else:
+               formatted_lines.append("")
+   
+   # Create the box with colored borders and lighter text
+   horizontal_line = h_line * (width - 1)
+   box = [
+       f"{border_color}{tl}{horizontal_line}{tr}",
+       *[f"{border_color}{v_line}{text_color} {line:<{width-2}}{border_color}{v_line}" for line in formatted_lines],
+       f"{border_color}{bl}{horizontal_line}{br}{Style.RESET_ALL}"
+   ]
+   
+   result = "\n".join(box)
+   if add_newlines:
+       result = f"\n{result}\n"
+   
+   return result
+
 def calculate_semaphore_count():
     cpu_count = os.cpu_count()
     memory_gb = get_system_memory() / (1024 ** 3)  # Convert to GB

From a9b6b6523812333400fd66730ce3e3c184ad79e2 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Thu, 28 Nov 2024 19:26:50 +0800
Subject: [PATCH 088/115] chore: update version to 0.3.744 and add publish.sh
 to .gitignore

---
 .gitignore              | 1 +
 crawl4ai/__version__.py | 2 +-
 2 files changed, 2 insertions(+), 1 deletion(-)

diff --git a/.gitignore b/.gitignore
index 8e96fa82..52e25a2a 100644
--- a/.gitignore
+++ b/.gitignore
@@ -214,3 +214,4 @@ git_issues.md
 todo_executor.md
 protect-all-except-feature.sh
 manage-collab.sh
+publish.sh
\ No newline at end of file
diff --git a/crawl4ai/__version__.py b/crawl4ai/__version__.py
index 073b371c..e38cc61b 100644
--- a/crawl4ai/__version__.py
+++ b/crawl4ai/__version__.py
@@ -1,2 +1,2 @@
 # crawl4ai/_version.py
-__version__ = "0.3.743"
+__version__ = "0.3.744"

From b14e83f49951cba097e67464546ba2b4f2787cdc Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Thu, 28 Nov 2024 19:31:09 +0800
Subject: [PATCH 089/115] docs: fix link formatting for recent updates section
 in README

---
 README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/README.md b/README.md
index d22d8940..26cc9fcc 100644
--- a/README.md
+++ b/README.md
@@ -11,7 +11,7 @@
 
 Crawl4AI is the #1 trending GitHub repository, actively maintained by a vibrant community. It delivers blazing-fast, AI-ready web crawling tailored for LLMs, AI agents, and data pipelines. Open source, flexible, and built for real-time performance, Crawl4AI empowers developers with unmatched speed, precision, and deployment ease.  
 
-[✨ Check out what's new in the latest update!](#recent-updates)  
+[✨ Check out what's new in the latest update!](#-recent-updates)
 
 ## 🧐 Why Crawl4AI?
 

From 776efa74a4c9fde71377f986cc69b201632a59c0 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Thu, 28 Nov 2024 19:32:32 +0800
Subject: [PATCH 090/115] docs: fix link formatting for recent updates section
 in README

---
 README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/README.md b/README.md
index 26cc9fcc..01197868 100644
--- a/README.md
+++ b/README.md
@@ -11,7 +11,7 @@
 
 Crawl4AI is the #1 trending GitHub repository, actively maintained by a vibrant community. It delivers blazing-fast, AI-ready web crawling tailored for LLMs, AI agents, and data pipelines. Open source, flexible, and built for real-time performance, Crawl4AI empowers developers with unmatched speed, precision, and deployment ease.  
 
-[✨ Check out what's new in the latest update!](#-recent-updates)
+[✨ Check out what's new in the latest update!](#--recent-updates)
 
 ## 🧐 Why Crawl4AI?
 

From 48d43c14b1864b87866e8114f5c4fc6e415b6e51 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Thu, 28 Nov 2024 19:33:02 +0800
Subject: [PATCH 091/115] docs: fix link formatting for recent updates section
 in README

---
 README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/README.md b/README.md
index 01197868..26cc9fcc 100644
--- a/README.md
+++ b/README.md
@@ -11,7 +11,7 @@
 
 Crawl4AI is the #1 trending GitHub repository, actively maintained by a vibrant community. It delivers blazing-fast, AI-ready web crawling tailored for LLMs, AI agents, and data pipelines. Open source, flexible, and built for real-time performance, Crawl4AI empowers developers with unmatched speed, precision, and deployment ease.  
 
-[✨ Check out what's new in the latest update!](#--recent-updates)
+[✨ Check out what's new in the latest update!](#-recent-updates)
 
 ## 🧐 Why Crawl4AI?
 

From 9221c08418bbfaa0d0cf48b4f933e3a2ae722f3a Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Thu, 28 Nov 2024 19:33:36 +0800
Subject: [PATCH 092/115] docs: fix link formatting for recent updates section
 in README

---
 README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/README.md b/README.md
index d22d8940..26cc9fcc 100644
--- a/README.md
+++ b/README.md
@@ -11,7 +11,7 @@
 
 Crawl4AI is the #1 trending GitHub repository, actively maintained by a vibrant community. It delivers blazing-fast, AI-ready web crawling tailored for LLMs, AI agents, and data pipelines. Open source, flexible, and built for real-time performance, Crawl4AI empowers developers with unmatched speed, precision, and deployment ease.  
 
-[✨ Check out what's new in the latest update!](#recent-updates)  
+[✨ Check out what's new in the latest update!](#-recent-updates)
 
 ## 🧐 Why Crawl4AI?
 

From cf35cbe59e39222b8e3c76ffadc67a7fea55df7a Mon Sep 17 00:00:00 2001
From: Paulo Kuong <pkuong80@gmail.com>
Date: Thu, 28 Nov 2024 06:46:36 -0500
Subject: [PATCH 093/115] CRAWL4_AI_BASE_DIRECTORY should be Path object
 instead of string (#298)

Thank you so much for your point. Yes, that's correct. I accept your pull request, and I add your name to a contribution list. Thank you again.
---
 setup.py | 50 +++++++++++++++++++++++++++++++++++---------------
 1 file changed, 35 insertions(+), 15 deletions(-)

diff --git a/setup.py b/setup.py
index f5f3cf2d..796c3bf9 100644
--- a/setup.py
+++ b/setup.py
@@ -9,10 +9,16 @@ import asyncio
 
 # Create the .crawl4ai folder in the user's home directory if it doesn't exist
 # If the folder already exists, remove the cache folder
-crawl4ai_folder = os.getenv("CRAWL4_AI_BASE_DIRECTORY", Path.home()) / ".crawl4ai"
+crawl4ai_folder = Path(os.getenv("CRAWL4_AI_BASE_DIRECTORY")) or Path.home()
+crawl4ai_folder = crawl4ai_folder / ".crawl4ai"
 cache_folder = crawl4ai_folder / "cache"
-content_folders = ['html_content', 'cleaned_html', 'markdown_content', 
-                  'extracted_content', 'screenshots']
+content_folders = [
+    "html_content",
+    "cleaned_html",
+    "markdown_content",
+    "extracted_content",
+    "screenshots",
+]
 
 # Clean up old cache if exists
 if cache_folder.exists():
@@ -28,7 +34,7 @@ for folder in content_folders:
 __location__ = os.path.realpath(os.path.join(os.getcwd(), os.path.dirname(__file__)))
 with open(os.path.join(__location__, "requirements.txt")) as f:
     requirements = f.read().splitlines()
-    
+
 with open("crawl4ai/__version__.py") as f:
     for line in f:
         if line.startswith("__version__"):
@@ -37,11 +43,12 @@ with open("crawl4ai/__version__.py") as f:
 
 # Define requirements
 default_requirements = requirements
-torch_requirements = ["torch", "nltk",  "scikit-learn"]
+torch_requirements = ["torch", "nltk", "scikit-learn"]
 transformer_requirements = ["transformers", "tokenizers"]
-cosine_similarity_requirements = ["torch", "transformers", "nltk" ]
+cosine_similarity_requirements = ["torch", "transformers", "nltk"]
 sync_requirements = ["selenium"]
 
+
 def install_playwright():
     print("Installing Playwright browsers...")
     try:
@@ -49,16 +56,22 @@ def install_playwright():
         print("Playwright installation completed successfully.")
     except subprocess.CalledProcessError as e:
         print(f"Error during Playwright installation: {e}")
-        print("Please run 'python -m playwright install' manually after the installation.")
+        print(
+            "Please run 'python -m playwright install' manually after the installation."
+        )
     except Exception as e:
         print(f"Unexpected error during Playwright installation: {e}")
-        print("Please run 'python -m playwright install' manually after the installation.")
+        print(
+            "Please run 'python -m playwright install' manually after the installation."
+        )
+
 
 def run_migration():
     """Initialize database during installation"""
     try:
         print("Starting database initialization...")
         from crawl4ai.async_database import async_db_manager
+
         asyncio.run(async_db_manager.initialize())
         print("Database initialization completed successfully.")
     except ImportError:
@@ -67,12 +80,14 @@ def run_migration():
         print(f"Warning: Database initialization failed: {e}")
         print("Database will be initialized on first use")
 
+
 class PostInstallCommand(install):
     def run(self):
         install.run(self)
         install_playwright()
         # run_migration()
 
+
 setup(
     name="Crawl4AI",
     version=version,
@@ -84,18 +99,23 @@ setup(
     author_email="unclecode@kidocode.com",
     license="MIT",
     packages=find_packages(),
-    install_requires=default_requirements + ["playwright", "aiofiles"],  # Added aiofiles
+    install_requires=default_requirements
+    + ["playwright", "aiofiles"],  # Added aiofiles
     extras_require={
         "torch": torch_requirements,
         "transformer": transformer_requirements,
         "cosine": cosine_similarity_requirements,
         "sync": sync_requirements,
-        "all": default_requirements + torch_requirements + transformer_requirements + cosine_similarity_requirements + sync_requirements,
+        "all": default_requirements
+        + torch_requirements
+        + transformer_requirements
+        + cosine_similarity_requirements
+        + sync_requirements,
     },
     entry_points={
-        'console_scripts': [
-            'crawl4ai-download-models=crawl4ai.model_loader:main',
-            'crawl4ai-migrate=crawl4ai.migrations:main',  # Added migration command
+        "console_scripts": [
+            "crawl4ai-download-models=crawl4ai.model_loader:main",
+            "crawl4ai-migrate=crawl4ai.migrations:main",  # Added migration command
         ],
     },
     classifiers=[
@@ -110,6 +130,6 @@ setup(
     ],
     python_requires=">=3.7",
     cmdclass={
-        'install': PostInstallCommand,
+        "install": PostInstallCommand,
     },
-)
\ No newline at end of file
+)

From 1d83c493aff8672c9da471c222f60c5c72145b71 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Thu, 28 Nov 2024 19:58:40 +0800
Subject: [PATCH 094/115]   Enhance setup process and update contributors list 
  - Acknowledge contributor paulokuong for fixing RAWL4_AI_BASE_DIRECTORY
 issue   - Refine base directory handling in `setup.py`   - Clarify Playwright
 installation instructions and improve error handling

---
 CONTRIBUTORS.md |  1 +
 setup.py        | 48 ++++++++++++++++++++++++++++++++++--------------
 2 files changed, 35 insertions(+), 14 deletions(-)

diff --git a/CONTRIBUTORS.md b/CONTRIBUTORS.md
index deb46a9c..663e5541 100644
--- a/CONTRIBUTORS.md
+++ b/CONTRIBUTORS.md
@@ -21,6 +21,7 @@ We would like to thank the following people for their contributions to Crawl4AI:
 - [nelzomal](https://github.com/nelzomal) - Enhance development installation instructions [#286](https://github.com/unclecode/crawl4ai/pull/286)
 - [HamzaFarhan](https://github.com/HamzaFarhan) - Handled the cases where markdown_with_citations, references_markdown, and filtered_html might not be defined [#293](https://github.com/unclecode/crawl4ai/pull/293)
 - [NanmiCoder](https://github.com/NanmiCoder) - fix: crawler strategy exception handling and fixes [#271](https://github.com/unclecode/crawl4ai/pull/271)
+- [paulokuong](https://github.com/paulokuong) - fix: RAWL4_AI_BASE_DIRECTORY should be Path object instead of string [#298](https://github.com/unclecode/crawl4ai/pull/298)
 
 
 ## Other Contributors
diff --git a/setup.py b/setup.py
index f5f3cf2d..dbb07410 100644
--- a/setup.py
+++ b/setup.py
@@ -9,10 +9,16 @@ import asyncio
 
 # Create the .crawl4ai folder in the user's home directory if it doesn't exist
 # If the folder already exists, remove the cache folder
-crawl4ai_folder = os.getenv("CRAWL4_AI_BASE_DIRECTORY", Path.home()) / ".crawl4ai"
+crawl4ai_folder = Path(os.getenv("CRAWL4_AI_BASE_DIRECTORY")) or Path.home()
+crawl4ai_folder = crawl4ai_folder / ".crawl4ai"
 cache_folder = crawl4ai_folder / "cache"
-content_folders = ['html_content', 'cleaned_html', 'markdown_content', 
-                  'extracted_content', 'screenshots']
+content_folders = [
+    "html_content",
+    "cleaned_html",
+    "markdown_content",
+    "extracted_content",
+    "screenshots",
+]
 
 # Clean up old cache if exists
 if cache_folder.exists():
@@ -28,7 +34,7 @@ for folder in content_folders:
 __location__ = os.path.realpath(os.path.join(os.getcwd(), os.path.dirname(__file__)))
 with open(os.path.join(__location__, "requirements.txt")) as f:
     requirements = f.read().splitlines()
-    
+
 with open("crawl4ai/__version__.py") as f:
     for line in f:
         if line.startswith("__version__"):
@@ -37,11 +43,12 @@ with open("crawl4ai/__version__.py") as f:
 
 # Define requirements
 default_requirements = requirements
-torch_requirements = ["torch", "nltk",  "scikit-learn"]
+torch_requirements = ["torch", "nltk", "scikit-learn"]
 transformer_requirements = ["transformers", "tokenizers"]
-cosine_similarity_requirements = ["torch", "transformers", "nltk" ]
+cosine_similarity_requirements = ["torch", "transformers", "nltk"]
 sync_requirements = ["selenium"]
 
+
 def install_playwright():
     print("Installing Playwright browsers...")
     try:
@@ -49,16 +56,22 @@ def install_playwright():
         print("Playwright installation completed successfully.")
     except subprocess.CalledProcessError as e:
         print(f"Error during Playwright installation: {e}")
-        print("Please run 'python -m playwright install' manually after the installation.")
+        print(
+            "Please run 'python -m playwright install' manually after the installation."
+        )
     except Exception as e:
         print(f"Unexpected error during Playwright installation: {e}")
-        print("Please run 'python -m playwright install' manually after the installation.")
+        print(
+            "Please run 'python -m playwright install' manually after the installation."
+        )
+
 
 def run_migration():
     """Initialize database during installation"""
     try:
         print("Starting database initialization...")
         from crawl4ai.async_database import async_db_manager
+
         asyncio.run(async_db_manager.initialize())
         print("Database initialization completed successfully.")
     except ImportError:
@@ -67,12 +80,14 @@ def run_migration():
         print(f"Warning: Database initialization failed: {e}")
         print("Database will be initialized on first use")
 
+
 class PostInstallCommand(install):
     def run(self):
         install.run(self)
         install_playwright()
         # run_migration()
 
+
 setup(
     name="Crawl4AI",
     version=version,
@@ -84,18 +99,23 @@ setup(
     author_email="unclecode@kidocode.com",
     license="MIT",
     packages=find_packages(),
-    install_requires=default_requirements + ["playwright", "aiofiles"],  # Added aiofiles
+    install_requires=default_requirements
+    + ["playwright", "aiofiles"],  # Added aiofiles
     extras_require={
         "torch": torch_requirements,
         "transformer": transformer_requirements,
         "cosine": cosine_similarity_requirements,
         "sync": sync_requirements,
-        "all": default_requirements + torch_requirements + transformer_requirements + cosine_similarity_requirements + sync_requirements,
+        "all": default_requirements
+        + torch_requirements
+        + transformer_requirements
+        + cosine_similarity_requirements
+        + sync_requirements,
     },
     entry_points={
-        'console_scripts': [
-            'crawl4ai-download-models=crawl4ai.model_loader:main',
-            'crawl4ai-migrate=crawl4ai.migrations:main',  # Added migration command
+        "console_scripts": [
+            "crawl4ai-download-models=crawl4ai.model_loader:main",
+            "crawl4ai-migrate=crawl4ai.migrations:main",  # Added migration command
         ],
     },
     classifiers=[
@@ -110,6 +130,6 @@ setup(
     ],
     python_requires=">=3.7",
     cmdclass={
-        'install': PostInstallCommand,
+        "install": PostInstallCommand,
     },
 )
\ No newline at end of file

From 652d396a818a01d9673920da8c1a2d166f0d23f1 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Thu, 28 Nov 2024 20:00:29 +0800
Subject: [PATCH 095/115] chore: update version to 0.3.745

---
 crawl4ai/__version__.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/crawl4ai/__version__.py b/crawl4ai/__version__.py
index e38cc61b..8b69d491 100644
--- a/crawl4ai/__version__.py
+++ b/crawl4ai/__version__.py
@@ -1,2 +1,2 @@
 # crawl4ai/_version.py
-__version__ = "0.3.744"
+__version__ = "0.3.745"

From 7d81c17cca98b720d06743d6398d1184350ccc75 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Thu, 28 Nov 2024 20:02:39 +0800
Subject: [PATCH 096/115] fix: improve handling of CRAWL4_AI_BASE_DIRECTORY
 environment variable in setup.py

---
 setup.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/setup.py b/setup.py
index dbb07410..d891ff9f 100644
--- a/setup.py
+++ b/setup.py
@@ -9,7 +9,8 @@ import asyncio
 
 # Create the .crawl4ai folder in the user's home directory if it doesn't exist
 # If the folder already exists, remove the cache folder
-crawl4ai_folder = Path(os.getenv("CRAWL4_AI_BASE_DIRECTORY")) or Path.home()
+base_dir = os.getenv("CRAWL4_AI_BASE_DIRECTORY")
+crawl4ai_folder = Path(base_dir) if base_dir else Path.home()
 crawl4ai_folder = crawl4ai_folder / ".crawl4ai"
 cache_folder = crawl4ai_folder / "cache"
 content_folders = [

From c8485776fe2e475bbba1f8ee513679999283441c Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Thu, 28 Nov 2024 20:04:16 +0800
Subject: [PATCH 097/115] docs: update README to reflect latest version
 v0.3.745

---
 README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/README.md b/README.md
index 26cc9fcc..e8e6cddf 100644
--- a/README.md
+++ b/README.md
@@ -11,7 +11,7 @@
 
 Crawl4AI is the #1 trending GitHub repository, actively maintained by a vibrant community. It delivers blazing-fast, AI-ready web crawling tailored for LLMs, AI agents, and data pipelines. Open source, flexible, and built for real-time performance, Crawl4AI empowers developers with unmatched speed, precision, and deployment ease.  
 
-[✨ Check out what's new in the latest update!](#-recent-updates)
+[✨ Check out latest update v0.3.745](#-recent-updates)
 
 ## 🧐 Why Crawl4AI?
 

From c0e87abaee97e9e206eb787f8939fdf8790f4a2b Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Thu, 28 Nov 2024 21:43:08 +0800
Subject: [PATCH 098/115] fix: update package versions in requirements.txt for
 compatibility

---
 requirements.txt | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/requirements.txt b/requirements.txt
index ed259ac9..c0f6f183 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -1,16 +1,16 @@
 aiosqlite~=0.20
 html2text~=2024.2
 lxml~=5.3
-litellm~=1.48
+litellm>=1.53.1
 numpy>=1.26.0,<3
 pillow~=10.4
-playwright>=1.47,<1.48
+playwright>=1.49.0
 python-dotenv~=1.0
 requests~=2.26
 beautifulsoup4~=4.12
-tf-playwright-stealth~=1.0
+tf-playwright-stealth>=1.1.0
 xxhash~=3.4
 rank-bm25~=0.2
-aiofiles~=24.0
+aiofiles>=24.1.0
 colorama~=0.4
 snowballstemmer~=2.2
\ No newline at end of file

From b0419edda6c0a25da82f65f557beee4e0a3daf02 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Fri, 29 Nov 2024 02:31:17 +0800
Subject: [PATCH 099/115] Update README.md (#300)

---
 README.md | 28 ----------------------------
 1 file changed, 28 deletions(-)

diff --git a/README.md b/README.md
index e8e6cddf..c9d92e17 100644
--- a/README.md
+++ b/README.md
@@ -125,34 +125,6 @@ if __name__ == "__main__":
 
 ✨ Visit our [Documentation Website](https://crawl4ai.com/mkdocs/)
 
-## Features ✨
-
-- 🆓 Completely free and open-source
-- 🚀 Blazing fast performance, outperforming many paid services
-- 🤖 LLM-friendly output formats (JSON, cleaned HTML, markdown)
-- 🌐 Multi-browser support (Chromium, Firefox, WebKit)
-- 🌍 Supports crawling multiple URLs simultaneously
-- 🎨 Extracts and returns all media tags (Images, Audio, and Video)
-- 🔗 Extracts all external and internal links
-- 📚 Extracts metadata from the page
-- 🔄 Custom hooks for authentication, headers, and page modifications
-- 🕵️ User-agent customization
-- 🖼️ Takes screenshots of pages with enhanced error handling
-- 📜 Executes multiple custom JavaScripts before crawling
-- 📊 Generates structured output without LLM using JsonCssExtractionStrategy
-- 📚 Various chunking strategies: topic-based, regex, sentence, and more
-- 🧠 Advanced extraction strategies: cosine clustering, LLM, and more
-- 🎯 CSS selector support for precise data extraction
-- 📝 Passes instructions/keywords to refine extraction
-- 🔒 Proxy support with authentication for enhanced access
-- 🔄 Session management for complex multi-page crawling
-- 🌐 Asynchronous architecture for improved performance
-- 🖼️ Improved image processing with lazy-loading detection
-- 🕰️ Enhanced handling of delayed content loading
-- 🔑 Custom headers support for LLM interactions
-- 🖼️ iframe content extraction for comprehensive analysis
-- ⏱️ Flexible timeout and delayed content retrieval options
-
 ## Installation 🛠️
 
 Crawl4AI offers flexible installation options to suit various use cases. You can install it as a Python package or use Docker.

From 449dd7cc0b9d81e0f602b3868b478c8515a45bf1 Mon Sep 17 00:00:00 2001
From: unclecode <unclecode@kidocode.com>
Date: Fri, 29 Nov 2024 14:45:04 +0800
Subject: [PATCH 100/115] Migrating from the classic setup.py to a using
 PyProject approach.

---
 MANIFEST.in                       |   1 -
 build_hooks.py                    |  48 +++++++++++
 docs/examples/quickstart_async.py | 128 +++++++++++++++++-----------
 plugin.py                         |   9 ++
 post_install.py                   |  19 +++++
 pyproject.toml                    |  75 ++++++++++++++++
 requirements.txt                  |  16 ----
 setup.cfg                         |   2 -
 setup.py                          | 136 ------------------------------
 9 files changed, 229 insertions(+), 205 deletions(-)
 delete mode 100644 MANIFEST.in
 create mode 100644 build_hooks.py
 create mode 100644 plugin.py
 create mode 100644 post_install.py
 create mode 100644 pyproject.toml
 delete mode 100644 requirements.txt
 delete mode 100644 setup.cfg
 delete mode 100644 setup.py

diff --git a/MANIFEST.in b/MANIFEST.in
deleted file mode 100644
index 540b7204..00000000
--- a/MANIFEST.in
+++ /dev/null
@@ -1 +0,0 @@
-include requirements.txt
\ No newline at end of file
diff --git a/build_hooks.py b/build_hooks.py
new file mode 100644
index 00000000..e59b5910
--- /dev/null
+++ b/build_hooks.py
@@ -0,0 +1,48 @@
+import os
+import shutil
+from pathlib import Path
+import subprocess
+import sys
+from hatchling.builders.hooks.plugin.interface import BuildHookInterface
+PLUGIN = "CustomBuildHook" 
+
+class CustomBuildHook(BuildHookInterface):
+    def initialize(self, version, build_data):
+        # Create the .crawl4ai folder structure
+        base_dir = os.getenv("CRAWL4_AI_BASE_DIRECTORY")
+        crawl4ai_folder = Path(base_dir) if base_dir else Path.home()
+        crawl4ai_folder = crawl4ai_folder / ".crawl4ai"
+        cache_folder = crawl4ai_folder / "cache"
+        content_folders = [
+            "html_content",
+            "cleaned_html",
+            "markdown_content",
+            "extracted_content",
+            "screenshots",
+        ]
+
+        # Clean up old cache if exists
+        if cache_folder.exists():
+            shutil.rmtree(cache_folder)
+
+        # Create new folder structure
+        crawl4ai_folder.mkdir(exist_ok=True)
+        cache_folder.mkdir(exist_ok=True)
+        for folder in content_folders:
+            (crawl4ai_folder / folder).mkdir(exist_ok=True)
+
+        # Install Playwright browsers
+        try:
+            subprocess.check_call([sys.executable, "-m", "playwright", "install"])
+        except Exception as e:
+            print(f"Warning: Playwright installation failed: {e}")
+            print("Please run 'python -m playwright install' manually after installation")
+
+        # Initialize database
+        try:
+            from crawl4ai.async_database import async_db_manager
+            import asyncio
+            asyncio.run(async_db_manager.initialize())
+        except Exception as e:
+            print(f"Warning: Database initialization failed: {e}")
+            print("Database will be initialized on first use")
\ No newline at end of file
diff --git a/docs/examples/quickstart_async.py b/docs/examples/quickstart_async.py
index 9f1eff53..01f7677c 100644
--- a/docs/examples/quickstart_async.py
+++ b/docs/examples/quickstart_async.py
@@ -32,7 +32,7 @@ print("Website: https://crawl4ai.com")
 async def simple_crawl():
     print("\n--- Basic Usage ---")
     async with AsyncWebCrawler(verbose=True) as crawler:
-        result = await crawler.arun(url="https://www.nbcnews.com/business")
+        result = await crawler.arun(url="https://www.nbcnews.com/business", cache_mode= CacheMode.BYPASS)
         print(result.markdown[:500])  # Print first 500 characters
 
 async def simple_example_with_running_js_code():
@@ -76,16 +76,17 @@ async def use_proxy():
     async with AsyncWebCrawler(verbose=True, proxy="http://your-proxy-url:port") as crawler:
         result = await crawler.arun(
             url="https://www.nbcnews.com/business",
-            bypass_cache=True
+            cache_mode= CacheMode.BYPASS
         )
-        print(result.markdown[:500])  # Print first 500 characters
+        if result.success:
+            print(result.markdown[:500])  # Print first 500 characters
 
 async def capture_and_save_screenshot(url: str, output_path: str):
     async with AsyncWebCrawler(verbose=True) as crawler:
         result = await crawler.arun(
             url=url,
             screenshot=True,
-            bypass_cache=True
+            cache_mode= CacheMode.BYPASS
         )
         
         if result.success and result.screenshot:
@@ -141,41 +142,68 @@ async def extract_structured_data_using_llm(provider: str, api_token: str = None
 async def extract_structured_data_using_css_extractor():
     print("\n--- Using JsonCssExtractionStrategy for Fast Structured Output ---")
     schema = {
-        "name": "Coinbase Crypto Prices",
-        "baseSelector": ".cds-tableRow-t45thuk",
-        "fields": [
-            {
-                "name": "crypto",
-                "selector": "td:nth-child(1) h2",
-                "type": "text",
-            },
-            {
-                "name": "symbol",
-                "selector": "td:nth-child(1) p",
-                "type": "text",
-            },
-            {
-                "name": "price",
-                "selector": "td:nth-child(2)",
-                "type": "text",
+    "name": "KidoCode Courses",
+    "baseSelector": "section.charge-methodology .w-tab-content > div",
+    "fields": [
+        {
+            "name": "section_title",
+            "selector": "h3.heading-50",
+            "type": "text",
+        },
+        {
+            "name": "section_description",
+            "selector": ".charge-content",
+            "type": "text",
+        },
+        {
+            "name": "course_name",
+            "selector": ".text-block-93",
+            "type": "text",
+        },
+        {
+            "name": "course_description",
+            "selector": ".course-content-text",
+            "type": "text",
+        },
+        {
+            "name": "course_icon",
+            "selector": ".image-92",
+            "type": "attribute",
+            "attribute": "src"
+        }
+    ]
+}
+
+    async with AsyncWebCrawler(
+        headless=True,
+        verbose=True
+    ) as crawler:
+        
+        # Create the JavaScript that handles clicking multiple times
+        js_click_tabs = """
+        (async () => {
+            const tabs = document.querySelectorAll("section.charge-methodology .tabs-menu-3 > div");
+            
+            for(let tab of tabs) {
+                // scroll to the tab
+                tab.scrollIntoView();
+                tab.click();
+                // Wait for content to load and animations to complete
+                await new Promise(r => setTimeout(r, 500));
             }
-        ],
-    }
+        })();
+        """     
 
-    extraction_strategy = JsonCssExtractionStrategy(schema, verbose=True)
-
-    async with AsyncWebCrawler(verbose=True) as crawler:
         result = await crawler.arun(
-            url="https://www.coinbase.com/explore",
-            extraction_strategy=extraction_strategy,
-            cache_mode=CacheMode.BYPASS,
+            url="https://www.kidocode.com/degrees/technology",
+            extraction_strategy=JsonCssExtractionStrategy(schema, verbose=True),
+            js_code=[js_click_tabs],
+            cache_mode=CacheMode.BYPASS
         )
 
-        assert result.success, "Failed to crawl the page"
-
-        news_teasers = json.loads(result.extracted_content)
-        print(f"Successfully extracted {len(news_teasers)} news teasers")
-        print(json.dumps(news_teasers[0], indent=2))
+        companies = json.loads(result.extracted_content)
+        print(f"Successfully extracted {len(companies)} companies")
+        print(json.dumps(companies[0], indent=2))
 
 # Advanced Session-Based Crawling with Dynamic Content 🔄
 async def crawl_dynamic_content_pages_method_1():
@@ -363,21 +391,21 @@ async def crawl_custom_browser_type():
     # Use Firefox
     start = time.time()
     async with AsyncWebCrawler(browser_type="firefox", verbose=True, headless = True) as crawler:
-        result = await crawler.arun(url="https://www.example.com", bypass_cache=True)
+        result = await crawler.arun(url="https://www.example.com", cache_mode= CacheMode.BYPASS)
         print(result.markdown[:500])
         print("Time taken: ", time.time() - start)
 
     # Use WebKit
     start = time.time()
     async with AsyncWebCrawler(browser_type="webkit", verbose=True, headless = True) as crawler:
-        result = await crawler.arun(url="https://www.example.com", bypass_cache=True)
+        result = await crawler.arun(url="https://www.example.com", cache_mode= CacheMode.BYPASS)
         print(result.markdown[:500])
         print("Time taken: ", time.time() - start)
 
     # Use Chromium (default)
     start = time.time()
     async with AsyncWebCrawler(verbose=True, headless = True) as crawler:
-        result = await crawler.arun(url="https://www.example.com", bypass_cache=True)
+        result = await crawler.arun(url="https://www.example.com", cache_mode= CacheMode.BYPASS)
         print(result.markdown[:500])
         print("Time taken: ", time.time() - start)
 
@@ -534,29 +562,29 @@ async def fit_markdown_remove_overlay():
 
 
 async def main():
-    await simple_crawl()
-    await simple_example_with_running_js_code()
-    await simple_example_with_css_selector()
-    await use_proxy()
-    await capture_and_save_screenshot("https://www.example.com", os.path.join(__location__, "tmp/example_screenshot.jpg"))
-    await extract_structured_data_using_css_extractor()
+    # await simple_crawl()
+    # await simple_example_with_running_js_code()
+    # await simple_example_with_css_selector()
+    # await use_proxy()
+    # await capture_and_save_screenshot("https://www.example.com", os.path.join(__location__, "tmp/example_screenshot.jpg"))
+    # await extract_structured_data_using_css_extractor()
 
     # LLM extraction examples
     # await extract_structured_data_using_llm()
     # await extract_structured_data_using_llm("huggingface/meta-llama/Meta-Llama-3.1-8B-Instruct", os.getenv("HUGGINGFACE_API_KEY"))
     # await extract_structured_data_using_llm("ollama/llama3.2")    
-    await extract_structured_data_using_llm("openai/gpt-4o", os.getenv("OPENAI_API_KEY"))
+    # await extract_structured_data_using_llm("openai/gpt-4o", os.getenv("OPENAI_API_KEY"))
 
     # You always can pass custom headers to the extraction strategy
-    custom_headers = {
-        "Authorization": "Bearer your-custom-token",
-        "X-Custom-Header": "Some-Value"
-    }
-    await extract_structured_data_using_llm(extra_headers=custom_headers)
+    # custom_headers = {
+    #     "Authorization": "Bearer your-custom-token",
+    #     "X-Custom-Header": "Some-Value"
+    # }
+    # await extract_structured_data_using_llm(extra_headers=custom_headers)
     
     # await crawl_dynamic_content_pages_method_1()
     # await crawl_dynamic_content_pages_method_2()
-    await crawl_dynamic_content_pages_method_3()
+    # await crawl_dynamic_content_pages_method_3()
     
     await crawl_custom_browser_type()
     
diff --git a/plugin.py b/plugin.py
new file mode 100644
index 00000000..1e1b11bf
--- /dev/null
+++ b/plugin.py
@@ -0,0 +1,9 @@
+from colorama import Fore, Style
+import subprocess
+import sys
+
+def post_install():
+    print(f"\n{Fore.YELLOW}{'='*40}")
+    print(f"{Fore.RED}IMPORTANT: Run this command now:")
+    print(f"{Fore.GREEN}python -m playwright install")
+    print(f"{Fore.YELLOW}{'='*40}{Style.RESET_ALL}\n")
\ No newline at end of file
diff --git a/post_install.py b/post_install.py
new file mode 100644
index 00000000..e536e547
--- /dev/null
+++ b/post_install.py
@@ -0,0 +1,19 @@
+from colorama import Fore, Style
+import subprocess
+import sys
+import distutils.log as log
+from pathlib import Path
+
+def main():
+    try:
+        subprocess.check_call([sys.executable, "-m", "playwright", "install"], 
+                            stdout=subprocess.DEVNULL, 
+                            stderr=subprocess.DEVNULL)
+    except:
+        print(f"\n{Fore.YELLOW}{'='*40}")
+        print(f"{Fore.RED}IMPORTANT: Run this command now:")
+        print(f"{Fore.GREEN}python -m playwright install")
+        print(f"{Fore.YELLOW}{'='*40}{Style.RESET_ALL}\n")
+
+if __name__ == "__main__":
+    main()
\ No newline at end of file
diff --git a/pyproject.toml b/pyproject.toml
new file mode 100644
index 00000000..cfef8101
--- /dev/null
+++ b/pyproject.toml
@@ -0,0 +1,75 @@
+[build-system]
+requires = ["hatchling", "hatch-fancy-pypi-readme>=22.5.0"]
+build-backend = "hatchling.build"
+
+[project]
+name = "Crawl4AI"
+dynamic = ["version"]
+description = "🔥🕷️ Crawl4AI: Open-source LLM Friendly Web Crawler & scraper"
+readme = "README.md"
+license = "Apache-2.0"
+requires-python = ">=3.7"
+authors = [
+    { name = "Unclecode", email = "unclecode@kidocode.com" },
+]
+classifiers = [
+    "Development Status :: 3 - Alpha",
+    "Intended Audience :: Developers",
+    "License :: OSI Approved :: Apache Software License",
+    "Programming Language :: Python :: 3",
+    "Programming Language :: Python :: 3.7",
+    "Programming Language :: Python :: 3.8",
+    "Programming Language :: Python :: 3.9",
+    "Programming Language :: Python :: 3.10",
+]
+dependencies = [
+    "aiosqlite~=0.20",
+    "html2text~=2024.2",
+    "lxml~=5.3",
+    "litellm>=1.53.1",
+    "numpy>=1.26.0,<3",
+    "pillow~=10.4",
+    "playwright>=1.49.0",
+    "python-dotenv~=1.0",
+    "requests~=2.26",
+    "beautifulsoup4~=4.12",
+    "tf-playwright-stealth>=1.1.0",
+    "xxhash~=3.4",
+    "rank-bm25~=0.2", 
+    "aiofiles>=24.1.0",
+    "colorama~=0.4",
+    "snowballstemmer~=2.2",
+]
+
+[project.optional-dependencies]
+torch = ["torch", "nltk", "scikit-learn"]
+transformer = ["transformers", "tokenizers"]
+cosine = ["torch", "transformers", "nltk"]
+sync = ["selenium"]
+all = [
+    "torch",
+    "nltk",
+    "scikit-learn",
+    "transformers",
+    "tokenizers",
+    "selenium",
+]
+
+[project.urls]
+Homepage = "https://github.com/unclecode/crawl4ai"
+Documentation = "https://crawl4ai.com/mkdocs/"
+
+[project.scripts]
+crawl4ai-download-models = "crawl4ai.model_loader:main"
+crawl4ai-migrate = "crawl4ai.migrations:main"
+crawl4ai-post-install = "crawl4ai.post_install:main"
+
+[tool.hatch.version]
+path = "crawl4ai/__version__.py"
+
+[tool.hatch.build.hooks.custom]
+dependencies = ["hatch-fancy-pypi-readme>=22.5.0"]
+path = "build_hooks.py"
+
+[project.entry-points.hatch]
+crawl4ai = "crawl4ai.plugin:post_install"
diff --git a/requirements.txt b/requirements.txt
deleted file mode 100644
index c0f6f183..00000000
--- a/requirements.txt
+++ /dev/null
@@ -1,16 +0,0 @@
-aiosqlite~=0.20
-html2text~=2024.2
-lxml~=5.3
-litellm>=1.53.1
-numpy>=1.26.0,<3
-pillow~=10.4
-playwright>=1.49.0
-python-dotenv~=1.0
-requests~=2.26
-beautifulsoup4~=4.12
-tf-playwright-stealth>=1.1.0
-xxhash~=3.4
-rank-bm25~=0.2
-aiofiles>=24.1.0
-colorama~=0.4
-snowballstemmer~=2.2
\ No newline at end of file
diff --git a/setup.cfg b/setup.cfg
deleted file mode 100644
index 56490d6a..00000000
--- a/setup.cfg
+++ /dev/null
@@ -1,2 +0,0 @@
-[options]
-include_package_data = True
\ No newline at end of file
diff --git a/setup.py b/setup.py
deleted file mode 100644
index d44169bf..00000000
--- a/setup.py
+++ /dev/null
@@ -1,136 +0,0 @@
-from setuptools import setup, find_packages
-from setuptools.command.install import install
-import os
-from pathlib import Path
-import shutil
-import subprocess
-import sys
-import asyncio
-
-# Create the .crawl4ai folder in the user's home directory if it doesn't exist
-# If the folder already exists, remove the cache folder
-base_dir = os.getenv("CRAWL4_AI_BASE_DIRECTORY")
-crawl4ai_folder = Path(base_dir) if base_dir else Path.home()
-crawl4ai_folder = crawl4ai_folder / ".crawl4ai"
-cache_folder = crawl4ai_folder / "cache"
-content_folders = [
-    "html_content",
-    "cleaned_html",
-    "markdown_content",
-    "extracted_content",
-    "screenshots",
-]
-
-# Clean up old cache if exists
-if cache_folder.exists():
-    shutil.rmtree(cache_folder)
-
-# Create new folder structure
-crawl4ai_folder.mkdir(exist_ok=True)
-cache_folder.mkdir(exist_ok=True)
-for folder in content_folders:
-    (crawl4ai_folder / folder).mkdir(exist_ok=True)
-
-# Read requirements and version
-__location__ = os.path.realpath(os.path.join(os.getcwd(), os.path.dirname(__file__)))
-with open(os.path.join(__location__, "requirements.txt")) as f:
-    requirements = f.read().splitlines()
-
-with open("crawl4ai/__version__.py") as f:
-    for line in f:
-        if line.startswith("__version__"):
-            version = line.split("=")[1].strip().strip('"')
-            break
-
-# Define requirements
-default_requirements = requirements
-torch_requirements = ["torch", "nltk", "scikit-learn"]
-transformer_requirements = ["transformers", "tokenizers"]
-cosine_similarity_requirements = ["torch", "transformers", "nltk"]
-sync_requirements = ["selenium"]
-
-
-def install_playwright():
-    print("Installing Playwright browsers...")
-    try:
-        subprocess.check_call([sys.executable, "-m", "playwright", "install"])
-        print("Playwright installation completed successfully.")
-    except subprocess.CalledProcessError as e:
-        print(f"Error during Playwright installation: {e}")
-        print(
-            "Please run 'python -m playwright install' manually after the installation."
-        )
-    except Exception as e:
-        print(f"Unexpected error during Playwright installation: {e}")
-        print(
-            "Please run 'python -m playwright install' manually after the installation."
-        )
-
-
-def run_migration():
-    """Initialize database during installation"""
-    try:
-        print("Starting database initialization...")
-        from crawl4ai.async_database import async_db_manager
-
-        asyncio.run(async_db_manager.initialize())
-        print("Database initialization completed successfully.")
-    except ImportError:
-        print("Warning: Database module not found. Will initialize on first use.")
-    except Exception as e:
-        print(f"Warning: Database initialization failed: {e}")
-        print("Database will be initialized on first use")
-
-
-class PostInstallCommand(install):
-    def run(self):
-        install.run(self)
-        install_playwright()
-        # run_migration()
-
-
-setup(
-    name="Crawl4AI",
-    version=version,
-    description="🔥🕷️ Crawl4AI: Open-source LLM Friendly Web Crawler & scraper",
-    long_description=open("README.md", encoding="utf-8").read(),
-    long_description_content_type="text/markdown",
-    url="https://github.com/unclecode/crawl4ai",
-    author="Unclecode",
-    author_email="unclecode@kidocode.com",
-    license="MIT",
-    packages=find_packages(),
-    install_requires=default_requirements
-    + ["playwright", "aiofiles"],  # Added aiofiles
-    extras_require={
-        "torch": torch_requirements,
-        "transformer": transformer_requirements,
-        "cosine": cosine_similarity_requirements,
-        "sync": sync_requirements,
-        "all": default_requirements
-        + torch_requirements
-        + transformer_requirements
-        + cosine_similarity_requirements
-        + sync_requirements,
-    },
-    entry_points={
-        "console_scripts": [
-            "crawl4ai-download-models=crawl4ai.model_loader:main",
-            "crawl4ai-migrate=crawl4ai.migrations:main",  # Added migration command
-        ],
-    },
-    classifiers=[
-        "Development Status :: 3 - Alpha",
-        "Intended Audience :: Developers",
-        "License :: OSI Approved :: Apache Software License",
-        "Programming Language :: Python :: 3",
-        "Programming Language :: Python :: 3.7",
-        "Programming Language :: Python :: 3.8",
-        "Programming Language :: Python :: 3.9",
-        "Programming Language :: Python :: 3.10",
-    ],
-    python_requires=">=3.7",
-    cmdclass={
-        "install": PostInstallCommand,
-    },
-)

From 12e73d489846dc83c29347bf84646ad8daef6cfc Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Fri, 29 Nov 2024 16:01:19 +0800
Subject: [PATCH 101/115] refactor: remove legacy build hooks and setup files,
 migrate to setup.cfg and pyproject.toml

---
 MANIFEST.in      |   1 +
 build_hooks.py   |  48 -----------------
 plugin.py        |   9 ----
 post_install.py  |  19 -------
 pyproject.toml   |  75 --------------------------
 requirements.txt |  16 ++++++
 setup.cfg        |   2 +
 setup.py         | 136 +++++++++++++++++++++++++++++++++++++++++++++++
 8 files changed, 155 insertions(+), 151 deletions(-)
 create mode 100644 MANIFEST.in
 delete mode 100644 build_hooks.py
 delete mode 100644 plugin.py
 delete mode 100644 post_install.py
 delete mode 100644 pyproject.toml
 create mode 100644 requirements.txt
 create mode 100644 setup.cfg
 create mode 100644 setup.py

diff --git a/MANIFEST.in b/MANIFEST.in
new file mode 100644
index 00000000..540b7204
--- /dev/null
+++ b/MANIFEST.in
@@ -0,0 +1 @@
+include requirements.txt
\ No newline at end of file
diff --git a/build_hooks.py b/build_hooks.py
deleted file mode 100644
index e59b5910..00000000
--- a/build_hooks.py
+++ /dev/null
@@ -1,48 +0,0 @@
-import os
-import shutil
-from pathlib import Path
-import subprocess
-import sys
-from hatchling.builders.hooks.plugin.interface import BuildHookInterface
-PLUGIN = "CustomBuildHook" 
-
-class CustomBuildHook(BuildHookInterface):
-    def initialize(self, version, build_data):
-        # Create the .crawl4ai folder structure
-        base_dir = os.getenv("CRAWL4_AI_BASE_DIRECTORY")
-        crawl4ai_folder = Path(base_dir) if base_dir else Path.home()
-        crawl4ai_folder = crawl4ai_folder / ".crawl4ai"
-        cache_folder = crawl4ai_folder / "cache"
-        content_folders = [
-            "html_content",
-            "cleaned_html",
-            "markdown_content",
-            "extracted_content",
-            "screenshots",
-        ]
-
-        # Clean up old cache if exists
-        if cache_folder.exists():
-            shutil.rmtree(cache_folder)
-
-        # Create new folder structure
-        crawl4ai_folder.mkdir(exist_ok=True)
-        cache_folder.mkdir(exist_ok=True)
-        for folder in content_folders:
-            (crawl4ai_folder / folder).mkdir(exist_ok=True)
-
-        # Install Playwright browsers
-        try:
-            subprocess.check_call([sys.executable, "-m", "playwright", "install"])
-        except Exception as e:
-            print(f"Warning: Playwright installation failed: {e}")
-            print("Please run 'python -m playwright install' manually after installation")
-
-        # Initialize database
-        try:
-            from crawl4ai.async_database import async_db_manager
-            import asyncio
-            asyncio.run(async_db_manager.initialize())
-        except Exception as e:
-            print(f"Warning: Database initialization failed: {e}")
-            print("Database will be initialized on first use")
\ No newline at end of file
diff --git a/plugin.py b/plugin.py
deleted file mode 100644
index 1e1b11bf..00000000
--- a/plugin.py
+++ /dev/null
@@ -1,9 +0,0 @@
-from colorama import Fore, Style
-import subprocess
-import sys
-
-def post_install():
-    print(f"\n{Fore.YELLOW}{'='*40}")
-    print(f"{Fore.RED}IMPORTANT: Run this command now:")
-    print(f"{Fore.GREEN}python -m playwright install")
-    print(f"{Fore.YELLOW}{'='*40}{Style.RESET_ALL}\n")
\ No newline at end of file
diff --git a/post_install.py b/post_install.py
deleted file mode 100644
index e536e547..00000000
--- a/post_install.py
+++ /dev/null
@@ -1,19 +0,0 @@
-from colorama import Fore, Style
-import subprocess
-import sys
-import distutils.log as log
-from pathlib import Path
-
-def main():
-    try:
-        subprocess.check_call([sys.executable, "-m", "playwright", "install"], 
-                            stdout=subprocess.DEVNULL, 
-                            stderr=subprocess.DEVNULL)
-    except:
-        print(f"\n{Fore.YELLOW}{'='*40}")
-        print(f"{Fore.RED}IMPORTANT: Run this command now:")
-        print(f"{Fore.GREEN}python -m playwright install")
-        print(f"{Fore.YELLOW}{'='*40}{Style.RESET_ALL}\n")
-
-if __name__ == "__main__":
-    main()
\ No newline at end of file
diff --git a/pyproject.toml b/pyproject.toml
deleted file mode 100644
index cfef8101..00000000
--- a/pyproject.toml
+++ /dev/null
@@ -1,75 +0,0 @@
-[build-system]
-requires = ["hatchling", "hatch-fancy-pypi-readme>=22.5.0"]
-build-backend = "hatchling.build"
-
-[project]
-name = "Crawl4AI"
-dynamic = ["version"]
-description = "🔥🕷️ Crawl4AI: Open-source LLM Friendly Web Crawler & scraper"
-readme = "README.md"
-license = "Apache-2.0"
-requires-python = ">=3.7"
-authors = [
-    { name = "Unclecode", email = "unclecode@kidocode.com" },
-]
-classifiers = [
-    "Development Status :: 3 - Alpha",
-    "Intended Audience :: Developers",
-    "License :: OSI Approved :: Apache Software License",
-    "Programming Language :: Python :: 3",
-    "Programming Language :: Python :: 3.7",
-    "Programming Language :: Python :: 3.8",
-    "Programming Language :: Python :: 3.9",
-    "Programming Language :: Python :: 3.10",
-]
-dependencies = [
-    "aiosqlite~=0.20",
-    "html2text~=2024.2",
-    "lxml~=5.3",
-    "litellm>=1.53.1",
-    "numpy>=1.26.0,<3",
-    "pillow~=10.4",
-    "playwright>=1.49.0",
-    "python-dotenv~=1.0",
-    "requests~=2.26",
-    "beautifulsoup4~=4.12",
-    "tf-playwright-stealth>=1.1.0",
-    "xxhash~=3.4",
-    "rank-bm25~=0.2", 
-    "aiofiles>=24.1.0",
-    "colorama~=0.4",
-    "snowballstemmer~=2.2",
-]
-
-[project.optional-dependencies]
-torch = ["torch", "nltk", "scikit-learn"]
-transformer = ["transformers", "tokenizers"]
-cosine = ["torch", "transformers", "nltk"]
-sync = ["selenium"]
-all = [
-    "torch",
-    "nltk",
-    "scikit-learn",
-    "transformers",
-    "tokenizers",
-    "selenium",
-]
-
-[project.urls]
-Homepage = "https://github.com/unclecode/crawl4ai"
-Documentation = "https://crawl4ai.com/mkdocs/"
-
-[project.scripts]
-crawl4ai-download-models = "crawl4ai.model_loader:main"
-crawl4ai-migrate = "crawl4ai.migrations:main"
-crawl4ai-post-install = "crawl4ai.post_install:main"
-
-[tool.hatch.version]
-path = "crawl4ai/__version__.py"
-
-[tool.hatch.build.hooks.custom]
-dependencies = ["hatch-fancy-pypi-readme>=22.5.0"]
-path = "build_hooks.py"
-
-[project.entry-points.hatch]
-crawl4ai = "crawl4ai.plugin:post_install"
diff --git a/requirements.txt b/requirements.txt
new file mode 100644
index 00000000..c0f6f183
--- /dev/null
+++ b/requirements.txt
@@ -0,0 +1,16 @@
+aiosqlite~=0.20
+html2text~=2024.2
+lxml~=5.3
+litellm>=1.53.1
+numpy>=1.26.0,<3
+pillow~=10.4
+playwright>=1.49.0
+python-dotenv~=1.0
+requests~=2.26
+beautifulsoup4~=4.12
+tf-playwright-stealth>=1.1.0
+xxhash~=3.4
+rank-bm25~=0.2
+aiofiles>=24.1.0
+colorama~=0.4
+snowballstemmer~=2.2
\ No newline at end of file
diff --git a/setup.cfg b/setup.cfg
new file mode 100644
index 00000000..56490d6a
--- /dev/null
+++ b/setup.cfg
@@ -0,0 +1,2 @@
+[options]
+include_package_data = True
\ No newline at end of file
diff --git a/setup.py b/setup.py
new file mode 100644
index 00000000..d44169bf
--- /dev/null
+++ b/setup.py
@@ -0,0 +1,136 @@
+from setuptools import setup, find_packages
+from setuptools.command.install import install
+import os
+from pathlib import Path
+import shutil
+import subprocess
+import sys
+import asyncio
+
+# Create the .crawl4ai folder in the user's home directory if it doesn't exist
+# If the folder already exists, remove the cache folder
+base_dir = os.getenv("CRAWL4_AI_BASE_DIRECTORY")
+crawl4ai_folder = Path(base_dir) if base_dir else Path.home()
+crawl4ai_folder = crawl4ai_folder / ".crawl4ai"
+cache_folder = crawl4ai_folder / "cache"
+content_folders = [
+    "html_content",
+    "cleaned_html",
+    "markdown_content",
+    "extracted_content",
+    "screenshots",
+]
+
+# Clean up old cache if exists
+if cache_folder.exists():
+    shutil.rmtree(cache_folder)
+
+# Create new folder structure
+crawl4ai_folder.mkdir(exist_ok=True)
+cache_folder.mkdir(exist_ok=True)
+for folder in content_folders:
+    (crawl4ai_folder / folder).mkdir(exist_ok=True)
+
+# Read requirements and version
+__location__ = os.path.realpath(os.path.join(os.getcwd(), os.path.dirname(__file__)))
+with open(os.path.join(__location__, "requirements.txt")) as f:
+    requirements = f.read().splitlines()
+
+with open("crawl4ai/__version__.py") as f:
+    for line in f:
+        if line.startswith("__version__"):
+            version = line.split("=")[1].strip().strip('"')
+            break
+
+# Define requirements
+default_requirements = requirements
+torch_requirements = ["torch", "nltk", "scikit-learn"]
+transformer_requirements = ["transformers", "tokenizers"]
+cosine_similarity_requirements = ["torch", "transformers", "nltk"]
+sync_requirements = ["selenium"]
+
+
+def install_playwright():
+    print("Installing Playwright browsers...")
+    try:
+        subprocess.check_call([sys.executable, "-m", "playwright", "install"])
+        print("Playwright installation completed successfully.")
+    except subprocess.CalledProcessError as e:
+        print(f"Error during Playwright installation: {e}")
+        print(
+            "Please run 'python -m playwright install' manually after the installation."
+        )
+    except Exception as e:
+        print(f"Unexpected error during Playwright installation: {e}")
+        print(
+            "Please run 'python -m playwright install' manually after the installation."
+        )
+
+
+def run_migration():
+    """Initialize database during installation"""
+    try:
+        print("Starting database initialization...")
+        from crawl4ai.async_database import async_db_manager
+
+        asyncio.run(async_db_manager.initialize())
+        print("Database initialization completed successfully.")
+    except ImportError:
+        print("Warning: Database module not found. Will initialize on first use.")
+    except Exception as e:
+        print(f"Warning: Database initialization failed: {e}")
+        print("Database will be initialized on first use")
+
+
+class PostInstallCommand(install):
+    def run(self):
+        install.run(self)
+        install_playwright()
+        # run_migration()
+
+
+setup(
+    name="Crawl4AI",
+    version=version,
+    description="🔥🕷️ Crawl4AI: Open-source LLM Friendly Web Crawler & scraper",
+    long_description=open("README.md", encoding="utf-8").read(),
+    long_description_content_type="text/markdown",
+    url="https://github.com/unclecode/crawl4ai",
+    author="Unclecode",
+    author_email="unclecode@kidocode.com",
+    license="MIT",
+    packages=find_packages(),
+    install_requires=default_requirements
+    + ["playwright", "aiofiles"],  # Added aiofiles
+    extras_require={
+        "torch": torch_requirements,
+        "transformer": transformer_requirements,
+        "cosine": cosine_similarity_requirements,
+        "sync": sync_requirements,
+        "all": default_requirements
+        + torch_requirements
+        + transformer_requirements
+        + cosine_similarity_requirements
+        + sync_requirements,
+    },
+    entry_points={
+        "console_scripts": [
+            "crawl4ai-download-models=crawl4ai.model_loader:main",
+            "crawl4ai-migrate=crawl4ai.migrations:main",  # Added migration command
+        ],
+    },
+    classifiers=[
+        "Development Status :: 3 - Alpha",
+        "Intended Audience :: Developers",
+        "License :: OSI Approved :: Apache Software License",
+        "Programming Language :: Python :: 3",
+        "Programming Language :: Python :: 3.7",
+        "Programming Language :: Python :: 3.8",
+        "Programming Language :: Python :: 3.9",
+        "Programming Language :: Python :: 3.10",
+    ],
+    python_requires=">=3.7",
+    cmdclass={
+        "install": PostInstallCommand,
+    },
+)

From d202f3539bf7447f7594f7f1897c3062c337ae52 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Fri, 29 Nov 2024 18:48:44 +0800
Subject: [PATCH 102/115]   Enhance installation and migration processes   -
 Added a post-installation setup script for initialization.   - Updated README
 with installation notes for Playwright setup.   - Enhanced migration logging
 for better error visibility.   - Added 'pydantic' to requirements.   - Bumped
 version to 0.3.746.

---
 README.md                         | 32 ++-----------------
 crawl4ai/__init__.py              |  1 -
 crawl4ai/__version__.py           |  2 +-
 crawl4ai/install.py               | 44 ++++++++++++++++++++++++++
 crawl4ai/migrations.py            | 40 ++++++++++++++++--------
 docs/examples/quickstart_async.py | 18 +++++------
 requirements.txt                  |  4 +--
 setup.py                          | 51 ++-----------------------------
 8 files changed, 90 insertions(+), 102 deletions(-)
 create mode 100644 crawl4ai/install.py

diff --git a/README.md b/README.md
index e8e6cddf..bbfa5858 100644
--- a/README.md
+++ b/README.md
@@ -27,6 +27,7 @@ Crawl4AI is the #1 trending GitHub repository, actively maintained by a vibrant
 1. Install Crawl4AI:
 ```bash
 pip install crawl4ai
+crawl4ai-setup # Setup the browser
 ```
 
 2. Run a simple web crawl:
@@ -125,34 +126,6 @@ if __name__ == "__main__":
 
 ✨ Visit our [Documentation Website](https://crawl4ai.com/mkdocs/)
 
-## Features ✨
-
-- 🆓 Completely free and open-source
-- 🚀 Blazing fast performance, outperforming many paid services
-- 🤖 LLM-friendly output formats (JSON, cleaned HTML, markdown)
-- 🌐 Multi-browser support (Chromium, Firefox, WebKit)
-- 🌍 Supports crawling multiple URLs simultaneously
-- 🎨 Extracts and returns all media tags (Images, Audio, and Video)
-- 🔗 Extracts all external and internal links
-- 📚 Extracts metadata from the page
-- 🔄 Custom hooks for authentication, headers, and page modifications
-- 🕵️ User-agent customization
-- 🖼️ Takes screenshots of pages with enhanced error handling
-- 📜 Executes multiple custom JavaScripts before crawling
-- 📊 Generates structured output without LLM using JsonCssExtractionStrategy
-- 📚 Various chunking strategies: topic-based, regex, sentence, and more
-- 🧠 Advanced extraction strategies: cosine clustering, LLM, and more
-- 🎯 CSS selector support for precise data extraction
-- 📝 Passes instructions/keywords to refine extraction
-- 🔒 Proxy support with authentication for enhanced access
-- 🔄 Session management for complex multi-page crawling
-- 🌐 Asynchronous architecture for improved performance
-- 🖼️ Improved image processing with lazy-loading detection
-- 🕰️ Enhanced handling of delayed content loading
-- 🔑 Custom headers support for LLM interactions
-- 🖼️ iframe content extraction for comprehensive analysis
-- ⏱️ Flexible timeout and delayed content retrieval options
-
 ## Installation 🛠️
 
 Crawl4AI offers flexible installation options to suit various use cases. You can install it as a Python package or use Docker.
@@ -168,11 +141,12 @@ For basic web crawling and scraping tasks:
 
 ```bash
 pip install crawl4ai
+crawl4ai-setup # Setup the browser
 ```
 
 By default, this will install the asynchronous version of Crawl4AI, using Playwright for web crawling.
 
-👉 **Note**: When you install Crawl4AI, the setup script should automatically install and set up Playwright. However, if you encounter any Playwright-related errors, you can manually install it using one of these methods:
+👉 **Note**: When you install Crawl4AI, the `crawl4ai-setup` should automatically install and set up Playwright. However, if you encounter any Playwright-related errors, you can manually install it using one of these methods:
 
 1. Through the command line:
 
diff --git a/crawl4ai/__init__.py b/crawl4ai/__init__.py
index 0ccf13d8..cee7c25b 100644
--- a/crawl4ai/__init__.py
+++ b/crawl4ai/__init__.py
@@ -4,7 +4,6 @@ from .async_webcrawler import AsyncWebCrawler, CacheMode
 
 from .models import CrawlResult
 from .__version__ import __version__
-# __version__ = "0.3.73"
 
 __all__ = [
     "AsyncWebCrawler",
diff --git a/crawl4ai/__version__.py b/crawl4ai/__version__.py
index 8b69d491..4a938b75 100644
--- a/crawl4ai/__version__.py
+++ b/crawl4ai/__version__.py
@@ -1,2 +1,2 @@
 # crawl4ai/_version.py
-__version__ = "0.3.745"
+__version__ = "0.3.746"
diff --git a/crawl4ai/install.py b/crawl4ai/install.py
new file mode 100644
index 00000000..71fe30ea
--- /dev/null
+++ b/crawl4ai/install.py
@@ -0,0 +1,44 @@
+import subprocess
+import sys
+import asyncio
+from .async_logger import AsyncLogger, LogLevel
+
+# Initialize logger
+logger = AsyncLogger(log_level=LogLevel.DEBUG, verbose=True)
+
+def post_install():
+    """Run all post-installation tasks"""
+    logger.info("Running post-installation setup...", tag="INIT")
+    install_playwright()
+    run_migration()
+    logger.success("Post-installation setup completed!", tag="COMPLETE")
+    
+def install_playwright():
+    logger.info("Installing Playwright browsers...", tag="INIT")
+    try:
+        subprocess.check_call([sys.executable, "-m", "playwright", "install"])
+        logger.success("Playwright installation completed successfully.", tag="COMPLETE")
+    except subprocess.CalledProcessError as e:
+        logger.error(f"Error during Playwright installation: {e}", tag="ERROR")
+        logger.warning(
+            "Please run 'python -m playwright install' manually after the installation."
+        )
+    except Exception as e:
+        logger.error(f"Unexpected error during Playwright installation: {e}", tag="ERROR")
+        logger.warning(
+            "Please run 'python -m playwright install' manually after the installation."
+        )
+
+def run_migration():
+    """Initialize database during installation"""
+    try:
+        logger.info("Starting database initialization...", tag="INIT")
+        from crawl4ai.async_database import async_db_manager
+
+        asyncio.run(async_db_manager.initialize())
+        logger.success("Database initialization completed successfully.", tag="COMPLETE")
+    except ImportError:
+        logger.warning("Database module not found. Will initialize on first use.")
+    except Exception as e:
+        logger.warning(f"Database initialization failed: {e}")
+        logger.warning("Database will be initialized on first use")
\ No newline at end of file
diff --git a/crawl4ai/migrations.py b/crawl4ai/migrations.py
index 77616086..3386b0fb 100644
--- a/crawl4ai/migrations.py
+++ b/crawl4ai/migrations.py
@@ -9,9 +9,13 @@ import aiofiles
 import shutil
 import time
 from datetime import datetime
+from .async_logger import AsyncLogger, LogLevel
 
-logging.basicConfig(level=logging.INFO)
-logger = logging.getLogger(__name__)
+# Initialize logger
+logger = AsyncLogger(log_level=LogLevel.DEBUG, verbose=True)
+
+# logging.basicConfig(level=logging.INFO)
+# logger = logging.getLogger(__name__)
 
 class DatabaseMigration:
     def __init__(self, db_path: str):
@@ -55,7 +59,8 @@ class DatabaseMigration:
 
     async def migrate_database(self):
         """Migrate existing database to file-based storage"""
-        logger.info("Starting database migration...")
+        # logger.info("Starting database migration...")
+        logger.info("Starting database migration...", tag="INIT")
         
         try:
             async with aiosqlite.connect(self.db_path) as db:
@@ -91,19 +96,25 @@ class DatabaseMigration:
                     
                     migrated_count += 1
                     if migrated_count % 100 == 0:
-                        logger.info(f"Migrated {migrated_count} records...")
+                        logger.info(f"Migrated {migrated_count} records...", tag="INIT")
+                        
 
                 await db.commit()
-                logger.info(f"Migration completed. {migrated_count} records processed.")
+                logger.success(f"Migration completed. {migrated_count} records processed.", tag="COMPLETE")
 
         except Exception as e:
-            logger.error(f"Migration failed: {e}")
-            raise
+            # logger.error(f"Migration failed: {e}")
+            logger.error(
+                message="Migration failed: {error}",
+                tag="ERROR",
+                params={"error": str(e)}
+            )
+            raise e
 
 async def backup_database(db_path: str) -> str:
     """Create backup of existing database"""
     if not os.path.exists(db_path):
-        logger.info("No existing database found. Skipping backup.")
+        logger.info("No existing database found. Skipping backup.", tag="INIT")
         return None
         
     # Create backup with timestamp
@@ -116,11 +127,16 @@ async def backup_database(db_path: str) -> str:
         
         # Create backup
         shutil.copy2(db_path, backup_path)
-        logger.info(f"Database backup created at: {backup_path}")
+        logger.info(f"Database backup created at: {backup_path}", tag="COMPLETE")
         return backup_path
     except Exception as e:
-        logger.error(f"Backup failed: {e}")
-        raise
+        # logger.error(f"Backup failed: {e}")
+        logger.error(
+                message="Migration failed: {error}",
+                tag="ERROR",
+                params={"error": str(e)}
+            )
+        raise e
     
 async def run_migration(db_path: Optional[str] = None):
     """Run database migration"""
@@ -128,7 +144,7 @@ async def run_migration(db_path: Optional[str] = None):
         db_path = os.path.join(Path.home(), ".crawl4ai", "crawl4ai.db")
     
     if not os.path.exists(db_path):
-        logger.info("No existing database found. Skipping migration.")
+        logger.info("No existing database found. Skipping migration.", tag="INIT")
         return
         
     # Create backup first
diff --git a/docs/examples/quickstart_async.py b/docs/examples/quickstart_async.py
index 01f7677c..679a9bc2 100644
--- a/docs/examples/quickstart_async.py
+++ b/docs/examples/quickstart_async.py
@@ -562,18 +562,18 @@ async def fit_markdown_remove_overlay():
 
 
 async def main():
-    # await simple_crawl()
-    # await simple_example_with_running_js_code()
-    # await simple_example_with_css_selector()
+    await simple_crawl()
+    await simple_example_with_running_js_code()
+    await simple_example_with_css_selector()
     # await use_proxy()
-    # await capture_and_save_screenshot("https://www.example.com", os.path.join(__location__, "tmp/example_screenshot.jpg"))
-    # await extract_structured_data_using_css_extractor()
+    await capture_and_save_screenshot("https://www.example.com", os.path.join(__location__, "tmp/example_screenshot.jpg"))
+    await extract_structured_data_using_css_extractor()
 
     # LLM extraction examples
     # await extract_structured_data_using_llm()
     # await extract_structured_data_using_llm("huggingface/meta-llama/Meta-Llama-3.1-8B-Instruct", os.getenv("HUGGINGFACE_API_KEY"))
     # await extract_structured_data_using_llm("ollama/llama3.2")    
-    # await extract_structured_data_using_llm("openai/gpt-4o", os.getenv("OPENAI_API_KEY"))
+    await extract_structured_data_using_llm("openai/gpt-4o", os.getenv("OPENAI_API_KEY"))
 
     # You always can pass custom headers to the extraction strategy
     # custom_headers = {
@@ -582,9 +582,9 @@ async def main():
     # }
     # await extract_structured_data_using_llm(extra_headers=custom_headers)
     
-    # await crawl_dynamic_content_pages_method_1()
-    # await crawl_dynamic_content_pages_method_2()
-    # await crawl_dynamic_content_pages_method_3()
+    await crawl_dynamic_content_pages_method_1()
+    await crawl_dynamic_content_pages_method_2()
+    await crawl_dynamic_content_pages_method_3()
     
     await crawl_custom_browser_type()
     
diff --git a/requirements.txt b/requirements.txt
index c0f6f183..741e12ef 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -1,5 +1,4 @@
 aiosqlite~=0.20
-html2text~=2024.2
 lxml~=5.3
 litellm>=1.53.1
 numpy>=1.26.0,<3
@@ -13,4 +12,5 @@ xxhash~=3.4
 rank-bm25~=0.2
 aiofiles>=24.1.0
 colorama~=0.4
-snowballstemmer~=2.2
\ No newline at end of file
+snowballstemmer~=2.2
+pydantic>=2.10
\ No newline at end of file
diff --git a/setup.py b/setup.py
index d44169bf..e6840cd0 100644
--- a/setup.py
+++ b/setup.py
@@ -1,11 +1,8 @@
 from setuptools import setup, find_packages
-from setuptools.command.install import install
 import os
 from pathlib import Path
 import shutil
-import subprocess
-import sys
-import asyncio
+
 
 # Create the .crawl4ai folder in the user's home directory if it doesn't exist
 # If the folder already exists, remove the cache folder
@@ -49,46 +46,6 @@ transformer_requirements = ["transformers", "tokenizers"]
 cosine_similarity_requirements = ["torch", "transformers", "nltk"]
 sync_requirements = ["selenium"]
 
-
-def install_playwright():
-    print("Installing Playwright browsers...")
-    try:
-        subprocess.check_call([sys.executable, "-m", "playwright", "install"])
-        print("Playwright installation completed successfully.")
-    except subprocess.CalledProcessError as e:
-        print(f"Error during Playwright installation: {e}")
-        print(
-            "Please run 'python -m playwright install' manually after the installation."
-        )
-    except Exception as e:
-        print(f"Unexpected error during Playwright installation: {e}")
-        print(
-            "Please run 'python -m playwright install' manually after the installation."
-        )
-
-
-def run_migration():
-    """Initialize database during installation"""
-    try:
-        print("Starting database initialization...")
-        from crawl4ai.async_database import async_db_manager
-
-        asyncio.run(async_db_manager.initialize())
-        print("Database initialization completed successfully.")
-    except ImportError:
-        print("Warning: Database module not found. Will initialize on first use.")
-    except Exception as e:
-        print(f"Warning: Database initialization failed: {e}")
-        print("Database will be initialized on first use")
-
-
-class PostInstallCommand(install):
-    def run(self):
-        install.run(self)
-        install_playwright()
-        # run_migration()
-
-
 setup(
     name="Crawl4AI",
     version=version,
@@ -116,7 +73,8 @@ setup(
     entry_points={
         "console_scripts": [
             "crawl4ai-download-models=crawl4ai.model_loader:main",
-            "crawl4ai-migrate=crawl4ai.migrations:main",  # Added migration command
+            "crawl4ai-migrate=crawl4ai.migrations:main",  
+            'crawl4ai-setup=crawl4ai.install:post_install', 
         ],
     },
     classifiers=[
@@ -130,7 +88,4 @@ setup(
         "Programming Language :: Python :: 3.10",
     ],
     python_requires=">=3.7",
-    cmdclass={
-        "install": PostInstallCommand,
-    },
 )

From 93bf3e8a1f87760e04d6a18b2e27bae0f5d5da0e Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Fri, 29 Nov 2024 20:08:09 +0800
Subject: [PATCH 103/115]   Refactor Dockerfile and clean up main.py   -
 Enhanced Dockerfile for platform-specific installations     - Added ARG for
 TARGETPLATFORM and BUILDPLATFORM     - Improved GPU support conditional on
 TARGETPLATFORM   - Removed static pages mounting in main.py   - Streamlined
 code structure to improve maintainability

---
 Dockerfile | 25 ++++++++++++++++---------
 main.py    |  4 ----
 2 files changed, 16 insertions(+), 13 deletions(-)

diff --git a/Dockerfile b/Dockerfile
index bd71deae..2997590a 100644
--- a/Dockerfile
+++ b/Dockerfile
@@ -1,6 +1,9 @@
 # syntax=docker/dockerfile:1.4
 
-# Build arguments
+ARG TARGETPLATFORM
+ARG BUILDPLATFORM
+
+# Other build arguments
 ARG PYTHON_VERSION=3.10
 
 # Base stage with system dependencies
@@ -63,13 +66,13 @@ RUN apt-get update && apt-get install -y --no-install-recommends \
     && rm -rf /var/lib/apt/lists/*
 
 # GPU support if enabled and architecture is supported
-RUN if [ "$ENABLE_GPU" = "true" ] && [ "$(dpkg --print-architecture)" != "arm64" ] ; then \
-        apt-get update && apt-get install -y --no-install-recommends \
-        nvidia-cuda-toolkit \
-        && rm -rf /var/lib/apt/lists/* ; \
-    else \
-        echo "Skipping NVIDIA CUDA Toolkit installation (unsupported architecture or GPU disabled)"; \
-    fi
+RUN if [ "$ENABLE_GPU" = "true" ] && [ "$TARGETPLATFORM" = "linux/amd64" ] ; then \
+    apt-get update && apt-get install -y --no-install-recommends \
+    nvidia-cuda-toolkit \
+    && rm -rf /var/lib/apt/lists/* ; \
+else \
+    echo "Skipping NVIDIA CUDA Toolkit installation (unsupported platform or GPU disabled)"; \
+fi
 
 # Create and set working directory
 WORKDIR /app
@@ -120,7 +123,11 @@ RUN pip install --no-cache-dir \
 RUN mkdocs build
 
 # Install Playwright and browsers
-RUN playwright install
+RUN if [ "$TARGETPLATFORM" = "linux/amd64" ]; then \
+    playwright install chromium; \
+    elif [ "$TARGETPLATFORM" = "linux/arm64" ]; then \
+    playwright install chromium; \
+    fi
 
 # Expose port
 EXPOSE 8000 11235 9222 8080
diff --git a/main.py b/main.py
index 6d217410..d6c792e8 100644
--- a/main.py
+++ b/main.py
@@ -340,9 +340,6 @@ app.add_middleware(
     allow_headers=["*"],  # Allows all headers
 )
 
-# Mount the pages directory as a static directory
-app.mount("/pages", StaticFiles(directory=__location__ + "/pages"), name="pages")
-
 # API token security
 security = HTTPBearer()
 CRAWL4AI_API_TOKEN = os.getenv("CRAWL4AI_API_TOKEN") or "test_api_code"
@@ -364,7 +361,6 @@ if os.path.exists(__location__ + "/site"):
     app.mount("/mkdocs", StaticFiles(directory="site", html=True), name="mkdocs")
 
 site_templates = Jinja2Templates(directory=__location__ + "/site")
-templates = Jinja2Templates(directory=__location__ + "/pages")
 
 crawler_service = CrawlerService()
 

From f9c98a377dd1dda28f88cd5ab4e801535a88abcc Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Fri, 29 Nov 2024 20:52:51 +0800
Subject: [PATCH 104/115]   Enhance Docker support and improve installation
 process   - Added new Docker commands for platform-specific builds.   -
 Updated README with comprehensive installation and setup instructions.   -
 Introduced `post_install` method in setup script for automation.   - Refined
 migration processes with enhanced error logging.   - Bump version to 0.3.746
 and updated dependencies.

---
 CHANGELOG.md                    |  59 +++++++++++
 README.md                       | 177 +++++++++++++++++++++++++++-----
 docker-compose.yml              |  65 ++++++------
 docs/examples/docker_example.py |  22 ++--
 4 files changed, 256 insertions(+), 67 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 5ec79639..309218dc 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -1,5 +1,64 @@
 # Changelog
 
+## [0.3.746] November 29, 2024
+
+### Major Features
+1. Enhanced Docker Support (Nov 29, 2024)
+   - Improved GPU support in Docker images.
+   - Dockerfile refactored for better platform-specific installations.
+   - Introduced new Docker commands for different platforms:
+     - `basic-amd64`, `all-amd64`, `gpu-amd64` for AMD64.
+     - `basic-arm64`, `all-arm64`, `gpu-arm64` for ARM64.
+
+### Infrastructure & Documentation
+- Enhanced README.md to improve user guidance and installation instructions.
+- Added installation instructions for Playwright setup in README.
+- Created and updated examples in `docs/examples/quickstart_async.py` to be more useful and user-friendly.
+- Updated `requirements.txt` with a new `pydantic` dependency.
+- Bumped version number in `crawl4ai/__version__.py` to 0.3.746.
+
+### Breaking Changes
+- Streamlined application structure:
+  - Removed static pages and related code from `main.py` which might affect existing deployments relying on static content.
+
+### Development Updates
+- Developed `post_install` method in `crawl4ai/install.py` to streamline post-installation setup tasks.
+- Refined migration processes in `crawl4ai/migrations.py` with enhanced logging for better error visibility.
+- Updated `docker-compose.yml` to support local and hub services for different architectures, enhancing build and deploy capabilities.
+- Refactored example test cases in `docs/examples/docker_example.py` to facilitate comprehensive testing.
+
+### README.md
+Updated README with new docker commands and setup instructions.
+Enhanced installation instructions and guidance.
+
+### crawl4ai/install.py
+Added post-install script functionality.
+Introduced `post_install` method for automation of post-installation tasks.
+
+### crawl4ai/migrations.py
+Improved migration logging.
+Refined migration processes and added better logging.
+
+### docker-compose.yml
+Refactored docker-compose for better service management.
+Updated to define services for different platforms and versions.
+
+### requirements.txt
+Updated dependencies.
+Added `pydantic` to requirements file.
+
+### crawler/__version__.py
+Updated version number.
+Bumped version number to 0.3.746.
+
+### docs/examples/quickstart_async.py
+Enhanced example scripts.
+Uncommented example usage in async guide for user functionality.
+
+### main.py
+Refactored code to improve maintainability.
+Streamlined app structure by removing static pages code.
+
 ## [0.3.743] November 27, 2024
 
 Enhance features and documentation
diff --git a/README.md b/README.md
index bbfa5858..3d89ee19 100644
--- a/README.md
+++ b/README.md
@@ -220,48 +220,173 @@ Crawl4AI is available as Docker images for easy deployment. You can either pull
 
 ---
 
-### Option 1: Docker Hub (Recommended)
+<details>
+<summary>🐳 <strong>Option 1: Docker Hub (Recommended)</strong></summary>
 
+Choose the appropriate image based on your platform and needs:
+
+### For AMD64 (Regular Linux/Windows):
 ```bash
-# Pull and run from Docker Hub (choose one):
-docker pull unclecode/crawl4ai:basic    # Basic crawling features
-docker pull unclecode/crawl4ai:all      # Full installation (ML, LLM support)
-docker pull unclecode/crawl4ai:gpu      # GPU-enabled version
+# Basic version (recommended)
+docker pull unclecode/crawl4ai:basic-amd64
+docker run -p 11235:11235 unclecode/crawl4ai:basic-amd64
 
-# Run the container
-docker run -p 11235:11235 unclecode/crawl4ai:basic  # Replace 'basic' with your chosen version
+# Full ML/LLM support
+docker pull unclecode/crawl4ai:all-amd64
+docker run -p 11235:11235 unclecode/crawl4ai:all-amd64
 
-# In case you want to set platform to arm64
-docker run --platform linux/arm64 -p 11235:11235 unclecode/crawl4ai:basic
-
-# In case to allocate more shared memory for the container
-docker run --shm-size=2gb -p 11235:11235 unclecode/crawl4ai:basic
+# With GPU support
+docker pull unclecode/crawl4ai:gpu-amd64
+docker run -p 11235:11235 unclecode/crawl4ai:gpu-amd64
 ```
 
----
+### For ARM64 (M1/M2 Macs, ARM servers):
+```bash
+# Basic version (recommended)
+docker pull unclecode/crawl4ai:basic-arm64
+docker run -p 11235:11235 unclecode/crawl4ai:basic-arm64
 
-### Option 2: Build from Repository
+# Full ML/LLM support
+docker pull unclecode/crawl4ai:all-arm64
+docker run -p 11235:11235 unclecode/crawl4ai:all-arm64
+
+# With GPU support
+docker pull unclecode/crawl4ai:gpu-arm64
+docker run -p 11235:11235 unclecode/crawl4ai:gpu-arm64
+```
+
+Need more memory? Add `--shm-size`:
+```bash
+docker run --shm-size=2gb -p 11235:11235 unclecode/crawl4ai:basic-amd64
+```
+
+Test the installation:
+```bash
+curl http://localhost:11235/health
+```
+
+### For Raspberry Pi (32-bit) (Experimental)
+```bash
+# Pull and run basic version (recommended for Raspberry Pi)
+docker pull unclecode/crawl4ai:basic-armv7
+docker run -p 11235:11235 unclecode/crawl4ai:basic-armv7
+
+# With increased shared memory if needed
+docker run --shm-size=2gb -p 11235:11235 unclecode/crawl4ai:basic-armv7
+```
+
+Note: Due to hardware constraints, only the basic version is recommended for Raspberry Pi.
+
+</details>
+
+<details>
+<summary>🐳 <strong>Option 2: Build from Repository</strong></summary>
+
+Build the image locally based on your platform:
 
 ```bash
 # Clone the repository
 git clone https://github.com/unclecode/crawl4ai.git
 cd crawl4ai
 
-# Build the image
-docker build -t crawl4ai:local \
-  --build-arg INSTALL_TYPE=basic \  # Options: basic, all
+# For AMD64 (Regular Linux/Windows)
+docker build --platform linux/amd64 \
+  --tag crawl4ai:local \
+  --build-arg INSTALL_TYPE=basic \
   .
 
-# In case you want to set platform to arm64
-docker build -t crawl4ai:local \
-  --build-arg INSTALL_TYPE=basic \  # Options: basic, all
-  --platform linux/arm64 \
+# For ARM64 (M1/M2 Macs, ARM servers)
+docker build --platform linux/arm64 \
+  --tag crawl4ai:local \
+  --build-arg INSTALL_TYPE=basic \
   .
-
-# Run your local build
-docker run -p 11235:11235 crawl4ai:local
 ```
 
+Build options:
+- INSTALL_TYPE=basic (default): Basic crawling features
+- INSTALL_TYPE=all: Full ML/LLM support
+- ENABLE_GPU=true: Add GPU support
+
+Example with all options:
+```bash
+docker build --platform linux/amd64 \
+  --tag crawl4ai:local \
+  --build-arg INSTALL_TYPE=all \
+  --build-arg ENABLE_GPU=true \
+  .
+```
+
+Run your local build:
+```bash
+# Regular run
+docker run -p 11235:11235 crawl4ai:local
+
+# With increased shared memory
+docker run --shm-size=2gb -p 11235:11235 crawl4ai:local
+```
+
+Test the installation:
+```bash
+curl http://localhost:11235/health
+```
+
+</details>
+
+<details>
+<summary>🐳 <strong>Option 3: Using Docker Compose</strong></summary>
+
+Docker Compose provides a more structured way to run Crawl4AI, especially when dealing with environment variables and multiple configurations.
+
+```bash
+# Clone the repository
+git clone https://github.com/unclecode/crawl4ai.git
+cd crawl4ai
+```
+
+### For AMD64 (Regular Linux/Windows):
+```bash
+# Build and run locally
+docker-compose --profile local-amd64 up
+
+# Run from Docker Hub
+VERSION=basic docker-compose --profile hub-amd64 up   # Basic version
+VERSION=all docker-compose --profile hub-amd64 up     # Full ML/LLM support
+VERSION=gpu docker-compose --profile hub-amd64 up     # GPU support
+```
+
+### For ARM64 (M1/M2 Macs, ARM servers):
+```bash
+# Build and run locally
+docker-compose --profile local-arm64 up
+
+# Run from Docker Hub
+VERSION=basic docker-compose --profile hub-arm64 up   # Basic version
+VERSION=all docker-compose --profile hub-arm64 up     # Full ML/LLM support
+VERSION=gpu docker-compose --profile hub-arm64 up     # GPU support
+```
+
+Environment variables (optional):
+```bash
+# Create a .env file
+CRAWL4AI_API_TOKEN=your_token
+OPENAI_API_KEY=your_openai_key
+CLAUDE_API_KEY=your_claude_key
+```
+
+The compose file includes:
+- Memory management (4GB limit, 1GB reserved)
+- Shared memory volume for browser support
+- Health checks
+- Auto-restart policy
+- All necessary port mappings
+
+Test the installation:
+```bash
+curl http://localhost:11235/health
+```
+
+</details>
+
 ---
 
 ### Quick Test
@@ -278,11 +403,11 @@ response = requests.post(
 )
 task_id = response.json()["task_id"]
 
-# Get results
+# Continue polling until the task is complete (status="completed")
 result = requests.get(f"http://localhost:11235/task/{task_id}")
 ```
 
-For advanced configuration, environment variables, and usage examples, see our [Docker Deployment Guide](https://crawl4ai.com/mkdocs/basic/docker-deployment/).
+For more examples, see our [Docker Examples](https://github.com/unclecode/crawl4ai/blob/main/docs/examples/docker_example.py). For advanced configuration, environment variables, and usage examples, see our [Docker Deployment Guide](https://crawl4ai.com/mkdocs/basic/docker-deployment/).
 
 </details>
 
diff --git a/docker-compose.yml b/docker-compose.yml
index b93beda9..4b22fd98 100644
--- a/docker-compose.yml
+++ b/docker-compose.yml
@@ -1,5 +1,6 @@
 services:
-  crawl4ai:
+  # Local build services for different platforms
+  crawl4ai-amd64:
     build:
       context: .
       dockerfile: Dockerfile
@@ -7,35 +8,39 @@ services:
         PYTHON_VERSION: "3.10"
         INSTALL_TYPE: ${INSTALL_TYPE:-basic}
         ENABLE_GPU: false
-    profiles: ["local"]
-    ports:
-      - "11235:11235"
-      - "8000:8000"
-      - "9222:9222"
-      - "8080:8080"
-    environment:
-      - CRAWL4AI_API_TOKEN=${CRAWL4AI_API_TOKEN:-}
-      - OPENAI_API_KEY=${OPENAI_API_KEY:-}
-      - CLAUDE_API_KEY=${CLAUDE_API_KEY:-}
-    volumes:
-      - /dev/shm:/dev/shm
-    deploy:
-      resources:
-        limits:
-          memory: 4G
-        reservations:
-          memory: 1G
-    restart: unless-stopped
-    healthcheck:
-      test: ["CMD", "curl", "-f", "http://localhost:11235/health"]
-      interval: 30s
-      timeout: 10s
-      retries: 3
-      start_period: 40s
+      platforms:
+        - linux/amd64
+    profiles: ["local-amd64"]
+    extends: &base-config
+      file: docker-compose.yml
+      service: base-config
 
-  crawl4ai-hub:
-    image: unclecode/crawl4ai:basic
-    profiles: ["hub"]
+  crawl4ai-arm64:
+    build:
+      context: .
+      dockerfile: Dockerfile
+      args:
+        PYTHON_VERSION: "3.10"
+        INSTALL_TYPE: ${INSTALL_TYPE:-basic}
+        ENABLE_GPU: false
+      platforms:
+        - linux/arm64
+    profiles: ["local-arm64"]
+    extends: *base-config
+
+  # Hub services for different platforms and versions
+  crawl4ai-hub-amd64:
+    image: unclecode/crawl4ai:${VERSION:-basic}-amd64
+    profiles: ["hub-amd64"]
+    extends: *base-config
+
+  crawl4ai-hub-arm64:
+    image: unclecode/crawl4ai:${VERSION:-basic}-arm64
+    profiles: ["hub-arm64"]
+    extends: *base-config
+
+  # Base configuration to be extended
+  base-config:
     ports:
       - "11235:11235"
       - "8000:8000"
@@ -59,4 +64,4 @@ services:
       interval: 30s
       timeout: 10s
       retries: 3
-      start_period: 40s
+      start_period: 40s
\ No newline at end of file
diff --git a/docs/examples/docker_example.py b/docs/examples/docker_example.py
index 17ef9f04..48acc809 100644
--- a/docs/examples/docker_example.py
+++ b/docs/examples/docker_example.py
@@ -78,20 +78,20 @@ def test_docker_deployment(version="basic"):
             time.sleep(5)
     
     # Test cases based on version
-    # test_basic_crawl(tester)
-    # test_basic_crawl(tester)
-    # test_basic_crawl_sync(tester)
     test_basic_crawl_direct(tester)
+    test_basic_crawl(tester)
+    test_basic_crawl(tester)
+    test_basic_crawl_sync(tester)
     
-    # if version in ["full", "transformer"]:
-    #     test_cosine_extraction(tester)
+    if version in ["full", "transformer"]:
+        test_cosine_extraction(tester)
 
-    # test_js_execution(tester)
-    # test_css_selector(tester)
-    # test_structured_extraction(tester)
-    # test_llm_extraction(tester)
-    # test_llm_with_ollama(tester)
-    # test_screenshot(tester)
+    test_js_execution(tester)
+    test_css_selector(tester)
+    test_structured_extraction(tester)
+    test_llm_extraction(tester)
+    test_llm_with_ollama(tester)
+    test_screenshot(tester)
     
 
 def test_basic_crawl(tester: Crawl4AiTester):

From 1def53b7fe60267d5bc1f492f50b5f53f8858eee Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Fri, 29 Nov 2024 20:53:43 +0800
Subject: [PATCH 105/115] docs: update Raspberry Pi section to indicate
 upcoming support

---
 README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/README.md b/README.md
index 3d89ee19..405c1002 100644
--- a/README.md
+++ b/README.md
@@ -265,7 +265,7 @@ Test the installation:
 curl http://localhost:11235/health
 ```
 
-### For Raspberry Pi (32-bit) (Experimental)
+### For Raspberry Pi (32-bit) (coming soon):
 ```bash
 # Pull and run basic version (recommended for Raspberry Pi)
 docker pull unclecode/crawl4ai:basic-armv7

From 1ed7c15118fc81427fa29afe6368eb2a47720fd4 Mon Sep 17 00:00:00 2001
From: dvschuyl <125589423+dvschuyl@users.noreply.github.com>
Date: Fri, 29 Nov 2024 14:06:04 +0100
Subject: [PATCH 106/115] :adhesive_bandage: Page-evaluate navigation destroyed
 error (#304)

Thanks for your contribution and such a nice approach. Now that I think of it, I guess I can make good use of this for some other part of the code. By the way, thank you so much; I will add your name to the new list of contributors.
---
 crawl4ai/async_crawler_strategy.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/crawl4ai/async_crawler_strategy.py b/crawl4ai/async_crawler_strategy.py
index e5316187..a41d29a8 100644
--- a/crawl4ai/async_crawler_strategy.py
+++ b/crawl4ai/async_crawler_strategy.py
@@ -920,6 +920,7 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
                 });
             }
             """
+            await page.wait_for_load_state()
             await page.evaluate(update_image_dimensions_js)
 
             # Wait a bit for any onload events to complete

From 0780db55e1298e73178077ec0bdc65cd534faa8d Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Fri, 29 Nov 2024 21:12:19 +0800
Subject: [PATCH 107/115] fix: handle errors during image dimension updates in
 AsyncPlaywrightCrawlerStrategy

---
 crawl4ai/async_crawler_strategy.py | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/crawl4ai/async_crawler_strategy.py b/crawl4ai/async_crawler_strategy.py
index e5316187..cc7f3993 100644
--- a/crawl4ai/async_crawler_strategy.py
+++ b/crawl4ai/async_crawler_strategy.py
@@ -920,7 +920,11 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
                 });
             }
             """
-            await page.evaluate(update_image_dimensions_js)
+            try:
+                await page.wait_for_load_state()
+                await page.evaluate(update_image_dimensions_js)
+            except Exception as e:
+                raise RuntimeError(f"Error updating image dimensions ACS-UPDATE_IMAGE_DIMENSIONS_JS: {str(e)}")
 
             # Wait a bit for any onload events to complete
             await page.wait_for_timeout(100)

From 8c76a8c7dcb2820a351eeb5696db2fc04fce7805 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Fri, 29 Nov 2024 21:14:49 +0800
Subject: [PATCH 108/115] docs: add contributor entry for dvschuyl regarding
 AsyncPlaywrightCrawlerStrategy issue

---
 CONTRIBUTORS.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/CONTRIBUTORS.md b/CONTRIBUTORS.md
index 663e5541..79038bdd 100644
--- a/CONTRIBUTORS.md
+++ b/CONTRIBUTORS.md
@@ -18,6 +18,7 @@ We would like to thank the following people for their contributions to Crawl4AI:
 
 ## Pull Requests
 
+- [dvschuyl](https://github.com/dvschuyl) - AsyncPlaywrightCrawlerStrategy page-evaluate context destroyed by navigation [#304](https://github.com/unclecode/crawl4ai/pull/304)
 - [nelzomal](https://github.com/nelzomal) - Enhance development installation instructions [#286](https://github.com/unclecode/crawl4ai/pull/286)
 - [HamzaFarhan](https://github.com/HamzaFarhan) - Handled the cases where markdown_with_citations, references_markdown, and filtered_html might not be defined [#293](https://github.com/unclecode/crawl4ai/pull/293)
 - [NanmiCoder](https://github.com/NanmiCoder) - fix: crawler strategy exception handling and fixes [#271](https://github.com/unclecode/crawl4ai/pull/271)

From 3e83893b3f41b7176f6ec0beaccab9f2b159785d Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Sat, 30 Nov 2024 18:13:12 +0800
Subject: [PATCH 109/115]   Enhance User-Agent Handling

  - Added a new UserAgentGenerator class for generating random User-Agents.
  - Integrated User-Agent generation in AsyncPlaywrightCrawlerStrategy for randomization.
  - Enhanced HTTP headers with generated Client Hints.
---
 crawl4ai/async_crawler_strategy.py |  33 +++-
 crawl4ai/user_agent_generator.py   | 262 +++++++++++++++++++++++++++++
 2 files changed, 289 insertions(+), 6 deletions(-)
 create mode 100644 crawl4ai/user_agent_generator.py

diff --git a/crawl4ai/async_crawler_strategy.py b/crawl4ai/async_crawler_strategy.py
index cc7f3993..3d24bd84 100644
--- a/crawl4ai/async_crawler_strategy.py
+++ b/crawl4ai/async_crawler_strategy.py
@@ -16,6 +16,7 @@ import json
 import uuid
 from .models import AsyncCrawlResponse
 from .utils import create_box_message
+from .user_agent_generator import UserAgentGenerator
 from playwright_stealth import StealthConfig, stealth_async
 
 stealth_config = StealthConfig(
@@ -222,14 +223,20 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
         self.use_cached_html = use_cached_html
         self.user_agent = kwargs.get(
             "user_agent",
-            "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 "
-            "(KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36"
+            "Mozilla/5.0 (Linux; Android 11; SM-G973F) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.120 Mobile Safari/537.36"
         )
+        user_agenr_generator = UserAgentGenerator()
+        if kwargs.get("user_agent_mode") == "random":
+            self.user_agent = user_agenr_generator.generate(
+                 **kwargs.get("user_agent_generator_config", {})
+            )
         self.proxy = kwargs.get("proxy")
         self.proxy_config = kwargs.get("proxy_config")
         self.headless = kwargs.get("headless", True)
         self.browser_type = kwargs.get("browser_type", "chromium")
         self.headers = kwargs.get("headers", {})
+        self.browser_hint = user_agenr_generator.generate_client_hints(self.user_agent)
+        self.headers.setdefault("sec-ch-ua", self.browser_hint)
         self.cookies = kwargs.get("cookies", [])
         self.sessions = {}
         self.session_ttl = 1800 
@@ -307,7 +314,9 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
                         
                     if self.user_agent:
                         await self.default_context.set_extra_http_headers({
-                            "User-Agent": self.user_agent
+                            "User-Agent": self.user_agent,
+                            "sec-ch-ua": self.browser_hint,
+                            # **self.headers
                         })
             else:
                 # Base browser arguments
@@ -321,7 +330,9 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
                         "--disable-infobars",
                         "--window-position=0,0",
                         "--ignore-certificate-errors",
-                        "--ignore-certificate-errors-spki-list"
+                        "--ignore-certificate-errors-spki-list",
+                        "--disable-blink-features=AutomationControlled",
+                        
                     ]
                 }
                 
@@ -642,6 +653,15 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
         self._cleanup_expired_sessions()
         session_id = kwargs.get("session_id")
         
+        # Check if in kwargs we have user_agent that will override the default user_agent
+        user_agent = kwargs.get("user_agent", self.user_agent)
+        
+        # Generate random user agent if magic mode is enabled and user_agent_mode is not random
+        if kwargs.get("user_agent_mode") != "random" and kwargs.get("magic", False):
+            user_agent = UserAgentGenerator().generate(
+                **kwargs.get("user_agent_generator_config", {})
+            )
+        
         # Handle page creation differently for managed browser
         context = None
         if self.use_managed_browser:
@@ -666,7 +686,7 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
                     else:
                         # Normal context creation for non-persistent or non-Chrome browsers
                         context = await self.browser.new_context(
-                            user_agent=self.user_agent,
+                            user_agent=user_agent,
                             viewport={"width": 1200, "height": 800},
                             proxy={"server": self.proxy} if self.proxy else None,
                             java_script_enabled=True,
@@ -686,10 +706,11 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
                 else:
                     # Normal context creation
                     context = await self.browser.new_context(
-                        user_agent=self.user_agent,
+                        user_agent=user_agent,
                         viewport={"width": 1920, "height": 1080},
                         proxy={"server": self.proxy} if self.proxy else None,
                         accept_downloads=self.accept_downloads,
+                        ignore_https_errors=True  # Add this line
                     )
                     if self.cookies:
                             await context.add_cookies(self.cookies)
diff --git a/crawl4ai/user_agent_generator.py b/crawl4ai/user_agent_generator.py
new file mode 100644
index 00000000..0a4df0bb
--- /dev/null
+++ b/crawl4ai/user_agent_generator.py
@@ -0,0 +1,262 @@
+import random
+from typing import Optional, Literal, List, Dict, Tuple
+import re
+
+
+class UserAgentGenerator:
+    def __init__(self):
+        # Previous platform definitions remain the same...
+        self.desktop_platforms = {
+            "windows": {
+                "10_64": "(Windows NT 10.0; Win64; x64)",
+                "10_32": "(Windows NT 10.0; WOW64)",
+            },
+            "macos": {
+                "intel": "(Macintosh; Intel Mac OS X 10_15_7)",
+                "newer": "(Macintosh; Intel Mac OS X 10.15; rv:109.0)",
+            },
+            "linux": {
+                "generic": "(X11; Linux x86_64)",
+                "ubuntu": "(X11; Ubuntu; Linux x86_64)",
+                "chrome_os": "(X11; CrOS x86_64 14541.0.0)",
+            }
+        }
+
+        self.mobile_platforms = {
+            "android": {
+                "samsung": "(Linux; Android 13; SM-S901B)",
+                "pixel": "(Linux; Android 12; Pixel 6)",
+                "oneplus": "(Linux; Android 13; OnePlus 9 Pro)",
+                "xiaomi": "(Linux; Android 12; M2102J20SG)",
+            },
+            "ios": {
+                "iphone": "(iPhone; CPU iPhone OS 16_5 like Mac OS X)",
+                "ipad": "(iPad; CPU OS 16_5 like Mac OS X)",
+            }
+        }
+
+        # Browser Combinations
+        self.browser_combinations = {
+            1: [
+                ["chrome"],
+                ["firefox"],
+                ["safari"],
+                ["edge"]
+            ],
+            2: [
+                ["gecko", "firefox"],
+                ["chrome", "safari"],
+                ["webkit", "safari"]
+            ],
+            3: [
+                ["chrome", "safari", "edge"],
+                ["webkit", "chrome", "safari"]
+            ]
+        }
+
+        # Rendering Engines with versions
+        self.rendering_engines = {
+            "chrome_webkit": "AppleWebKit/537.36",
+            "safari_webkit": "AppleWebKit/605.1.15",
+            "gecko": [  # Added Gecko versions
+                "Gecko/20100101",
+                "Gecko/20100101",  # Firefox usually uses this constant version
+                "Gecko/2010010",
+            ]
+        }
+
+        # Browser Versions
+        self.chrome_versions = [
+            "Chrome/119.0.6045.199",
+            "Chrome/118.0.5993.117",
+            "Chrome/117.0.5938.149",
+            "Chrome/116.0.5845.187",
+            "Chrome/115.0.5790.171",
+        ]
+
+        self.edge_versions = [
+            "Edg/119.0.2151.97",
+            "Edg/118.0.2088.76",
+            "Edg/117.0.2045.47",
+            "Edg/116.0.1938.81",
+            "Edg/115.0.1901.203",
+        ]
+
+        self.safari_versions = [
+            "Safari/537.36",  # For Chrome-based
+            "Safari/605.1.15",
+            "Safari/604.1",
+            "Safari/602.1",
+            "Safari/601.5.17",
+        ]
+
+        # Added Firefox versions
+        self.firefox_versions = [
+            "Firefox/119.0",
+            "Firefox/118.0.2",
+            "Firefox/117.0.1",
+            "Firefox/116.0",
+            "Firefox/115.0.3",
+            "Firefox/114.0.2",
+            "Firefox/113.0.1",
+            "Firefox/112.0",
+            "Firefox/111.0.1",
+            "Firefox/110.0",
+        ]
+
+    def get_browser_stack(self, num_browsers: int = 1) -> List[str]:
+        """Get a valid combination of browser versions"""
+        if num_browsers not in self.browser_combinations:
+            raise ValueError(f"Unsupported number of browsers: {num_browsers}")
+        
+        combination = random.choice(self.browser_combinations[num_browsers])
+        browser_stack = []
+        
+        for browser in combination:
+            if browser == "chrome":
+                browser_stack.append(random.choice(self.chrome_versions))
+            elif browser == "firefox":
+                browser_stack.append(random.choice(self.firefox_versions))
+            elif browser == "safari":
+                browser_stack.append(random.choice(self.safari_versions))
+            elif browser == "edge":
+                browser_stack.append(random.choice(self.edge_versions))
+            elif browser == "gecko":
+                browser_stack.append(random.choice(self.rendering_engines["gecko"]))
+            elif browser == "webkit":
+                browser_stack.append(self.rendering_engines["chrome_webkit"])
+        
+        return browser_stack
+
+    def generate(self, 
+                device_type: Optional[Literal['desktop', 'mobile']] = None,
+                os_type: Optional[str] = None,
+                device_brand: Optional[str] = None,
+                browser_type: Optional[Literal['chrome', 'edge', 'safari', 'firefox']] = None,
+                num_browsers: int = 3) -> str:
+        """
+        Generate a random user agent with specified constraints.
+        
+        Args:
+            device_type: 'desktop' or 'mobile'
+            os_type: 'windows', 'macos', 'linux', 'android', 'ios'
+            device_brand: Specific device brand
+            browser_type: 'chrome', 'edge', 'safari', or 'firefox'
+            num_browsers: Number of browser specifications (1-3)
+        """
+        # Get platform string
+        platform = self.get_random_platform(device_type, os_type, device_brand)
+        
+        # Start with Mozilla
+        components = ["Mozilla/5.0", platform]
+        
+        # Add browser stack
+        browser_stack = self.get_browser_stack(num_browsers)
+        
+        # Add appropriate legacy token based on browser stack
+        if "Firefox" in str(browser_stack):
+            components.append(random.choice(self.rendering_engines["gecko"]))
+        elif "Chrome" in str(browser_stack) or "Safari" in str(browser_stack):
+            components.append(self.rendering_engines["chrome_webkit"])
+            components.append("(KHTML, like Gecko)")
+        
+        # Add browser versions
+        components.extend(browser_stack)
+        
+        return " ".join(components)
+
+    def generate_with_client_hints(self, **kwargs) -> Tuple[str, str]:
+        """Generate both user agent and matching client hints"""
+        user_agent = self.generate(**kwargs)
+        client_hints = self.generate_client_hints(user_agent)
+        return user_agent, client_hints
+
+    def get_random_platform(self, device_type, os_type, device_brand):
+        """Helper method to get random platform based on constraints"""
+        platforms = self.desktop_platforms if device_type == 'desktop' else \
+                   self.mobile_platforms if device_type == 'mobile' else \
+                   {**self.desktop_platforms, **self.mobile_platforms}
+        
+        if os_type:
+            for platform_group in [self.desktop_platforms, self.mobile_platforms]:
+                if os_type in platform_group:
+                    platforms = {os_type: platform_group[os_type]}
+                    break
+        
+        os_key = random.choice(list(platforms.keys()))
+        if device_brand and device_brand in platforms[os_key]:
+            return platforms[os_key][device_brand]
+        return random.choice(list(platforms[os_key].values()))
+
+    def parse_user_agent(self, user_agent: str) -> Dict[str, str]:
+        """Parse a user agent string to extract browser and version information"""
+        browsers = {
+            'chrome': r'Chrome/(\d+)',
+            'edge': r'Edg/(\d+)',
+            'safari': r'Version/(\d+)',
+            'firefox': r'Firefox/(\d+)'
+        }
+        
+        result = {}
+        for browser, pattern in browsers.items():
+            match = re.search(pattern, user_agent)
+            if match:
+                result[browser] = match.group(1)
+        
+        return result
+
+    def generate_client_hints(self, user_agent: str) -> str:
+        """Generate Sec-CH-UA header value based on user agent string"""
+        browsers = self.parse_user_agent(user_agent)
+        
+        # Client hints components
+        hints = []
+        
+        # Handle different browser combinations
+        if 'chrome' in browsers:
+            hints.append(f'"Chromium";v="{browsers["chrome"]}"')
+            hints.append('"Not_A Brand";v="8"')
+            
+            if 'edge' in browsers:
+                hints.append(f'"Microsoft Edge";v="{browsers["edge"]}"')
+            else:
+                hints.append(f'"Google Chrome";v="{browsers["chrome"]}"')
+                
+        elif 'firefox' in browsers:
+            # Firefox doesn't typically send Sec-CH-UA
+            return '""'
+            
+        elif 'safari' in browsers:
+            # Safari's format for client hints
+            hints.append(f'"Safari";v="{browsers["safari"]}"')
+            hints.append('"Not_A Brand";v="8"')
+        
+        return ', '.join(hints)
+
+# Example usage:
+if __name__ == "__main__":
+    generator = UserAgentGenerator()
+    
+    print("\nSingle browser (Chrome):")
+    print(generator.generate(num_browsers=1, browser_type='chrome'))
+    
+    print("\nTwo browsers (Gecko/Firefox):")
+    print(generator.generate(num_browsers=2))
+    
+    print("\nThree browsers (Chrome/Safari/Edge):")
+    print(generator.generate(num_browsers=3))
+    
+    print("\nFirefox on Linux:")
+    print(generator.generate(
+        device_type='desktop',
+        os_type='linux',
+        browser_type='firefox',
+        num_browsers=2
+    ))
+    
+    print("\nChrome/Safari/Edge on Windows:")
+    print(generator.generate(
+        device_type='desktop',
+        os_type='windows',
+        num_browsers=3
+    ))
\ No newline at end of file

From 80d58ad24c64e30ab0c037496de89952516b772e Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Sat, 30 Nov 2024 22:00:15 +0800
Subject: [PATCH 110/115] bump version to 0.3.747

---
 crawl4ai/__version__.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/crawl4ai/__version__.py b/crawl4ai/__version__.py
index 4a938b75..189a2955 100644
--- a/crawl4ai/__version__.py
+++ b/crawl4ai/__version__.py
@@ -1,2 +1,2 @@
 # crawl4ai/_version.py
-__version__ = "0.3.746"
+__version__ = "0.3.747"

From 293f299c083aab97aa06e8a06045caa7273aae15 Mon Sep 17 00:00:00 2001
From: unclecode <unclecode@kidocode.com>
Date: Sun, 1 Dec 2024 19:17:33 +0800
Subject: [PATCH 111/115]   Add PruningContentFilter with unit tests and update
 documentation

  - Introduced the PruningContentFilter for better content relevance.
  - Implemented comprehensive unit tests for verification of functionality.
  - Enhanced existing BM25ContentFilter tests for edge case coverage.
  - Updated documentation to include usage examples for new filter.
---
 CHANGELOG.md                                  |  50 +++
 README.md                                     |   7 +-
 crawl4ai/content_filter_strategy.py           | 285 ++++++++++--------
 crawl4ai/content_scraping_strategy.py         |  13 +-
 docs/examples/quickstart_async.py             |   8 +-
 docs/md_v2/advanced/managed_browser.md        |  54 +++-
 docs/md_v2/basic/content_filtering.md         |  58 +++-
 ..._filter.py => test_content_filter_bm25.py} |   0
 tests/async/test_content_filter_prune.py      | 159 ++++++++++
 9 files changed, 499 insertions(+), 135 deletions(-)
 rename tests/async/{test_content_filter.py => test_content_filter_bm25.py} (100%)
 create mode 100644 tests/async/test_content_filter_prune.py

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 309218dc..03a7afb0 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -1,5 +1,55 @@
 # Changelog
 
+## [0.3.75] December 1, 2024
+
+### PruningContentFilter
+
+#### 1. Introduced PruningContentFilter (Dec 01, 2024) (Dec 01, 2024)
+A new content filtering strategy that removes less relevant nodes based on metrics like text and link density.
+
+**Affected Files:**
+- `crawl4ai/content_filter_strategy.py`: Enhancement of content filtering capabilities.
+```diff
+Implemented effective pruning algorithm with comprehensive scoring.
+```
+- `README.md`: Improved documentation regarding new features.
+```diff
+Updated to include usage and explanation for the PruningContentFilter.
+```
+- `docs/md_v2/basic/content_filtering.md`: Expanded documentation for users.
+```diff
+Added detailed section explaining the PruningContentFilter.
+```
+
+#### 2. Added Unit Tests for PruningContentFilter (Dec 01, 2024) (Dec 01, 2024)
+Comprehensive tests added to ensure correct functionality of PruningContentFilter
+
+**Affected Files:**
+- `tests/async/test_content_filter_prune.py`: Increased test coverage for content filtering strategies.
+```diff
+Created test cases for various scenarios using the PruningContentFilter.
+```
+
+### Development Updates
+
+#### 3. Enhanced BM25ContentFilter tests (Dec 01, 2024) (Dec 01, 2024)
+Extended testing to cover additional edge cases and performance metrics.
+
+**Affected Files:**
+- `tests/async/test_content_filter_bm25.py`: Improved reliability and performance assurance.
+```diff
+Added tests for new extraction scenarios including malformed HTML.
+```
+
+### Infrastructure & Documentation
+
+#### 4. Updated Examples (Dec 01, 2024) (Dec 01, 2024)
+Altered examples in documentation to promote the use of PruningContentFilter alongside existing strategies.
+
+**Affected Files:**
+- `docs/examples/quickstart_async.py`: Enhanced usability and clarity for new users.
+- Revised example to illustrate usage of PruningContentFilter.
+
 ## [0.3.746] November 29, 2024
 
 ### Major Features
diff --git a/README.md b/README.md
index 405c1002..d70af8ad 100644
--- a/README.md
+++ b/README.md
@@ -422,7 +422,7 @@ You can check the project structure in the directory [https://github.com/uncleco
 ```python
 import asyncio
 from crawl4ai import AsyncWebCrawler, CacheMode
-from crawl4ai.content_filter_strategy import BM25ContentFilter
+from crawl4ai.content_filter_strategy import PruningContentFilter, BM25ContentFilter
 from crawl4ai.markdown_generation_strategy import DefaultMarkdownGenerator
 
 async def main():
@@ -434,8 +434,11 @@ async def main():
             url="https://docs.micronaut.io/4.7.6/guide/",
             cache_mode=CacheMode.ENABLED,
             markdown_generator=DefaultMarkdownGenerator(
-                content_filter=BM25ContentFilter(user_query=None, bm25_threshold=1.0)
+                content_filter=PruningContentFilter(threshold=0.48, threshold_type="fixed", min_word_threshold=0)
             ),
+            # markdown_generator=DefaultMarkdownGenerator(
+            #     content_filter=BM25ContentFilter(user_query="WHEN_WE_FOCUS_BASED_ON_A_USER_QUERY", bm25_threshold=1.0)
+            # ),
         )
         print(len(result.markdown))
         print(len(result.fit_markdown))
diff --git a/crawl4ai/content_filter_strategy.py b/crawl4ai/content_filter_strategy.py
index e6891a3f..ca3868bb 100644
--- a/crawl4ai/content_filter_strategy.py
+++ b/crawl4ai/content_filter_strategy.py
@@ -4,10 +4,10 @@ from typing import List, Tuple, Dict
 from rank_bm25 import BM25Okapi
 from time import perf_counter
 from collections import deque
-from bs4 import BeautifulSoup, NavigableString, Tag
+from bs4 import BeautifulSoup, NavigableString, Tag, Comment
 from .utils import clean_tokens
 from abc import ABC, abstractmethod
-
+import math
 from snowballstemmer import stemmer
 
 
@@ -358,145 +358,186 @@ class BM25ContentFilter(RelevantContentFilter):
         return [self.clean_element(tag) for _, _, tag in selected_candidates]
 
 
-class HeuristicContentFilter(RelevantContentFilter):
-    def __init__(self):
-        super().__init__()
-        # Weights for different heuristics
-        self.tag_weights = {
-            'article': 10,
-            'main': 8,
-            'section': 5,
-            'div': 3,
-            'p': 2,
-            'pre': 2,
-            'code': 2,
-            'blockquote': 2,
-            'li': 1,
-            'span': 1,
-        }
-        self.max_depth = 5  # Maximum depth from body to consider
 
-    def filter_content(self, html: str) -> List[str]:
-        """Implements heuristic content filtering without relying on a query."""
+
+
+
+class PruningContentFilter(RelevantContentFilter):
+    def __init__(self, user_query: str = None, min_word_threshold: int = None, 
+                 threshold_type: str = 'fixed', threshold: float = 0.48):
+        super().__init__(user_query)
+        self.min_word_threshold = min_word_threshold
+        self.threshold_type = threshold_type
+        self.threshold = threshold
+        
+        # Add tag importance for dynamic threshold
+        self.tag_importance = {
+            'article': 1.5,
+            'main': 1.4,
+            'section': 1.3,
+            'p': 1.2,
+            'h1': 1.4,
+            'h2': 1.3,
+            'h3': 1.2,
+            'div': 0.7,
+            'span': 0.6
+        }
+        
+        # Metric configuration
+        self.metric_config = {
+            'text_density': True,
+            'link_density': True,
+            'tag_weight': True,
+            'class_id_weight': True,
+            'text_length': True,
+        }
+        
+        self.metric_weights = {
+            'text_density': 0.4,
+            'link_density': 0.2,
+            'tag_weight': 0.2,
+            'class_id_weight': 0.1,
+            'text_length': 0.1,
+        }
+        
+        self.tag_weights = {
+            'div': 0.5,
+            'p': 1.0,
+            'article': 1.5,
+            'section': 1.0,
+            'span': 0.3,
+            'li': 0.5,
+            'ul': 0.5,
+            'ol': 0.5,
+            'h1': 1.2,
+            'h2': 1.1,
+            'h3': 1.0,
+            'h4': 0.9,
+            'h5': 0.8,
+            'h6': 0.7,
+        }
+
+    def filter_content(self, html: str, min_word_threshold: int = None) -> List[str]:
         if not html or not isinstance(html, str):
             return []
-
+            
         soup = BeautifulSoup(html, 'lxml')
-
-        # Ensure there is a body tag
         if not soup.body:
             soup = BeautifulSoup(f'<body>{html}</body>', 'lxml')
-        body = soup.body
+        
+        # Remove comments and unwanted tags
+        self._remove_comments(soup)
+        self._remove_unwanted_tags(soup)
+        
+        # Prune tree starting from body
+        body = soup.find('body')
+        self._prune_tree(body)
+        
+        # Extract remaining content as list of HTML strings
+        content_blocks = []
+        for element in body.children:
+            if isinstance(element, str) or not hasattr(element, 'name'):
+                continue
+            if len(element.get_text(strip=True)) > 0:
+                content_blocks.append(str(element))
+                
+        return content_blocks
 
-        # Extract candidate text chunks
-        candidates = self.extract_text_chunks(body)
+    def _remove_comments(self, soup):
+        for element in soup(text=lambda text: isinstance(text, Comment)):
+            element.extract()
 
-        if not candidates:
-            return []
+    def _remove_unwanted_tags(self, soup):
+        for tag in self.excluded_tags:
+            for element in soup.find_all(tag):
+                element.decompose()
 
-        # Score each candidate
-        scored_candidates = []
-        for index, text, tag_type, tag in candidates:
-            score = self.score_element(tag, text)
-            if score > 0:
-                scored_candidates.append((score, index, text, tag))
+    def _prune_tree(self, node):
+        if not node or not hasattr(node, 'name') or node.name is None:
+            return
 
-        # Sort candidates by score and then by document order
-        scored_candidates.sort(key=lambda x: (-x[0], x[1]))
+        text_len = len(node.get_text(strip=True))
+        tag_len = len(node.encode_contents().decode('utf-8'))
+        link_text_len = sum(len(s.strip()) for s in (a.string for a in node.find_all('a', recursive=False)) if s)
 
-        # Extract the top candidates (e.g., top 5)
-        top_candidates = scored_candidates[:5]  # Adjust the number as needed
+        metrics = {
+            'node': node,
+            'tag_name': node.name,
+            'text_len': text_len,
+            'tag_len': tag_len,
+            'link_text_len': link_text_len
+        }
 
-        # Sort the top candidates back to their original document order
-        top_candidates.sort(key=lambda x: x[1])
+        score = self._compute_composite_score(metrics)
 
-        # Clean and return the content
-        return [self.clean_element(tag) for _, _, _, tag in top_candidates]
+        if self.threshold_type == 'fixed':
+            should_remove = score < self.threshold
+        else:  # dynamic
+            tag_importance = self.tag_importance.get(node.name, 0.7)
+            text_ratio = text_len / tag_len if tag_len > 0 else 0
+            link_ratio = link_text_len / text_len if text_len > 0 else 1
+            
+            threshold = self.threshold  # base threshold
+            if tag_importance > 1:
+                threshold *= 0.8
+            if text_ratio > 0.4:
+                threshold *= 0.9
+            if link_ratio > 0.6:
+                threshold *= 1.2
+                
+            should_remove = score < threshold
 
-    def score_element(self, tag: Tag, text: str) -> float:
-        """Compute a score for an element based on heuristics."""
-        if not text or not tag:
-            return 0
+        if should_remove:
+            node.decompose()
+        else:
+            children = [child for child in node.children if hasattr(child, 'name')]
+            for child in children:
+                self._prune_tree(child)
 
-        # Exclude unwanted tags
-        if self.is_excluded(tag):
-            return 0
+    def _compute_composite_score(self, metrics, text_len, tag_len, link_text_len):
+        if self.min_word_threshold:
+            # Get raw text from metrics node - avoid extra processing
+            text = metrics['node'].get_text(strip=True)
+            word_count = text.count(' ') + 1
+            if word_count < self.min_word_threshold:
+                return -1.0  # Guaranteed removal
+        score = 0.0
+        total_weight = 0.0
 
-        # Text density
-        text_length = len(text.strip())
-        html_length = len(str(tag))
-        text_density = text_length / html_length if html_length > 0 else 0
+        if self.metric_config['text_density']:
+            density = text_len / tag_len if tag_len > 0 else 0
+            score += self.metric_weights['text_density'] * density
+            total_weight += self.metric_weights['text_density']
 
-        # Link density
-        link_text_length = sum(len(a.get_text().strip()) for a in tag.find_all('a'))
-        link_density = link_text_length / text_length if text_length > 0 else 0
+        if self.metric_config['link_density']:
+            density = 1 - (link_text_len / text_len if text_len > 0 else 0)
+            score += self.metric_weights['link_density'] * density
+            total_weight += self.metric_weights['link_density']
 
-        # Tag weight
-        tag_weight = self.tag_weights.get(tag.name, 1)
+        if self.metric_config['tag_weight']:
+            tag_score = self.tag_weights.get(metrics['tag_name'], 0.5)
+            score += self.metric_weights['tag_weight'] * tag_score
+            total_weight += self.metric_weights['tag_weight']
 
-        # Depth factor (prefer elements closer to the body tag)
-        depth = self.get_depth(tag)
-        depth_weight = max(self.max_depth - depth, 1) / self.max_depth
+        if self.metric_config['class_id_weight']:
+            class_score = self._compute_class_id_weight(metrics['node'])
+            score += self.metric_weights['class_id_weight'] * max(0, class_score)
+            total_weight += self.metric_weights['class_id_weight']
 
-        # Compute the final score
-        score = (text_density * tag_weight * depth_weight) / (1 + link_density)
+        if self.metric_config['text_length']:
+            score += self.metric_weights['text_length'] * math.log(text_len + 1)
+            total_weight += self.metric_weights['text_length']
 
-        return score
+        return score / total_weight if total_weight > 0 else 0
 
-    def get_depth(self, tag: Tag) -> int:
-        """Compute the depth of the tag from the body tag."""
-        depth = 0
-        current = tag
-        while current and current != current.parent and current.name != 'body':
-            current = current.parent
-            depth += 1
-        return depth
-
-    def extract_text_chunks(self, body: Tag) -> List[Tuple[int, str, str, Tag]]:
-        """
-        Extracts text chunks from the body element while preserving order.
-        Returns list of tuples (index, text, tag_type, tag) for scoring.
-        """
-        chunks = []
-        index = 0
-
-        def traverse(element):
-            nonlocal index
-            if isinstance(element, NavigableString):
-                return
-            if not isinstance(element, Tag):
-                return
-            if self.is_excluded(element):
-                return
-            # Only consider included tags
-            if element.name in self.included_tags:
-                text = element.get_text(separator=' ', strip=True)
-                if len(text.split()) >= self.min_word_count:
-                    tag_type = 'header' if element.name in self.header_tags else 'content'
-                    chunks.append((index, text, tag_type, element))
-                    index += 1
-                    # Do not traverse children of this element to prevent duplication
-                    return
-            for child in element.children:
-                traverse(child)
-
-        traverse(body)
-        return chunks
-
-    def is_excluded(self, tag: Tag) -> bool:
-        """Determine if a tag should be excluded based on heuristics."""
-        if tag.name in self.excluded_tags:
-            return True
-        class_id = ' '.join(filter(None, [
-            ' '.join(tag.get('class', [])),
-            tag.get('id', '')
-        ]))
-        if self.negative_patterns.search(class_id):
-            return True
-        # Exclude tags with high link density (e.g., navigation menus)
-        text = tag.get_text(separator=' ', strip=True)
-        link_text_length = sum(len(a.get_text(strip=True)) for a in tag.find_all('a'))
-        text_length = len(text)
-        if text_length > 0 and (link_text_length / text_length) > 0.5:
-            return True
-        return False
+    def _compute_class_id_weight(self, node):
+        class_id_score = 0
+        if 'class' in node.attrs:
+            classes = ' '.join(node['class'])
+            if self.negative_patterns.match(classes):
+                class_id_score -= 0.5
+        if 'id' in node.attrs:
+            element_id = node['id']
+            if self.negative_patterns.match(element_id):
+                class_id_score -= 0.5
+        return class_id_score
\ No newline at end of file
diff --git a/crawl4ai/content_scraping_strategy.py b/crawl4ai/content_scraping_strategy.py
index ec6c3361..de8894b7 100644
--- a/crawl4ai/content_scraping_strategy.py
+++ b/crawl4ai/content_scraping_strategy.py
@@ -9,7 +9,7 @@ from bs4 import element, NavigableString, Comment
 from urllib.parse import urljoin
 from requests.exceptions import InvalidSchema
 # from .content_cleaning_strategy import ContentCleaningStrategy
-from .content_filter_strategy import RelevantContentFilter, BM25ContentFilter#, HeuristicContentFilter
+from .content_filter_strategy import RelevantContentFilter, BM25ContentFilter, PruningContentFilter
 from .markdown_generation_strategy import MarkdownGenerationStrategy, DefaultMarkdownGenerator
 from .models import MarkdownGenerationResult
 from .utils import (
@@ -110,10 +110,15 @@ class WebScrapingStrategy(ContentScrapingStrategy):
         if markdown_generator:
             try:
                 if kwargs.get('fit_markdown', False) and not markdown_generator.content_filter:
-                        markdown_generator.content_filter = BM25ContentFilter(
-                            user_query=kwargs.get('fit_markdown_user_query', None),
-                            bm25_threshold=kwargs.get('fit_markdown_bm25_threshold', 1.0)
+                        markdown_generator.content_filter = PruningContentFilter(
+                            threshold_type=kwargs.get('fit_markdown_treshold_type', 'fixed'),
+                            threshold=kwargs.get('fit_markdown_treshold', 0.48),
+                            min_word_threshold=kwargs.get('fit_markdown_min_word_threshold', ),
                         )
+                        # markdown_generator.content_filter = BM25ContentFilter(
+                        #     user_query=kwargs.get('fit_markdown_user_query', None),
+                        #     bm25_threshold=kwargs.get('fit_markdown_bm25_threshold', 1.0)
+                        # )
                 
                 markdown_result: MarkdownGenerationResult = markdown_generator.generate_markdown(
                     cleaned_html=cleaned_html,
diff --git a/docs/examples/quickstart_async.py b/docs/examples/quickstart_async.py
index 679a9bc2..73d695c3 100644
--- a/docs/examples/quickstart_async.py
+++ b/docs/examples/quickstart_async.py
@@ -15,7 +15,7 @@ from bs4 import BeautifulSoup
 from pydantic import BaseModel, Field
 from crawl4ai import AsyncWebCrawler, CacheMode
 from crawl4ai.markdown_generation_strategy import DefaultMarkdownGenerator
-from crawl4ai.content_filter_strategy import BM25ContentFilter
+from crawl4ai.content_filter_strategy import BM25ContentFilter, PruningContentFilter
 from crawl4ai.extraction_strategy import (
     JsonCssExtractionStrategy,
     LLMExtractionStrategy,
@@ -466,7 +466,8 @@ async def speed_comparison():
             url="https://www.nbcnews.com/business",
             word_count_threshold=0,
             markdown_generator=DefaultMarkdownGenerator(
-                content_filter=BM25ContentFilter(user_query=None, bm25_threshold=1.0)
+                content_filter = PruningContentFilter(threshold=0.48, threshold_type="fixed", min_word_threshold=0)
+                # content_filter=BM25ContentFilter(user_query=None, bm25_threshold=1.0)
             ),
             cache_mode=CacheMode.BYPASS,
             verbose=False,
@@ -489,7 +490,8 @@ async def speed_comparison():
             word_count_threshold=0,
             cache_mode=CacheMode.BYPASS,
             markdown_generator=DefaultMarkdownGenerator(
-                content_filter=BM25ContentFilter(user_query=None, bm25_threshold=1.0)
+                content_filter = PruningContentFilter(threshold=0.48, threshold_type="fixed", min_word_threshold=0)
+                # content_filter=BM25ContentFilter(user_query=None, bm25_threshold=1.0)
             ),
             verbose=False,
         )
diff --git a/docs/md_v2/advanced/managed_browser.md b/docs/md_v2/advanced/managed_browser.md
index 80d6fc1a..0d327f2e 100644
--- a/docs/md_v2/advanced/managed_browser.md
+++ b/docs/md_v2/advanced/managed_browser.md
@@ -4,7 +4,59 @@ This guide explains how to use content filtering strategies in Crawl4AI to extra
 
 ## Relevance Content Filter
 
-The `RelevanceContentFilter` is an abstract class that provides a common interface for content filtering strategies. Specific filtering algorithms, like `BM25ContentFilter`, inherit from this class and implement the `filter_content` method. This method takes the HTML content as input and returns a list of filtered text blocks.
+The `RelevanceContentFilter` is an abstract class that provides a common interface for content filtering strategies. Specific filtering algorithms, like `PruningContentFilter` or `BM25ContentFilter`, inherit from this class and implement the `filter_content` method. This method takes the HTML content as input and returns a list of filtered text blocks.
+
+
+## Pruning Content Filter
+
+The `PruningContentFilter` is a tree-shaking algorithm that analyzes the HTML DOM structure and removes less relevant nodes based on various metrics like text density, link density, and tag importance. It evaluates each node using a composite scoring system and "prunes" nodes that fall below a certain threshold.
+
+### Usage
+
+```python
+from crawl4ai import AsyncWebCrawler
+from crawl4ai.content_filter_strategy import PruningContentFilter
+
+async def filter_content(url):
+    async with AsyncWebCrawler() as crawler:
+        content_filter = PruningContentFilter(
+            min_word_threshold=5,
+            threshold_type='dynamic',
+            threshold=0.45
+        )
+        result = await crawler.arun(url=url, extraction_strategy=content_filter, fit_markdown=True)
+        if result.success:
+            print(f"Cleaned Markdown:\n{result.fit_markdown}")
+```
+
+### Parameters
+
+- **`min_word_threshold`**: (Optional) Minimum number of words a node must contain to be considered relevant. Nodes with fewer words are automatically pruned.
+
+- **`threshold_type`**: (Optional, default 'fixed') Controls how pruning thresholds are calculated:
+  - `'fixed'`: Uses a constant threshold value for all nodes
+  - `'dynamic'`: Adjusts threshold based on node characteristics like tag importance and text/link ratios
+
+- **`threshold`**: (Optional, default 0.48) Base threshold value for node pruning:
+  - For fixed threshold: Nodes scoring below this value are removed
+  - For dynamic threshold: This value is adjusted based on node properties
+
+### How It Works
+
+The pruning algorithm evaluates each node using multiple metrics:
+- Text density: Ratio of actual text to overall node content
+- Link density: Proportion of text within links
+- Tag importance: Weight based on HTML tag type (e.g., article, p, div)
+- Content quality: Metrics like text length and structural importance
+
+Nodes scoring below the threshold are removed, effectively "shaking" less relevant content from the DOM tree. This results in a cleaner document containing only the most relevant content blocks.
+
+The algorithm is particularly effective for:
+- Removing boilerplate content
+- Eliminating navigation menus and sidebars
+- Preserving main article content
+- Maintaining document structure while removing noise
+
 
 ## BM25 Algorithm
 
diff --git a/docs/md_v2/basic/content_filtering.md b/docs/md_v2/basic/content_filtering.md
index 9506c075..0d327f2e 100644
--- a/docs/md_v2/basic/content_filtering.md
+++ b/docs/md_v2/basic/content_filtering.md
@@ -4,7 +4,59 @@ This guide explains how to use content filtering strategies in Crawl4AI to extra
 
 ## Relevance Content Filter
 
-The `RelevanceContentFilter` is an abstract class that provides a common interface for content filtering strategies. Specific filtering algorithms, like `BM25ContentFilter`, inherit from this class and implement the `filter_content` method. This method takes the HTML content as input and returns a list of filtered text blocks.
+The `RelevanceContentFilter` is an abstract class that provides a common interface for content filtering strategies. Specific filtering algorithms, like `PruningContentFilter` or `BM25ContentFilter`, inherit from this class and implement the `filter_content` method. This method takes the HTML content as input and returns a list of filtered text blocks.
+
+
+## Pruning Content Filter
+
+The `PruningContentFilter` is a tree-shaking algorithm that analyzes the HTML DOM structure and removes less relevant nodes based on various metrics like text density, link density, and tag importance. It evaluates each node using a composite scoring system and "prunes" nodes that fall below a certain threshold.
+
+### Usage
+
+```python
+from crawl4ai import AsyncWebCrawler
+from crawl4ai.content_filter_strategy import PruningContentFilter
+
+async def filter_content(url):
+    async with AsyncWebCrawler() as crawler:
+        content_filter = PruningContentFilter(
+            min_word_threshold=5,
+            threshold_type='dynamic',
+            threshold=0.45
+        )
+        result = await crawler.arun(url=url, extraction_strategy=content_filter, fit_markdown=True)
+        if result.success:
+            print(f"Cleaned Markdown:\n{result.fit_markdown}")
+```
+
+### Parameters
+
+- **`min_word_threshold`**: (Optional) Minimum number of words a node must contain to be considered relevant. Nodes with fewer words are automatically pruned.
+
+- **`threshold_type`**: (Optional, default 'fixed') Controls how pruning thresholds are calculated:
+  - `'fixed'`: Uses a constant threshold value for all nodes
+  - `'dynamic'`: Adjusts threshold based on node characteristics like tag importance and text/link ratios
+
+- **`threshold`**: (Optional, default 0.48) Base threshold value for node pruning:
+  - For fixed threshold: Nodes scoring below this value are removed
+  - For dynamic threshold: This value is adjusted based on node properties
+
+### How It Works
+
+The pruning algorithm evaluates each node using multiple metrics:
+- Text density: Ratio of actual text to overall node content
+- Link density: Proportion of text within links
+- Tag importance: Weight based on HTML tag type (e.g., article, p, div)
+- Content quality: Metrics like text length and structural importance
+
+Nodes scoring below the threshold are removed, effectively "shaking" less relevant content from the DOM tree. This results in a cleaner document containing only the most relevant content blocks.
+
+The algorithm is particularly effective for:
+- Removing boilerplate content
+- Eliminating navigation menus and sidebars
+- Preserving main article content
+- Maintaining document structure while removing noise
+
 
 ## BM25 Algorithm
 
@@ -21,7 +73,7 @@ from crawl4ai.content_filter_strategy import BM25ContentFilter
 async def filter_content(url, query=None):
     async with AsyncWebCrawler() as crawler:
         content_filter = BM25ContentFilter(user_query=query)
-        result = await crawler.arun(url=url, content_filter=content_filter, fit_markdown=True) # Set fit_markdown flag to True to trigger BM25 filtering
+        result = await crawler.arun(url=url, extraction_strategy=content_filter, fit_markdown=True) # Set fit_markdown flag to True to trigger BM25 filtering
         if result.success:
             print(f"Filtered Content (JSON):\n{result.extracted_content}")
             print(f"\nFiltered Markdown:\n{result.fit_markdown}") # New field in CrawlResult object
@@ -71,7 +123,7 @@ class MyCustomFilter(RelevantContentFilter):
 async def custom_filter_demo(url: str):
     async with AsyncWebCrawler() as crawler:
         custom_filter = MyCustomFilter()
-        result = await crawler.arun(url, content_filter=custom_filter)
+        result = await crawler.arun(url, extraction_strategy=custom_filter)
         if result.success:
             print(result.extracted_content)
 
diff --git a/tests/async/test_content_filter.py b/tests/async/test_content_filter_bm25.py
similarity index 100%
rename from tests/async/test_content_filter.py
rename to tests/async/test_content_filter_bm25.py
diff --git a/tests/async/test_content_filter_prune.py b/tests/async/test_content_filter_prune.py
new file mode 100644
index 00000000..23b0fa3a
--- /dev/null
+++ b/tests/async/test_content_filter_prune.py
@@ -0,0 +1,159 @@
+import os, sys
+import pytest
+from bs4 import BeautifulSoup
+
+parent_dir = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
+sys.path.append(parent_dir)
+
+from crawl4ai.content_filter_strategy import PruningContentFilter
+
+@pytest.fixture
+def basic_html():
+    return """
+    <html>
+        <body>
+            <article>
+                <h1>Main Article</h1>
+                <p>This is a high-quality paragraph with substantial text content. It contains enough words to pass the threshold and has good text density without too many links. This kind of content should survive the pruning process.</p>
+                <div class="sidebar">Low quality sidebar content</div>
+                <div class="social-share">Share buttons</div>
+            </article>
+        </body>
+    </html>
+    """
+
+@pytest.fixture
+def link_heavy_html():
+    return """
+    <html>
+        <body>
+            <div class="content">
+                <p>Good content paragraph that should remain.</p>
+                <div class="links">
+                    <a href="#">Link 1</a>
+                    <a href="#">Link 2</a>
+                    <a href="#">Link 3</a>
+                    <a href="#">Link 4</a>
+                </div>
+            </div>
+        </body>
+    </html>
+    """
+
+@pytest.fixture
+def mixed_content_html():
+    return """
+    <html>
+        <body>
+            <article>
+                <h1>Article Title</h1>
+                <p class="summary">Short summary.</p>
+                <div class="content">
+                    <p>Long high-quality paragraph with substantial content that should definitely survive the pruning process. This content has good text density and proper formatting which makes it valuable for retention.</p>
+                </div>
+                <div class="comments">
+                    <p>Short comment 1</p>
+                    <p>Short comment 2</p>
+                </div>
+            </article>
+        </body>
+    </html>
+    """
+
+class TestPruningContentFilter:
+    def test_basic_pruning(self, basic_html):
+        """Test basic content pruning functionality"""
+        filter = PruningContentFilter(min_word_threshold=5)
+        contents = filter.filter_content(basic_html)
+        
+        combined_content = ' '.join(contents).lower()
+        assert "high-quality paragraph" in combined_content
+        assert "sidebar content" not in combined_content
+        assert "share buttons" not in combined_content
+
+    def test_min_word_threshold(self, mixed_content_html):
+        """Test minimum word threshold filtering"""
+        filter = PruningContentFilter(min_word_threshold=10)
+        contents = filter.filter_content(mixed_content_html)
+        
+        combined_content = ' '.join(contents).lower()
+        assert "short summary" not in combined_content
+        assert "long high-quality paragraph" in combined_content
+        assert "short comment" not in combined_content
+
+    def test_threshold_types(self, basic_html):
+        """Test fixed vs dynamic thresholds"""
+        fixed_filter = PruningContentFilter(threshold_type='fixed', threshold=0.48)
+        dynamic_filter = PruningContentFilter(threshold_type='dynamic', threshold=0.45)
+        
+        fixed_contents = fixed_filter.filter_content(basic_html)
+        dynamic_contents = dynamic_filter.filter_content(basic_html)
+        
+        assert len(fixed_contents) != len(dynamic_contents), \
+            "Fixed and dynamic thresholds should yield different results"
+
+    def test_link_density_impact(self, link_heavy_html):
+        """Test handling of link-heavy content"""
+        filter = PruningContentFilter(threshold_type='dynamic')
+        contents = filter.filter_content(link_heavy_html)
+        
+        combined_content = ' '.join(contents).lower()
+        assert "good content paragraph" in combined_content
+        assert len([c for c in contents if 'href' in c]) < 2, \
+            "Should prune link-heavy sections"
+
+    def test_tag_importance(self, mixed_content_html):
+        """Test tag importance in scoring"""
+        filter = PruningContentFilter(threshold_type='dynamic')
+        contents = filter.filter_content(mixed_content_html)
+        
+        has_article = any('article' in c.lower() for c in contents)
+        has_h1 = any('h1' in c.lower() for c in contents)
+        assert has_article or has_h1, "Should retain important tags"
+
+    def test_empty_input(self):
+        """Test handling of empty input"""
+        filter = PruningContentFilter()
+        assert filter.filter_content("") == []
+        assert filter.filter_content(None) == []
+
+    def test_malformed_html(self):
+        """Test handling of malformed HTML"""
+        malformed_html = "<div>Unclosed div<p>Nested<span>content</div>"
+        filter = PruningContentFilter()
+        contents = filter.filter_content(malformed_html)
+        assert isinstance(contents, list)
+
+    def test_performance(self, basic_html):
+        """Test performance with timer"""
+        filter = PruningContentFilter()
+        
+        import time
+        start = time.perf_counter()
+        filter.filter_content(basic_html)
+        duration = time.perf_counter() - start
+        
+        # Extra strict on performance since you mentioned milliseconds matter
+        assert duration < 0.1, f"Processing took too long: {duration:.3f} seconds"
+
+    @pytest.mark.parametrize("threshold,expected_count", [
+        (0.3, 4),  # Very lenient
+        (0.48, 2), # Default
+        (0.7, 1),  # Very strict
+    ])
+    def test_threshold_levels(self, mixed_content_html, threshold, expected_count):
+        """Test different threshold levels"""
+        filter = PruningContentFilter(threshold_type='fixed', threshold=threshold)
+        contents = filter.filter_content(mixed_content_html)
+        assert len(contents) <= expected_count, \
+            f"Expected {expected_count} or fewer elements with threshold {threshold}"
+
+    def test_consistent_output(self, basic_html):
+        """Test output consistency across multiple runs"""
+        filter = PruningContentFilter()
+        first_run = filter.filter_content(basic_html)
+        second_run = filter.filter_content(basic_html)
+        assert first_run == second_run, "Output should be consistent"
+
+if __name__ == "__main__":
+    pytest.main([__file__])
\ No newline at end of file

From 95a4f74d2a9c0ae8c6f727cce6f6d0c17694aeb4 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Mon, 2 Dec 2024 20:37:28 +0800
Subject: [PATCH 112/115] fix: pass logger to WebScrapingStrategy and update
 score computation in PruningContentFilter

---
 crawl4ai/async_webcrawler.py        | 4 +++-
 crawl4ai/content_filter_strategy.py | 2 +-
 2 files changed, 4 insertions(+), 2 deletions(-)

diff --git a/crawl4ai/async_webcrawler.py b/crawl4ai/async_webcrawler.py
index 66b4c21b..8db69333 100644
--- a/crawl4ai/async_webcrawler.py
+++ b/crawl4ai/async_webcrawler.py
@@ -472,7 +472,9 @@ class AsyncWebCrawler:
         try:
             _url = url if not kwargs.get("is_raw_html", False) else "Raw HTML"
             t1 = time.perf_counter()
-            scrapping_strategy = WebScrapingStrategy()
+            scrapping_strategy = WebScrapingStrategy(
+                logger=self.logger,
+            )
             # result = await scrapping_strategy.ascrap(
             result = scrapping_strategy.scrap(
                 url,
diff --git a/crawl4ai/content_filter_strategy.py b/crawl4ai/content_filter_strategy.py
index ca3868bb..f05b92fa 100644
--- a/crawl4ai/content_filter_strategy.py
+++ b/crawl4ai/content_filter_strategy.py
@@ -468,7 +468,7 @@ class PruningContentFilter(RelevantContentFilter):
             'link_text_len': link_text_len
         }
 
-        score = self._compute_composite_score(metrics)
+        score = self._compute_composite_score(metrics, text_len, tag_len, link_text_len)
 
         if self.threshold_type == 'fixed':
             should_remove = score < self.threshold

From e9639ad18972d11929823ff9b1bb9794ad938750 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Tue, 3 Dec 2024 19:44:38 +0800
Subject: [PATCH 113/115] refactor: improve error handling in DataProcessor and
 optimize data parsing logic

---
 crawl4ai/async_webcrawler.py | 305 ++++++++++++++++++-----------------
 1 file changed, 155 insertions(+), 150 deletions(-)

diff --git a/crawl4ai/async_webcrawler.py b/crawl4ai/async_webcrawler.py
index 8db69333..2c17602d 100644
--- a/crawl4ai/async_webcrawler.py
+++ b/crawl4ai/async_webcrawler.py
@@ -7,6 +7,7 @@ from pathlib import Path
 from typing import Optional, List, Union
 import json
 import asyncio
+from contextlib import nullcontext
 from .models import CrawlResult, MarkdownGenerationResult
 from .async_database import async_db_manager
 from .chunking_strategy import *
@@ -67,6 +68,7 @@ class AsyncWebCrawler:
         always_bypass_cache: bool = False,
         always_by_pass_cache: Optional[bool] = None,  # Deprecated parameter
         base_directory: str = str(os.getenv("CRAWL4_AI_BASE_DIRECTORY", Path.home())),
+        thread_safe: bool = False,
         **kwargs,
     ):
         """
@@ -104,6 +106,8 @@ class AsyncWebCrawler:
         else:
             self.always_bypass_cache = always_bypass_cache
 
+        self._lock = asyncio.Lock() if thread_safe else None
+        
         self.crawl4ai_folder = os.path.join(base_directory, ".crawl4ai")
         os.makedirs(self.crawl4ai_folder, exist_ok=True)
         os.makedirs(f"{self.crawl4ai_folder}/cache", exist_ok=True)
@@ -178,169 +182,170 @@ class AsyncWebCrawler:
         Returns:
             CrawlResult: The result of crawling and processing
         """
-        try:
-            # Handle deprecated parameters
-            if any([bypass_cache, disable_cache, no_cache_read, no_cache_write]):
-                if kwargs.get("warning", True):
-                    warnings.warn(
-                        "Cache control boolean flags are deprecated and will be removed in version X.X.X. "
-                        "Use 'cache_mode' parameter instead. Examples:\n"
-                        "- For bypass_cache=True, use cache_mode=CacheMode.BYPASS\n"
-                        "- For disable_cache=True, use cache_mode=CacheMode.DISABLED\n"
-                        "- For no_cache_read=True, use cache_mode=CacheMode.WRITE_ONLY\n"
-                        "- For no_cache_write=True, use cache_mode=CacheMode.READ_ONLY\n"
-                        "Pass warning=False to suppress this warning.",
-                        DeprecationWarning,
-                        stacklevel=2
-                    )
+        async with self._lock or nullcontext():
+            try:
+                # Handle deprecated parameters
+                if any([bypass_cache, disable_cache, no_cache_read, no_cache_write]):
+                    if kwargs.get("warning", True):
+                        warnings.warn(
+                            "Cache control boolean flags are deprecated and will be removed in version X.X.X. "
+                            "Use 'cache_mode' parameter instead. Examples:\n"
+                            "- For bypass_cache=True, use cache_mode=CacheMode.BYPASS\n"
+                            "- For disable_cache=True, use cache_mode=CacheMode.DISABLED\n"
+                            "- For no_cache_read=True, use cache_mode=CacheMode.WRITE_ONLY\n"
+                            "- For no_cache_write=True, use cache_mode=CacheMode.READ_ONLY\n"
+                            "Pass warning=False to suppress this warning.",
+                            DeprecationWarning,
+                            stacklevel=2
+                        )
+                    
+                    # Convert legacy parameters if cache_mode not provided
+                    if cache_mode is None:
+                        cache_mode = _legacy_to_cache_mode(
+                            disable_cache=disable_cache,
+                            bypass_cache=bypass_cache,
+                            no_cache_read=no_cache_read,
+                            no_cache_write=no_cache_write
+                        )
                 
-                # Convert legacy parameters if cache_mode not provided
+                # Default to ENABLED if no cache mode specified
                 if cache_mode is None:
-                    cache_mode = _legacy_to_cache_mode(
-                        disable_cache=disable_cache,
-                        bypass_cache=bypass_cache,
-                        no_cache_read=no_cache_read,
-                        no_cache_write=no_cache_write
+                    cache_mode = CacheMode.ENABLED
+
+                # Create cache context
+                cache_context = CacheContext(url, cache_mode, self.always_bypass_cache)
+
+                extraction_strategy = extraction_strategy or NoExtractionStrategy()
+                extraction_strategy.verbose = verbose
+                if not isinstance(extraction_strategy, ExtractionStrategy):
+                    raise ValueError("Unsupported extraction strategy")
+                if not isinstance(chunking_strategy, ChunkingStrategy):
+                    raise ValueError("Unsupported chunking strategy")
+                
+                word_count_threshold = max(word_count_threshold, MIN_WORD_THRESHOLD)
+
+                async_response: AsyncCrawlResponse = None
+                cached_result = None
+                screenshot_data = None
+                extracted_content = None
+                
+                start_time = time.perf_counter()
+                
+                # Try to get cached result if appropriate
+                if cache_context.should_read():
+                    cached_result = await async_db_manager.aget_cached_url(url)
+                            
+                if cached_result:
+                    html = sanitize_input_encode(cached_result.html)
+                    extracted_content = sanitize_input_encode(cached_result.extracted_content or "")
+                    if screenshot:
+                        screenshot_data = cached_result.screenshot
+                        if not screenshot_data:
+                            cached_result = None
+                    # if verbose:
+                    #     print(f"{Fore.BLUE}{self.tag_format('FETCH')} {self.log_icons['FETCH']} Cache hit for {cache_context.display_url} | Status: {Fore.GREEN if bool(html) else Fore.RED}{bool(html)}{Style.RESET_ALL} | Time: {time.perf_counter() - start_time:.2f}s")
+                    self.logger.url_status(
+                            url=cache_context.display_url,
+                            success=bool(html),
+                            timing=time.perf_counter() - start_time,
+                            tag="FETCH"
+                        )                    
+
+
+                # Fetch fresh content if needed
+                if not cached_result or not html:
+                    t1 = time.perf_counter()
+                    
+                    if user_agent:
+                        self.crawler_strategy.update_user_agent(user_agent)
+                    async_response: AsyncCrawlResponse = await self.crawler_strategy.crawl(
+                        url, 
+                        screenshot=screenshot, 
+                        **kwargs
                     )
-            
-            # Default to ENABLED if no cache mode specified
-            if cache_mode is None:
-                cache_mode = CacheMode.ENABLED
-
-            # Create cache context
-            cache_context = CacheContext(url, cache_mode, self.always_bypass_cache)
-
-            extraction_strategy = extraction_strategy or NoExtractionStrategy()
-            extraction_strategy.verbose = verbose
-            if not isinstance(extraction_strategy, ExtractionStrategy):
-                raise ValueError("Unsupported extraction strategy")
-            if not isinstance(chunking_strategy, ChunkingStrategy):
-                raise ValueError("Unsupported chunking strategy")
-            
-            word_count_threshold = max(word_count_threshold, MIN_WORD_THRESHOLD)
-
-            async_response: AsyncCrawlResponse = None
-            cached_result = None
-            screenshot_data = None
-            extracted_content = None
-            
-            start_time = time.perf_counter()
-            
-            # Try to get cached result if appropriate
-            if cache_context.should_read():
-                cached_result = await async_db_manager.aget_cached_url(url)
-                        
-            if cached_result:
-                html = sanitize_input_encode(cached_result.html)
-                extracted_content = sanitize_input_encode(cached_result.extracted_content or "")
-                if screenshot:
-                    screenshot_data = cached_result.screenshot
-                    if not screenshot_data:
-                        cached_result = None
-                # if verbose:
-                #     print(f"{Fore.BLUE}{self.tag_format('FETCH')} {self.log_icons['FETCH']} Cache hit for {cache_context.display_url} | Status: {Fore.GREEN if bool(html) else Fore.RED}{bool(html)}{Style.RESET_ALL} | Time: {time.perf_counter() - start_time:.2f}s")
-                self.logger.url_status(
+                    html = sanitize_input_encode(async_response.html)
+                    screenshot_data = async_response.screenshot
+                    t2 = time.perf_counter()
+                    self.logger.url_status(
                         url=cache_context.display_url,
                         success=bool(html),
-                        timing=time.perf_counter() - start_time,
+                        timing=t2 - t1,
                         tag="FETCH"
-                    )                    
+                    )
+                    # if verbose:
+                    #     print(f"{Fore.BLUE}{self.tag_format('FETCH')} {self.log_icons['FETCH']} Live fetch for {cache_context.display_url}... | Status: {Fore.GREEN if bool(html) else Fore.RED}{bool(html)}{Style.RESET_ALL} | Time: {t2 - t1:.2f}s")
 
-
-            # Fetch fresh content if needed
-            if not cached_result or not html:
-                t1 = time.perf_counter()
+                # Process the HTML content
+                crawl_result = await self.aprocess_html(
+                    url=url,
+                    html=html,
+                    extracted_content=extracted_content,
+                    word_count_threshold=word_count_threshold,
+                    extraction_strategy=extraction_strategy,
+                    chunking_strategy=chunking_strategy,
+                    content_filter=content_filter,
+                    css_selector=css_selector,
+                    screenshot=screenshot_data,
+                    verbose=verbose,
+                    is_cached=bool(cached_result),
+                    async_response=async_response,
+                    is_web_url=cache_context.is_web_url,
+                    is_local_file=cache_context.is_local_file,
+                    is_raw_html=cache_context.is_raw_html,
+                    **kwargs,
+                )
                 
-                if user_agent:
-                    self.crawler_strategy.update_user_agent(user_agent)
-                async_response: AsyncCrawlResponse = await self.crawler_strategy.crawl(
-                    url, 
-                    screenshot=screenshot, 
-                    **kwargs
-                )
-                html = sanitize_input_encode(async_response.html)
-                screenshot_data = async_response.screenshot
-                t2 = time.perf_counter()
-                self.logger.url_status(
-                    url=cache_context.display_url,
-                    success=bool(html),
-                    timing=t2 - t1,
-                    tag="FETCH"
-                )
+                # Set response data
+                if async_response:
+                    crawl_result.status_code = async_response.status_code
+                    crawl_result.response_headers = async_response.response_headers
+                    crawl_result.downloaded_files = async_response.downloaded_files
+                else:
+                    crawl_result.status_code = 200
+                    crawl_result.response_headers = cached_result.response_headers if cached_result else {}
+
+                crawl_result.success = bool(html)
+                crawl_result.session_id = kwargs.get("session_id", None)
+
                 # if verbose:
-                #     print(f"{Fore.BLUE}{self.tag_format('FETCH')} {self.log_icons['FETCH']} Live fetch for {cache_context.display_url}... | Status: {Fore.GREEN if bool(html) else Fore.RED}{bool(html)}{Style.RESET_ALL} | Time: {t2 - t1:.2f}s")
+                #     print(f"{Fore.GREEN}{self.tag_format('COMPLETE')} {self.log_icons['COMPLETE']} {cache_context.display_url[:URL_LOG_SHORTEN_LENGTH]}... | Status: {Fore.GREEN if crawl_result.success else Fore.RED}{crawl_result.success} | {Fore.YELLOW}Total: {time.perf_counter() - start_time:.2f}s{Style.RESET_ALL}")
+                self.logger.success(
+                        message="{url:.50}... | Status: {status} | Total: {timing}",
+                        tag="COMPLETE",
+                        params={
+                            "url": cache_context.display_url,
+                            "status": crawl_result.success,
+                            "timing": f"{time.perf_counter() - start_time:.2f}s"
+                        },
+                        colors={
+                            "status": Fore.GREEN if crawl_result.success else Fore.RED,
+                            "timing": Fore.YELLOW
+                        }
+                    )
 
-            # Process the HTML content
-            crawl_result = await self.aprocess_html(
-                url=url,
-                html=html,
-                extracted_content=extracted_content,
-                word_count_threshold=word_count_threshold,
-                extraction_strategy=extraction_strategy,
-                chunking_strategy=chunking_strategy,
-                content_filter=content_filter,
-                css_selector=css_selector,
-                screenshot=screenshot_data,
-                verbose=verbose,
-                is_cached=bool(cached_result),
-                async_response=async_response,
-                is_web_url=cache_context.is_web_url,
-                is_local_file=cache_context.is_local_file,
-                is_raw_html=cache_context.is_raw_html,
-                **kwargs,
-            )
+                # Update cache if appropriate
+                if cache_context.should_write() and not bool(cached_result):
+                    await async_db_manager.acache_url(crawl_result)
+
+                return crawl_result
             
-            # Set response data
-            if async_response:
-                crawl_result.status_code = async_response.status_code
-                crawl_result.response_headers = async_response.response_headers
-                crawl_result.downloaded_files = async_response.downloaded_files
-            else:
-                crawl_result.status_code = 200
-                crawl_result.response_headers = cached_result.response_headers if cached_result else {}
-
-            crawl_result.success = bool(html)
-            crawl_result.session_id = kwargs.get("session_id", None)
-
-            # if verbose:
-            #     print(f"{Fore.GREEN}{self.tag_format('COMPLETE')} {self.log_icons['COMPLETE']} {cache_context.display_url[:URL_LOG_SHORTEN_LENGTH]}... | Status: {Fore.GREEN if crawl_result.success else Fore.RED}{crawl_result.success} | {Fore.YELLOW}Total: {time.perf_counter() - start_time:.2f}s{Style.RESET_ALL}")
-            self.logger.success(
-                    message="{url:.50}... | Status: {status} | Total: {timing}",
-                    tag="COMPLETE",
-                    params={
-                        "url": cache_context.display_url,
-                        "status": crawl_result.success,
-                        "timing": f"{time.perf_counter() - start_time:.2f}s"
-                    },
-                    colors={
-                        "status": Fore.GREEN if crawl_result.success else Fore.RED,
-                        "timing": Fore.YELLOW
-                    }
+            except Exception as e:
+                if not hasattr(e, "msg"):
+                    e.msg = str(e)
+                # print(f"{Fore.RED}{self.tag_format('ERROR')} {self.log_icons['ERROR']} Failed to crawl {cache_context.display_url[:URL_LOG_SHORTEN_LENGTH]}... | {e.msg}{Style.RESET_ALL}")
+                
+                self.logger.error_status(
+                    url=cache_context.display_url,
+                    error=create_box_message(e.msg, type = "error"),
+                    tag="ERROR"
+                )            
+                return CrawlResult(
+                    url=url, 
+                    html="", 
+                    success=False, 
+                    error_message=e.msg
                 )
 
-            # Update cache if appropriate
-            if cache_context.should_write() and not bool(cached_result):
-                await async_db_manager.acache_url(crawl_result)
-
-            return crawl_result
-        
-        except Exception as e:
-            if not hasattr(e, "msg"):
-                e.msg = str(e)
-            # print(f"{Fore.RED}{self.tag_format('ERROR')} {self.log_icons['ERROR']} Failed to crawl {cache_context.display_url[:URL_LOG_SHORTEN_LENGTH]}... | {e.msg}{Style.RESET_ALL}")
-            
-            self.logger.error_status(
-                url=cache_context.display_url,
-                error=create_box_message(e.msg, type = "error"),
-                tag="ERROR"
-            )            
-            return CrawlResult(
-                url=url, 
-                html="", 
-                success=False, 
-                error_message=e.msg
-            )
-
     async def arun_many(
         self,
         urls: List[str],

From b02544bc0bf1dac897adec6bb0de730e5b7f3ccd Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Tue, 3 Dec 2024 21:28:52 +0800
Subject: [PATCH 114/115] docs: update README and blog for version 0.4.0
 release, highlighting new features and improvements

---
 README.md                         | 22 +++++++----
 docs/md_v2/blog/index.md          | 28 ++++++++++++++
 docs/md_v2/blog/releases/0.4.0.md | 62 +++++++++++++++++++++++++++++++
 mkdocs.yml                        | 14 ++++---
 4 files changed, 113 insertions(+), 13 deletions(-)
 create mode 100644 docs/md_v2/blog/index.md
 create mode 100644 docs/md_v2/blog/releases/0.4.0.md

diff --git a/README.md b/README.md
index d70af8ad..cbeb4067 100644
--- a/README.md
+++ b/README.md
@@ -11,7 +11,10 @@
 
 Crawl4AI is the #1 trending GitHub repository, actively maintained by a vibrant community. It delivers blazing-fast, AI-ready web crawling tailored for LLMs, AI agents, and data pipelines. Open source, flexible, and built for real-time performance, Crawl4AI empowers developers with unmatched speed, precision, and deployment ease.  
 
-[✨ Check out latest update v0.3.745](#-recent-updates)
+
+🎉 **Version 0.4.0 is out!** Introducing our experimental PruningContentFilter - a powerful new algorithm for smarter Markdown generation. Test it out and [share your feedback](https://github.com/unclecode/crawl4ai/issues)! [Read the release notes →](https://github.com/unclecode/crawl4ai/blob/main/docs/md_v2/blog/releases/0.4.0.md)
+
+[✨ Check out latest update v0.4.0](#-recent-updates)
 
 ## 🧐 Why Crawl4AI?
 
@@ -623,18 +626,21 @@ async def test_news_crawl():
 
 ## ✨ Recent Updates   
 
-- 🚀 **Improved ManagedBrowser Configuration**: Dynamic host and port support for more flexible browser management.  
-- 📝 **Enhanced Markdown Generation**: New generator class for better formatting and customization.  
-- ⚡ **Fast HTML Formatting**: Significantly optimized HTML formatting in the web crawler.  
-- 🛠️ **Utility & Sanitization Upgrades**: Improved sanitization and expanded utility functions for streamlined workflows.  
-- 👥 **Acknowledgments**: Added contributor details and pull request acknowledgments for better transparency.  
+- 🔬 **PruningContentFilter**: New unsupervised filtering strategy for intelligent content extraction based on text density and relevance scoring.
+- 🧵 **Enhanced Thread Safety**: Improved multi-threaded environment handling with better locks and parallel processing support.
+- 🤖 **Smart User-Agent Generation**: Advanced user-agent generator with customization options and randomization capabilities.
+- 📝 **New Blog Launch**: Stay updated with our detailed release notes and technical deep dives at [crawl4ai.com/blog](https://crawl4ai.com/blog).
+- 🧪 **Expanded Test Coverage**: Comprehensive test suite for both PruningContentFilter and BM25ContentFilter with edge case handling.
 
+Read the full details of this release in our [0.4.0 Release Notes](https://github.com/unclecode/crawl4ai/blob/main/docs/md_v2/blog/releases/0.4.0.md).
 
 ## 📖 Documentation & Roadmap 
 
-For detailed documentation, including installation instructions, advanced features, and API reference, visit our [Documentation Website](https://crawl4ai.com/mkdocs/).
+> 🚨 **Documentation Update Alert**: We're undertaking a major documentation overhaul next week to reflect recent updates and improvements. Stay tuned for a more comprehensive and up-to-date guide!
 
-Moreover to check our development plans and upcoming features, check out our [Roadmap](https://github.com/unclecode/crawl4ai/blob/main/ROADMAP.md).
+For current documentation, including installation instructions, advanced features, and API reference, visit our [Documentation Website](https://crawl4ai.com/mkdocs/).
+
+To check our development plans and upcoming features, visit our [Roadmap](https://github.com/unclecode/crawl4ai/blob/main/ROADMAP.md).
 
 <details>
 <summary>📈 <strong>Development TODOs</strong></summary>
diff --git a/docs/md_v2/blog/index.md b/docs/md_v2/blog/index.md
new file mode 100644
index 00000000..054b12f8
--- /dev/null
+++ b/docs/md_v2/blog/index.md
@@ -0,0 +1,28 @@
+# Crawl4AI Blog
+
+Welcome to the Crawl4AI blog! Here you'll find detailed release notes, technical deep dives, and news about the project.
+
+## Latest Release
+
+### [0.4.0 - Major Content Filtering Update](releases/0.4.0.md)
+*December 1, 2024*
+
+Introducing significant improvements to content filtering, multi-threaded environment handling, and user-agent generation. This release features the new PruningContentFilter, enhanced thread safety, and improved test coverage.
+
+[Read full release notes →](releases/0.4.0.md)
+
+## Project History
+
+Want to see how we got here? Check out our [complete changelog](https://github.com/unclecode/crawl4ai/blob/main/CHANGELOG.md) covering all previous versions and the evolution of Crawl4AI.
+
+## Categories
+
+- [Technical Deep Dives](/blog/technical) - Coming soon
+- [Tutorials & Guides](/blog/tutorials) - Coming soon
+- [Community Updates](/blog/community) - Coming soon
+
+## Stay Updated
+
+- Star us on [GitHub](https://github.com/unclecode/crawl4ai)
+- Follow [@unclecode](https://twitter.com/unclecode) on Twitter
+- Join our community discussions on GitHub
diff --git a/docs/md_v2/blog/releases/0.4.0.md b/docs/md_v2/blog/releases/0.4.0.md
new file mode 100644
index 00000000..0e7ee5df
--- /dev/null
+++ b/docs/md_v2/blog/releases/0.4.0.md
@@ -0,0 +1,62 @@
+# Release Summary for Version 0.4.0 (December 1, 2024)
+
+## Overview
+The 0.4.0 release introduces significant improvements to content filtering, multi-threaded environment handling, user-agent generation, and test coverage. Key highlights include the introduction of the PruningContentFilter, designed to automatically identify and extract the most valuable parts of an HTML document, as well as enhancements to the BM25ContentFilter to extend its versatility and effectiveness.
+
+## Major Features and Enhancements
+
+### 1. PruningContentFilter
+- Introduced a new unsupervised content filtering strategy that scores and prunes less relevant nodes in an HTML document based on metrics like text and link density.
+- Focuses on retaining the most valuable parts of the content, making it highly effective for extracting relevant information from complex web pages.
+- Fully documented with updated README and expanded user guides.
+
+### 2. User-Agent Generator
+- Added a user-agent generator utility that resolves compatibility issues and supports customizable user-agent strings.
+- By default, the generator randomizes user agents for each request, adding diversity, but users can customize it for tailored scenarios.
+
+### 3. Enhanced Thread Safety
+- Improved handling of multi-threaded environments by adding better thread locks for parallel processing, ensuring consistency and stability when running multiple threads.
+
+### 4. Extended Content Filtering Strategies
+- Users now have access to both the PruningContentFilter for unsupervised extraction and the BM25ContentFilter for supervised filtering based on user queries.
+- Enhanced BM25ContentFilter with improved capabilities to process page titles, meta tags, and descriptions, allowing for more effective classification and clustering of text chunks.
+
+### 5. Documentation Updates
+- Updated examples and tutorials to promote the use of the PruningContentFilter alongside the BM25ContentFilter, providing clear instructions for selecting the appropriate filter for each use case.
+
+### 6. Unit Test Enhancements
+- Added unit tests for PruningContentFilter to ensure accuracy and reliability.
+- Enhanced BM25ContentFilter tests to cover additional edge cases and performance metrics, particularly for malformed HTML inputs.
+
+## Revised Change Logs for Version 0.4.0
+
+### PruningContentFilter (Dec 01, 2024)
+- Introduced the PruningContentFilter to optimize content extraction by pruning less relevant HTML nodes.
+  - **Affected Files:**
+    - **crawl4ai/content_filter_strategy.py**: Added a scoring-based pruning algorithm.
+    - **README.md**: Updated to include PruningContentFilter usage.
+    - **docs/md_v2/basic/content_filtering.md**: Expanded user documentation, detailing the use and benefits of PruningContentFilter.
+
+### Unit Tests for PruningContentFilter (Dec 01, 2024)
+- Added comprehensive unit tests for PruningContentFilter to ensure correctness and efficiency.
+  - **Affected Files:**
+    - **tests/async/test_content_filter_prune.py**: Created tests covering different pruning scenarios to ensure stability and correctness.
+
+### Enhanced BM25ContentFilter Tests (Dec 01, 2024)
+- Expanded tests to cover additional extraction scenarios and performance metrics, improving robustness.
+  - **Affected Files:**
+    - **tests/async/test_content_filter_bm25.py**: Added tests for edge cases, including malformed HTML inputs.
+
+### Documentation and Example Updates (Dec 01, 2024)
+- Revised examples to illustrate the use of PruningContentFilter alongside existing content filtering methods.
+  - **Affected Files:**
+    - **docs/examples/quickstart_async.py**: Enhanced example clarity and usability for new users.
+
+## Experimental Features
+- The PruningContentFilter is still under experimental development, and we continue to gather feedback for further refinements.
+
+## Conclusion
+This release significantly enhances the content extraction capabilities of Crawl4ai with the introduction of the PruningContentFilter, improved supervised filtering with BM25ContentFilter, and robust multi-threaded handling. Additionally, the user-agent generator provides much-needed versatility, resolving compatibility issues faced by many users.
+
+Users are encouraged to experiment with the new content filtering methods to determine which best suits their needs.
+
diff --git a/mkdocs.yml b/mkdocs.yml
index 1b26b9df..4ba7c2a7 100644
--- a/mkdocs.yml
+++ b/mkdocs.yml
@@ -10,7 +10,11 @@ nav:
   - 'Installation': 'basic/installation.md'
   - 'Docker Deplotment': 'basic/docker-deploymeny.md'
   - 'Quick Start': 'basic/quickstart.md'
-  
+  - Changelog & Blog:
+    - 'Blog Home': 'blog/index.md'
+    - 'Latest (0.4.0)': 'blog/releases/0.4.0.md'
+    - 'Changelog': 'https://github.com/unclecode/crawl4ai/blob/main/CHANGELOG.md'
+
   - Basic:
     - 'Simple Crawling': 'basic/simple-crawling.md'
     - 'Output Formats': 'basic/output-formats.md'
@@ -50,12 +54,12 @@ nav:
     - '5. Dynamic Content': 'tutorial/episode_05_JavaScript_Execution_and_Dynamic_Content_Handling.md'
     - '6. Magic Mode': 'tutorial/episode_06_Magic_Mode_and_Anti-Bot_Protection.md'
     - '7. Content Cleaning': 'tutorial/episode_07_Content_Cleaning_and_Fit_Markdown.md'
-    - '8. Media Handling': 'tutorial/episode_08_Media_Handling:_Images,_Videos,_and_Audio.md'
+    - '8. Media Handling': 'tutorial/episode_08_Media_Handling_Images_Videos_and_Audio.md'
     - '9. Link Analysis': 'tutorial/episode_09_Link_Analysis_and_Smart_Filtering.md'
     - '10. User Simulation': 'tutorial/episode_10_Custom_Headers,_Identity,_and_User_Simulation.md'
-    - '11.1. JSON CSS': 'tutorial/episode_11_1_Extraction_Strategies:_JSON_CSS.md'
-    - '11.2. LLM Strategy': 'tutorial/episode_11_2_Extraction_Strategies:_LLM.md'
-    - '11.3. Cosine Strategy': 'tutorial/episode_11_3_Extraction_Strategies:_Cosine.md'
+    - '11.1. JSON CSS': 'tutorial/episode_11_1_Extraction_Strategies_JSON_CSS.md'
+    - '11.2. LLM Strategy': 'tutorial/episode_11_2_Extraction_Strategies_LLM.md'
+    - '11.3. Cosine Strategy': 'tutorial/episode_11_3_Extraction_Strategies_Cosine.md'
     - '12. Session Crawling': 'tutorial/episode_12_Session-Based_Crawling_for_Dynamic_Websites.md'
     - '13. Text Chunking': 'tutorial/episode_13_Chunking_Strategies_for_Large_Text_Processing.md'
     - '14. Custom Workflows': 'tutorial/episode_14_Hooks_and_Custom_Workflow_with_AsyncWebCrawler.md'

From 486db3a7713e6ffb22dc378c989b67bdc57fff74 Mon Sep 17 00:00:00 2001
From: UncleCode <unclecode@kidocode.com>
Date: Wed, 4 Dec 2024 20:26:39 +0800
Subject: [PATCH 115/115]   Updated to version 0.4.0 with new features   -
 Enhanced error handling in async crawler.   - Added flexible options in
 Markdown generation.   - Updated user agent settings for improved
 reliability.   - Reflected changes in documentation and examples.

---
 crawl4ai/__version__.py                  |  2 +-
 crawl4ai/async_crawler_strategy.py       | 19 ++++++++-
 crawl4ai/markdown_generation_strategy.py | 12 ++++--
 crawl4ai/user_agent_generator.py         |  1 +
 docs/examples/quickstart_async.py        | 51 +++++++++++++++++++-----
 5 files changed, 69 insertions(+), 16 deletions(-)

diff --git a/crawl4ai/__version__.py b/crawl4ai/__version__.py
index 189a2955..6f8b06f4 100644
--- a/crawl4ai/__version__.py
+++ b/crawl4ai/__version__.py
@@ -1,2 +1,2 @@
 # crawl4ai/_version.py
-__version__ = "0.3.747"
+__version__ = "0.4.0"
diff --git a/crawl4ai/async_crawler_strategy.py b/crawl4ai/async_crawler_strategy.py
index 3d24bd84..493597ea 100644
--- a/crawl4ai/async_crawler_strategy.py
+++ b/crawl4ai/async_crawler_strategy.py
@@ -6,6 +6,7 @@ from typing import Callable, Dict, Any, List, Optional, Awaitable
 import os, sys, shutil
 import tempfile, subprocess
 from playwright.async_api import async_playwright, Page, Browser, Error
+from playwright.async_api import TimeoutError as PlaywrightTimeoutError
 from io import BytesIO
 from PIL import Image, ImageDraw, ImageFont
 from pathlib import Path
@@ -223,6 +224,7 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
         self.use_cached_html = use_cached_html
         self.user_agent = kwargs.get(
             "user_agent",
+            # "Mozilla/5.0 (Macintosh; Intel Mac OS X 10.15; rv:109.0) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/116.0.5845.187 Safari/604.1 Edg/117.0.2045.47"
             "Mozilla/5.0 (Linux; Android 11; SM-G973F) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.120 Mobile Safari/537.36"
         )
         user_agenr_generator = UserAgentGenerator()
@@ -941,11 +943,24 @@ class AsyncPlaywrightCrawlerStrategy(AsyncCrawlerStrategy):
                 });
             }
             """
+            
             try:
-                await page.wait_for_load_state()
+                try:
+                    await page.wait_for_load_state(
+                        # state="load",
+                        state="domcontentloaded",
+                        timeout=5
+                    )
+                except PlaywrightTimeoutError:
+                    pass
                 await page.evaluate(update_image_dimensions_js)
             except Exception as e:
-                raise RuntimeError(f"Error updating image dimensions ACS-UPDATE_IMAGE_DIMENSIONS_JS: {str(e)}")
+                self.logger.error(
+                    message="Error updating image dimensions ACS-UPDATE_IMAGE_DIMENSIONS_JS: {error}",
+                    tag="ERROR",
+                    params={"error": str(e)}
+                )
+                # raise RuntimeError(f"Error updating image dimensions ACS-UPDATE_IMAGE_DIMENSIONS_JS: {str(e)}")
 
             # Wait a bit for any onload events to complete
             await page.wait_for_timeout(100)
diff --git a/crawl4ai/markdown_generation_strategy.py b/crawl4ai/markdown_generation_strategy.py
index f242054d..1e0ca664 100644
--- a/crawl4ai/markdown_generation_strategy.py
+++ b/crawl4ai/markdown_generation_strategy.py
@@ -11,8 +11,9 @@ LINK_PATTERN = re.compile(r'!?\[([^\]]+)\]\(([^)]+?)(?:\s+"([^"]*)")?\)')
 
 class MarkdownGenerationStrategy(ABC):
     """Abstract base class for markdown generation strategies."""
-    def __init__(self, content_filter: Optional[RelevantContentFilter] = None):
+    def __init__(self, content_filter: Optional[RelevantContentFilter] = None, options: Optional[Dict[str, Any]] = None):
         self.content_filter = content_filter
+        self.options = options or {}
     
     @abstractmethod
     def generate_markdown(self, 
@@ -27,8 +28,8 @@ class MarkdownGenerationStrategy(ABC):
 
 class DefaultMarkdownGenerator(MarkdownGenerationStrategy):
     """Default implementation of markdown generation strategy."""
-    def __init__(self, content_filter: Optional[RelevantContentFilter] = None):
-        super().__init__(content_filter)
+    def __init__(self, content_filter: Optional[RelevantContentFilter] = None, options: Optional[Dict[str, Any]] = None):
+        super().__init__(content_filter, options)
     
     def convert_links_to_citations(self, markdown: str, base_url: str = "") -> Tuple[str, str]:
         link_map = {}
@@ -74,6 +75,7 @@ class DefaultMarkdownGenerator(MarkdownGenerationStrategy):
                          cleaned_html: str, 
                          base_url: str = "",
                          html2text_options: Optional[Dict[str, Any]] = None,
+                         options: Optional[Dict[str, Any]] = None,
                          content_filter: Optional[RelevantContentFilter] = None,
                          citations: bool = True,
                          **kwargs) -> MarkdownGenerationResult:
@@ -82,6 +84,10 @@ class DefaultMarkdownGenerator(MarkdownGenerationStrategy):
         h = CustomHTML2Text()
         if html2text_options:
             h.update_params(**html2text_options)
+        elif options:
+            h.update_params(**options)
+        elif self.options:
+            h.update_params(**self.options)
 
         # Generate raw markdown
         raw_markdown = h.handle(cleaned_html)
diff --git a/crawl4ai/user_agent_generator.py b/crawl4ai/user_agent_generator.py
index 0a4df0bb..a1f3a49e 100644
--- a/crawl4ai/user_agent_generator.py
+++ b/crawl4ai/user_agent_generator.py
@@ -236,6 +236,7 @@ class UserAgentGenerator:
 # Example usage:
 if __name__ == "__main__":
     generator = UserAgentGenerator()
+    print(generator.generate())
     
     print("\nSingle browser (Chrome):")
     print(generator.generate(num_browsers=1, browser_type='chrome'))
diff --git a/docs/examples/quickstart_async.py b/docs/examples/quickstart_async.py
index 73d695c3..176b0ba7 100644
--- a/docs/examples/quickstart_async.py
+++ b/docs/examples/quickstart_async.py
@@ -547,19 +547,50 @@ async def generate_knowledge_graph():
             f.write(result.extracted_content)
 
 async def fit_markdown_remove_overlay():
-    async with AsyncWebCrawler(headless = False) as crawler:
-        url = "https://janineintheworld.com/places-to-visit-in-central-mexico"
+    async with AsyncWebCrawler(
+            headless=True,  # Set to False to see what is happening
+            verbose=True,
+            user_agent_mode="random",
+            user_agent_generator_config={
+                "device_type": "mobile",
+                "os_type": "android"
+            },
+    ) as crawler:
         result = await crawler.arun(
-            url=url,
+            url='https://www.kidocode.com/degrees/technology',
             cache_mode=CacheMode.BYPASS,
-            word_count_threshold = 10,
-            remove_overlay_elements=True,
-            screenshot = True
+            markdown_generator=DefaultMarkdownGenerator(
+                content_filter=PruningContentFilter(threshold=0.48, threshold_type="fixed", min_word_threshold=0),
+                options={
+                    "ignore_links": True
+                }
+            ),
+            # markdown_generator=DefaultMarkdownGenerator(
+            #     content_filter=BM25ContentFilter(user_query=None, bm25_threshold=1.0),
+            #     options={
+            #         "ignore_links": True
+            #     }
+            # ),
         )
-        # Save markdown to file
-        with open(os.path.join(__location__, "mexico_places.md"), "w") as f:
-            f.write(result.fit_markdown)
-
+        
+        if result.success:
+            print(len(result.markdown_v2.raw_markdown))
+            print(len(result.markdown_v2.markdown_with_citations))
+            print(len(result.markdown_v2.fit_markdown))
+            
+            # Save clean html
+            with open(os.path.join(__location__, "output/cleaned_html.html"), "w") as f:
+                f.write(result.cleaned_html)
+            
+            with open(os.path.join(__location__, "output/output_raw_markdown.md"), "w") as f:
+                f.write(result.markdown_v2.raw_markdown)
+                
+            with open(os.path.join(__location__, "output/output_markdown_with_citations.md"), "w") as f:
+                f.write(result.markdown_v2.markdown_with_citations) 
+                
+            with open(os.path.join(__location__, "output/output_fit_markdown.md"), "w") as f:   
+                f.write(result.markdown_v2.fit_markdown)
+        
     print("Done")