Apply Ruff Corrections

2025-01-13 19:19:58 +08:00
parent c3370ec5da
commit 8ec12d7d68
84 changed files with 6861 additions and 5076 deletions
--- a/docs/examples/rest_call.py
+++ b/docs/examples/rest_call.py
@@ -1,4 +1,3 @@
-
 import requests, base64, os

 data = {
@@ -6,59 +5,50 @@ data = {
    "screenshot": True,
 }

-response = requests.post("https://crawl4ai.com/crawl", json=data) 
-result = response.json()['results'][0]
+response = requests.post("https://crawl4ai.com/crawl", json=data)
+result = response.json()["results"][0]
 print(result.keys())
-# dict_keys(['url', 'html', 'success', 'cleaned_html', 'media', 
-# 'links', 'screenshot', 'markdown', 'extracted_content', 
+# dict_keys(['url', 'html', 'success', 'cleaned_html', 'media',
+# 'links', 'screenshot', 'markdown', 'extracted_content',
 # 'metadata', 'error_message'])
 with open("screenshot.png", "wb") as f:
-    f.write(base64.b64decode(result['screenshot']))
-    
+    f.write(base64.b64decode(result["screenshot"]))
+
 # Example of filtering the content using CSS selectors
 data = {
-    "urls": [
-        "https://www.nbcnews.com/business"
-    ],
+    "urls": ["https://www.nbcnews.com/business"],
    "css_selector": "article",
    "screenshot": True,
 }

 # Example of executing a JS script on the page before extracting the content
 data = {
-    "urls": [
-        "https://www.nbcnews.com/business"
-    ],
+    "urls": ["https://www.nbcnews.com/business"],
    "screenshot": True,
-    'js' : ["""
+    "js": [
+        """
    const loadMoreButton = Array.from(document.querySelectorAll('button')).
    find(button => button.textContent.includes('Load More'));
    loadMoreButton && loadMoreButton.click();
-    """]
+    """
+    ],
 }

 # Example of using a custom extraction strategy
 data = {
-    "urls": [
-        "https://www.nbcnews.com/business"
-    ],
+    "urls": ["https://www.nbcnews.com/business"],
    "extraction_strategy": "CosineStrategy",
-    "extraction_strategy_args": {
-        "semantic_filter": "inflation rent prices"
-    },
+    "extraction_strategy_args": {"semantic_filter": "inflation rent prices"},
 }

 # Example of using LLM to extract content
 data = {
-    "urls": [
-        "https://www.nbcnews.com/business"
-    ],
+    "urls": ["https://www.nbcnews.com/business"],
    "extraction_strategy": "LLMExtractionStrategy",
    "extraction_strategy_args": {
        "provider": "groq/llama3-8b-8192",
        "api_token": os.environ.get("GROQ_API_KEY"),
        "instruction": """I am interested in only financial news, 
-        and translate them in French."""
+        and translate them in French.""",
    },
 }
-