Apply Ruff Corrections

2025-01-13 19:19:58 +08:00
parent c3370ec5da
commit 8ec12d7d68
84 changed files with 6861 additions and 5076 deletions
--- a/tests/async/test_content_extraction.py
+++ b/tests/async/test_content_extraction.py
@@ -1,8 +1,6 @@
 import os
 import sys
 import pytest
-import asyncio
-import json

 # Add the parent directory to the Python path
 parent_dir = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
@@ -10,6 +8,7 @@ sys.path.append(parent_dir)

 from crawl4ai.async_webcrawler import AsyncWebCrawler

+
@pytest.mark.asyncio
 async def test_extract_markdown():
    async with AsyncWebCrawler(verbose=True) as crawler:
@@ -20,6 +19,7 @@ async def test_extract_markdown():
        assert isinstance(result.markdown, str)
        assert len(result.markdown) > 0

+
@pytest.mark.asyncio
 async def test_extract_cleaned_html():
    async with AsyncWebCrawler(verbose=True) as crawler:
@@ -30,6 +30,7 @@ async def test_extract_cleaned_html():
        assert isinstance(result.cleaned_html, str)
        assert len(result.cleaned_html) > 0

+
@pytest.mark.asyncio
 async def test_extract_media():
    async with AsyncWebCrawler(verbose=True) as crawler:
@@ -46,6 +47,7 @@ async def test_extract_media():
            assert "alt" in image
            assert "type" in image

+
@pytest.mark.asyncio
 async def test_extract_links():
    async with AsyncWebCrawler(verbose=True) as crawler:
@@ -63,6 +65,7 @@ async def test_extract_links():
            assert "href" in link
            assert "text" in link

+
@pytest.mark.asyncio
 async def test_extract_metadata():
    async with AsyncWebCrawler(verbose=True) as crawler:
@@ -75,16 +78,20 @@ async def test_extract_metadata():
        assert "title" in metadata
        assert isinstance(metadata["title"], str)

+
@pytest.mark.asyncio
 async def test_css_selector_extraction():
    async with AsyncWebCrawler(verbose=True) as crawler:
        url = "https://www.nbcnews.com/business"
        css_selector = "h1, h2, h3"
-        result = await crawler.arun(url=url, bypass_cache=True, css_selector=css_selector)
+        result = await crawler.arun(
+            url=url, bypass_cache=True, css_selector=css_selector
+        )
        assert result.success
        assert result.markdown
        assert all(heading in result.markdown for heading in ["#", "##", "###"])

+
 # Entry point for debugging
 if __name__ == "__main__":
-    pytest.main([__file__, "-v"])
+    pytest.main([__file__, "-v"])