refactor(cli): improve CLI default command handling

Make 'crawl' the default command when no command is specified. This improves user experience by allowing direct URL input without explicitly specifying the 'crawl' command. Also removes unnecessary blank lines in example code for better readability.
2025-03-04 20:28:16 +08:00
parent cbef406f9b
commit 56bc3c6e45
3 changed files with 9 additions and 9 deletions
--- a/crawl4ai/cli.py
+++ b/crawl4ai/cli.py
@@ -712,7 +712,7 @@ def profiles_cmd():
    # Run interactive profile manager
    anyio.run(manage_profiles)

-@cli.command()
+@cli.command(name="")
@click.argument("url", required=False)
@click.option("--example", is_flag=True, help="Show usage examples")
@click.option("--browser-config", "-B", type=click.Path(exists=True), help="Browser config file (YAML/JSON)")
@@ -772,5 +772,11 @@ def default(url: str, example: bool, browser_config: str, crawler_config: str, f
        profile=profile
    )

+def main():
+    import sys
+    if len(sys.argv) < 2 or sys.argv[1] not in cli.commands:
+        sys.argv.insert(1, "crawl")
+    cli()
+
 if __name__ == "__main__":
-    cli()
+    main()
--- a/docs/examples/deepcrawl_example.py
+++ b/docs/examples/deepcrawl_example.py
@@ -65,7 +65,6 @@ async def basic_deep_crawl():
            f"\n✅ Performance: {len(results)} pages in {time.perf_counter() - start_time:.2f} seconds"
        )

-
 # 2️⃣ Stream vs. Non-Stream Execution
 async def stream_vs_nonstream():
    """
@@ -127,7 +126,6 @@ async def stream_vs_nonstream():
        print(f"  ✅ All results: {time.perf_counter() - start_time:.2f} seconds")
        print("\n🔍 Key Takeaway: Streaming allows processing results immediately")

-
 # 3️⃣ Introduce Filters & Scorers
 async def filters_and_scorers():
    """
@@ -236,7 +234,6 @@ async def filters_and_scorers():
        print(f"  ✅ Crawler prioritized {len(results)} pages by relevance score")
        print("  🔍 Note: BestFirstCrawlingStrategy visits highest-scoring pages first")

-
 # 4️⃣ Wrap-Up and Key Takeaways
 async def wrap_up():
    """
@@ -307,7 +304,6 @@ async def wrap_up():
    for depth, count in sorted(depth_counts.items()):
        print(f"  Depth {depth}: {count} pages")

-
 # 5️⃣ Advanced Filters
 async def advanced_filters():
    """
@@ -371,7 +367,6 @@ async def advanced_filters():
            relevance_score = result.metadata.get("relevance_score", 0)
            print(f"  → Score: {relevance_score:.2f} | {result.url}")

-
 # Main function to run the entire tutorial
 async def max_pages_and_thresholds():
    """
@@ -497,7 +492,6 @@ async def run_tutorial():
    print("You now have a comprehensive understanding of deep crawling with Crawl4AI.")
    print("For more information, check out https://docs.crawl4ai.com")

-
 # Execute the tutorial when run directly
 if __name__ == "__main__":
    asyncio.run(run_tutorial())
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -78,7 +78,7 @@ crawl4ai-download-models = "crawl4ai.model_loader:main"
 crawl4ai-migrate = "crawl4ai.migrations:main"
 crawl4ai-setup = "crawl4ai.install:post_install"
 crawl4ai-doctor = "crawl4ai.install:doctor"
-crwl = "crawl4ai.cli:cli"
+crwl = "crawl4ai.cli:main"

 [tool.setuptools]
 packages = {find = {where = ["."], include = ["crawl4ai*"]}}