From 5cc58f9bb3ac049df3cb7a2ee31680b3aec30a41 Mon Sep 17 00:00:00 2001 From: Aravind Karnam Date: Fri, 2 May 2025 16:40:58 +0530 Subject: [PATCH] fix: 1. duplicate verbose flag 2.inconsistency in argument name --profile-name 3. duplicate initialisaiton of env_defaults --- docs/apps/linkdin/c4ai_discover.py | 10 ++++------ 1 file changed, 4 insertions(+), 6 deletions(-) diff --git a/docs/apps/linkdin/c4ai_discover.py b/docs/apps/linkdin/c4ai_discover.py index 82874568..dca2fa69 100644 --- a/docs/apps/linkdin/c4ai_discover.py +++ b/docs/apps/linkdin/c4ai_discover.py @@ -272,7 +272,7 @@ def build_arg_parser() -> argparse.ArgumentParser: parser.add_argument("--title-filters", default="Product,Engineering", help="comma list of job keywords") parser.add_argument("--max-companies", type=int, default=1000) parser.add_argument("--max-people", type=int, default=500) - parser.add_argument("--profile-path", default=str(pathlib.Path.home() / ".crawl4ai/profiles/profile_linkedin_uc")) + parser.add_argument("--profile-name", default=str(pathlib.Path.home() / ".crawl4ai/profiles/profile_linkedin_uc")) parser.add_argument("--outdir", default="./output") parser.add_argument("--concurrency", type=int, default=4) parser.add_argument("--log-level", default="info", choices=["debug", "info", "warn", "error"]) @@ -355,8 +355,7 @@ async def async_main(opts): user_agent_generator_config= { "platforms": "mobile", "os": "Android" - }, - verbose=False, + } ) crawler = AsyncWebCrawler(config=bc) @@ -366,7 +365,7 @@ async def async_main(opts): # crawler = await next_crawler().start() try: # Build LinkedIn search URL - search_url = f"https://www.linkedin.com/search/results/companies/?keywords={quote(opts.query)}&geoUrn={opts.geo}" + search_url = f'https://www.linkedin.com/search/results/companies/?keywords={quote(opts.query)}&companyHqGeo="{opts.geo}"' logging.info("Seed URL => %s", search_url) companies: List[Dict] = [] @@ -425,14 +424,13 @@ def main(): if cli_opts.debug: opts = detect_debug_defaults(force=True) else: - env_defaults = detect_debug_defaults() env_defaults = detect_debug_defaults() opts = env_defaults if env_defaults else cli_opts if not getattr(opts, "cmd", None): opts.cmd = "full" - exit_code = asyncio.run(async_main(opts)) + exit_code = asyncio.run(async_main(cli_opts)) sys.exit(exit_code)