Feat/llm config (#724)

* feature: Add LlmConfig to easily configure and pass LLM configs to different strategies * pulled in next branch and resolved conflicts * feat: Add gemini and deepseek providers. Make ignore_cache in llm content filter to true by default to avoid confusions * Refactor: Update LlmConfig in LLMExtractionStrategy class and deprecate old params * updated tests, docs and readme
2025-02-21 13:11:37 +05:30
parent 3cb28875c3
commit 2af958e12c
25 changed files with 420 additions and 240 deletions
--- a/tests/docker/test_docker.py
+++ b/tests/docker/test_docker.py
@@ -7,6 +7,7 @@ from crawl4ai import (
    BrowserConfig, CrawlerRunConfig, DefaultMarkdownGenerator,
    PruningContentFilter, JsonCssExtractionStrategy, LLMContentFilter, CacheMode
 )
+from crawl4ai.async_configs import LlmConfig
 from crawl4ai.docker_client import Crawl4aiDockerClient

 class Crawl4AiTester:
@@ -142,7 +143,7 @@ async def test_with_client():
            cache_mode=CacheMode.BYPASS,
            markdown_generator=DefaultMarkdownGenerator(
                content_filter=LLMContentFilter(
-                    provider="openai/gpt-40",
+                    llmConfig=LlmConfig(provider="openai/gpt-40"),
                    instruction="Extract key technical concepts"
                )
            ),