Profiling/monitoring :Add interactive monitoring dashboard and integration tests for monitoring endpoints

- Implemented an interactive monitoring dashboard in `demo_monitoring_dashboard.py` for real-time statistics, profiling session management, and system resource monitoring. - Created a quick test script `test_monitoring_quick.py` to verify the functionality of monitoring endpoints. - Developed comprehensive integration tests in `test_monitoring_endpoints.py` covering health checks, statistics, profiling sessions, and real-time streaming. - Added error handling and user-friendly output for better usability in the dashboard.
2025-10-16 16:48:13 +08:00
parent 74eeff4c51
commit 3877335d89
7 changed files with 2363 additions and 1 deletions
--- a/deploy/docker/api.py
+++ b/deploy/docker/api.py
@@ -58,6 +58,9 @@ from crawl4ai.markdown_generation_strategy import DefaultMarkdownGenerator
 from crawl4ai.async_crawler_strategy import AsyncHTTPCrawlerStrategy
 from crawl4ai.utils import perform_completion_with_backoff

+# Import monitoring/tracking functions
+from routers.monitoring import track_crawl_start, track_crawl_end
+
 # Import missing utility functions and types
 try:
    from utils import (
@@ -665,6 +668,8 @@ async def stream_results(

    from utils import datetime_handler

+    start_time = time.time()
+
    try:
        async for result in results_gen:
            try:
@@ -681,6 +686,14 @@ async def stream_results(
                if result_dict.get("pdf") is not None:
                    result_dict["pdf"] = b64encode(result_dict["pdf"]).decode("utf-8")
                logger.info(f"Streaming result for {result_dict.get('url', 'unknown')}")
+                
+                # Track each streamed result for monitoring
+                duration_ms = int((time.time() - start_time) * 1000)
+                url = result_dict.get('url', 'unknown')
+                success = result_dict.get('success', False)
+                bytes_processed = len(str(result_dict.get("markdown", ""))) + len(str(result_dict.get("html", "")))
+                track_crawl_end(url, success, duration_ms, bytes_processed)
+                
                data = json.dumps(result_dict, default=datetime_handler) + "\n"
                yield data.encode("utf-8")
            except Exception as e:
@@ -721,6 +734,9 @@ async def handle_crawl_request(
    dispatcher = None,
 ) -> dict:
    """Handle non-streaming crawl requests with optional hooks."""
+    # Track crawl start for monitoring
+    track_crawl_start()
+    
    start_mem_mb = _get_memory_mb()  # <--- Get memory before
    start_time = time.time()
    mem_delta_mb = None
@@ -872,6 +888,15 @@ async def handle_crawl_request(
            "server_peak_memory_mb": peak_mem_mb,
        }

+        # Track successful crawl completion for monitoring
+        duration_ms = int((end_time - start_time) * 1000)
+        for result in processed_results:
+            url = result.get("url", "unknown")
+            success = result.get("success", False)
+            # Estimate bytes processed (rough approximation based on content length)
+            bytes_processed = len(str(result.get("markdown", ""))) + len(str(result.get("html", "")))
+            track_crawl_end(url, success, duration_ms, bytes_processed)
+
        # Add hooks information if hooks were used
        if hooks_config and hook_manager:
            from hook_manager import UserHookManager
@@ -918,6 +943,11 @@ async def handle_crawl_request(
        if start_mem_mb is not None and end_mem_mb_error is not None:
            mem_delta_mb = end_mem_mb_error - start_mem_mb

+        # Track failed crawl for monitoring
+        duration_ms = int((time.time() - start_time) * 1000)
+        for url in urls:
+            track_crawl_end(url, success=False, duration_ms=duration_ms, bytes_processed=0)
+
        raise HTTPException(
            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
            detail=json.dumps(
@@ -947,6 +977,9 @@ async def handle_stream_crawl_request(
    dispatcher = None,
 ) -> Tuple[AsyncWebCrawler, AsyncGenerator, Optional[Dict]]:
    """Handle streaming crawl requests with optional hooks."""
+    # Track crawl start for monitoring
+    track_crawl_start()
+    
    hooks_info = None
    try:
        browser_config = BrowserConfig.load(browser_config)
--- a/deploy/docker/routers/monitoring.py
+++ b/deploy/docker/routers/monitoring.py
@@ -0,0 +1,746 @@
+"""
+Monitoring and Profiling Router
+
+Provides endpoints for:
+- Browser performance profiling
+- Real-time crawler statistics
+- System resource monitoring
+- Session management
+"""
+
+from fastapi import APIRouter, HTTPException, BackgroundTasks, Query
+from fastapi.responses import StreamingResponse
+from pydantic import BaseModel, Field
+from typing import Dict, List, Optional, Any, AsyncGenerator
+from datetime import datetime, timedelta
+import uuid
+import asyncio
+import json
+import time
+import psutil
+import logging
+from collections import defaultdict
+
+logger = logging.getLogger(__name__)
+
+router = APIRouter(
+    prefix="/monitoring",
+    tags=["Monitoring & Profiling"],
+    responses={
+        404: {"description": "Session not found"},
+        500: {"description": "Internal server error"}
+    }
+)
+
+# ============================================================================
+# Data Structures
+# ============================================================================
+
+# In-memory storage for profiling sessions
+PROFILING_SESSIONS: Dict[str, Dict[str, Any]] = {}
+
+# Real-time crawler statistics
+CRAWLER_STATS = {
+    "active_crawls": 0,
+    "total_crawls": 0,
+    "successful_crawls": 0,
+    "failed_crawls": 0,
+    "total_bytes_processed": 0,
+    "average_response_time_ms": 0.0,
+    "last_updated": datetime.now().isoformat(),
+}
+
+# Per-URL statistics
+URL_STATS: Dict[str, Dict[str, Any]] = defaultdict(lambda: {
+    "total_requests": 0,
+    "success_count": 0,
+    "failure_count": 0,
+    "average_time_ms": 0.0,
+    "last_accessed": None,
+})
+
+
+# ============================================================================
+# Pydantic Models
+# ============================================================================
+
+class ProfilingStartRequest(BaseModel):
+    """Request to start a profiling session."""
+    url: str = Field(..., description="URL to profile")
+    browser_config: Optional[Dict[str, Any]] = Field(
+        default_factory=dict,
+        description="Browser configuration"
+    )
+    crawler_config: Optional[Dict[str, Any]] = Field(
+        default_factory=dict,
+        description="Crawler configuration"
+    )
+    profile_duration: Optional[int] = Field(
+        default=30,
+        ge=5,
+        le=300,
+        description="Maximum profiling duration in seconds"
+    )
+    collect_network: bool = Field(
+        default=True,
+        description="Collect network performance data"
+    )
+    collect_memory: bool = Field(
+        default=True,
+        description="Collect memory usage data"
+    )
+    collect_cpu: bool = Field(
+        default=True,
+        description="Collect CPU usage data"
+    )
+    
+    class Config:
+        schema_extra = {
+            "example": {
+                "url": "https://example.com",
+                "profile_duration": 30,
+                "collect_network": True,
+                "collect_memory": True,
+                "collect_cpu": True
+            }
+        }
+
+
+class ProfilingSession(BaseModel):
+    """Profiling session information."""
+    session_id: str = Field(..., description="Unique session identifier")
+    status: str = Field(..., description="Session status: running, completed, failed")
+    url: str = Field(..., description="URL being profiled")
+    start_time: str = Field(..., description="Session start time (ISO format)")
+    end_time: Optional[str] = Field(None, description="Session end time (ISO format)")
+    duration_seconds: Optional[float] = Field(None, description="Total duration in seconds")
+    results: Optional[Dict[str, Any]] = Field(None, description="Profiling results")
+    error: Optional[str] = Field(None, description="Error message if failed")
+    
+    class Config:
+        schema_extra = {
+            "example": {
+                "session_id": "abc123",
+                "status": "completed",
+                "url": "https://example.com",
+                "start_time": "2025-10-16T10:30:00",
+                "end_time": "2025-10-16T10:30:30",
+                "duration_seconds": 30.5,
+                "results": {
+                    "performance": {
+                        "page_load_time_ms": 1234,
+                        "dom_content_loaded_ms": 890,
+                        "first_paint_ms": 567
+                    }
+                }
+            }
+        }
+
+
+class CrawlerStats(BaseModel):
+    """Current crawler statistics."""
+    active_crawls: int = Field(..., description="Number of currently active crawls")
+    total_crawls: int = Field(..., description="Total crawls since server start")
+    successful_crawls: int = Field(..., description="Number of successful crawls")
+    failed_crawls: int = Field(..., description="Number of failed crawls")
+    success_rate: float = Field(..., description="Success rate percentage")
+    total_bytes_processed: int = Field(..., description="Total bytes processed")
+    average_response_time_ms: float = Field(..., description="Average response time")
+    uptime_seconds: float = Field(..., description="Server uptime in seconds")
+    memory_usage_mb: float = Field(..., description="Current memory usage in MB")
+    cpu_percent: float = Field(..., description="Current CPU usage percentage")
+    last_updated: str = Field(..., description="Last update timestamp")
+
+
+class URLStatistics(BaseModel):
+    """Statistics for a specific URL pattern."""
+    url_pattern: str
+    total_requests: int
+    success_count: int
+    failure_count: int
+    success_rate: float
+    average_time_ms: float
+    last_accessed: Optional[str]
+
+
+class SessionListResponse(BaseModel):
+    """List of profiling sessions."""
+    total: int
+    sessions: List[ProfilingSession]
+
+
+# ============================================================================
+# Helper Functions
+# ============================================================================
+
+def get_system_stats() -> Dict[str, Any]:
+    """Get current system resource usage."""
+    try:
+        process = psutil.Process()
+        
+        return {
+            "memory_usage_mb": process.memory_info().rss / 1024 / 1024,
+            "cpu_percent": process.cpu_percent(interval=0.1),
+            "num_threads": process.num_threads(),
+            "open_files": len(process.open_files()),
+            "connections": len(process.connections()),
+        }
+    except Exception as e:
+        logger.error(f"Error getting system stats: {e}")
+        return {
+            "memory_usage_mb": 0.0,
+            "cpu_percent": 0.0,
+            "num_threads": 0,
+            "open_files": 0,
+            "connections": 0,
+        }
+
+
+def cleanup_old_sessions(max_age_hours: int = 24):
+    """Remove old profiling sessions to prevent memory leaks."""
+    cutoff = datetime.now() - timedelta(hours=max_age_hours)
+    
+    to_remove = []
+    for session_id, session in PROFILING_SESSIONS.items():
+        try:
+            start_time = datetime.fromisoformat(session["start_time"])
+            if start_time < cutoff:
+                to_remove.append(session_id)
+        except (ValueError, KeyError):
+            continue
+    
+    for session_id in to_remove:
+        del PROFILING_SESSIONS[session_id]
+        logger.info(f"Cleaned up old session: {session_id}")
+    
+    return len(to_remove)
+
+
+# ============================================================================
+# Profiling Endpoints
+# ============================================================================
+
+@router.post(
+    "/profile/start",
+    response_model=ProfilingSession,
+    summary="Start profiling session",
+    description="Start a new browser profiling session for performance analysis"
+)
+async def start_profiling_session(
+    request: ProfilingStartRequest,
+    background_tasks: BackgroundTasks
+):
+    """
+    Start a new profiling session.
+    
+    Returns a session ID that can be used to retrieve results later.
+    The profiling runs in the background and collects:
+    - Page load performance metrics
+    - Network requests and timing
+    - Memory usage patterns
+    - CPU utilization
+    - Browser-specific metrics
+    """
+    session_id = str(uuid.uuid4())
+    start_time = datetime.now()
+    
+    session_data = {
+        "session_id": session_id,
+        "status": "running",
+        "url": request.url,
+        "start_time": start_time.isoformat(),
+        "end_time": None,
+        "duration_seconds": None,
+        "results": None,
+        "error": None,
+        "config": {
+            "profile_duration": request.profile_duration,
+            "collect_network": request.collect_network,
+            "collect_memory": request.collect_memory,
+            "collect_cpu": request.collect_cpu,
+        }
+    }
+    
+    PROFILING_SESSIONS[session_id] = session_data
+    
+    # Add background task to run profiling
+    background_tasks.add_task(
+        run_profiling_session,
+        session_id,
+        request
+    )
+    
+    logger.info(f"Started profiling session {session_id} for {request.url}")
+    
+    return ProfilingSession(**session_data)
+
+
+@router.get(
+    "/profile/{session_id}",
+    response_model=ProfilingSession,
+    summary="Get profiling results",
+    description="Retrieve results from a profiling session"
+)
+async def get_profiling_results(session_id: str):
+    """
+    Get profiling session results.
+    
+    Returns the current status and results of a profiling session.
+    If the session is still running, results will be None.
+    """
+    if session_id not in PROFILING_SESSIONS:
+        raise HTTPException(
+            status_code=404,
+            detail=f"Profiling session '{session_id}' not found"
+        )
+    
+    session = PROFILING_SESSIONS[session_id]
+    return ProfilingSession(**session)
+
+
+@router.get(
+    "/profile",
+    response_model=SessionListResponse,
+    summary="List profiling sessions",
+    description="List all profiling sessions with optional filtering"
+)
+async def list_profiling_sessions(
+    status: Optional[str] = Query(None, description="Filter by status: running, completed, failed"),
+    limit: int = Query(50, ge=1, le=500, description="Maximum number of sessions to return")
+):
+    """
+    List all profiling sessions.
+    
+    Can be filtered by status and limited in number.
+    """
+    sessions = list(PROFILING_SESSIONS.values())
+    
+    # Filter by status if provided
+    if status:
+        sessions = [s for s in sessions if s["status"] == status]
+    
+    # Sort by start time (newest first)
+    sessions.sort(key=lambda x: x["start_time"], reverse=True)
+    
+    # Limit results
+    sessions = sessions[:limit]
+    
+    return SessionListResponse(
+        total=len(sessions),
+        sessions=[ProfilingSession(**s) for s in sessions]
+    )
+
+
+@router.delete(
+    "/profile/{session_id}",
+    summary="Delete profiling session",
+    description="Delete a profiling session and its results"
+)
+async def delete_profiling_session(session_id: str):
+    """
+    Delete a profiling session.
+    
+    Removes the session and all associated data from memory.
+    """
+    if session_id not in PROFILING_SESSIONS:
+        raise HTTPException(
+            status_code=404,
+            detail=f"Profiling session '{session_id}' not found"
+        )
+    
+    session = PROFILING_SESSIONS.pop(session_id)
+    logger.info(f"Deleted profiling session {session_id}")
+    
+    return {
+        "success": True,
+        "message": f"Session {session_id} deleted",
+        "session": ProfilingSession(**session)
+    }
+
+
+@router.post(
+    "/profile/cleanup",
+    summary="Cleanup old sessions",
+    description="Remove old profiling sessions to free memory"
+)
+async def cleanup_sessions(
+    max_age_hours: int = Query(24, ge=1, le=168, description="Maximum age in hours")
+):
+    """
+    Cleanup old profiling sessions.
+    
+    Removes sessions older than the specified age.
+    """
+    removed = cleanup_old_sessions(max_age_hours)
+    
+    return {
+        "success": True,
+        "removed_count": removed,
+        "remaining_count": len(PROFILING_SESSIONS),
+        "message": f"Removed {removed} sessions older than {max_age_hours} hours"
+    }
+
+
+# ============================================================================
+# Statistics Endpoints
+# ============================================================================
+
+@router.get(
+    "/stats",
+    response_model=CrawlerStats,
+    summary="Get crawler statistics",
+    description="Get current crawler statistics and system metrics"
+)
+async def get_crawler_stats():
+    """
+    Get current crawler statistics.
+    
+    Returns real-time metrics about:
+    - Active and total crawls
+    - Success/failure rates
+    - Response times
+    - System resource usage
+    """
+    system_stats = get_system_stats()
+    
+    total = CRAWLER_STATS["successful_crawls"] + CRAWLER_STATS["failed_crawls"]
+    success_rate = (
+        (CRAWLER_STATS["successful_crawls"] / total * 100)
+        if total > 0 else 0.0
+    )
+    
+    # Calculate uptime
+    # In a real implementation, you'd track server start time
+    uptime_seconds = 0.0  # Placeholder
+    
+    stats = CrawlerStats(
+        active_crawls=CRAWLER_STATS["active_crawls"],
+        total_crawls=CRAWLER_STATS["total_crawls"],
+        successful_crawls=CRAWLER_STATS["successful_crawls"],
+        failed_crawls=CRAWLER_STATS["failed_crawls"],
+        success_rate=success_rate,
+        total_bytes_processed=CRAWLER_STATS["total_bytes_processed"],
+        average_response_time_ms=CRAWLER_STATS["average_response_time_ms"],
+        uptime_seconds=uptime_seconds,
+        memory_usage_mb=system_stats["memory_usage_mb"],
+        cpu_percent=system_stats["cpu_percent"],
+        last_updated=datetime.now().isoformat()
+    )
+    
+    return stats
+
+
+@router.get(
+    "/stats/stream",
+    summary="Stream crawler statistics",
+    description="Server-Sent Events stream of real-time crawler statistics"
+)
+async def stream_crawler_stats(
+    interval: int = Query(2, ge=1, le=60, description="Update interval in seconds")
+):
+    """
+    Stream real-time crawler statistics.
+    
+    Returns an SSE (Server-Sent Events) stream that pushes
+    statistics updates at the specified interval.
+    
+    Example:
+        ```javascript
+        const eventSource = new EventSource('/monitoring/stats/stream?interval=2');
+        eventSource.onmessage = (event) => {
+            const stats = JSON.parse(event.data);
+            console.log('Stats:', stats);
+        };
+        ```
+    """
+    
+    async def generate_stats() -> AsyncGenerator[str, None]:
+        """Generate stats stream."""
+        try:
+            while True:
+                # Get current stats
+                stats = await get_crawler_stats()
+                
+                # Format as SSE
+                data = json.dumps(stats.dict())
+                yield f"data: {data}\n\n"
+                
+                # Wait for next interval
+                await asyncio.sleep(interval)
+                
+        except asyncio.CancelledError:
+            logger.info("Stats stream cancelled by client")
+        except Exception as e:
+            logger.error(f"Error in stats stream: {e}")
+            yield f"event: error\ndata: {json.dumps({'error': str(e)})}\n\n"
+    
+    return StreamingResponse(
+        generate_stats(),
+        media_type="text/event-stream",
+        headers={
+            "Cache-Control": "no-cache",
+            "Connection": "keep-alive",
+            "X-Accel-Buffering": "no",
+        }
+    )
+
+
+@router.get(
+    "/stats/urls",
+    response_model=List[URLStatistics],
+    summary="Get URL statistics",
+    description="Get statistics for crawled URLs"
+)
+async def get_url_statistics(
+    limit: int = Query(100, ge=1, le=1000, description="Maximum number of URLs to return"),
+    sort_by: str = Query("total_requests", description="Sort field: total_requests, success_rate, average_time_ms")
+):
+    """
+    Get statistics for crawled URLs.
+    
+    Returns metrics for each URL that has been crawled,
+    including request counts, success rates, and timing.
+    """
+    stats_list = []
+    
+    for url, stats in URL_STATS.items():
+        total = stats["total_requests"]
+        success_rate = (stats["success_count"] / total * 100) if total > 0 else 0.0
+        
+        stats_list.append(URLStatistics(
+            url_pattern=url,
+            total_requests=stats["total_requests"],
+            success_count=stats["success_count"],
+            failure_count=stats["failure_count"],
+            success_rate=success_rate,
+            average_time_ms=stats["average_time_ms"],
+            last_accessed=stats["last_accessed"]
+        ))
+    
+    # Sort
+    if sort_by == "success_rate":
+        stats_list.sort(key=lambda x: x.success_rate, reverse=True)
+    elif sort_by == "average_time_ms":
+        stats_list.sort(key=lambda x: x.average_time_ms)
+    else:  # total_requests
+        stats_list.sort(key=lambda x: x.total_requests, reverse=True)
+    
+    return stats_list[:limit]
+
+
+@router.post(
+    "/stats/reset",
+    summary="Reset statistics",
+    description="Reset all crawler statistics to zero"
+)
+async def reset_statistics():
+    """
+    Reset all statistics.
+    
+    Clears all accumulated statistics but keeps the server running.
+    Useful for testing or starting fresh measurements.
+    """
+    global CRAWLER_STATS, URL_STATS
+    
+    CRAWLER_STATS = {
+        "active_crawls": 0,
+        "total_crawls": 0,
+        "successful_crawls": 0,
+        "failed_crawls": 0,
+        "total_bytes_processed": 0,
+        "average_response_time_ms": 0.0,
+        "last_updated": datetime.now().isoformat(),
+    }
+    
+    URL_STATS.clear()
+    
+    logger.info("All statistics reset")
+    
+    return {
+        "success": True,
+        "message": "All statistics have been reset",
+        "timestamp": datetime.now().isoformat()
+    }
+
+
+# ============================================================================
+# Background Tasks
+# ============================================================================
+
+async def run_profiling_session(session_id: str, request: ProfilingStartRequest):
+    """
+    Background task to run profiling session.
+    
+    This performs the actual profiling work:
+    1. Creates a crawler with profiling enabled
+    2. Crawls the target URL
+    3. Collects performance metrics
+    4. Stores results in the session
+    """
+    start_time = time.time()
+    
+    try:
+        from crawl4ai import AsyncWebCrawler, BrowserConfig, CrawlerRunConfig
+        from crawl4ai.browser_profiler import BrowserProfiler
+        
+        logger.info(f"Starting profiling for session {session_id}")
+        
+        # Create profiler
+        profiler = BrowserProfiler()
+        
+        # Configure browser and crawler
+        browser_config = BrowserConfig.load(request.browser_config)
+        crawler_config = CrawlerRunConfig.load(request.crawler_config)
+        
+        # Enable profiling options
+        browser_config.profiling_enabled = True
+        
+        results = {}
+        
+        async with AsyncWebCrawler(config=browser_config) as crawler:
+            # Start profiling
+            profiler.start()
+            
+            # Collect system stats before
+            stats_before = get_system_stats()
+            
+            # Crawl with timeout
+            try:
+                result = await asyncio.wait_for(
+                    crawler.arun(request.url, config=crawler_config),
+                    timeout=request.profile_duration
+                )
+                
+                crawl_success = result.success
+                
+            except asyncio.TimeoutError:
+                logger.warning(f"Profiling session {session_id} timed out")
+                crawl_success = False
+                result = None
+            
+            # Stop profiling
+            profiler_results = profiler.stop()
+            
+            # Collect system stats after
+            stats_after = get_system_stats()
+            
+            # Build results
+            results = {
+                "crawl_success": crawl_success,
+                "url": request.url,
+                "performance": profiler_results if profiler_results else {},
+                "system": {
+                    "before": stats_before,
+                    "after": stats_after,
+                    "delta": {
+                        "memory_mb": stats_after["memory_usage_mb"] - stats_before["memory_usage_mb"],
+                        "cpu_percent": stats_after["cpu_percent"] - stats_before["cpu_percent"],
+                    }
+                }
+            }
+            
+            if result:
+                results["content"] = {
+                    "markdown_length": len(result.markdown) if result.markdown else 0,
+                    "html_length": len(result.html) if result.html else 0,
+                    "links_count": len(result.links["internal"]) + len(result.links["external"]),
+                    "media_count": len(result.media["images"]) + len(result.media["videos"]),
+                }
+        
+        # Update session with results
+        end_time = time.time()
+        duration = end_time - start_time
+        
+        PROFILING_SESSIONS[session_id].update({
+            "status": "completed",
+            "end_time": datetime.now().isoformat(),
+            "duration_seconds": duration,
+            "results": results
+        })
+        
+        logger.info(f"Profiling session {session_id} completed in {duration:.2f}s")
+        
+    except Exception as e:
+        logger.error(f"Profiling session {session_id} failed: {str(e)}")
+        
+        PROFILING_SESSIONS[session_id].update({
+            "status": "failed",
+            "end_time": datetime.now().isoformat(),
+            "duration_seconds": time.time() - start_time,
+            "error": str(e)
+        })
+
+
+# ============================================================================
+# Middleware Integration Points
+# ============================================================================
+
+def track_crawl_start():
+    """Call this when a crawl starts."""
+    CRAWLER_STATS["active_crawls"] += 1
+    CRAWLER_STATS["total_crawls"] += 1
+    CRAWLER_STATS["last_updated"] = datetime.now().isoformat()
+
+
+def track_crawl_end(url: str, success: bool, duration_ms: float, bytes_processed: int = 0):
+    """Call this when a crawl ends."""
+    CRAWLER_STATS["active_crawls"] = max(0, CRAWLER_STATS["active_crawls"] - 1)
+    
+    if success:
+        CRAWLER_STATS["successful_crawls"] += 1
+    else:
+        CRAWLER_STATS["failed_crawls"] += 1
+    
+    CRAWLER_STATS["total_bytes_processed"] += bytes_processed
+    
+    # Update average response time (running average)
+    total = CRAWLER_STATS["successful_crawls"] + CRAWLER_STATS["failed_crawls"]
+    current_avg = CRAWLER_STATS["average_response_time_ms"]
+    CRAWLER_STATS["average_response_time_ms"] = (
+        (current_avg * (total - 1) + duration_ms) / total
+    )
+    
+    # Update URL stats
+    url_stat = URL_STATS[url]
+    url_stat["total_requests"] += 1
+    
+    if success:
+        url_stat["success_count"] += 1
+    else:
+        url_stat["failure_count"] += 1
+    
+    # Update average time for this URL
+    total_url = url_stat["total_requests"]
+    current_avg_url = url_stat["average_time_ms"]
+    url_stat["average_time_ms"] = (
+        (current_avg_url * (total_url - 1) + duration_ms) / total_url
+    )
+    url_stat["last_accessed"] = datetime.now().isoformat()
+    
+    CRAWLER_STATS["last_updated"] = datetime.now().isoformat()
+
+
+# ============================================================================
+# Health Check
+# ============================================================================
+
+@router.get(
+    "/health",
+    summary="Health check",
+    description="Check if monitoring system is operational"
+)
+async def health_check():
+    """
+    Health check endpoint.
+    
+    Returns status of the monitoring system.
+    """
+    system_stats = get_system_stats()
+    
+    return {
+        "status": "healthy",
+        "timestamp": datetime.now().isoformat(),
+        "active_sessions": len([s for s in PROFILING_SESSIONS.values() if s["status"] == "running"]),
+        "total_sessions": len(PROFILING_SESSIONS),
+        "system": system_stats
+    }
--- a/deploy/docker/server.py
+++ b/deploy/docker/server.py
@@ -87,7 +87,7 @@ from prometheus_fastapi_instrumentator import Instrumentator
 from pydantic import BaseModel, Field
 from rank_bm25 import BM25Okapi
 from redis import asyncio as aioredis
-from routers import adaptive, dispatchers, scripts
+from routers import adaptive, dispatchers, scripts, monitoring
 from schemas import (
    CrawlRequest,
    CrawlRequestWithHooks,
@@ -297,6 +297,7 @@ app.include_router(init_job_router(redis, config, token_dep))
 app.include_router(adaptive.router)
 app.include_router(dispatchers.router)
 app.include_router(scripts.router)
+app.include_router(monitoring.router)


 # ──────────────────────── Endpoints ──────────────────────────
--- a/docs/md_v2/api/docker-server.md
+++ b/docs/md_v2/api/docker-server.md
@@ -48,6 +48,18 @@ Visit `http://localhost:11235/docs` for interactive Swagger UI documentation.
 - [POST /adaptive/crawl](#post-adaptivecrawl) - Adaptive crawl with auto-discovery
 - [GET /adaptive/status/{task_id}](#get-adaptivestatustask_id) - Check adaptive crawl status

+### Monitoring & Profiling
+- [GET /monitoring/health](#get-monitoringhealth) - Health check endpoint
+- [GET /monitoring/stats](#get-monitoringstats) - Get current statistics
+- [GET /monitoring/stats/stream](#get-monitoringsstatsstream) - Real-time statistics stream (SSE)
+- [GET /monitoring/stats/urls](#get-monitoringstatssurls) - URL-specific statistics
+- [POST /monitoring/stats/reset](#post-monitoringsstatsreset) - Reset statistics
+- [POST /monitoring/profile/start](#post-monitoringprofilestart) - Start profiling session
+- [GET /monitoring/profile/{session_id}](#get-monitoringprofilesession_id) - Get profiling results
+- [GET /monitoring/profile](#get-monitoringprofile) - List profiling sessions
+- [DELETE /monitoring/profile/{session_id}](#delete-monitoringprofilesession_id) - Delete session
+- [POST /monitoring/profile/cleanup](#post-monitoringprofilecleanup) - Cleanup old sessions
+
 ### Utility Endpoints
 - [POST /token](#post-token) - Get authentication token
 - [GET /health](#get-health) - Health check
@@ -1013,6 +1025,487 @@ Check status of adaptive crawl task.

 ---

+## Monitoring & Profiling
+
+The monitoring endpoints provide real-time statistics, profiling capabilities, and health monitoring for your Crawl4AI instance.
+
+### GET /monitoring/health
+
+Health check endpoint for monitoring integration.
+
+#### Response
+
+```json
+{
+  "status": "healthy",
+  "uptime_seconds": 3600,
+  "timestamp": "2025-01-07T12:00:00Z"
+}
+```
+
+#### Examples
+
+=== "Python"
+    ```python
+    response = requests.get("http://localhost:11235/monitoring/health")
+    health = response.json()
+    print(f"Status: {health['status']}")
+    print(f"Uptime: {health['uptime_seconds']}s")
+    ```
+
+=== "cURL"
+    ```bash
+    curl http://localhost:11235/monitoring/health
+    ```
+
+---
+
+### GET /monitoring/stats
+
+Get current crawler statistics and system metrics.
+
+#### Response
+
+```json
+{
+  "active_crawls": 2,
+  "total_crawls": 150,
+  "successful_crawls": 142,
+  "failed_crawls": 8,
+  "success_rate": 94.67,
+  "avg_duration_ms": 1250.5,
+  "total_bytes_processed": 15728640,
+  "system_stats": {
+    "cpu_percent": 45.2,
+    "memory_percent": 62.8,
+    "memory_used_mb": 2048,
+    "memory_available_mb": 8192,
+    "disk_usage_percent": 55.3,
+    "active_processes": 127
+  }
+}
+```
+
+#### Examples
+
+=== "Python"
+    ```python
+    response = requests.get("http://localhost:11235/monitoring/stats")
+    stats = response.json()
+    
+    print(f"Active crawls: {stats['active_crawls']}")
+    print(f"Success rate: {stats['success_rate']:.2f}%")
+    print(f"CPU usage: {stats['system_stats']['cpu_percent']:.1f}%")
+    print(f"Memory usage: {stats['system_stats']['memory_percent']:.1f}%")
+    ```
+
+=== "cURL"
+    ```bash
+    curl http://localhost:11235/monitoring/stats
+    ```
+
+---
+
+### GET /monitoring/stats/stream
+
+Server-Sent Events (SSE) stream of real-time statistics. Updates every 2 seconds.
+
+#### Response
+
+```
+data: {"active_crawls": 2, "total_crawls": 150, ...}
+
+data: {"active_crawls": 3, "total_crawls": 151, ...}
+
+data: {"active_crawls": 2, "total_crawls": 151, ...}
+```
+
+#### Examples
+
+=== "Python"
+    ```python
+    import requests
+    import json
+    
+    # Stream real-time stats
+    response = requests.get(
+        "http://localhost:11235/monitoring/stats/stream",
+        stream=True
+    )
+    
+    for line in response.iter_lines():
+        if line.startswith(b"data: "):
+            data = json.loads(line[6:])  # Remove "data: " prefix
+            print(f"Active: {data['active_crawls']}, "
+                  f"Total: {data['total_crawls']}, "
+                  f"CPU: {data['system_stats']['cpu_percent']:.1f}%")
+    ```
+
+=== "JavaScript"
+    ```javascript
+    const eventSource = new EventSource('http://localhost:11235/monitoring/stats/stream');
+    
+    eventSource.onmessage = (event) => {
+      const stats = JSON.parse(event.data);
+      console.log('Active crawls:', stats.active_crawls);
+      console.log('CPU:', stats.system_stats.cpu_percent);
+    };
+    ```
+
+---
+
+### GET /monitoring/stats/urls
+
+Get URL-specific statistics showing per-URL performance metrics.
+
+#### Response
+
+```json
+[
+  {
+    "url": "https://example.com",
+    "total_requests": 45,
+    "successful_requests": 42,
+    "failed_requests": 3,
+    "avg_duration_ms": 850.3,
+    "total_bytes_processed": 2621440,
+    "last_request_time": "2025-01-07T12:00:00Z"
+  },
+  {
+    "url": "https://python.org",
+    "total_requests": 32,
+    "successful_requests": 32,
+    "failed_requests": 0,
+    "avg_duration_ms": 1120.7,
+    "total_bytes_processed": 1835008,
+    "last_request_time": "2025-01-07T11:55:00Z"
+  }
+]
+```
+
+#### Examples
+
+=== "Python"
+    ```python
+    response = requests.get("http://localhost:11235/monitoring/stats/urls")
+    url_stats = response.json()
+    
+    for stat in url_stats:
+        success_rate = (stat['successful_requests'] / stat['total_requests']) * 100
+        print(f"\nURL: {stat['url']}")
+        print(f"  Requests: {stat['total_requests']}")
+        print(f"  Success rate: {success_rate:.1f}%")
+        print(f"  Avg time: {stat['avg_duration_ms']:.1f}ms")
+        print(f"  Data processed: {stat['total_bytes_processed'] / 1024:.1f}KB")
+    ```
+
+---
+
+### POST /monitoring/stats/reset
+
+Reset all statistics counters. Useful for testing or starting fresh monitoring sessions.
+
+#### Response
+
+```json
+{
+  "status": "reset",
+  "previous_stats": {
+    "total_crawls": 150,
+    "successful_crawls": 142,
+    "failed_crawls": 8
+  }
+}
+```
+
+#### Examples
+
+=== "Python"
+    ```python
+    response = requests.post("http://localhost:11235/monitoring/stats/reset")
+    result = response.json()
+    print(f"Stats reset. Previous total: {result['previous_stats']['total_crawls']}")
+    ```
+
+=== "cURL"
+    ```bash
+    curl -X POST http://localhost:11235/monitoring/stats/reset
+    ```
+
+---
+
+### POST /monitoring/profile/start
+
+Start a profiling session to monitor crawler performance over time.
+
+#### Request
+
+```json
+{
+  "urls": [
+    "https://example.com",
+    "https://python.org"
+  ],
+  "duration_seconds": 60,
+  "browser_config": {
+    "headless": true
+  },
+  "crawler_config": {
+    "word_count_threshold": 10
+  }
+}
+```
+
+#### Response
+
+```json
+{
+  "session_id": "prof_abc123xyz",
+  "status": "running",
+  "started_at": "2025-01-07T12:00:00Z",
+  "urls": [
+    "https://example.com",
+    "https://python.org"
+  ],
+  "duration_seconds": 60
+}
+```
+
+#### Examples
+
+=== "Python"
+    ```python
+    # Start a profiling session
+    response = requests.post(
+        "http://localhost:11235/monitoring/profile/start",
+        json={
+            "urls": ["https://example.com", "https://python.org"],
+            "duration_seconds": 60,
+            "crawler_config": {
+                "word_count_threshold": 10
+            }
+        }
+    )
+    
+    session = response.json()
+    session_id = session["session_id"]
+    print(f"Profiling session started: {session_id}")
+    print(f"Status: {session['status']}")
+    ```
+
+---
+
+### GET /monitoring/profile/{session_id}
+
+Get profiling session details and results.
+
+#### Response
+
+```json
+{
+  "session_id": "prof_abc123xyz",
+  "status": "completed",
+  "started_at": "2025-01-07T12:00:00Z",
+  "completed_at": "2025-01-07T12:01:00Z",
+  "duration_seconds": 60,
+  "urls": ["https://example.com", "https://python.org"],
+  "results": {
+    "total_requests": 120,
+    "successful_requests": 115,
+    "failed_requests": 5,
+    "avg_response_time_ms": 950.3,
+    "system_metrics": {
+      "avg_cpu_percent": 48.5,
+      "peak_cpu_percent": 72.3,
+      "avg_memory_percent": 55.2,
+      "peak_memory_percent": 68.9,
+      "total_bytes_processed": 5242880
+    }
+  }
+}
+```
+
+#### Examples
+
+=== "Python"
+    ```python
+    import time
+    
+    # Start session
+    start_response = requests.post(
+        "http://localhost:11235/monitoring/profile/start",
+        json={
+            "urls": ["https://example.com"],
+            "duration_seconds": 30
+        }
+    )
+    session_id = start_response.json()["session_id"]
+    
+    # Wait for completion
+    time.sleep(32)
+    
+    # Get results
+    result_response = requests.get(
+        f"http://localhost:11235/monitoring/profile/{session_id}"
+    )
+    session = result_response.json()
+    
+    print(f"Session: {session_id}")
+    print(f"Status: {session['status']}")
+    
+    if session['status'] == 'completed':
+        results = session['results']
+        print(f"\nResults:")
+        print(f"  Total requests: {results['total_requests']}")
+        print(f"  Success rate: {results['successful_requests'] / results['total_requests'] * 100:.1f}%")
+        print(f"  Avg response time: {results['avg_response_time_ms']:.1f}ms")
+        print(f"\nSystem Metrics:")
+        print(f"  Avg CPU: {results['system_metrics']['avg_cpu_percent']:.1f}%")
+        print(f"  Peak CPU: {results['system_metrics']['peak_cpu_percent']:.1f}%")
+        print(f"  Avg Memory: {results['system_metrics']['avg_memory_percent']:.1f}%")
+    ```
+
+---
+
+### GET /monitoring/profile
+
+List all profiling sessions.
+
+#### Response
+
+```json
+{
+  "sessions": [
+    {
+      "session_id": "prof_abc123xyz",
+      "status": "completed",
+      "started_at": "2025-01-07T12:00:00Z",
+      "completed_at": "2025-01-07T12:01:00Z",
+      "duration_seconds": 60,
+      "urls": ["https://example.com"]
+    },
+    {
+      "session_id": "prof_def456uvw",
+      "status": "running",
+      "started_at": "2025-01-07T12:05:00Z",
+      "duration_seconds": 120,
+      "urls": ["https://python.org", "https://github.com"]
+    }
+  ]
+}
+```
+
+#### Examples
+
+=== "Python"
+    ```python
+    response = requests.get("http://localhost:11235/monitoring/profile")
+    data = response.json()
+    
+    print(f"Total sessions: {len(data['sessions'])}")
+    
+    for session in data['sessions']:
+        print(f"\n{session['session_id']}")
+        print(f"  Status: {session['status']}")
+        print(f"  URLs: {', '.join(session['urls'])}")
+        print(f"  Duration: {session['duration_seconds']}s")
+    ```
+
+---
+
+### DELETE /monitoring/profile/{session_id}
+
+Delete a profiling session.
+
+#### Response
+
+```json
+{
+  "status": "deleted",
+  "session_id": "prof_abc123xyz"
+}
+```
+
+#### Examples
+
+=== "Python"
+    ```python
+    response = requests.delete(
+        f"http://localhost:11235/monitoring/profile/{session_id}"
+    )
+    
+    if response.status_code == 200:
+        print(f"Session {session_id} deleted")
+    ```
+
+---
+
+### POST /monitoring/profile/cleanup
+
+Clean up old profiling sessions.
+
+#### Request
+
+```json
+{
+  "max_age_seconds": 3600
+}
+```
+
+#### Response
+
+```json
+{
+  "deleted_count": 5,
+  "remaining_count": 3
+}
+```
+
+#### Examples
+
+=== "Python"
+    ```python
+    # Delete sessions older than 1 hour
+    response = requests.post(
+        "http://localhost:11235/monitoring/profile/cleanup",
+        json={"max_age_seconds": 3600}
+    )
+    
+    result = response.json()
+    print(f"Deleted {result['deleted_count']} old sessions")
+    print(f"Remaining: {result['remaining_count']}")
+    ```
+
+---
+
+### Monitoring Dashboard Demo
+
+We provide an interactive terminal-based dashboard for monitoring. Run it with:
+
+```bash
+python tests/docker/extended_features/demo_monitoring_dashboard.py --url http://localhost:11235
+```
+
+**Features:**
+- Real-time statistics with auto-refresh
+- System resource monitoring (CPU, Memory, Disk)
+- URL-specific performance metrics
+- Profiling session management
+- Interactive commands (view, create, delete sessions)
+- Color-coded status indicators
+
+**Dashboard Commands:**
+- `[D]` - Dashboard view (default)
+- `[S]` - Profiling sessions view
+- `[U]` - URL statistics view
+- `[R]` - Reset statistics
+- `[N]` - Create new profiling session (from sessions view)
+- `[V]` - View session details (from sessions view)
+- `[X]` - Delete session (from sessions view)
+- `[Q]` - Quit
+
+---
+
 ## Utility Endpoints

 ### POST /token
--- a/tests/docker/extended_features/demo_monitoring_dashboard.py
+++ b/tests/docker/extended_features/demo_monitoring_dashboard.py
@@ -0,0 +1,479 @@
+"""
+Interactive Monitoring Dashboard Demo
+
+This demo showcases the monitoring and profiling capabilities of Crawl4AI's Docker server.
+It provides:
+- Real-time statistics dashboard with auto-refresh
+- Profiling session management
+- System resource monitoring
+- URL-specific statistics
+- Interactive terminal UI
+
+Usage:
+    python demo_monitoring_dashboard.py [--url BASE_URL]
+"""
+
+import argparse
+import asyncio
+import json
+import sys
+import time
+from datetime import datetime
+from typing import Dict, List, Optional
+
+import httpx
+
+
+class Colors:
+    """ANSI color codes for terminal output."""
+    HEADER = '\033[95m'
+    OKBLUE = '\033[94m'
+    OKCYAN = '\033[96m'
+    OKGREEN = '\033[92m'
+    WARNING = '\033[93m'
+    FAIL = '\033[91m'
+    ENDC = '\033[0m'
+    BOLD = '\033[1m'
+    UNDERLINE = '\033[4m'
+
+
+class MonitoringDashboard:
+    """Interactive monitoring dashboard for Crawl4AI."""
+
+    def __init__(self, base_url: str = "http://localhost:11234"):
+        self.base_url = base_url
+        self.client = httpx.AsyncClient(base_url=base_url, timeout=60.0)
+        self.running = True
+        self.current_view = "dashboard"  # dashboard, sessions, urls
+        self.profiling_sessions: List[Dict] = []
+
+    async def close(self):
+        """Close the HTTP client."""
+        await self.client.aclose()
+
+    def clear_screen(self):
+        """Clear the terminal screen."""
+        print("\033[2J\033[H", end="")
+
+    def print_header(self, title: str):
+        """Print a formatted header."""
+        width = 80
+        print(f"\n{Colors.HEADER}{Colors.BOLD}")
+        print("=" * width)
+        print(f"{title.center(width)}")
+        print("=" * width)
+        print(f"{Colors.ENDC}")
+
+    def print_section(self, title: str):
+        """Print a section header."""
+        print(f"\n{Colors.OKBLUE}{Colors.BOLD}▶ {title}{Colors.ENDC}")
+        print("-" * 80)
+
+    async def check_health(self) -> Dict:
+        """Check server health."""
+        try:
+            response = await self.client.get("/monitoring/health")
+            response.raise_for_status()
+            return response.json()
+        except Exception as e:
+            return {"status": "error", "error": str(e)}
+
+    async def get_stats(self) -> Dict:
+        """Get current statistics."""
+        try:
+            response = await self.client.get("/monitoring/stats")
+            response.raise_for_status()
+            return response.json()
+        except Exception as e:
+            return {"error": str(e)}
+
+    async def get_url_stats(self) -> List[Dict]:
+        """Get URL-specific statistics."""
+        try:
+            response = await self.client.get("/monitoring/stats/urls")
+            response.raise_for_status()
+            return response.json()
+        except Exception as e:
+            return []
+
+    async def list_profiling_sessions(self) -> List[Dict]:
+        """List all profiling sessions."""
+        try:
+            response = await self.client.get("/monitoring/profile")
+            response.raise_for_status()
+            data = response.json()
+            return data.get("sessions", [])
+        except Exception as e:
+            return []
+
+    async def start_profiling_session(self, urls: List[str], duration: int = 30) -> Dict:
+        """Start a new profiling session."""
+        try:
+            request_data = {
+                "urls": urls,
+                "duration_seconds": duration,
+                "crawler_config": {
+                    "word_count_threshold": 10
+                }
+            }
+            response = await self.client.post("/monitoring/profile/start", json=request_data)
+            response.raise_for_status()
+            return response.json()
+        except Exception as e:
+            return {"error": str(e)}
+
+    async def get_profiling_session(self, session_id: str) -> Dict:
+        """Get profiling session details."""
+        try:
+            response = await self.client.get(f"/monitoring/profile/{session_id}")
+            response.raise_for_status()
+            return response.json()
+        except Exception as e:
+            return {"error": str(e)}
+
+    async def delete_profiling_session(self, session_id: str) -> Dict:
+        """Delete a profiling session."""
+        try:
+            response = await self.client.delete(f"/monitoring/profile/{session_id}")
+            response.raise_for_status()
+            return response.json()
+        except Exception as e:
+            return {"error": str(e)}
+
+    async def reset_stats(self) -> Dict:
+        """Reset all statistics."""
+        try:
+            response = await self.client.post("/monitoring/stats/reset")
+            response.raise_for_status()
+            return response.json()
+        except Exception as e:
+            return {"error": str(e)}
+
+    def display_dashboard(self, stats: Dict):
+        """Display the main statistics dashboard."""
+        self.clear_screen()
+        self.print_header("Crawl4AI Monitoring Dashboard")
+
+        # Health Status
+        print(f"\n{Colors.OKGREEN}● Server Status: ONLINE{Colors.ENDC}")
+        print(f"Base URL: {self.base_url}")
+        print(f"Last Updated: {datetime.now().strftime('%Y-%m-%d %H:%M:%S')}")
+
+        # Crawler Statistics
+        self.print_section("Crawler Statistics")
+        if "error" in stats:
+            print(f"{Colors.FAIL}Error fetching stats: {stats['error']}{Colors.ENDC}")
+        else:
+            print(f"Active Crawls:      {Colors.BOLD}{stats.get('active_crawls', 0)}{Colors.ENDC}")
+            print(f"Total Crawls:       {stats.get('total_crawls', 0)}")
+            print(f"Successful:         {Colors.OKGREEN}{stats.get('successful_crawls', 0)}{Colors.ENDC}")
+            print(f"Failed:             {Colors.FAIL}{stats.get('failed_crawls', 0)}{Colors.ENDC}")
+            print(f"Success Rate:       {stats.get('success_rate', 0):.2f}%")
+            print(f"Avg Duration:       {stats.get('avg_duration_ms', 0):.2f} ms")
+            
+            # Format bytes
+            total_bytes = stats.get('total_bytes_processed', 0)
+            if total_bytes > 1024 * 1024:
+                bytes_str = f"{total_bytes / (1024 * 1024):.2f} MB"
+            elif total_bytes > 1024:
+                bytes_str = f"{total_bytes / 1024:.2f} KB"
+            else:
+                bytes_str = f"{total_bytes} bytes"
+            print(f"Total Data Processed: {bytes_str}")
+
+        # System Statistics
+        if "system_stats" in stats:
+            self.print_section("System Resources")
+            sys_stats = stats["system_stats"]
+            
+            cpu = sys_stats.get("cpu_percent", 0)
+            cpu_color = Colors.OKGREEN if cpu < 50 else Colors.WARNING if cpu < 80 else Colors.FAIL
+            print(f"CPU Usage:          {cpu_color}{cpu:.1f}%{Colors.ENDC}")
+            
+            mem = sys_stats.get("memory_percent", 0)
+            mem_color = Colors.OKGREEN if mem < 50 else Colors.WARNING if mem < 80 else Colors.FAIL
+            print(f"Memory Usage:       {mem_color}{mem:.1f}%{Colors.ENDC}")
+            
+            mem_used = sys_stats.get("memory_used_mb", 0)
+            mem_available = sys_stats.get("memory_available_mb", 0)
+            print(f"Memory Used:        {mem_used:.0f} MB / {mem_available:.0f} MB")
+            
+            disk = sys_stats.get("disk_usage_percent", 0)
+            disk_color = Colors.OKGREEN if disk < 70 else Colors.WARNING if disk < 90 else Colors.FAIL
+            print(f"Disk Usage:         {disk_color}{disk:.1f}%{Colors.ENDC}")
+            
+            print(f"Active Processes:   {sys_stats.get('active_processes', 0)}")
+
+        # Navigation
+        self.print_section("Navigation")
+        print(f"[D] Dashboard  [S] Profiling Sessions  [U] URL Stats  [R] Reset Stats  [Q] Quit")
+
+    def display_url_stats(self, url_stats: List[Dict]):
+        """Display URL-specific statistics."""
+        self.clear_screen()
+        self.print_header("URL Statistics")
+
+        if not url_stats:
+            print(f"\n{Colors.WARNING}No URL statistics available yet.{Colors.ENDC}")
+        else:
+            print(f"\nTotal URLs tracked: {len(url_stats)}")
+            print()
+            
+            # Table header
+            print(f"{Colors.BOLD}{'URL':<50} {'Requests':<10} {'Success':<10} {'Avg Time':<12} {'Data':<12}{Colors.ENDC}")
+            print("-" * 94)
+            
+            # Sort by total requests
+            sorted_stats = sorted(url_stats, key=lambda x: x.get('total_requests', 0), reverse=True)
+            
+            for stat in sorted_stats[:20]:  # Show top 20
+                url = stat.get('url', 'unknown')
+                if len(url) > 47:
+                    url = url[:44] + "..."
+                
+                total = stat.get('total_requests', 0)
+                success = stat.get('successful_requests', 0)
+                success_pct = f"{(success/total*100):.0f}%" if total > 0 else "N/A"
+                
+                avg_time = stat.get('avg_duration_ms', 0)
+                time_str = f"{avg_time:.0f} ms"
+                
+                bytes_processed = stat.get('total_bytes_processed', 0)
+                if bytes_processed > 1024 * 1024:
+                    data_str = f"{bytes_processed / (1024 * 1024):.2f} MB"
+                elif bytes_processed > 1024:
+                    data_str = f"{bytes_processed / 1024:.2f} KB"
+                else:
+                    data_str = f"{bytes_processed} B"
+                
+                print(f"{url:<50} {total:<10} {success_pct:<10} {time_str:<12} {data_str:<12}")
+
+        # Navigation
+        self.print_section("Navigation")
+        print(f"[D] Dashboard  [S] Profiling Sessions  [U] URL Stats  [R] Reset Stats  [Q] Quit")
+
+    def display_profiling_sessions(self, sessions: List[Dict]):
+        """Display profiling sessions."""
+        self.clear_screen()
+        self.print_header("Profiling Sessions")
+
+        if not sessions:
+            print(f"\n{Colors.WARNING}No profiling sessions found.{Colors.ENDC}")
+        else:
+            print(f"\nTotal sessions: {len(sessions)}")
+            print()
+            
+            # Table header
+            print(f"{Colors.BOLD}{'ID':<25} {'Status':<12} {'URLs':<6} {'Duration':<12} {'Started':<20}{Colors.ENDC}")
+            print("-" * 85)
+            
+            # Sort by started time (newest first)
+            sorted_sessions = sorted(sessions, key=lambda x: x.get('started_at', ''), reverse=True)
+            
+            for session in sorted_sessions[:15]:  # Show top 15
+                session_id = session.get('session_id', 'unknown')
+                if len(session_id) > 22:
+                    session_id = session_id[:19] + "..."
+                
+                status = session.get('status', 'unknown')
+                status_color = Colors.OKGREEN if status == 'completed' else Colors.WARNING if status == 'running' else Colors.FAIL
+                
+                url_count = len(session.get('urls', []))
+                
+                duration = session.get('duration_seconds', 0)
+                duration_str = f"{duration}s" if duration else "N/A"
+                
+                started = session.get('started_at', 'N/A')
+                if started != 'N/A':
+                    try:
+                        dt = datetime.fromisoformat(started.replace('Z', '+00:00'))
+                        started = dt.strftime('%Y-%m-%d %H:%M:%S')
+                    except:
+                        pass
+                
+                print(f"{session_id:<25} {status_color}{status:<12}{Colors.ENDC} {url_count:<6} {duration_str:<12} {started:<20}")
+
+        # Navigation
+        self.print_section("Navigation & Actions")
+        print(f"[D] Dashboard  [S] Profiling Sessions  [U] URL Stats")
+        print(f"[N] New Session  [V] View Session  [X] Delete Session")
+        print(f"[R] Reset Stats  [Q] Quit")
+
+    async def interactive_session_view(self, session_id: str):
+        """Display detailed view of a profiling session."""
+        session = await self.get_profiling_session(session_id)
+        
+        self.clear_screen()
+        self.print_header(f"Profiling Session: {session_id}")
+        
+        if "error" in session:
+            print(f"\n{Colors.FAIL}Error: {session['error']}{Colors.ENDC}")
+        else:
+            print(f"\n{Colors.BOLD}Session ID:{Colors.ENDC} {session.get('session_id', 'N/A')}")
+            
+            status = session.get('status', 'unknown')
+            status_color = Colors.OKGREEN if status == 'completed' else Colors.WARNING
+            print(f"{Colors.BOLD}Status:{Colors.ENDC} {status_color}{status}{Colors.ENDC}")
+            
+            print(f"{Colors.BOLD}URLs:{Colors.ENDC}")
+            for url in session.get('urls', []):
+                print(f"  - {url}")
+            
+            started = session.get('started_at', 'N/A')
+            print(f"{Colors.BOLD}Started:{Colors.ENDC} {started}")
+            
+            if 'completed_at' in session:
+                print(f"{Colors.BOLD}Completed:{Colors.ENDC} {session['completed_at']}")
+            
+            if 'results' in session:
+                self.print_section("Profiling Results")
+                results = session['results']
+                
+                print(f"Total Requests:     {results.get('total_requests', 0)}")
+                print(f"Successful:         {Colors.OKGREEN}{results.get('successful_requests', 0)}{Colors.ENDC}")
+                print(f"Failed:             {Colors.FAIL}{results.get('failed_requests', 0)}{Colors.ENDC}")
+                print(f"Avg Response Time:  {results.get('avg_response_time_ms', 0):.2f} ms")
+                
+                if 'system_metrics' in results:
+                    self.print_section("System Metrics During Profiling")
+                    metrics = results['system_metrics']
+                    print(f"Avg CPU:            {metrics.get('avg_cpu_percent', 0):.1f}%")
+                    print(f"Peak CPU:           {metrics.get('peak_cpu_percent', 0):.1f}%")
+                    print(f"Avg Memory:         {metrics.get('avg_memory_percent', 0):.1f}%")
+                    print(f"Peak Memory:        {metrics.get('peak_memory_percent', 0):.1f}%")
+        
+        print(f"\n{Colors.OKCYAN}Press any key to return...{Colors.ENDC}")
+        input()
+
+    async def create_new_session(self):
+        """Interactive session creation."""
+        self.clear_screen()
+        self.print_header("Create New Profiling Session")
+        
+        print(f"\n{Colors.BOLD}Enter URLs to profile (one per line, empty line to finish):{Colors.ENDC}")
+        urls = []
+        while True:
+            url = input(f"{Colors.OKCYAN}URL {len(urls) + 1}:{Colors.ENDC} ").strip()
+            if not url:
+                break
+            urls.append(url)
+        
+        if not urls:
+            print(f"{Colors.FAIL}No URLs provided. Cancelled.{Colors.ENDC}")
+            time.sleep(2)
+            return
+        
+        duration = input(f"{Colors.OKCYAN}Duration (seconds, default 30):{Colors.ENDC} ").strip()
+        try:
+            duration = int(duration) if duration else 30
+        except:
+            duration = 30
+        
+        print(f"\n{Colors.WARNING}Starting profiling session for {len(urls)} URL(s), {duration}s...{Colors.ENDC}")
+        result = await self.start_profiling_session(urls, duration)
+        
+        if "error" in result:
+            print(f"{Colors.FAIL}Error: {result['error']}{Colors.ENDC}")
+        else:
+            print(f"{Colors.OKGREEN}✓ Session started successfully!{Colors.ENDC}")
+            print(f"Session ID: {result.get('session_id', 'N/A')}")
+        
+        time.sleep(3)
+
+    async def run_dashboard(self):
+        """Run the interactive dashboard."""
+        print(f"{Colors.OKGREEN}Starting Crawl4AI Monitoring Dashboard...{Colors.ENDC}")
+        print(f"Connecting to {self.base_url}...")
+        
+        # Check health
+        health = await self.check_health()
+        if health.get("status") != "healthy":
+            print(f"{Colors.FAIL}Error: Server not responding or unhealthy{Colors.ENDC}")
+            print(f"Health check result: {health}")
+            return
+        
+        print(f"{Colors.OKGREEN}✓ Connected successfully!{Colors.ENDC}")
+        time.sleep(1)
+        
+        # Main loop
+        while self.running:
+            if self.current_view == "dashboard":
+                stats = await self.get_stats()
+                self.display_dashboard(stats)
+            elif self.current_view == "urls":
+                url_stats = await self.get_url_stats()
+                self.display_url_stats(url_stats)
+            elif self.current_view == "sessions":
+                sessions = await self.list_profiling_sessions()
+                self.display_profiling_sessions(sessions)
+            
+            # Get user input (non-blocking with timeout)
+            print(f"\n{Colors.OKCYAN}Enter command (or wait 5s for auto-refresh):{Colors.ENDC} ", end="", flush=True)
+            
+            try:
+                # Simple input with timeout simulation
+                import select
+                if sys.platform != 'win32':
+                    i, _, _ = select.select([sys.stdin], [], [], 5.0)
+                    if i:
+                        command = sys.stdin.readline().strip().lower()
+                    else:
+                        command = ""
+                else:
+                    # Windows doesn't support select on stdin
+                    command = input()
+            except:
+                command = ""
+            
+            # Process command
+            if command == 'q':
+                self.running = False
+            elif command == 'd':
+                self.current_view = "dashboard"
+            elif command == 's':
+                self.current_view = "sessions"
+            elif command == 'u':
+                self.current_view = "urls"
+            elif command == 'r':
+                print(f"\n{Colors.WARNING}Resetting statistics...{Colors.ENDC}")
+                await self.reset_stats()
+                time.sleep(1)
+            elif command == 'n' and self.current_view == "sessions":
+                await self.create_new_session()
+            elif command == 'v' and self.current_view == "sessions":
+                session_id = input(f"{Colors.OKCYAN}Enter session ID:{Colors.ENDC} ").strip()
+                if session_id:
+                    await self.interactive_session_view(session_id)
+            elif command == 'x' and self.current_view == "sessions":
+                session_id = input(f"{Colors.OKCYAN}Enter session ID to delete:{Colors.ENDC} ").strip()
+                if session_id:
+                    result = await self.delete_profiling_session(session_id)
+                    if "error" in result:
+                        print(f"{Colors.FAIL}Error: {result['error']}{Colors.ENDC}")
+                    else:
+                        print(f"{Colors.OKGREEN}✓ Session deleted{Colors.ENDC}")
+                    time.sleep(2)
+        
+        self.clear_screen()
+        print(f"\n{Colors.OKGREEN}Dashboard closed. Goodbye!{Colors.ENDC}\n")
+
+
+async def main():
+    """Main entry point."""
+    parser = argparse.ArgumentParser(description="Crawl4AI Monitoring Dashboard")
+    parser.add_argument(
+        "--url",
+        default="http://localhost:11234",
+        help="Base URL of the Crawl4AI Docker server (default: http://localhost:11234)"
+    )
+    args = parser.parse_args()
+    
+    dashboard = MonitoringDashboard(base_url=args.url)
+    try:
+        await dashboard.run_dashboard()
+    finally:
+        await dashboard.close()
+
+
+if __name__ == "__main__":
+    asyncio.run(main())
--- a/tests/docker/extended_features/test_monitoring_quick.py
+++ b/tests/docker/extended_features/test_monitoring_quick.py
@@ -0,0 +1,88 @@
+#!/usr/bin/env python3
+"""
+Quick test to verify monitoring endpoints are working
+"""
+import requests
+import sys
+
+BASE_URL = "http://localhost:11234"
+
+def test_health():
+    """Test health endpoint"""
+    try:
+        response = requests.get(f"{BASE_URL}/monitoring/health", timeout=5)
+        if response.status_code == 200:
+            print("✅ Health check: PASSED")
+            print(f"   Response: {response.json()}")
+            return True
+        else:
+            print(f"❌ Health check: FAILED (status {response.status_code})")
+            return False
+    except Exception as e:
+        print(f"❌ Health check: ERROR - {e}")
+        return False
+
+def test_stats():
+    """Test stats endpoint"""
+    try:
+        response = requests.get(f"{BASE_URL}/monitoring/stats", timeout=5)
+        if response.status_code == 200:
+            stats = response.json()
+            print("✅ Stats endpoint: PASSED")
+            print(f"   Active crawls: {stats.get('active_crawls', 'N/A')}")
+            print(f"   Total crawls: {stats.get('total_crawls', 'N/A')}")
+            return True
+        else:
+            print(f"❌ Stats endpoint: FAILED (status {response.status_code})")
+            return False
+    except Exception as e:
+        print(f"❌ Stats endpoint: ERROR - {e}")
+        return False
+
+def test_url_stats():
+    """Test URL stats endpoint"""
+    try:
+        response = requests.get(f"{BASE_URL}/monitoring/stats/urls", timeout=5)
+        if response.status_code == 200:
+            print("✅ URL stats endpoint: PASSED")
+            url_stats = response.json()
+            print(f"   URLs tracked: {len(url_stats)}")
+            return True
+        else:
+            print(f"❌ URL stats endpoint: FAILED (status {response.status_code})")
+            return False
+    except Exception as e:
+        print(f"❌ URL stats endpoint: ERROR - {e}")
+        return False
+
+def main():
+    print("=" * 60)
+    print("Monitoring Endpoints Quick Test")
+    print("=" * 60)
+    print(f"\nTesting server at: {BASE_URL}")
+    print("\nMake sure the server is running:")
+    print("  cd deploy/docker && python server.py")
+    print("\n" + "-" * 60 + "\n")
+    
+    results = []
+    results.append(test_health())
+    print()
+    results.append(test_stats())
+    print()
+    results.append(test_url_stats())
+    
+    print("\n" + "=" * 60)
+    passed = sum(results)
+    total = len(results)
+    
+    if passed == total:
+        print(f"✅ All tests passed! ({passed}/{total})")
+        print("\nMonitoring endpoints are working correctly! 🎉")
+        return 0
+    else:
+        print(f"❌ Some tests failed ({passed}/{total} passed)")
+        print("\nPlease check the server logs for errors.")
+        return 1
+
+if __name__ == "__main__":
+    sys.exit(main())
--- a/tests/docker/test_monitoring_endpoints.py
+++ b/tests/docker/test_monitoring_endpoints.py
@@ -0,0 +1,522 @@
+"""
+Integration tests for monitoring and profiling endpoints.
+
+Tests all monitoring endpoints including profiling sessions, statistics,
+health checks, and real-time streaming.
+"""
+
+import asyncio
+import json
+import time
+from typing import Dict, List
+
+import pytest
+from httpx import AsyncClient
+
+# Base URL for the Docker API server
+BASE_URL = "http://localhost:11235"
+
+
+@pytest.fixture(scope="module")
+def event_loop():
+    """Create event loop for async tests."""
+    loop = asyncio.get_event_loop_policy().new_event_loop()
+    yield loop
+    loop.close()
+
+
+@pytest.fixture(scope="module")
+async def client():
+    """Create HTTP client for tests."""
+    async with AsyncClient(base_url=BASE_URL, timeout=60.0) as client:
+        yield client
+
+
+class TestHealthEndpoint:
+    """Tests for /monitoring/health endpoint."""
+
+    @pytest.mark.asyncio
+    async def test_health_check(self, client: AsyncClient):
+        """Test basic health check returns OK."""
+        response = await client.get("/monitoring/health")
+        assert response.status_code == 200
+        data = response.json()
+        assert data["status"] == "healthy"
+        assert "uptime_seconds" in data
+        assert data["uptime_seconds"] >= 0
+
+
+class TestStatsEndpoints:
+    """Tests for /monitoring/stats/* endpoints."""
+
+    @pytest.mark.asyncio
+    async def test_get_stats_empty(self, client: AsyncClient):
+        """Test getting stats when no crawls have been performed."""
+        # Reset stats first
+        await client.post("/monitoring/stats/reset")
+        
+        response = await client.get("/monitoring/stats")
+        assert response.status_code == 200
+        data = response.json()
+        
+        # Verify all expected fields
+        assert "active_crawls" in data
+        assert "total_crawls" in data
+        assert "successful_crawls" in data
+        assert "failed_crawls" in data
+        assert "success_rate" in data
+        assert "avg_duration_ms" in data
+        assert "total_bytes_processed" in data
+        assert "system_stats" in data
+        
+        # Verify system stats
+        system = data["system_stats"]
+        assert "cpu_percent" in system
+        assert "memory_percent" in system
+        assert "memory_used_mb" in system
+        assert "memory_available_mb" in system
+        assert "disk_usage_percent" in system
+        assert "active_processes" in system
+
+    @pytest.mark.asyncio
+    async def test_stats_after_crawl(self, client: AsyncClient):
+        """Test stats are updated after performing a crawl."""
+        # Reset stats
+        await client.post("/monitoring/stats/reset")
+        
+        # Perform a simple crawl
+        crawl_request = {
+            "urls": ["https://www.example.com"],
+            "crawler_config": {
+                "word_count_threshold": 10
+            }
+        }
+        crawl_response = await client.post("/crawl", json=crawl_request)
+        assert crawl_response.status_code == 200
+        
+        # Get stats
+        response = await client.get("/monitoring/stats")
+        assert response.status_code == 200
+        data = response.json()
+        
+        # Verify stats are updated
+        assert data["total_crawls"] >= 1
+        assert data["successful_crawls"] >= 0
+        assert data["failed_crawls"] >= 0
+        assert data["total_crawls"] == data["successful_crawls"] + data["failed_crawls"]
+        
+        # Verify success rate calculation
+        if data["total_crawls"] > 0:
+            expected_rate = (data["successful_crawls"] / data["total_crawls"]) * 100
+            assert abs(data["success_rate"] - expected_rate) < 0.01
+
+    @pytest.mark.asyncio
+    async def test_stats_reset(self, client: AsyncClient):
+        """Test resetting stats clears all counters."""
+        # Ensure we have some stats
+        crawl_request = {
+            "urls": ["https://www.example.com"],
+            "crawler_config": {"word_count_threshold": 10}
+        }
+        await client.post("/crawl", json=crawl_request)
+        
+        # Reset stats
+        reset_response = await client.post("/monitoring/stats/reset")
+        assert reset_response.status_code == 200
+        data = reset_response.json()
+        assert data["status"] == "reset"
+        assert "previous_stats" in data
+        
+        # Verify stats are cleared
+        stats_response = await client.get("/monitoring/stats")
+        stats = stats_response.json()
+        assert stats["total_crawls"] == 0
+        assert stats["successful_crawls"] == 0
+        assert stats["failed_crawls"] == 0
+        assert stats["active_crawls"] == 0
+
+    @pytest.mark.asyncio
+    async def test_url_specific_stats(self, client: AsyncClient):
+        """Test getting URL-specific statistics."""
+        # Reset and crawl
+        await client.post("/monitoring/stats/reset")
+        crawl_request = {
+            "urls": ["https://www.example.com"],
+            "crawler_config": {"word_count_threshold": 10}
+        }
+        await client.post("/crawl", json=crawl_request)
+        
+        # Get URL stats
+        response = await client.get("/monitoring/stats/urls")
+        assert response.status_code == 200
+        data = response.json()
+        
+        assert isinstance(data, list)
+        if len(data) > 0:
+            url_stat = data[0]
+            assert "url" in url_stat
+            assert "total_requests" in url_stat
+            assert "successful_requests" in url_stat
+            assert "failed_requests" in url_stat
+            assert "avg_duration_ms" in url_stat
+            assert "total_bytes_processed" in url_stat
+            assert "last_request_time" in url_stat
+
+
+class TestStatsStreaming:
+    """Tests for /monitoring/stats/stream SSE endpoint."""
+
+    @pytest.mark.asyncio
+    async def test_stats_stream_basic(self, client: AsyncClient):
+        """Test SSE streaming of statistics."""
+        # Start streaming (collect a few events then stop)
+        events = []
+        async with client.stream("GET", "/monitoring/stats/stream") as response:
+            assert response.status_code == 200
+            assert "text/event-stream" in response.headers.get("content-type", "")
+            
+            # Collect first 3 events
+            count = 0
+            async for line in response.aiter_lines():
+                if line.startswith("data: "):
+                    data_str = line[6:]  # Remove "data: " prefix
+                    data = json.loads(data_str)
+                    events.append(data)
+                    count += 1
+                    if count >= 3:
+                        break
+        
+        # Verify we got events
+        assert len(events) >= 3
+        
+        # Verify event structure
+        for event in events:
+            assert "active_crawls" in event
+            assert "total_crawls" in event
+            assert "successful_crawls" in event
+            assert "system_stats" in event
+
+    @pytest.mark.asyncio
+    async def test_stats_stream_during_crawl(self, client: AsyncClient):
+        """Test streaming updates during active crawl."""
+        # Start streaming in background
+        stream_task = None
+        events = []
+        
+        async def collect_stream():
+            async with client.stream("GET", "/monitoring/stats/stream") as response:
+                async for line in response.aiter_lines():
+                    if line.startswith("data: "):
+                        data_str = line[6:]
+                        data = json.loads(data_str)
+                        events.append(data)
+                        if len(events) >= 5:
+                            break
+        
+        # Start stream collection
+        stream_task = asyncio.create_task(collect_stream())
+        
+        # Wait a bit then start crawl
+        await asyncio.sleep(1)
+        crawl_request = {
+            "urls": ["https://www.example.com"],
+            "crawler_config": {"word_count_threshold": 10}
+        }
+        asyncio.create_task(client.post("/crawl", json=crawl_request))
+        
+        # Wait for events
+        try:
+            await asyncio.wait_for(stream_task, timeout=15.0)
+        except asyncio.TimeoutError:
+            stream_task.cancel()
+        
+        # Should have collected some events
+        assert len(events) > 0
+
+
+class TestProfilingEndpoints:
+    """Tests for /monitoring/profile/* endpoints."""
+
+    @pytest.mark.asyncio
+    async def test_list_profiling_sessions_empty(self, client: AsyncClient):
+        """Test listing profiling sessions when none exist."""
+        response = await client.get("/monitoring/profile")
+        assert response.status_code == 200
+        data = response.json()
+        assert "sessions" in data
+        assert isinstance(data["sessions"], list)
+
+    @pytest.mark.asyncio
+    async def test_start_profiling_session(self, client: AsyncClient):
+        """Test starting a new profiling session."""
+        request_data = {
+            "urls": ["https://www.example.com", "https://www.python.org"],
+            "duration_seconds": 2,
+            "crawler_config": {
+                "word_count_threshold": 10
+            }
+        }
+        
+        response = await client.post("/monitoring/profile/start", json=request_data)
+        assert response.status_code == 200
+        data = response.json()
+        
+        assert "session_id" in data
+        assert "status" in data
+        assert data["status"] == "running"
+        assert "started_at" in data
+        assert "urls" in data
+        assert len(data["urls"]) == 2
+        
+        return data["session_id"]
+
+    @pytest.mark.asyncio
+    async def test_get_profiling_session(self, client: AsyncClient):
+        """Test retrieving a profiling session by ID."""
+        # Start a session
+        request_data = {
+            "urls": ["https://www.example.com"],
+            "duration_seconds": 2,
+            "crawler_config": {"word_count_threshold": 10}
+        }
+        start_response = await client.post("/monitoring/profile/start", json=request_data)
+        session_id = start_response.json()["session_id"]
+        
+        # Get session immediately (should be running)
+        response = await client.get(f"/monitoring/profile/{session_id}")
+        assert response.status_code == 200
+        data = response.json()
+        
+        assert data["session_id"] == session_id
+        assert data["status"] in ["running", "completed"]
+        assert "started_at" in data
+        assert "urls" in data
+
+    @pytest.mark.asyncio
+    async def test_profiling_session_completion(self, client: AsyncClient):
+        """Test profiling session completes and produces results."""
+        # Start a short session
+        request_data = {
+            "urls": ["https://www.example.com"],
+            "duration_seconds": 3,
+            "crawler_config": {"word_count_threshold": 10}
+        }
+        start_response = await client.post("/monitoring/profile/start", json=request_data)
+        session_id = start_response.json()["session_id"]
+        
+        # Wait for completion
+        await asyncio.sleep(5)
+        
+        # Get completed session
+        response = await client.get(f"/monitoring/profile/{session_id}")
+        assert response.status_code == 200
+        data = response.json()
+        
+        assert data["status"] == "completed"
+        assert "completed_at" in data
+        assert "duration_seconds" in data
+        assert "results" in data
+        
+        # Verify results structure
+        results = data["results"]
+        assert "total_requests" in results
+        assert "successful_requests" in results
+        assert "failed_requests" in results
+        assert "avg_response_time_ms" in results
+        assert "system_metrics" in results
+
+    @pytest.mark.asyncio
+    async def test_profiling_session_not_found(self, client: AsyncClient):
+        """Test retrieving non-existent session returns 404."""
+        response = await client.get("/monitoring/profile/nonexistent-id-12345")
+        assert response.status_code == 404
+        data = response.json()
+        assert "detail" in data
+
+    @pytest.mark.asyncio
+    async def test_delete_profiling_session(self, client: AsyncClient):
+        """Test deleting a profiling session."""
+        # Start a session
+        request_data = {
+            "urls": ["https://www.example.com"],
+            "duration_seconds": 1,
+            "crawler_config": {"word_count_threshold": 10}
+        }
+        start_response = await client.post("/monitoring/profile/start", json=request_data)
+        session_id = start_response.json()["session_id"]
+        
+        # Wait for completion
+        await asyncio.sleep(2)
+        
+        # Delete session
+        delete_response = await client.delete(f"/monitoring/profile/{session_id}")
+        assert delete_response.status_code == 200
+        data = delete_response.json()
+        assert data["status"] == "deleted"
+        assert data["session_id"] == session_id
+        
+        # Verify it's gone
+        get_response = await client.get(f"/monitoring/profile/{session_id}")
+        assert get_response.status_code == 404
+
+    @pytest.mark.asyncio
+    async def test_cleanup_old_sessions(self, client: AsyncClient):
+        """Test cleaning up old profiling sessions."""
+        # Start a few sessions
+        for i in range(3):
+            request_data = {
+                "urls": ["https://www.example.com"],
+                "duration_seconds": 1,
+                "crawler_config": {"word_count_threshold": 10}
+            }
+            await client.post("/monitoring/profile/start", json=request_data)
+        
+        # Wait for completion
+        await asyncio.sleep(2)
+        
+        # Cleanup sessions older than 0 seconds (all completed ones)
+        cleanup_response = await client.post(
+            "/monitoring/profile/cleanup",
+            json={"max_age_seconds": 0}
+        )
+        assert cleanup_response.status_code == 200
+        data = cleanup_response.json()
+        assert "deleted_count" in data
+        assert data["deleted_count"] >= 0
+
+    @pytest.mark.asyncio
+    async def test_list_sessions_after_operations(self, client: AsyncClient):
+        """Test listing sessions shows correct state after various operations."""
+        # Start a session
+        request_data = {
+            "urls": ["https://www.example.com"],
+            "duration_seconds": 5,
+            "crawler_config": {"word_count_threshold": 10}
+        }
+        start_response = await client.post("/monitoring/profile/start", json=request_data)
+        session_id = start_response.json()["session_id"]
+        
+        # List sessions
+        list_response = await client.get("/monitoring/profile")
+        assert list_response.status_code == 200
+        data = list_response.json()
+        
+        # Should have at least one session
+        sessions = data["sessions"]
+        assert len(sessions) >= 1
+        
+        # Find our session
+        our_session = next((s for s in sessions if s["session_id"] == session_id), None)
+        assert our_session is not None
+        assert our_session["status"] in ["running", "completed"]
+
+
+class TestProfilingWithCrawlConfig:
+    """Tests for profiling with various crawler configurations."""
+
+    @pytest.mark.asyncio
+    async def test_profiling_with_extraction_strategy(self, client: AsyncClient):
+        """Test profiling with extraction strategy configured."""
+        request_data = {
+            "urls": ["https://www.example.com"],
+            "duration_seconds": 2,
+            "crawler_config": {
+                "word_count_threshold": 10,
+                "extraction_strategy": "NoExtractionStrategy"
+            }
+        }
+        
+        response = await client.post("/monitoring/profile/start", json=request_data)
+        assert response.status_code == 200
+        data = response.json()
+        assert data["status"] == "running"
+
+    @pytest.mark.asyncio
+    async def test_profiling_with_browser_config(self, client: AsyncClient):
+        """Test profiling with custom browser configuration."""
+        request_data = {
+            "urls": ["https://www.example.com"],
+            "duration_seconds": 2,
+            "browser_config": {
+                "headless": True,
+                "verbose": False
+            },
+            "crawler_config": {
+                "word_count_threshold": 10
+            }
+        }
+        
+        response = await client.post("/monitoring/profile/start", json=request_data)
+        assert response.status_code == 200
+        data = response.json()
+        assert data["status"] == "running"
+
+
+class TestIntegrationScenarios:
+    """Integration tests for real-world monitoring scenarios."""
+
+    @pytest.mark.asyncio
+    async def test_concurrent_crawls_and_monitoring(self, client: AsyncClient):
+        """Test monitoring multiple concurrent crawls."""
+        # Reset stats
+        await client.post("/monitoring/stats/reset")
+        
+        # Start multiple crawls concurrently
+        crawl_tasks = []
+        urls = [
+            "https://www.example.com",
+            "https://www.python.org",
+            "https://www.github.com"
+        ]
+        
+        for url in urls:
+            crawl_request = {
+                "urls": [url],
+                "crawler_config": {"word_count_threshold": 10}
+            }
+            task = client.post("/crawl", json=crawl_request)
+            crawl_tasks.append(task)
+        
+        # Execute concurrently
+        responses = await asyncio.gather(*crawl_tasks, return_exceptions=True)
+        
+        # Get stats
+        await asyncio.sleep(1)  # Give tracking time to update
+        stats_response = await client.get("/monitoring/stats")
+        stats = stats_response.json()
+        
+        # Should have tracked multiple crawls
+        assert stats["total_crawls"] >= len(urls)
+
+    @pytest.mark.asyncio
+    async def test_profiling_and_stats_correlation(self, client: AsyncClient):
+        """Test that profiling data correlates with statistics."""
+        # Reset stats
+        await client.post("/monitoring/stats/reset")
+        
+        # Start profiling session
+        profile_request = {
+            "urls": ["https://www.example.com"],
+            "duration_seconds": 3,
+            "crawler_config": {"word_count_threshold": 10}
+        }
+        profile_response = await client.post("/monitoring/profile/start", json=profile_request)
+        session_id = profile_response.json()["session_id"]
+        
+        # Wait for completion
+        await asyncio.sleep(5)
+        
+        # Get profiling results
+        profile_data_response = await client.get(f"/monitoring/profile/{session_id}")
+        profile_data = profile_data_response.json()
+        
+        # Get stats
+        stats_response = await client.get("/monitoring/stats")
+        stats = stats_response.json()
+        
+        # Stats should reflect profiling activity
+        assert stats["total_crawls"] >= profile_data["results"]["total_requests"]
+
+
+if __name__ == "__main__":
+    pytest.main([__file__, "-v", "-s"])