feat: implement advanced rate limiter with circuit breaker and metric… (#31)

betmoar · web-flow · commit 290ffe8a025d · 2025-09-16T15:17:48.000+02:00
This pull request introduces significant improvements to the rate limiting system, configuration, and utility imports for the track identification service. The main focus is on making rate limiting more robust and configurable, tightening default limits, and updating legacy support. Below are the most important changes grouped by theme:

Rate Limiting System Overhaul:

Introduced a new RateLimiter class in tracklistify/utils/rate_limiter.py that supports provider-specific limits, circuit breaker functionality, metrics collection, and asynchronous concurrency control. This replaces the previous simpler implementation and adds support for registering providers, alert callbacks, and global rate limiter access.
Added a global singleton accessor get_global_rate_limiter and updated legacy support with get_simple_rate_limiter for backward compatibility. The legacy function get_rate_limiter was removed.
Configuration Updates:

Added global rate limiting configuration options (max_requests_per_minute, max_concurrent_requests) to the TrackIdentificationConfig class in tracklistify/config/base.py, with new defaults set to 25 requests per minute and 2 concurrent requests.
Updated .env.example to reflect stricter default values: minimum confidence threshold increased to 0.8, max requests per minute reduced to 25, and max concurrent requests reduced to 2. [1] [2]
Utility Imports and Refactoring:

Updated tracklistify/utils/__init__.py to use get_simple_rate_limiter instead of the old get_rate_limiter, ensuring all imports match the new rate limiting implementation.
These changes collectively enhance the reliability and configurability of rate limiting, improve error handling with circuit breakers, and ensure the codebase uses the latest utility interfaces.
diff --git a/.env.example b/.env.example
@@ -5,13 +5,13 @@
 TRACKLISTIFY_OUTPUT_DIR=.tracklistify/output       # Directory for output files
 TRACKLISTIFY_CACHE_DIR=.tracklistify/cache         # Directory for caching processed audio segments
 TRACKLISTIFY_TEMP_DIR=.tracklistify/temp           # Directory for temporary files
-TRACKLISTIFY_LOG_DIR=.tracklistify/log             # Directory for log files 
+TRACKLISTIFY_LOG_DIR=.tracklistify/log             # Directory for log files
 TRACKLISTIFY_VERBOSE=false                         # Enable verbose logging
 TRACKLISTIFY_DEBUG=false                           # Enable debug mode
 
 # Track Identification Settings
 TRACKLISTIFY_SEGMENT_LENGTH=60                      # Length of audio segments in seconds (10 to 300)
-TRACKLISTIFY_MIN_CONFIDENCE=0.0                     # Minimum confidence threshold (0.0 to 1.0)
+TRACKLISTIFY_MIN_CONFIDENCE=0.8                     # Minimum confidence threshold (0.0 to 1.0)
 TRACKLISTIFY_TIME_THRESHOLD=30.0                    # Time threshold between tracks in seconds (0.0 to 300.0)
 TRACKLISTIFY_MAX_DUPLICATES=2                       # Maximum number of duplicate tracks (0 to 10)
 TRACKLISTIFY_OVERLAP_DURATION=10                    # Overlap duration between segments in seconds (0 to 30)
@@ -50,8 +50,8 @@ TRACKLISTIFY_RETRY_MAX_DELAY=30.0                   # Maximum retry delay (1.0 t
 
 # Rate Limiting Settings
 TRACKLISTIFY_RATE_LIMIT_ENABLED=true                # Enable rate limiting
-TRACKLISTIFY_MAX_REQUESTS_PER_MINUTE=60             # Global maximum requests per minute (1 to 1000)
-TRACKLISTIFY_MAX_CONCURRENT_REQUESTS=10             # Global maximum concurrent requests (1 to 100)
+TRACKLISTIFY_MAX_REQUESTS_PER_MINUTE=25             # Global maximum requests per minute (1 to 1000)
+TRACKLISTIFY_MAX_CONCURRENT_REQUESTS=2             # Global maximum concurrent requests (1 to 100)
 
 # Circuit Breaker Settings
 TRACKLISTIFY_CIRCUIT_BREAKER_ENABLED=true          # Enable circuit breaker
diff --git a/tracklistify/config/base.py b/tracklistify/config/base.py
@@ -109,6 +109,11 @@ class TrackIdentificationConfig(BaseConfig):
     primary_provider: str = field(default="shazam")
     fallback_enabled: bool = field(default=True)
     fallback_providers: List[str] = field(default_factory=list)
+
+    # Global rate limiting settings
+    max_requests_per_minute: int = field(default=25)
+    max_concurrent_requests: int = field(default=2)
+
     cache_enabled: bool = field(default=True)
     cache_ttl: int = field(default=86400)
     cache_max_size: int = field(default=1000000)
diff --git a/tracklistify/utils/__init__.py b/tracklistify/utils/__init__.py
@@ -5,16 +5,16 @@
 """
 
 from .decorators import memoize
+from .identification import IdentificationManager
 from .logger import get_logger, set_logger
-from .rate_limiter import get_rate_limiter
+from .rate_limiter import get_simple_rate_limiter
 from .validation import validate_input
-from .identification import IdentificationManager
 
 __all__ = [
     "memoize",
     "get_logger",
     "set_logger",
-    "get_rate_limiter",
+    "get_simple_rate_limiter",
     "validate_input",
     "IdentificationManager",
 ]
diff --git a/tracklistify/utils/rate_limiter.py b/tracklistify/utils/rate_limiter.py
@@ -3,13 +3,19 @@
 """
 
 # Standard library imports
+import asyncio
 import time
 from dataclasses import dataclass, field
 from enum import Enum
 from threading import Lock, Semaphore
-from typing import List, Optional, Tuple
+from typing import Any, Callable, Dict, List, Optional, Tuple
 
 # Local/package imports
+from ..config import get_config
+
+# Rate limiting constants
+# 1ms threshold to detect actual rate limit
+RATE_LIMIT_DETECTION_THRESHOLD_SECONDS = 0.001
 
 
 class CircuitState(Enum):
@@ -37,21 +43,234 @@ class RateLimitMetrics:
 class ProviderLimits:
     """Rate limits for a specific provider."""
 
-    max_requests_per_minute: int = 60
-    max_concurrent_requests: int = 10
-    tokens: int = field(default_factory=lambda: 60)
+    max_requests_per_minute: int = 25  # Default fallback (matches Shazam default)
+    max_concurrent_requests: int = 1  # Default fallback (matches Shazam default)
+    tokens: int = field(init=False)
     last_update: float = field(default_factory=time.time)
-    semaphore: Semaphore = field(default_factory=lambda: Semaphore(10))
+    semaphore: asyncio.Semaphore = field(init=False)
     lock: Lock = field(default_factory=Lock)
     metrics: RateLimitMetrics = field(default_factory=RateLimitMetrics)
     circuit_state: CircuitState = field(default=CircuitState.CLOSED)
     circuit_open_time: Optional[float] = None
     consecutive_failures: int = 0
 
+    def __post_init__(self):
+        self.tokens = self.max_requests_per_minute
+        self.semaphore = asyncio.Semaphore(self.max_concurrent_requests)
+
 
-@dataclass
 class RateLimiter:
-    """Rate limiter implementation."""
+    """Advanced rate limiter with provider management, circuit breaker, metrics."""
+
+    def __init__(self, config=None):
+        self._provider_limits: Dict[Any, ProviderLimits] = {}
+        self._alert_callbacks: List[Callable[[str], None]] = []
+        # Use provided config or get global config
+        self._config = config or get_config()
+
+    def register_provider(
+        self,
+        provider: Any,
+        max_requests_per_minute: int = None,
+        max_concurrent_requests: int = None,
+    ):
+        """Register a provider with specific rate limits."""
+        # Use provided values, or fall back to config values based on provider
+        if max_requests_per_minute is None or max_concurrent_requests is None:
+            provider_str = str(provider).lower()
+
+            # Get provider-specific limits from config
+            if provider_str == "shazam":
+                rpm = max_requests_per_minute or getattr(
+                    self._config, "shazam_max_rpm", 25
+                )
+                concurrent = max_concurrent_requests or getattr(
+                    self._config, "shazam_max_concurrent", 1
+                )
+            elif provider_str == "acrcloud":
+                rpm = max_requests_per_minute or getattr(
+                    self._config, "acrcloud_max_rpm", 30
+                )
+                concurrent = max_concurrent_requests or getattr(
+                    self._config, "acrcloud_max_concurrent", 5
+                )
+            elif provider_str == "spotify":
+                rpm = max_requests_per_minute or getattr(
+                    self._config, "spotify_max_rpm", 120
+                )
+                concurrent = max_concurrent_requests or getattr(
+                    self._config, "spotify_max_concurrent", 20
+                )
+            else:
+                # Fall back to global config or defaults
+                rpm = max_requests_per_minute or getattr(
+                    self._config, "max_requests_per_minute", 25
+                )
+                concurrent = max_concurrent_requests or getattr(
+                    self._config, "max_concurrent_requests", 2
+                )
+        else:
+            rpm = max_requests_per_minute
+            concurrent = max_concurrent_requests
+
+        self._provider_limits[provider] = ProviderLimits(
+            max_requests_per_minute=rpm,
+            max_concurrent_requests=concurrent,
+        )
+
+    def register_alert_callback(self, callback: Callable[[str], None]):
+        """Register a callback for rate limiting alerts."""
+        self._alert_callbacks.append(callback)
+
+    def _send_alert(self, message: str):
+        """Send alert to all registered callbacks."""
+        for callback in self._alert_callbacks:
+            callback(message)
+
+    async def acquire(self, provider: Any, timeout: float = 30.0) -> bool:
+        """Acquire permission to make a request."""
+        if provider not in self._provider_limits:
+            self.register_provider(provider)
+
+        limits = self._provider_limits[provider]
+
+        # Check circuit breaker first (don't count rejected requests)
+        circuit_breaker_enabled = getattr(self._config, "circuit_breaker_enabled", True)
+        if circuit_breaker_enabled and limits.circuit_state == CircuitState.OPEN:
+            circuit_reset_timeout = getattr(
+                self._config, "circuit_breaker_reset_timeout", 60.0
+            )
+            if (
+                limits.circuit_open_time
+                and time.time() - limits.circuit_open_time > circuit_reset_timeout
+            ):
+                limits.circuit_state = CircuitState.HALF_OPEN
+            else:
+                return False
+
+        # Try to acquire semaphore for concurrent requests
+        try:
+            # Always attempt to acquire the semaphore with a timeout
+            start_time = time.time()
+            await asyncio.wait_for(limits.semaphore.acquire(), timeout=timeout)
+            wait_time = time.time() - start_time
+            limits.metrics.total_wait_time += wait_time
+            # Note: Don't record semaphore waits as rate limit windows
+            # This is concurrency control, not rate limiting
+        except asyncio.TimeoutError:
+            return False
+
+        # At this point, we have semaphore access and will process the request
+        limits.metrics.total_requests += 1
+
+        # Check if rate limiting is enabled
+        rate_limit_enabled = getattr(self._config, "rate_limit_enabled", True)
+        if not rate_limit_enabled:
+            return True
+
+        # Check rate limiting tokens
+        token_wait_start = time.time()
+
+        while time.time() - token_wait_start < timeout:
+            with limits.lock:
+                self._refill_tokens(limits)
+                if limits.tokens > 0:
+                    limits.tokens -= 1
+                    # Record metrics only if we had to wait for tokens (rate limiting)
+                    wait_time = time.time() - token_wait_start
+                    if wait_time >= RATE_LIMIT_DETECTION_THRESHOLD_SECONDS:
+                        # Count successful requests that were rate-limited
+                        limits.metrics.rate_limited_requests += 1
+                        limits.metrics.last_rate_limit = time.time()
+                        limits.metrics.rate_limit_windows.append(
+                            (token_wait_start, time.time())
+                        )
+                    return True
+
+            # Wait a short time before checking again
+            await asyncio.sleep(0.01)
+
+        # Timeout exceeded - this is a rate limiting failure
+        # Record the window and update last_rate_limit but don't increment
+        # rate_limited_requests (that's only for successful requests that waited)
+        limits.metrics.last_rate_limit = time.time()
+        limits.metrics.rate_limit_windows.append((token_wait_start, time.time()))
+
+        limits.semaphore.release()
+        return False
+
+    def release(self, provider: Any):
+        """Release a concurrent request slot."""
+        if provider in self._provider_limits:
+            limits = self._provider_limits[provider]
+            limits.semaphore.release()
+
+    def _refill_tokens(self, limits: ProviderLimits):
+        """Refill rate limiting tokens."""
+        now = time.time()
+        elapsed = now - limits.last_update
+        if elapsed >= 1.0:  # Refill every second
+            tokens_to_add = int(elapsed * (limits.max_requests_per_minute / 60))
+            if tokens_to_add > 0:
+                limits.tokens = min(
+                    limits.max_requests_per_minute, limits.tokens + tokens_to_add
+                )
+                limits.last_update = now
+
+    def _update_circuit_breaker(self, provider: Any, success: bool):
+        """Update circuit breaker state based on request success."""
+        if provider not in self._provider_limits:
+            return
+
+        limits = self._provider_limits[provider]
+        circuit_breaker_enabled = getattr(self._config, "circuit_breaker_enabled", True)
+
+        if not circuit_breaker_enabled:
+            return
+
+        if success:
+            limits.consecutive_failures = 0
+            if limits.circuit_state == CircuitState.HALF_OPEN:
+                limits.circuit_state = CircuitState.CLOSED
+        else:
+            limits.consecutive_failures += 1
+            circuit_threshold = getattr(self._config, "circuit_breaker_threshold", 5)
+            if (
+                limits.consecutive_failures >= circuit_threshold
+                and limits.circuit_state == CircuitState.CLOSED
+            ):
+                limits.circuit_state = CircuitState.OPEN
+                limits.circuit_open_time = time.time()
+                limits.metrics.circuit_trips += 1
+                limits.metrics.last_circuit_trip = time.time()
+                self._send_alert(
+                    message=f"Circuit breaker opened for provider {provider} "
+                    f"after {limits.consecutive_failures} failures"
+                )
+
+    def get_metrics(self, provider: Any) -> Dict[str, Any]:
+        """Get metrics for a provider."""
+        if provider not in self._provider_limits:
+            return {}
+
+        limits = self._provider_limits[provider]
+        return {
+            "total_requests": limits.metrics.total_requests,
+            "rate_limited_requests": limits.metrics.rate_limited_requests,
+            "total_wait_time": limits.metrics.total_wait_time,
+            "last_rate_limit": limits.metrics.last_rate_limit,
+            "rate_limit_windows": limits.metrics.rate_limit_windows,
+            "circuit_trips": limits.metrics.circuit_trips,
+            "last_circuit_trip": limits.metrics.last_circuit_trip,
+            "circuit_state": limits.circuit_state.value,
+            "current_tokens": limits.tokens,
+        }
+
+
+# Legacy support for the simple RateLimiter
+@dataclass
+class SimpleLimiter:
+    """Simple rate limiter implementation."""
 
     max_requests_per_minute: int
     max_concurrent_requests: int
@@ -84,20 +303,36 @@ def _refill(self):
 
 
 # Singleton instance
-_rate_limiter_instance = None
+_global_rate_limiter = None
 
 
-def get_rate_limiter(provider: str, config) -> RateLimiter:
-    """Get rate limiter for the specified provider."""
+def get_global_rate_limiter() -> RateLimiter:
+    """Get the global rate limiter instance."""
+    global _global_rate_limiter
+    if _global_rate_limiter is None:
+        _global_rate_limiter = RateLimiter()
+    return _global_rate_limiter
+
+
+def get_simple_rate_limiter(provider: str, config=None) -> SimpleLimiter:
+    """Get legacy rate limiter for the specified provider."""
+    if config is None:
+        config = get_config()
+
     if provider == "shazam":
-        return RateLimiter(
+        return SimpleLimiter(
             max_requests_per_minute=config.shazam_max_rpm,
             max_concurrent_requests=config.shazam_max_concurrent,
         )
     elif provider == "acrcloud":
-        return RateLimiter(
+        return SimpleLimiter(
             max_requests_per_minute=config.acrcloud_max_rpm,
             max_concurrent_requests=config.acrcloud_max_concurrent,
         )
+    elif provider == "spotify":
+        return SimpleLimiter(
+            max_requests_per_minute=getattr(config, "spotify_max_rpm", 120),
+            max_concurrent_requests=getattr(config, "spotify_max_concurrent", 20),
+        )
     else:
         raise ValueError(f"Unknown provider: {provider}")