MMIRAGE/src/mmirage/config/batch_provider.py at 71f9d6f355b4fc21d2a6b251432ad2bc2f83860f · EPFLiGHT/MMIRAGE · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
"""Provider-agnostic batch configuration contracts.

This module defines the shared configuration shape used by any future batch
submission provider (OpenAI, Anthropic, etc.).
"""

from dataclasses import dataclass, field
from typing import Any, Dict, Literal, Optional


@dataclass
class BatchRetryPolicy:
    """Retry behavior used by provider-neutral batch submission orchestration.

    Attributes:
        max_attempts: Maximum number of submission attempts for retryable errors.
        initial_backoff_seconds: Delay before the first retry attempt.
        backoff_multiplier: Multiplicative factor for subsequent retry delays.
    """

    max_attempts: int = 3
    initial_backoff_seconds: float = 2.0
    backoff_multiplier: float = 2.0

    def __post_init__(self) -> None:
        if self.max_attempts < 1:
            raise ValueError("max_attempts must be >= 1")
        if self.initial_backoff_seconds < 0:
            raise ValueError("initial_backoff_seconds must be >= 0")
        if self.backoff_multiplier < 1:
            raise ValueError("backoff_multiplier must be >= 1")


@dataclass
class BatchProviderConfig:
    """Shared contract for provider-specific batch configuration.

    Concrete provider configs should inherit from this dataclass and extend it
    with provider-specific settings. The fields here are intentionally provider
    neutral so chunking/submission orchestration can run through one typed path.

    Attributes:
        provider: Provider identifier (for example, "openai" or "anthropic").
        enabled: Whether batch submission mode is enabled.
        max_chunk_bytes: Maximum serialized request bytes per chunk.
            Defaults to 50 MB.
        max_requests_per_chunk: Optional hard cap on number of requests in a
            chunk. If None, no request-count cap is enforced.
        metadata_output_path: Path where submission metadata artifacts are saved.
        retry_policy: Retry policy used by the shared batch layer.
        oversized_request_policy: Handling policy when a single request exceeds
            ``max_chunk_bytes``. ``isolate`` creates a dedicated oversized
            chunk, while ``reject`` fails fast.
        extras: Provider-specific knobs that do not belong in the shared fields.
        credentials: Provider credentials required to submit chunks.
    """

    provider: str
    enabled: bool = True
    max_chunk_bytes: int = 50 * 1024 * 1024
    max_requests_per_chunk: Optional[int] = None
    metadata_output_path: str = ""
    retry_policy: BatchRetryPolicy = field(default_factory=BatchRetryPolicy)
    oversized_request_policy: Literal["isolate", "reject"] = "isolate"
    extras: Dict[str, Any] = field(default_factory=dict)
    credentials: Dict[str, str] = field(default_factory=dict)

    def __post_init__(self) -> None:
        self.provider = self.provider.strip().lower()

        if not self.provider:
            raise ValueError("provider must be a non-empty string")
        if self.max_chunk_bytes < 1:
            raise ValueError("max_chunk_bytes must be >= 1")
        if self.max_requests_per_chunk is not None and self.max_requests_per_chunk < 1:
            raise ValueError("max_requests_per_chunk must be >= 1 when provided")
        if self.oversized_request_policy not in {"isolate", "reject"}:
            raise ValueError("oversized_request_policy must be either 'isolate' or 'reject'")