confident-ai · Jayachander123 · Mar 17, 2026 · Mar 17, 2026 · Mar 20, 2026 · Apr 14, 2026
diff --git a/deepeval/config/settings.py b/deepeval/config/settings.py
@@ -51,7 +51,6 @@
 )
 from deepeval.constants import SUPPORTED_PROVIDER_SLUGS, slugify
 
-
 logger = logging.getLogger(__name__)
 _SAVE_RE = re.compile(r"^(?P<scheme>dotenv)(?::(?P<path>.+))?$")
 
@@ -534,6 +533,12 @@ def __setattr__(self, name: str, value):
     GROK_COST_PER_OUTPUT_TOKEN: Optional[float] = Field(
         None, description="Grok output token cost (used for cost reporting)."
     )
+    # Groq
+    USE_GROQ_MODEL: Optional[bool] = Field(
+        None, description="Select Groq as the active LLM provider."
+    )
+    GROQ_API_KEY: Optional[SecretStr] = Field(None, description="Groq API key.")
+    GROQ_MODEL_NAME: Optional[str] = Field(None, description="Groq model name.")
     # LiteLLM
     USE_LITELLM: Optional[bool] = Field(
         None, description="Select LiteLLM as the active LLM provider."
@@ -1014,6 +1019,7 @@ def DEEPEVAL_TASK_GATHER_BUFFER_SECONDS(self) -> float:
         "USE_GEMINI_MODEL",
         "USE_MOONSHOT_MODEL",
         "USE_GROK_MODEL",
+        "USE_GROQ_MODEL",
         "USE_DEEPSEEK_MODEL",
         "USE_LITELLM",
         "USE_AZURE_OPENAI_EMBEDDING",

diff --git a/deepeval/constants.py b/deepeval/constants.py
@@ -37,6 +37,7 @@ class ProviderSlug(str, Enum):
     LOCAL = "local"
     OLLAMA = "ollama"
     OPENROUTER = "openrouter"
+    GROQ = "groq"
 
 
 def slugify(value: Union[str, ProviderSlug]) -> str:

diff --git a/deepeval/models/__init__.py b/deepeval/models/__init__.py
@@ -14,6 +14,7 @@
     LiteLLMModel,
     KimiModel,
     GrokModel,
+    GroqModel,
     DeepSeekModel,
     PortkeyModel,
     OpenRouterModel,
@@ -39,6 +40,7 @@
     "LiteLLMModel",
     "KimiModel",
     "GrokModel",
+    "GroqModel",
     "DeepSeekModel",
     "OpenAIEmbeddingModel",
     "AzureOpenAIEmbeddingModel",

diff --git a/deepeval/models/llms/__init__.py b/deepeval/models/llms/__init__.py
@@ -11,6 +11,7 @@
 from .deepseek_model import DeepSeekModel
 from .portkey_model import PortkeyModel
 from .openrouter_model import OpenRouterModel
+from .groq_model import GroqModel
 
 __all__ = [
     "AzureOpenAIModel",
@@ -26,4 +27,5 @@
     "DeepSeekModel",
     "PortkeyModel",
     "OpenRouterModel",
+    "GroqModel",
 ]
diff --git a/deepeval/models/llms/constants.py b/deepeval/models/llms/constants.py
@@ -2,7 +2,6 @@
 
 from deepeval.models.base_model import DeepEvalModelData
 
-
 DEFAULT_GPT_MODEL = "gpt-4.1"
 # OpenRouter uses provider/model format (e.g., "openai/gpt-4", "anthropic/claude-3-opus")
 # DeepEval does not validate OpenRouter model strings.
@@ -2053,3 +2052,32 @@ def make_model_data(**kwargs: Any) -> ModelDataFactory:
         ),
     }
 )
+
+GROQ_MODELS_DATA = ModelDataRegistry(
+    {
+        "llama3-8b-8192": make_model_data(
+            supports_log_probs=False,
+            supports_multimodal=False,
+            supports_structured_outputs=True,
+            supports_json=True,
+            input_price=0.05 / 1e6,
+            output_price=0.08 / 1e6,
+        ),
+        "llama3-70b-8192": make_model_data(
+            supports_log_probs=False,
+            supports_multimodal=False,
+            supports_structured_outputs=True,
+            supports_json=True,
+            input_price=0.59 / 1e6,
+            output_price=0.79 / 1e6,
+        ),
+        "mixtral-8x7b-32768": make_model_data(
+            supports_log_probs=False,
+            supports_multimodal=False,
+            supports_structured_outputs=True,
+            supports_json=True,
+            input_price=0.24 / 1e6,
+            output_price=0.24 / 1e6,
+        ),
+    }
+)
diff --git a/deepeval/models/llms/groq_model.py b/deepeval/models/llms/groq_model.py
@@ -0,0 +1,221 @@
+import os
+from pydantic import BaseModel, SecretStr
+from typing import TYPE_CHECKING, Optional, Tuple, Union
+
+from deepeval.errors import DeepEvalError
+from deepeval.config.settings import get_settings
+from deepeval.models.utils import require_secret_api_key
+from deepeval.models.retry_policy import create_retry_decorator
+from deepeval.utils import require_dependency
+from deepeval.models.base_model import DeepEvalBaseLLM
+from deepeval.constants import ProviderSlug
+from deepeval.models.llms.constants import GROQ_MODELS_DATA, make_model_data
+
+if TYPE_CHECKING:
+    from groq import Groq, AsyncGroq
+
+# -----------------------------------------------------------------------------
+# Constants & Defaults
+# -----------------------------------------------------------------------------
+default_groq_model = "llama3-8b-8192"
+
+# Use a standard string for the retry decorator if ProviderSlug.GROQ doesn't exist yet
+retry_groq = create_retry_decorator(ProviderSlug.GROQ)
+
+
+# -----------------------------------------------------------------------------
+# Model Implementation
+# -----------------------------------------------------------------------------
+class GroqModel(DeepEvalBaseLLM):
+    """Class that implements Groq's LPU inference engine for high-speed evaluation.
+
+    This class provides native integration with Groq's ultra-fast API, supporting
+    both text generation and structured JSON outputs using Pydantic schemas.
+
+    Attributes:
+        model: Name of the Groq model to use (e.g., 'llama3-8b-8192', 'mixtral-8x7b-32768')
+        api_key: Groq API key for authentication
+        temperature: Sampling temperature for generation
+
+    Example:
+        ```python
+        from deepeval.models import GroqModel
+
+        # Initialize the model
+        model = GroqModel(
+            model="llama3-70b-8192",
+            api_key="gsk_..."
+        )
+
+        # Generate text
+        response = model.generate("What is the capital of France?")
+        ```
+    """
+
+    def __init__(
+        self,
+        model: Optional[str] = None,
+        api_key: Optional[str] = None,
+        temperature: Optional[float] = None,
+        **kwargs,
+    ):
+        settings = get_settings()
+        self.model_name = model or default_groq_model
+
+        # Secure API Key handling: Check params -> Settings -> Environment
+        if api_key is not None:
+            self.api_key = (
+                api_key
+                if isinstance(api_key, SecretStr)
+                else SecretStr(api_key)
+            )
+        else:
+            env_key = getattr(settings, "GROQ_API_KEY", None) or os.environ.get(
+                "GROQ_API_KEY"
+            )
+            self.api_key = (
+                env_key
+                if isinstance(env_key, SecretStr)
+                else (SecretStr(env_key) if env_key else None)
+            )
+
+        # Temperature handling
+        if temperature is not None:
+            self.temperature = float(temperature)
+        elif settings.TEMPERATURE is not None:
+            self.temperature = settings.TEMPERATURE
+        else:
+            self.temperature = 0.0
+
+        if self.temperature < 0:
+            raise DeepEvalError("Temperature must be >= 0.")
+
+        self.kwargs = kwargs
+        self.model_data = GROQ_MODELS_DATA.get(
+            self.model_name,
+            make_model_data(
+                supports_log_probs=False,
+                supports_multimodal=False,
+                supports_structured_outputs=True,
+                supports_json=True,
+                input_price=None,
+                output_price=None,
+            ),
+        )
+        self._module = self._require_module()
+
+        # Client caching for performance optimization
+        self._client: Optional["Groq"] = None
+        self._async_client: Optional["AsyncGroq"] = None
+        super().__init__(self.model_name)
+
+    def _require_module(self):
+        """Lazy loads the groq library to prevent import errors for non-Groq users."""
+        return require_dependency(
+            "groq",
+            provider_label="GroqModel",
+            install_hint="Install it with `pip install groq`.",
+        )
+
+    def load_model(self, async_mode: bool = False):
+        """Initializes and caches the Groq client."""
+        if async_mode:
+            if self._async_client is not None:
+                return self._async_client
+        else:
+            if self._client is not None:
+                return self._client
+
+        api_key = require_secret_api_key(
+            self.api_key,
+            provider_label="Groq",
+            env_var_name="GROQ_API_KEY",
+            param_hint="`api_key` to GroqModel(...)",
+        )
+
+        if hasattr(api_key, "get_secret_value"):
+            api_key = api_key.get_secret_value()
+
+        if async_mode:
+            self._async_client = self._module.AsyncGroq(
+                api_key=api_key, **self.kwargs
+            )
+            return self._async_client
+        else:
+            self._client = self._module.Groq(api_key=api_key, **self.kwargs)
+            return self._client
+
+    # -------------------------------------------------------------------------
+    # Generation Methods
+    # -------------------------------------------------------------------------
+    @retry_groq
+    def generate(
+        self, prompt: str, schema: Optional[BaseModel] = None
+    ) -> Tuple[Union[str, BaseModel], float]:
+        """Generates text or structured output from a prompt."""
+        client = self.load_model(async_mode=False)
+
+        chat_args = {
+            "model": self.model_name,
+            "messages": [{"role": "user", "content": prompt}],
+            "temperature": self.temperature,
+        }
+
+        if schema is not None:
+            chat_args["response_format"] = {"type": "json_object"}
+
+        response = client.chat.completions.create(**chat_args)
+        content = response.choices[0].message.content
+
+        if schema is not None:
+            return schema.model_validate_json(content), 0.0
+
+        return content, 0.0
+
+    @retry_groq
+    async def a_generate(
+        self, prompt: str, schema: Optional[BaseModel] = None
+    ) -> Tuple[Union[str, BaseModel], float]:
+        """Asynchronously generates text or structured output from a prompt."""
+        async_client = self.load_model(async_mode=True)
+
+        chat_args = {
+            "model": self.model_name,
+            "messages": [{"role": "user", "content": prompt}],
+            "temperature": self.temperature,
+        }
+
+        if schema is not None:
+            chat_args["response_format"] = {"type": "json_object"}
+
+        response = await async_client.chat.completions.create(**chat_args)
+        content = response.choices[0].message.content
+
+        if schema is not None:
+            return schema.model_validate_json(content), 0.0
+
+        return content, 0.0
+
+    # -------------------------------------------------------------------------
+    # Capabilities
+    # -------------------------------------------------------------------------
+
+    def supports_log_probs(self) -> Union[bool, None]:
+        return self.model_data.supports_log_probs
+
+    def supports_temperature(self) -> Union[bool, None]:
+        # Uses getattr fallback because supports_temperature is not in make_model_data
+        return getattr(self.model_data, "supports_temperature", True)
+
+    def supports_multimodal(self) -> Union[bool, None]:
+        return self.model_data.supports_multimodal
+
+    def supports_structured_outputs(self) -> Union[bool, None]:
+        return self.model_data.supports_structured_outputs
+
+    def supports_json_mode(self) -> Union[bool, None]:
+        # Note: The property on make_model_data is called 'supports_json'
+        return self.model_data.supports_json
+
+    def get_model_name(self) -> str:
+        return f"{self.name} (Groq)"