feat: add gemini-3-flash-preview to cost registry (#5424)

replicas-connector[bot] · connortbot · web-flow · commit 877298823c11 · 2025-12-17T16:31:44.000-08:00
* feat: add gemini-3-flash-preview to cost registry

Add pricing for gemini-3-flash-preview model with support for Google AI
Studio, Vertex AI, and OpenRouter providers.

Pricing:
- Input: $0.50/1M tokens
- Cached input: $0.05/1M tokens (10% of input)
- Output: $3/1M tokens
- Audio input: $1/1M tokens
- Cached audio input: $0.10/1M tokens (10% of audio input)

* feat: add gemini-3-flash-preview to legacy cost registry

- Add model pricing to legacy providers/google/index.ts
- Update test snapshots to include new model
- Fix jest config to work without preset
- Add jest dependencies to root package.json

Pricing:
- Input: $0.50/1M tokens
- Cached input: $0.05/1M tokens
- Output: $3/1M tokens

* chore: revert changes to yarn.lock, package.json, and jest.config.ts

* fix

---------

Co-authored-by: replicas-connector[bot] &lt;replicas-connector[bot]@users.noreply.github.com&gt;
Co-authored-by: connortbot &lt;loiconnor8@gmail.com&gt;
diff --git a/packages/__tests__/cost/__snapshots__/registrySnapshots.test.ts.snap b/packages/__tests__/cost/__snapshots__/registrySnapshots.test.ts.snap
@@ -2323,6 +2323,77 @@ exports[`Registry Snapshots endpoint configurations snapshot 1`] = `
       ],
     },
   },
+  "google/gemini-3-flash-preview": {
+    "gemini-3-flash-preview:google-ai-studio": {
+      "context": 1048576,
+      "crossRegion": false,
+      "maxTokens": 65536,
+      "modelId": "gemini-3-flash-preview",
+      "parameters": [
+        "include_reasoning",
+        "max_tokens",
+        "reasoning",
+        "response_format",
+        "seed",
+        "stop",
+        "structured_outputs",
+        "temperature",
+        "tool_choice",
+        "tools",
+        "top_p",
+      ],
+      "provider": "google-ai-studio",
+      "ptbEnabled": true,
+      "regions": [
+        "*",
+      ],
+    },
+    "gemini-3-flash-preview:openrouter": {
+      "context": 1048576,
+      "crossRegion": false,
+      "maxTokens": 65536,
+      "modelId": "google/gemini-3-flash-preview",
+      "parameters": [
+        "max_tokens",
+        "response_format",
+        "seed",
+        "stop",
+        "temperature",
+        "tool_choice",
+        "tools",
+        "top_p",
+      ],
+      "provider": "openrouter",
+      "ptbEnabled": true,
+      "regions": [
+        "*",
+      ],
+    },
+    "gemini-3-flash-preview:vertex": {
+      "context": 1048576,
+      "crossRegion": true,
+      "maxTokens": 65536,
+      "modelId": "gemini-3-flash-preview",
+      "parameters": [
+        "include_reasoning",
+        "max_tokens",
+        "reasoning",
+        "response_format",
+        "seed",
+        "stop",
+        "structured_outputs",
+        "temperature",
+        "tool_choice",
+        "tools",
+        "top_p",
+      ],
+      "provider": "vertex",
+      "ptbEnabled": true,
+      "regions": [
+        "global",
+      ],
+    },
+  },
   "google/gemini-3-pro-image": {
     "gemini-3-pro-image-preview:google-ai-studio": {
       "context": 65536,
@@ -5934,6 +6005,11 @@ exports[`Registry Snapshots model coverage snapshot 1`] = `
     "openrouter",
     "vertex",
   ],
+  "google/gemini-3-flash-preview": [
+    "google-ai-studio",
+    "openrouter",
+    "vertex",
+  ],
   "google/gemini-3-pro-image": [
     "google-ai-studio",
     "openrouter",
@@ -7286,6 +7362,43 @@ exports[`Registry Snapshots pricing snapshot 1`] = `
       },
     ],
   },
+  "google/gemini-3-flash-preview": {
+    "google-ai-studio": [
+      {
+        "audio": {
+          "cachedInputMultiplier": 0.1,
+          "input": 0.000001,
+        },
+        "cacheMultipliers": {
+          "cachedInput": 0.1,
+        },
+        "input": 5e-7,
+        "output": 0.000003,
+        "threshold": 0,
+      },
+    ],
+    "openrouter": [
+      {
+        "input": 5.2775e-7,
+        "output": 0.000003165,
+        "threshold": 0,
+      },
+    ],
+    "vertex": [
+      {
+        "audio": {
+          "cachedInputMultiplier": 0.1,
+          "input": 0.000001,
+        },
+        "cacheMultipliers": {
+          "cachedInput": 0.1,
+        },
+        "input": 5e-7,
+        "output": 0.000003,
+        "threshold": 0,
+      },
+    ],
+  },
   "google/gemini-3-pro-image": {
     "google-ai-studio": [
       {
@@ -8075,6 +8188,14 @@ exports[`Registry Snapshots verify registry state 1`] = `
         "vertex",
       ],
     },
+    {
+      "model": "gemini-3-flash-preview",
+      "providers": [
+        "google-ai-studio",
+        "openrouter",
+        "vertex",
+      ],
+    },
     {
       "model": "gemini-3-pro-image-preview",
       "providers": [
@@ -8632,7 +8753,7 @@ exports[`Registry Snapshots verify registry state 1`] = `
       "provider": "fireworks",
     },
     {
-      "modelCount": 5,
+      "modelCount": 6,
       "provider": "google-ai-studio",
     },
     {
@@ -8660,15 +8781,15 @@ exports[`Registry Snapshots verify registry state 1`] = `
       "provider": "openai",
     },
     {
-      "modelCount": 59,
+      "modelCount": 60,
       "provider": "openrouter",
     },
     {
       "modelCount": 5,
       "provider": "perplexity",
     },
     {
-      "modelCount": 17,
+      "modelCount": 18,
       "provider": "vertex",
     },
     {
@@ -8702,6 +8823,7 @@ exports[`Registry Snapshots verify registry state 1`] = `
     "gemini-2.5-flash",
     "gemini-2.5-flash-lite",
     "gemini-2.5-pro",
+    "gemini-3-flash-preview",
     "gemini-3-pro-image-preview",
     "gemini-3-pro-preview",
     "gemma-3-12b-it",
@@ -8782,9 +8904,9 @@ exports[`Registry Snapshots verify registry state 1`] = `
     "claude-3.5-haiku:anthropic:*",
   ],
   "totalArchivedConfigs": 0,
-  "totalEndpoints": 257,
-  "totalModelProviderConfigs": 257,
-  "totalModelsWithPtb": 95,
+  "totalEndpoints": 259,
+  "totalModelProviderConfigs": 259,
+  "totalModelsWithPtb": 96,
   "totalProviders": 21,
 }
 `;
diff --git a/packages/cost/models/authors/google/gemini-3-flash-preview/endpoints.ts b/packages/cost/models/authors/google/gemini-3-flash-preview/endpoints.ts
@@ -0,0 +1,121 @@
+import { ModelProviderName } from "../../../providers";
+import type { ModelProviderConfig } from "../../../types";
+import { Gemini3FlashPreviewModelName } from "./model";
+
+export const endpoints = {
+  "gemini-3-flash-preview:google-ai-studio": {
+    providerModelId: "gemini-3-flash-preview",
+    provider: "google-ai-studio",
+    author: "google",
+    pricing: [
+      {
+        threshold: 0,
+        input: 0.0000005, // $0.50/1M tokens
+        output: 0.000003, // $3/1M tokens
+        cacheMultipliers: {
+          cachedInput: 0.1, // $0.05/1M = 10% of input
+        },
+        audio: {
+          input: 0.000001, // $1/1M audio tokens
+          cachedInputMultiplier: 0.1, // $0.10/1M = 10% of audio input
+        },
+      },
+    ],
+    contextLength: 1_048_576,
+    maxCompletionTokens: 65_536,
+    supportedParameters: [
+      "include_reasoning",
+      "max_tokens",
+      "reasoning",
+      "response_format",
+      "seed",
+      "stop",
+      "structured_outputs",
+      "temperature",
+      "tool_choice",
+      "tools",
+      "top_p",
+    ],
+    rateLimits: {
+      rpm: 2_000,
+      tpm: 8_000_000,
+    },
+    ptbEnabled: true,
+    responseFormat: "GOOGLE",
+    endpointConfigs: {
+      "*": {},
+    },
+  },
+  "gemini-3-flash-preview:vertex": {
+    providerModelId: "gemini-3-flash-preview",
+    provider: "vertex",
+    author: "google",
+    crossRegion: true,
+    pricing: [
+      {
+        threshold: 0,
+        input: 0.0000005, // $0.50/1M tokens
+        output: 0.000003, // $3/1M tokens
+        cacheMultipliers: {
+          cachedInput: 0.1, // $0.05/1M = 10% of input
+        },
+        audio: {
+          input: 0.000001, // $1/1M audio tokens
+          cachedInputMultiplier: 0.1, // $0.10/1M = 10% of audio input
+        },
+      },
+    ],
+    contextLength: 1_048_576,
+    maxCompletionTokens: 65_536,
+    supportedParameters: [
+      "include_reasoning",
+      "max_tokens",
+      "reasoning",
+      "response_format",
+      "seed",
+      "stop",
+      "structured_outputs",
+      "temperature",
+      "tool_choice",
+      "tools",
+      "top_p",
+    ],
+    responseFormat: "GOOGLE",
+    ptbEnabled: true,
+    endpointConfigs: {
+      global: {
+        providerModelId: "gemini-3-flash-preview",
+      },
+    },
+  },
+  "gemini-3-flash-preview:openrouter": {
+    provider: "openrouter",
+    author: "google",
+    providerModelId: "google/gemini-3-flash-preview",
+    pricing: [
+      {
+        threshold: 0,
+        input: 0.0000005275, // $0.5275/1M - $0.50/1M * 1.055
+        output: 0.000003165, // $3.165/1M - $3.00/1M * 1.055
+      },
+    ],
+    contextLength: 1_048_576,
+    maxCompletionTokens: 65_536,
+    supportedParameters: [
+      "max_tokens",
+      "response_format",
+      "seed",
+      "stop",
+      "temperature",
+      "tool_choice",
+      "tools",
+      "top_p",
+    ],
+    ptbEnabled: true,
+    endpointConfigs: {
+      "*": {},
+    },
+  },
+} satisfies Partial<
+  Record<`${Gemini3FlashPreviewModelName}:${ModelProviderName}`, ModelProviderConfig>
+>;
diff --git a/packages/cost/models/authors/google/gemini-3-flash-preview/model.ts b/packages/cost/models/authors/google/gemini-3-flash-preview/model.ts
@@ -0,0 +1,17 @@
+import { ModelConfig } from "../../../types";
+
+export const model = {
+  "gemini-3-flash-preview": {
+    name: "Google Gemini 3 Flash Preview",
+    author: "google",
+    description:
+      "Gemini 3 Flash Preview is Google's latest fast and efficient AI model optimized for quick response times while maintaining high quality. This preview version offers excellent performance for everyday tasks including text generation, code assistance, and multimodal understanding at a lower cost than Pro variants.",
+    contextLength: 1_048_576,
+    maxOutputTokens: 65_536,
+    created: "2025-12-17T00:00:00",
+    modality: { inputs: ["text", "image", "audio", "video"], outputs: ["text"] },
+    tokenizer: "Gemini",
+  },
+} satisfies Record<string, ModelConfig>;
+
+export type Gemini3FlashPreviewModelName = keyof typeof model;
diff --git a/packages/cost/models/authors/google/index.ts b/packages/cost/models/authors/google/index.ts
@@ -11,6 +11,8 @@ import { model as gemini25FlashLiteModel } from "./gemini-2.5-flash-lite/model";
 import { endpoints as gemini25FlashLiteEndpoints } from "./gemini-2.5-flash-lite/endpoints";
 import { model as gemini3ProPreviewModel } from "./gemini-3/model";
 import { endpoints as gemini3ProPreviewEndpoints } from "./gemini-3/endpoints";
+import { model as gemini3FlashPreviewModel } from "./gemini-3-flash-preview/model";
+import { endpoints as gemini3FlashPreviewEndpoints } from "./gemini-3-flash-preview/endpoints";
 import { model as gemini3ProImagePreviewModel } from "./gemini-3-pro-image/model";
 import { endpoints as gemini3ProImagePreviewEndpoints } from "./gemini-3-pro-image/endpoints";
 import { model as gemma29bModel } from "./gemma/model";
@@ -24,6 +26,7 @@ export const googleModels = {
   ...gemini25FlashModel,
   ...gemini25FlashLiteModel,
   ...gemini3ProPreviewModel,
+  ...gemini3FlashPreviewModel,
   ...gemini3ProImagePreviewModel,
   ...gemma29bModel,
   ...gemma3Model,
@@ -34,6 +37,7 @@ export const googleEndpointConfig = {
   ...gemini25FlashEndpoints,
   ...gemini25FlashLiteEndpoints,
   ...gemini3ProPreviewEndpoints,
+  ...gemini3FlashPreviewEndpoints,
   ...gemini3ProImagePreviewEndpoints,
   ...gemma29bEndpoints,
   ...gemma3Endpoints,
diff --git a/packages/cost/providers/google/index.ts b/packages/cost/providers/google/index.ts
@@ -219,6 +219,17 @@ export const costs: ModelRow[] = [
       prompt_cache_read_token: 0.0000002,
     },
   },
+  {
+    model: {
+      operator: "includes",
+      value: "gemini-3-flash-preview",
+    },
+    cost: {
+      prompt_token: 0.0000005,
+      completion_token: 0.000003,
+      prompt_cache_read_token: 0.00000005,
+    },
+  },
 ];
 
 export const modelDetails: ModelDetailsMap = {