feat(cost): add Gemini 3.1 Pro Preview model support (#5595)

colegottdank · web-flow · commit 23f8419328cc · 2026-02-19T22:20:53.000-08:00
diff --git a/packages/__tests__/cost/__snapshots__/registrySnapshots.test.ts.snap b/packages/__tests__/cost/__snapshots__/registrySnapshots.test.ts.snap
@@ -2847,6 +2847,77 @@ exports[`Registry Snapshots endpoint configurations snapshot 1`] = `
       ],
     },
   },
+  "google/gemini-3.1-pro-preview": {
+    "gemini-3.1-pro-preview:helicone": {
+      "context": 1048576,
+      "crossRegion": false,
+      "maxTokens": 65536,
+      "modelId": "pa/gemini-3.1-pro-preview",
+      "parameters": [
+        "include_reasoning",
+        "max_tokens",
+        "reasoning",
+        "response_format",
+        "seed",
+        "stop",
+        "structured_outputs",
+        "temperature",
+        "tool_choice",
+        "tools",
+        "top_p",
+      ],
+      "provider": "helicone",
+      "ptbEnabled": true,
+      "regions": [
+        "*",
+      ],
+    },
+    "gemini-3.1-pro-preview:openrouter": {
+      "context": 1048576,
+      "crossRegion": false,
+      "maxTokens": 65536,
+      "modelId": "google/gemini-3.1-pro-preview",
+      "parameters": [
+        "max_tokens",
+        "response_format",
+        "seed",
+        "stop",
+        "temperature",
+        "tool_choice",
+        "tools",
+        "top_p",
+      ],
+      "provider": "openrouter",
+      "ptbEnabled": true,
+      "regions": [
+        "*",
+      ],
+    },
+    "gemini-3.1-pro-preview:vertex": {
+      "context": 1048576,
+      "crossRegion": true,
+      "maxTokens": 65536,
+      "modelId": "gemini-3.1-pro-preview",
+      "parameters": [
+        "include_reasoning",
+        "max_tokens",
+        "reasoning",
+        "response_format",
+        "seed",
+        "stop",
+        "structured_outputs",
+        "temperature",
+        "tool_choice",
+        "tools",
+        "top_p",
+      ],
+      "provider": "vertex",
+      "ptbEnabled": true,
+      "regions": [
+        "global",
+      ],
+    },
+  },
   "google/gemma": {
     "gemma2-9b-it:chutes": {
       "context": 8192,
@@ -7230,6 +7301,11 @@ exports[`Registry Snapshots model coverage snapshot 1`] = `
     "openrouter",
     "vertex",
   ],
+  "google/gemini-3.1-pro-preview": [
+    "helicone",
+    "openrouter",
+    "vertex",
+  ],
   "google/gemma": [
     "chutes",
     "openrouter",
@@ -8957,6 +9033,51 @@ exports[`Registry Snapshots pricing snapshot 1`] = `
       },
     ],
   },
+  "google/gemini-3.1-pro-preview": {
+    "helicone": [
+      {
+        "input": 0.000002,
+        "output": 0.000012,
+        "threshold": 0,
+      },
+      {
+        "input": 0.000004,
+        "output": 0.000018,
+        "threshold": 200000,
+      },
+    ],
+    "openrouter": [
+      {
+        "input": 0.00000211,
+        "output": 0.00001266,
+        "threshold": 0,
+      },
+      {
+        "input": 0.00000422,
+        "output": 0.00001899,
+        "threshold": 200000,
+      },
+    ],
+    "vertex": [
+      {
+        "cacheMultipliers": {
+          "cachedInput": 0.1,
+        },
+        "cacheStoragePerHour": 0.0000045,
+        "input": 0.000002,
+        "output": 0.000012,
+        "threshold": 0,
+      },
+      {
+        "cacheMultipliers": {
+          "cachedInput": 0.1,
+        },
+        "input": 0.000004,
+        "output": 0.000018,
+        "threshold": 200000,
+      },
+    ],
+  },
   "google/gemma": {
     "chutes": [
       {
diff --git a/packages/cost/models/authors/google/gemini-3.1-pro-preview/endpoints.ts b/packages/cost/models/authors/google/gemini-3.1-pro-preview/endpoints.ts
@@ -0,0 +1,126 @@
+import { ModelProviderName } from "../../../providers";
+import type { ModelProviderConfig } from "../../../types";
+import { Gemini31ProPreviewModelName } from "./model";
+
+export const endpoints = {
+  "gemini-3.1-pro-preview:vertex": {
+    providerModelId: "gemini-3.1-pro-preview",
+    provider: "vertex",
+    author: "google",
+    crossRegion: true,
+    pricing: [
+      {
+        threshold: 0,
+        input: 0.000002, // $2/1M tokens
+        output: 0.000012, // $12/1M tokens (including thinking tokens)
+        cacheMultipliers: {
+          cachedInput: 0.1, // $0.20/1M = 10% of input
+        },
+        cacheStoragePerHour: 0.0000045, // $4.50/1M tokens per hour
+      },
+      {
+        threshold: 200000,
+        input: 0.000004, // $4/1M tokens (over 200K context)
+        output: 0.000018, // $18/1M tokens (over 200K context)
+        cacheMultipliers: {
+          cachedInput: 0.1, // $0.40/1M = 10% of $4
+        },
+      },
+    ],
+    contextLength: 1_048_576,
+    maxCompletionTokens: 65_536,
+    supportedParameters: [
+      "include_reasoning",
+      "max_tokens",
+      "reasoning",
+      "response_format",
+      "seed",
+      "stop",
+      "structured_outputs",
+      "temperature",
+      "tool_choice",
+      "tools",
+      "top_p",
+    ],
+    responseFormat: "GOOGLE",
+    ptbEnabled: true,
+    endpointConfigs: {
+      global: {
+        providerModelId: "gemini-3.1-pro-preview",
+      },
+    },
+  },
+
+  "gemini-3.1-pro-preview:openrouter": {
+    provider: "openrouter",
+    author: "google",
+    providerModelId: "google/gemini-3.1-pro-preview",
+    pricing: [
+      {
+        threshold: 0,
+        input: 0.00000211, // $2.11/1M - $2.00/1M * 1.055 (OpenRouter markup)
+        output: 0.00001266, // $12.66/1M - $12.00/1M * 1.055
+      },
+      {
+        threshold: 200000,
+        input: 0.00000422, // $4.22/1M - $4.00/1M * 1.055 (over 200K context)
+        output: 0.00001899, // $18.99/1M - $18.00/1M * 1.055 (over 200K context)
+      },
+    ],
+    contextLength: 1_048_576,
+    maxCompletionTokens: 65_536,
+    supportedParameters: [
+      "max_tokens",
+      "response_format",
+      "seed",
+      "stop",
+      "temperature",
+      "tool_choice",
+      "tools",
+      "top_p",
+    ],
+    ptbEnabled: true,
+    endpointConfigs: {
+      "*": {},
+    },
+  },
+
+  "gemini-3.1-pro-preview:helicone": {
+    provider: "helicone",
+    author: "google",
+    providerModelId: "pa/gemini-3.1-pro-preview",
+    pricing: [
+      {
+        threshold: 0,
+        input: 0.000002, // $2/1M tokens (Google's standard pricing)
+        output: 0.000012, // $12/1M tokens (Google's standard pricing)
+      },
+      {
+        threshold: 200000,
+        input: 0.000004, // $4/1M tokens (over 200K context)
+        output: 0.000018, // $18/1M tokens (over 200K context)
+      },
+    ],
+    contextLength: 1_048_576,
+    maxCompletionTokens: 65_536,
+    supportedParameters: [
+      "include_reasoning",
+      "max_tokens",
+      "reasoning",
+      "response_format",
+      "seed",
+      "stop",
+      "structured_outputs",
+      "temperature",
+      "tool_choice",
+      "tools",
+      "top_p",
+    ],
+    ptbEnabled: true,
+    endpointConfigs: {
+      "*": {},
+    },
+  },
+} satisfies Partial<
+  Record<`${Gemini31ProPreviewModelName}:${ModelProviderName}`, ModelProviderConfig>
+>;
diff --git a/packages/cost/models/authors/google/gemini-3.1-pro-preview/model.ts b/packages/cost/models/authors/google/gemini-3.1-pro-preview/model.ts
@@ -0,0 +1,17 @@
+import { ModelConfig } from "../../../types";
+
+export const model = {
+  "gemini-3.1-pro-preview": {
+    name: "Google Gemini 3.1 Pro Preview",
+    author: "google",
+    description:
+      "Gemini 3.1 Pro Preview is Google's most advanced reasoning model, released February 2026. It uses extended thinking/chain-of-thought reasoning to work through complex problems. Scores 77.1% on ARC-AGI-2 (more than doubling Gemini 3 Pro's 31.1%), and tops the Artificial Analysis Intelligence Index v4.0 at half the cost of competitors. Features enhanced accuracy for ambitious agentic workflows, complex problem-solving, and scientific reasoning.",
+    contextLength: 1_048_576,
+    maxOutputTokens: 65_536,
+    created: "2026-02-09T00:00:00",
+    modality: { inputs: ["text", "image", "audio", "video"], outputs: ["text"] },
+    tokenizer: "Gemini",
+  },
+} satisfies Record<string, ModelConfig>;
+
+export type Gemini31ProPreviewModelName = keyof typeof model;
diff --git a/packages/cost/models/authors/google/index.ts b/packages/cost/models/authors/google/index.ts
@@ -13,6 +13,8 @@ import { model as gemini25FlashLiteModel } from "./gemini-2.5-flash-lite/model";
 import { endpoints as gemini25FlashLiteEndpoints } from "./gemini-2.5-flash-lite/endpoints";
 import { model as gemini3ProPreviewModel } from "./gemini-3/model";
 import { endpoints as gemini3ProPreviewEndpoints } from "./gemini-3/endpoints";
+import { model as gemini31ProPreviewModel } from "./gemini-3.1-pro-preview/model";
+import { endpoints as gemini31ProPreviewEndpoints } from "./gemini-3.1-pro-preview/endpoints";
 import { model as gemini3FlashPreviewModel } from "./gemini-3-flash-preview/model";
 import { endpoints as gemini3FlashPreviewEndpoints } from "./gemini-3-flash-preview/endpoints";
 import { model as gemini3ProImagePreviewModel } from "./gemini-3-pro-image/model";
@@ -31,6 +33,7 @@ export const googleModels = {
   ...gemini25FlashModel,
   ...gemini25FlashLiteModel,
   ...gemini3ProPreviewModel,
+  ...gemini31ProPreviewModel,
   ...gemini3FlashPreviewModel,
   ...gemini3ProImagePreviewModel,
   ...gemini31ProPreviewModel,
@@ -44,6 +47,7 @@ export const googleEndpointConfig = {
   ...gemini25FlashEndpoints,
   ...gemini25FlashLiteEndpoints,
   ...gemini3ProPreviewEndpoints,
+  ...gemini31ProPreviewEndpoints,
   ...gemini3FlashPreviewEndpoints,
   ...gemini3ProImagePreviewEndpoints,
   ...gemini31ProPreviewEndpoints,
diff --git a/packages/cost/providers/google/index.ts b/packages/cost/providers/google/index.ts
@@ -263,6 +263,17 @@ export const costs: ModelRow[] = [
       prompt_cache_read_token: 0.00000005,
     },
   },
+  {
+    model: {
+      operator: "includes",
+      value: "gemini-3.1-pro-preview",
+    },
+    cost: {
+      prompt_token: 0.000002, // $2/1M tokens
+      completion_token: 0.000012, // $12/1M tokens (including thinking)
+      prompt_cache_read_token: 0.0000002, // $0.20/1M = 10% of input
+    },
+  },
 ];
 
 export const modelDetails: ModelDetailsMap = {
diff --git a/packages/cost/providers/openrouter/index.ts b/packages/cost/providers/openrouter/index.ts
@@ -1157,6 +1157,17 @@ export const costs: ModelRow[] = [
       prompt_cache_read_token: 2e-7, // $0.2/1M tokens
     },
   },
+  {
+    model: {
+      operator: "equals",
+      value: "google/gemini-3.1-pro-preview",
+    },
+    cost: {
+      prompt_token: 2.11e-6, // $2.11/1M tokens (OpenRouter markup)
+      completion_token: 1.266e-5, // $12.66/1M tokens
+      prompt_cache_read_token: 2.11e-7, // $0.211/1M tokens
+    },
+  },
   {
     model: {
       operator: "equals",