Merge pull request #64 from get-convex/jordan/add-gemini-pro

jordanhunt22 · web-flow · commit ec8a6db5797a · 2025-03-27T16:59:58.000-07:00
Add gemini pro to evals
diff --git a/.github/workflows/daily_google_evals.yml b/.github/workflows/daily_google_evals.yml
@@ -46,7 +46,7 @@ jobs:
 
     - name: Set Google models
       run: |
-        echo "MODELS=gemini-2.0-flash-lite,gemini-2.0-flash,gemini-1.5-flash" >> $GITHUB_ENV
+        echo "MODELS=gemini-2.0-flash-lite,gemini-2.0-flash,gemini-1.5-flash,gemini-2.5-pro-exp-03-25" >> $GITHUB_ENV
 
     - name: Run evaluations
       env:
diff --git a/runner/eval_convex_coding.py b/runner/eval_convex_coding.py
@@ -206,6 +206,7 @@ def convex_coding_task(model: ModelTemplate, input: str):
     "o3-mini",
     "gemini-2.0-flash-lite",
     "meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo",
+    "gemini-2.5-pro-exp-03-25",
 ]
 
 if os.getenv("MODELS") is not None:
diff --git a/runner/models/__init__.py b/runner/models/__init__.py
@@ -132,6 +132,14 @@ class ModelTemplate(BaseModel):
         uses_system_prompt=False,
         provider=ModelProvider.GOOGLE,
     ),
+    ModelTemplate(
+        name="gemini-2.5-pro-exp-03-25",
+        formatted_name="Gemini 2.5 Pro (Experimental)",
+        max_concurrency=int(os.getenv("GOOGLE_CONCURRENCY", "4")),
+        requires_chain_of_thought=False,
+        uses_system_prompt=False,
+        provider=ModelProvider.GOOGLE,
+    ),
 ]
 MODELS_BY_NAME = {model.name: model for model in ALL_MODELS}
 

Original file line number	Diff line number	Diff line change
`@@ -206,6 +206,7 @@ def convex_coding_task(model: ModelTemplate, input: str):`
`206`	`206`	`"o3-mini",`
`207`	`207`	`"gemini-2.0-flash-lite",`
`208`	`208`	`"meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo",`
	`209`	`+ "gemini-2.5-pro-exp-03-25",`
`209`	`210`	`]`
`210`	`211`
`211`	`212`	`if os.getenv("MODELS") is not None:`