Skip to content

Commit 57cc004

Browse files
vertex-mg-botcopybara-github
authored andcommitted
Update the HF TGI and pytorch-inference notebooks, with the latest container image version.
PiperOrigin-RevId: 704421485
1 parent b9549cc commit 57cc004

File tree

2 files changed

+2
-2
lines changed

2 files changed

+2
-2
lines changed

notebooks/community/model_garden/model_garden_huggingface_pytorch_inference_deployment.ipynb

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -153,7 +153,7 @@
153153
"TASK = \"text-classification\" # @param {type: \"string\", isTemplate: true}\n",
154154
"\n",
155155
"# The pre-built serving docker images for Hugging Face Pytorch Inference.\n",
156-
"SERVE_DOCKER_URI = \"us-docker.pkg.dev/deeplearning-platform-release/gcr.io/huggingface-pytorch-inference-cu121.2-2.transformers.4-44.ubuntu2204.py311\"\n",
156+
"SERVE_DOCKER_URI = \"us-docker.pkg.dev/deeplearning-platform-release/gcr.io/huggingface-pytorch-inference-cu121.2-3.transformers.4-46.ubuntu2204.py311\"\n",
157157
"\n",
158158
"machine_type = \"g2-standard-8\" # @param {type: \"string\", isTemplate: true}\n",
159159
"accelerator_type = \"NVIDIA_L4\" # @param [\"NVIDIA_L4\", \"None\"] {isTemplate: true}\n",

notebooks/community/model_garden/model_garden_huggingface_tgi_deployment.ipynb

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -154,7 +154,7 @@
154154
"MODEL_ID = \"google/gemma-2-2b-it\" # @param {type: \"string\", isTemplate: true}\n",
155155
"\n",
156156
"# The pre-built serving docker image for TGI.\n",
157-
"TGI_DOCKER_URI = \"us-docker.pkg.dev/deeplearning-platform-release/gcr.io/huggingface-text-generation-inference-cu124.2-3.ubuntu2204.py311\"\n",
157+
"TGI_DOCKER_URI = \"us-docker.pkg.dev/deeplearning-platform-release/gcr.io/huggingface-text-generation-inference-cu124.2-4.ubuntu2204.py311\"\n",
158158
"\n",
159159
"# @markdown Set use_dedicated_endpoint to False if you don't want to use [dedicated endpoint](https://cloud.google.com/vertex-ai/docs/general/deployment#create-dedicated-endpoint).\n",
160160
"use_dedicated_endpoint = True # @param {type:\"boolean\"}\n",

0 commit comments

Comments
 (0)