Skip to content

Commit 964c481

Browse files
vertex-mg-botcopybara-github
authored andcommitted
Enable dedicate endpoint for timesfm deployment
PiperOrigin-RevId: 700190957
1 parent 454a90b commit 964c481

File tree

1 file changed

+19
-4
lines changed

1 file changed

+19
-4
lines changed

notebooks/community/model_garden/model_garden_timesfm_deployment_on_vertex.ipynb

Lines changed: 19 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -306,6 +306,8 @@
306306
"print(\"Creating endpoint.\")\n",
307307
"\n",
308308
"SERVE_DOCKER_URI = \"us-docker.pkg.dev/vertex-ai/vertex-vision-model-garden-dockers/jax-timesfm-serve:20240828_1036_RC00\"\n",
309+
"# @markdown Set use_dedicated_endpoint to False if you don't want to use [dedicated endpoint](https://cloud.google.com/vertex-ai/docs/general/deployment#create-dedicated-endpoint).\n",
310+
"use_dedicated_endpoint = True # @param {type:\"boolean\"}\n",
309311
"\n",
310312
"\n",
311313
"def deploy_model(\n",
@@ -317,12 +319,14 @@
317319
" accelerator_type: str = \"NVIDIA_L4\",\n",
318320
" accelerator_count: int = 1,\n",
319321
" deploy_source: str = \"notebook\",\n",
322+
" use_dedicated_endpoint: bool = False,\n",
320323
") -> Tuple[aiplatform.Model, aiplatform.Endpoint]:\n",
321324
" \"\"\"Creates a Vertex AI Endpoint and deploys TimesFM to the endpoint.\"\"\"\n",
322325
" model_name_with_time = common_util.get_job_name_with_datetime(model_name)\n",
323326
" endpoint = aiplatform.Endpoint.create(\n",
324327
" display_name=f\"{model_name_with_time}-endpoint\",\n",
325328
" credentials=aiplatform.initializer.global_config.credentials,\n",
329+
" dedicated_endpoint_enabled=use_dedicated_endpoint,\n",
326330
" )\n",
327331
"\n",
328332
" if accelerator_type == \"ACCELERATOR_TYPE_UNSPECIFIED\":\n",
@@ -374,6 +378,7 @@
374378
" machine_type=machine_type,\n",
375379
" accelerator_type=accelerator_type,\n",
376380
" accelerator_count=accelerator_count,\n",
381+
" use_dedicated_endpoint=use_dedicated_endpoint,\n",
377382
")"
378383
]
379384
},
@@ -538,7 +543,10 @@
538543
"]\n",
539544
"\n",
540545
"# Query the endpoint.\n",
541-
"results = endpoints[\"timesfm\"].predict(instances=instances)\n",
546+
"results = endpoints[\"timesfm\"].predict(\n",
547+
" instances=instances,\n",
548+
" use_dedicated_endpoint=use_dedicated_endpoint,\n",
549+
")\n",
542550
"\n",
543551
"viz = Visualizer(nrows=1, ncols=3)\n",
544552
"viz.visualize_forecast(\n",
@@ -616,7 +624,8 @@
616624
" \"timestamp_format\": \"%Y-%m-%d\",\n",
617625
" }\n",
618626
" for each_input, each_timestamp in zip(inputs, timestamps)\n",
619-
" ]\n",
627+
" ],\n",
628+
" use_dedicated_endpoint=use_dedicated_endpoint,\n",
620629
")\n",
621630
"\n",
622631
"viz = Visualizer(nrows=1, ncols=3)\n",
@@ -788,10 +797,16 @@
788797
" },\n",
789798
"]\n",
790799
"\n",
791-
"response = endpoints[\"timesfm\"].predict(instances=cov_instances)\n",
800+
"response = endpoints[\"timesfm\"].predict(\n",
801+
" instances=cov_instances,\n",
802+
" use_dedicated_endpoint=use_dedicated_endpoint,\n",
803+
")\n",
792804
"\n",
793805
"no_cov_instances = [{\"input\": task[\"input\"], \"horizon\": 40} for task in cov_instances]\n",
794-
"no_cov_response = endpoints[\"timesfm\"].predict(instances=no_cov_instances)\n",
806+
"no_cov_response = endpoints[\"timesfm\"].predict(\n",
807+
" instances=no_cov_instances,\n",
808+
" use_dedicated_endpoint=use_dedicated_endpoint,\n",
809+
")\n",
795810
"\n",
796811
"viz = Visualizer(nrows=3, ncols=2)\n",
797812
"for task_i, (per_input, per_gt) in enumerate(\n",

0 commit comments

Comments
 (0)