fix public ecr setup

Jyothirmaikottu · Jyothirmaikottu · commit c67598b3c029 · 2025-12-08T14:59:50.000-08:00
diff --git a/vllm-samples/sagemaker/README.md b/vllm-samples/sagemaker/README.md
@@ -30,8 +30,9 @@ aws iam attach-role-policy --role-name SageMakerExecutionRole --policy-arn arn:a
 ### 1. Set Environment Variables
 
 ```bash
-# Check available images: https://gallery.ecr.aws/deep-learning-containers/vllm
-export CONTAINER_URI="public.ecr.aws/deep-learning-containers/0.11-gpu-py312"
+
+# Note: Using a Public Gallery image to create an SM endpoint is currently not supported
+export CONTAINER_URI="763104351884.dkr.ecr.us-east-1.amazonaws.com/vllm:0.11.2-gpu-py312"
 export IAM_ROLE="SageMakerExecutionRole"
 export HF_TOKEN="your-huggingface-token" 
 ```
@@ -76,13 +77,18 @@ Recommended GPU instances:
 Test NixlConnector locally - [NixlConnector Documentation](https://docs.vllm.ai/en/latest/features/nixl_connector_usage.html#transport-configuration)
 
 ```bash
+# Login to aws ecr
+aws ecr get-login-password --region us-west-2 | docker login \
+--username AWS --password-stdin 763104351884.dkr.ecr.us-east-1.amazonaws.com
+
 # Pull latest vLLM DLC for EC2
-docker pull public.ecr.aws/deep-learning-containers/vllm:0.11-gpu-py312
+# Note: Using a Public Gallery image to create an SM endpoint is currently not supported
+docker pull 763104351884.dkr.ecr.us-east-1.amazonaws.com/vllm:0.11.2-gpu-py312
 
 # Run container with GPU access
 docker run -it --entrypoint=/bin/bash --gpus=all \
   -v $(pwd):/workspace \
-  public.ecr.aws/deep-learning-containers/vllm:0.11-gpu-py312
+  763104351884.dkr.ecr.us-east-1.amazonaws.com/vllm:0.11.2-gpu-py312
 
 # Inside container, run the NixlConnector test
 export HF_TOKEN= "<TOKEN>"
diff --git a/vllm-samples/sagemaker/deploy_and_test_sm_endpoint.py b/vllm-samples/sagemaker/deploy_and_test_sm_endpoint.py
@@ -105,7 +105,7 @@ def main():
         help="DLC image URI",
         default=os.getenv(
             "CONTAINER_URI",
-            "public.ecr.aws/deep-learning-containers/vllm:0.11.0-gpu-py312",
+            "763104351884.dkr.ecr.us-east-1.amazonaws.com/vllm:0.11.2-gpu-py312",
         ),
     )
     parser.add_argument(

Original file line number	Diff line number	Diff line change
`@@ -105,7 +105,7 @@ def main():`
`105`	`105`	`help="DLC image URI",`
`106`	`106`	`default=os.getenv(`
`107`	`107`	`"CONTAINER_URI",`
`108`		`- "public.ecr.aws/deep-learning-containers/vllm:0.11.0-gpu-py312",`
	`108`	`+ "763104351884.dkr.ecr.us-east-1.amazonaws.com/vllm:0.11.2-gpu-py312",`
`109`	`109`	`),`
`110`	`110`	`)`
`111`	`111`	`parser.add_argument(`