aws-samples · yanbasic · Aug 26, 2025 · Aug 26, 2025
diff --git a/src/emd/cfn/shared/ecs_cluster.yaml b/src/emd/cfn/shared/ecs_cluster.yaml
@@ -10,7 +10,7 @@ Parameters:
   APIRouterImageURI:
     Type: String
     Description: The URI of OpenAI compatbile API router image. If provided, the router will be deployed.
-    Default: "public.ecr.aws/aws-gcr-solutions/dmaa/api-router:latest"
+    Default: "quay.io/dmaa/api-router:latest"
   UseSpot:
     Type: String
     Description: Use Fargate Spot capacity?

diff --git a/src/pipeline/backend/huggingface/embedding/Dockerfile b/src/pipeline/backend/huggingface/embedding/Dockerfile
@@ -1,4 +1,4 @@
-FROM public.ecr.aws/aws-gcr-solutions/dmaa/huggingface/transformers-pytorch-gpu:{{VERSION}} AS huggingface-base
+FROM quay.io/dmaa/huggingface/transformers-pytorch-gpu:{{VERSION}} AS huggingface-base
 
 # Create a new stage based on vllm-base
 FROM huggingface-base AS sagemaker-serving

diff --git a/src/pipeline/backend/huggingface/llm/Dockerfile b/src/pipeline/backend/huggingface/llm/Dockerfile
@@ -1,4 +1,4 @@
-FROM public.ecr.aws/aws-gcr-solutions/dmaa/huggingface/transformers-pytorch-gpu:{{VERSION}} AS huggingface-base
+FROM quay.io/dmaa/huggingface/transformers-pytorch-gpu:{{VERSION}} AS huggingface-base
 
 # Create a new stage based on vllm-base
 FROM huggingface-base AS sagemaker-serving

diff --git a/src/pipeline/backend/huggingface/llm/Dockerfile_baichuan b/src/pipeline/backend/huggingface/llm/Dockerfile_baichuan
@@ -1,4 +1,4 @@
-FROM public.ecr.aws/aws-gcr-solutions/dmaa/huggingface/transformers-pytorch-gpu:{{VERSION}} AS huggingface-base
+FROM quay.io/dmaa/huggingface/transformers-pytorch-gpu:{{VERSION}} AS huggingface-base
 
 # Create a new stage based on vllm-base
 FROM huggingface-base AS sagemaker-serving

diff --git a/src/pipeline/backend/huggingface/rerank/Dockerfile b/src/pipeline/backend/huggingface/rerank/Dockerfile
@@ -1,4 +1,4 @@
-FROM public.ecr.aws/aws-gcr-solutions/dmaa/huggingface/transformers-pytorch-gpu:{{VERSION}} AS huggingface-base
+FROM quay.io/dmaa/huggingface/transformers-pytorch-gpu:{{VERSION}} AS huggingface-base
 
 # Create a new stage based on vllm-base
 FROM huggingface-base AS sagemaker-serving

diff --git a/src/pipeline/backend/llama_cpp/Dockerfile b/src/pipeline/backend/llama_cpp/Dockerfile
@@ -1,4 +1,4 @@
-FROM public.ecr.aws/aws-gcr-solutions/dmaa/llama-cpp:{{VERSION}}
+FROM quay.io/dmaa/llama-cpp:{{VERSION}}
 
 # Ensure the serve script has executable permissions
 # RUN chmod +x /usr/bin/serve

diff --git a/src/pipeline/backend/lmdeploy/Dockerfile b/src/pipeline/backend/lmdeploy/Dockerfile
@@ -1,4 +1,4 @@
-FROM public.ecr.aws/aws-gcr-solutions/dmaa/openmmlab/lmdeploy:{{VERSION}} AS lmdeploy-base
+FROM quay.io/dmaa/openmmlab/lmdeploy:{{VERSION}} AS lmdeploy-base
 
 # Create a new stage based on vllm-base
 FROM lmdeploy-base AS sagemaker-serving

diff --git a/src/pipeline/backend/lmdeploy/Dockerfile_internvl2 b/src/pipeline/backend/lmdeploy/Dockerfile_internvl2
@@ -1,4 +1,4 @@
-FROM public.ecr.aws/aws-gcr-solutions/dmaa/openmmlab/lmdeploy:{{VERSION}} AS lmdeploy-base
+FROM quay.io/dmaa/openmmlab/lmdeploy:{{VERSION}} AS lmdeploy-base
 
 # Create a new stage based on vllm-base
 FROM lmdeploy-base AS sagemaker-serving

diff --git a/src/pipeline/backend/ollama/Dockerfile b/src/pipeline/backend/ollama/Dockerfile
@@ -1,4 +1,4 @@
-FROM public.ecr.aws/aws-gcr-solutions/dmaa/ollama:{{VERSION}} AS ollama-base
+FROM quay.io/dmaa/ollama:{{VERSION}} AS ollama-base
 
 # Ensure the serve script has executable permissions
 # RUN chmod +x /usr/bin/serve

diff --git a/src/pipeline/backend/tgi/Dockerfile b/src/pipeline/backend/tgi/Dockerfile
@@ -1,4 +1,4 @@
-FROM public.ecr.aws/aws-gcr-solutions/dmaa/huggingface/text-generation-inference:{{VERSION}} AS tgi-base
+FROM quay.io/dmaa/huggingface/text-generation-inference:{{VERSION}} AS tgi-base
 
 # Create a new stage based on vllm-base
 FROM tgi-base AS sagemaker-serving

diff --git a/src/pipeline/backend/vllm/Dockerfile b/src/pipeline/backend/vllm/Dockerfile
@@ -1,4 +1,4 @@
-FROM public.ecr.aws/aws-gcr-solutions/dmaa-vllm/vllm-openai:{{VERSION}} AS vllm-base
+FROM quay.io/dmaa/vllm-openai:{{VERSION}} AS vllm-base
 
 # Create a new stage based on vllm-base
 FROM vllm-base AS sagemaker-serving

diff --git a/src/pipeline/backend/vllm/Dockerfile_baichuan_m1 b/src/pipeline/backend/vllm/Dockerfile_baichuan_m1
@@ -1,4 +1,4 @@
-FROM public.ecr.aws/aws-gcr-solutions/dmaa-vllm/vllm-openai:{{VERSION}} AS vllm-base
+FROM quay.io/dmaa/vllm-openai:{{VERSION}} AS vllm-base
 
 # Create a new stage based on vllm-base
 FROM vllm-base AS sagemaker-serving

diff --git a/src/pipeline/backend/vllm/Dockerfile_dots_ocr b/src/pipeline/backend/vllm/Dockerfile_dots_ocr
@@ -1,4 +1,4 @@
-FROM public.ecr.aws/aws-gcr-solutions/dmaa-vllm/vllm-openai:{{VERSION}} AS vllm-base
+FROM quay.io/dmaa/vllm-openai:{{VERSION}} AS vllm-base
 
 WORKDIR /opt/ml/code
 

diff --git a/src/pipeline/backend/vllm/Dockerfile_gemma3 b/src/pipeline/backend/vllm/Dockerfile_gemma3
@@ -1,4 +1,4 @@
-FROM public.ecr.aws/aws-gcr-solutions/dmaa-vllm/vllm-openai:{{VERSION}} AS vllm-base
+FROM quay.io/dmaa/vllm-openai:{{VERSION}} AS vllm-base
 
 FROM vllm-base AS sagemaker-serving
 

diff --git a/src/pipeline/backend/vllm/Dockerfile_higgs_audio b/src/pipeline/backend/vllm/Dockerfile_higgs_audio
@@ -1,4 +1,4 @@
-FROM public.ecr.aws/aws-gcr-solutions/dmaa/higgs-audio-vllm:latest AS base
+FROM quay.io/dmaa/higgs-audio-vllm:latest AS base
 
 WORKDIR /opt/ml/code
 

diff --git a/src/pipeline/backend/vllm/Dockerfile_qwen25_vl b/src/pipeline/backend/vllm/Dockerfile_qwen25_vl
@@ -1,4 +1,4 @@
-FROM public.ecr.aws/aws-gcr-solutions/dmaa-vllm/vllm-openai:{{VERSION}} AS vllm-base
+FROM quay.io/dmaa/vllm-openai:{{VERSION}} AS vllm-base
 
 # Create a new stage based on vllm-base
 FROM vllm-base AS sagemaker-serving