From c012dc6d8aba21c5b87e37fb9c1345a7dbac8113 Mon Sep 17 00:00:00 2001 From: Ratnopam Chakrabarti Date: Sun, 7 Apr 2024 13:45:57 -0700 Subject: [PATCH 1/2] update stable-diffusion-neuron docker image --- .../stable-diffusion-inf2/ray-service-stablediffusion.yaml | 7 +++---- .../stable-diffusion-inf2/ray_serve_stablediffusion.py | 4 ++-- 2 files changed, 5 insertions(+), 6 deletions(-) diff --git a/ai-ml/trainium-inferentia/examples/inference/ray-serve/stable-diffusion-inf2/ray-service-stablediffusion.yaml b/ai-ml/trainium-inferentia/examples/inference/ray-serve/stable-diffusion-inf2/ray-service-stablediffusion.yaml index 3865b07c9..6523b0bbb 100644 --- a/ai-ml/trainium-inferentia/examples/inference/ray-serve/stable-diffusion-inf2/ray-service-stablediffusion.yaml +++ b/ai-ml/trainium-inferentia/examples/inference/ray-serve/stable-diffusion-inf2/ray-service-stablediffusion.yaml @@ -1,7 +1,6 @@ #---------------------------------------------------------------------- # NOTE: For deployment instructions, refer to the DoEKS website. #---------------------------------------------------------------------- ---- apiVersion: v1 kind: Namespace metadata: @@ -29,7 +28,7 @@ spec: - name: stable-diffusion-v2 autoscaling_config: metrics_interval_s: 0.2 - min_replicas: 8 + min_replicas: 2 max_replicas: 12 look_back_period_s: 2 downscale_delay_s: 30 @@ -55,7 +54,7 @@ spec: spec: containers: - name: ray-head - image: public.ecr.aws/data-on-eks/ray2.9.0-py310-stablediffusion-neuron:v1.0 + image: public.ecr.aws/data-on-eks/ray2.9.0-py310-stablediffusion-neuron:latest imagePullPolicy: Always # Ensure the image is always pulled when updated lifecycle: preStop: @@ -98,7 +97,7 @@ spec: spec: containers: - name: ray-worker - image: public.ecr.aws/data-on-eks/ray2.9.0-py310-stablediffusion-neuron:v1.0 + image: public.ecr.aws/data-on-eks/ray2.9.0-py310-stablediffusion-neuron:latest imagePullPolicy: Always # Ensure the image is always pulled when updated lifecycle: preStop: diff --git a/ai-ml/trainium-inferentia/examples/inference/ray-serve/stable-diffusion-inf2/ray_serve_stablediffusion.py b/ai-ml/trainium-inferentia/examples/inference/ray-serve/stable-diffusion-inf2/ray_serve_stablediffusion.py index acb8d07e1..4c1edcb9e 100644 --- a/ai-ml/trainium-inferentia/examples/inference/ray-serve/stable-diffusion-inf2/ray_serve_stablediffusion.py +++ b/ai-ml/trainium-inferentia/examples/inference/ray-serve/stable-diffusion-inf2/ray_serve_stablediffusion.py @@ -38,10 +38,10 @@ class StableDiffusionV2: def __init__(self): from optimum.neuron import NeuronStableDiffusionXLPipeline - compiled_model_id = "aws-neuron/stable-diffusion-xl-base-1-0-1024x1024" + model_id = os.getenv('MODEL_ID') # To avoid saving the model locally, we can use the pre-compiled model directly from HF - self.pipe = NeuronStableDiffusionXLPipeline.from_pretrained(compiled_model_id, device_ids=[0, 1]) + self.pipe = NeuronStableDiffusionXLPipeline.from_pretrained(model_id, device_ids=[0, 1]) async def generate(self, prompt: str): assert len(prompt), "prompt parameter cannot be empty" From e2fe0fd0a026b3913a6d2735f7ff47ea6400f13b Mon Sep 17 00:00:00 2001 From: Ratnopam Chakrabarti Date: Tue, 14 May 2024 13:12:38 -0700 Subject: [PATCH 2/2] fix install.sh to remove incorrect region value --- ai-ml/jark-stack/terraform/install.sh | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/ai-ml/jark-stack/terraform/install.sh b/ai-ml/jark-stack/terraform/install.sh index 4c8f21c48..1814a9044 100755 --- a/ai-ml/jark-stack/terraform/install.sh +++ b/ai-ml/jark-stack/terraform/install.sh @@ -13,7 +13,7 @@ terraform init -upgrade for target in "${targets[@]}" do echo "Applying module $target..." - apply_output=$(terraform apply -target="$target" -var="region=$region" -auto-approve 2>&1 | tee /dev/tty) + apply_output=$(terraform apply -target="$target" -auto-approve 2>&1 | tee /dev/tty) if [[ ${PIPESTATUS[0]} -eq 0 && $apply_output == *"Apply complete"* ]]; then echo "SUCCESS: Terraform apply of $target completed successfully" else @@ -24,7 +24,7 @@ done # Final apply to catch any remaining resources echo "Applying remaining resources..." -apply_output=$(terraform apply -var="region=$region" -auto-approve 2>&1 | tee /dev/tty) +apply_output=$(terraform apply -auto-approve 2>&1 | tee /dev/tty) if [[ ${PIPESTATUS[0]} -eq 0 && $apply_output == *"Apply complete"* ]]; then echo "SUCCESS: Terraform apply of all modules completed successfully" else