From 30c5387a1912849f2b8add82ba716554337a1803 Mon Sep 17 00:00:00 2001 From: Harish Rao Date: Sun, 25 Feb 2024 23:08:20 -0800 Subject: [PATCH] fix: For issue 429 "Unable to deploy llama2 on Eks/Ray Serve/inf2" (#430) --- .gitignore | 4 ++++ ai-ml/trainium-inferentia/eks.tf | 2 +- 2 files changed, 5 insertions(+), 1 deletion(-) diff --git a/.gitignore b/.gitignore index 5a15f96df..095c4d90c 100755 --- a/.gitignore +++ b/.gitignore @@ -51,3 +51,7 @@ site .tfsec examples/gradio-ui/* +ai-ml/trainium-inferentia/examples/gradio-ui/gradio_cached_examples/* + +# venv +**/.venv/* diff --git a/ai-ml/trainium-inferentia/eks.tf b/ai-ml/trainium-inferentia/eks.tf index 0aede3240..9a28b1b92 100644 --- a/ai-ml/trainium-inferentia/eks.tf +++ b/ai-ml/trainium-inferentia/eks.tf @@ -116,7 +116,7 @@ module "eks" { max_size = 8 desired_size = 3 - instance_types = ["m5.xlarge"] + instance_types = ["m5.2xlarge"] labels = { WorkerType = "ON_DEMAND"