From cba0d17f0f78d41291bd8f7bbf95991ea763b40e Mon Sep 17 00:00:00 2001 From: Albert Villanova del Moral <8515462+albertvillanova@users.noreply.github.com> Date: Thu, 21 Nov 2024 09:32:40 +0100 Subject: [PATCH] Update instance type/size in endpoint model_config example --- examples/model_configs/endpoint_model.yaml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/examples/model_configs/endpoint_model.yaml b/examples/model_configs/endpoint_model.yaml index 2834cdd28..4bf2f0602 100644 --- a/examples/model_configs/endpoint_model.yaml +++ b/examples/model_configs/endpoint_model.yaml @@ -10,8 +10,8 @@ model: accelerator: "gpu" region: "eu-west-1" vendor: "aws" - instance_size: "medium" - instance_type: "g5.2xlarge" + instance_size: "x1" + instance_type: "nvidia-a10g" framework: "pytorch" endpoint_type: "protected" namespace: null # The namespace under which to launch the endopint. Defaults to the current user's namespace