From e4d153ab8b49821a02ca73dc5cd946e0d9ab736d Mon Sep 17 00:00:00 2001 From: Matt McClean <124083747+mmcclean-aws@users.noreply.github.com> Date: Wed, 22 Feb 2023 09:26:06 -0800 Subject: [PATCH] Added support for the AWS Inferentia 2 instance types based on the NeuronCore v2 chip architecture --- .../cloudprovider/aws/ec2_instance_types.go | 28 +++++++++++++++++++ 1 file changed, 28 insertions(+) diff --git a/cluster-autoscaler/cloudprovider/aws/ec2_instance_types.go b/cluster-autoscaler/cloudprovider/aws/ec2_instance_types.go index a8a269c1393c..186c810922b3 100644 --- a/cluster-autoscaler/cloudprovider/aws/ec2_instance_types.go +++ b/cluster-autoscaler/cloudprovider/aws/ec2_instance_types.go @@ -1607,6 +1607,34 @@ var InstanceTypes = map[string]*InstanceType{ GPU: 0, Architecture: "amd64", }, + "inf2.48xlarge": { + InstanceType: "inf2.48xlarge", + VCPU: 192, + MemoryMb: 786432, + GPU: 0, + Architecture: "amd64", + }, + "inf2.24xlarge": { + InstanceType: "inf2.24xlarge", + VCPU: 96, + MemoryMb: 393216, + GPU: 0, + Architecture: "amd64", + }, + "inf2.8xlarge": { + InstanceType: "inf2.8xlarge", + VCPU: 32, + MemoryMb: 131072, + GPU: 0, + Architecture: "amd64", + }, + "inf2.xlarge": { + InstanceType: "inf2.xlarge", + VCPU: 4, + MemoryMb: 16384, + GPU: 0, + Architecture: "amd64", + }, "is4gen.2xlarge": { InstanceType: "is4gen.2xlarge", VCPU: 8,