apiVersion: karpenter.k8s.aws/v1
kind: EC2NodeClass
metadata:
name: gpu-nodeclass
spec:
amiFamily: AL2
amiSelectorTerms:
- id: "ami-09386b29276181ea6"
instanceProfile: 'KarpenterNodeInstanceProfile'
subnetSelectorTerms:
- tags:
karpenter.sh/discovery: "gpu-autoscaling-cluster7"
securityGroupSelectorTerms:
- tags:
karpenter.sh/discovery: "gpu-autoscaling-cluster7"
blockDeviceMappings:
- deviceName: /dev/xvda
ebs:
volumeSize: 300Gi
volumeType: gp3
---
apiVersion: karpenter.sh/v1
kind: NodePool
metadata:
name: ng-t4-xlarge
spec:
template:
metadata:
labels:
role: gpu
gpu-type: t4-xlarge
spec:
taints:
- key: gpu
value: "true"
effect: NoSchedule
requirements:
- key: node.kubernetes.io/instance-type
operator: In
values:
- g4dn.xlarge
- key: "karpenter.sh/capacity-type"
operator: In
values:
- on-demand
nodeClassRef:
group: karpenter.k8s.aws
kind: EC2NodeClass
name: gpu-nodeclass
limits:
nvidia.com/gpu: 5 disruption:
consolidationPolicy: WhenEmpty
consolidateAfter: 15m
---
apiVersion: karpenter.sh/v1
kind: NodePool
metadata:
name: ng-t4-2xlarge
spec:
template:
metadata:
labels:
role: gpu
gpu-type: t4-2xlarge
spec:
taints:
- key: gpu
value: "true"
effect: NoSchedule
requirements:
- key: node.kubernetes.io/instance-type
operator: In
values:
- g4dn.2xlarge
- key: "karpenter.sh/capacity-type"
operator: In
values:
- on-demand
nodeClassRef:
group: karpenter.k8s.aws
kind: EC2NodeClass
name: gpu-nodeclass
limits:
nvidia.com/gpu: 5
disruption:
consolidationPolicy: WhenEmpty
consolidateAfter: 15m
---
apiVersion: karpenter.sh/v1
kind: NodePool
metadata:
name: ng-l4-xlarge
spec:
template:
metadata:
labels:
role: gpu
gpu-type: l4-xlarge
spec:
taints:
- key: gpu
value: "true"
effect: NoSchedule
requirements:
- key: node.kubernetes.io/instance-type
operator: In
values:
- g6.xlarge
- key: "karpenter.sh/capacity-type"
operator: In
values:
- on-demand
nodeClassRef:
group: karpenter.k8s.aws
kind: EC2NodeClass
name: gpu-nodeclass
limits:
nvidia.com/gpu: 5
disruption:
consolidationPolicy: WhenEmpty
consolidateAfter: 15m
---
apiVersion: karpenter.sh/v1
kind: NodePool
metadata:
name: ng-l4-2xlarge
spec:
template:
metadata:
labels:
role: gpu
gpu-type: l4-2xlarge
spec:
taints:
- key: gpu
value: "true"
effect: NoSchedule
requirements:
- key: node.kubernetes.io/instance-type
operator: In
values:
- g6.2xlarge
- key: "karpenter.sh/capacity-type"
operator: In
values:
- on-demand
nodeClassRef:
group: karpenter.k8s.aws
kind: EC2NodeClass
name: gpu-nodeclass
limits:
nvidia.com/gpu: 5
disruption:
consolidationPolicy: WhenEmpty
consolidateAfter: 15m
---
apiVersion: karpenter.sh/v1
kind: NodePool
metadata:
name: ng-l4-12xlarge
spec:
template:
metadata:
labels:
role: gpu
gpu-type: l4-12xlarge
spec:
taints:
- key: gpu
value: "true"
effect: NoSchedule
requirements:
- key: node.kubernetes.io/instance-type
operator: In
values:
- g6.12xlarge
- key: "karpenter.sh/capacity-type"
operator: In
values:
- on-demand
nodeClassRef:
group: karpenter.k8s.aws
kind: EC2NodeClass
name: gpu-nodeclass
limits:
nvidia.com/gpu: 5
disruption:
consolidationPolicy: WhenEmpty
consolidateAfter: 15m
---
apiVersion: karpenter.sh/v1
kind: NodePool
metadata:
name: ng-l4-48xlarge
spec:
template:
metadata:
labels:
role: gpu
gpu-type: l4-48xlarge
spec:
taints:
- key: gpu
value: "true"
effect: NoSchedule
requirements:
- key: node.kubernetes.io/instance-type
operator: In
values:
- g6.48xlarge
- key: "karpenter.sh/capacity-type"
operator: In
values:
- on-demand
nodeClassRef:
group: karpenter.k8s.aws
kind: EC2NodeClass
name: gpu-nodeclass
limits:
nvidia.com/gpu: 5
disruption:
consolidationPolicy: WhenEmpty
consolidateAfter: 15m
---
apiVersion: karpenter.sh/v1
kind: NodePool
metadata:
name: ng-l40s-xlarge
spec:
template:
metadata:
labels:
role: gpu
gpu-type: l40s-xlarge
spec:
taints:
- key: gpu
value: "true"
effect: NoSchedule
requirements:
- key: node.kubernetes.io/instance-type
operator: In
values:
- g6e.xlarge
- key: "karpenter.sh/capacity-type"
operator: In
values:
- on-demand
nodeClassRef:
group: karpenter.k8s.aws
kind: EC2NodeClass
name: gpu-nodeclass
limits:
nvidia.com/gpu: 5
disruption:
consolidationPolicy: WhenEmpty
consolidateAfter: 15m
---
apiVersion: karpenter.sh/v1
kind: NodePool
metadata:
name: ng-l40s-2xlarge
spec:
template:
metadata:
labels:
role: gpu
gpu-type: l40s-2xlarge
spec:
taints:
- key: gpu
value: "true"
effect: NoSchedule
requirements:
- key: node.kubernetes.io/instance-type
operator: In
values:
- g6e.2xlarge
- key: "karpenter.sh/capacity-type"
operator: In
values:
- on-demand
nodeClassRef:
group: karpenter.k8s.aws
kind: EC2NodeClass
name: gpu-nodeclass
limits:
nvidia.com/gpu: 5
disruption:
consolidationPolicy: WhenEmpty
consolidateAfter: 15m
---
apiVersion: karpenter.sh/v1
kind: NodePool
metadata:
name: ng-l40s-12xlarge
spec:
template:
metadata:
labels:
role: gpu
gpu-type: l40s-12xlarge
spec:
taints:
- key: gpu
value: "true"
effect: NoSchedule
requirements:
- key: node.kubernetes.io/instance-type
operator: In
values:
- g6e.12xlarge
- key: "karpenter.sh/capacity-type"
operator: In
values:
- on-demand
nodeClassRef:
group: karpenter.k8s.aws
kind: EC2NodeClass
name: gpu-nodeclass
limits:
nvidia.com/gpu: 5
disruption:
consolidationPolicy: WhenEmpty
consolidateAfter: 15m
---
apiVersion: karpenter.sh/v1
kind: NodePool
metadata:
name: ng-l40s-48xlarge
spec:
template:
metadata:
labels:
role: gpu
gpu-type: l40s-48xlarge
spec:
taints:
- key: gpu
value: "true"
effect: NoSchedule
requirements:
- key: node.kubernetes.io/instance-type
operator: In
values:
- g6e.48xlarge
- key: "karpenter.sh/capacity-type"
operator: In
values:
- on-demand
nodeClassRef:
group: karpenter.k8s.aws
kind: EC2NodeClass
name: gpu-nodeclass
limits:
nvidia.com/gpu: 5
disruption:
consolidationPolicy: WhenEmpty
consolidateAfter: 15m
---
apiVersion: karpenter.sh/v1
kind: NodePool
metadata:
name: ng-a10g-xlarge
spec:
template:
metadata:
labels:
role: gpu
gpu-type: a10g-xlarge
spec:
taints:
- key: gpu
value: "true"
effect: NoSchedule
requirements:
- key: node.kubernetes.io/instance-type
operator: In
values:
- g5.xlarge
- key: "karpenter.sh/capacity-type"
operator: In
values:
- on-demand
nodeClassRef:
group: karpenter.k8s.aws
kind: EC2NodeClass
name: gpu-nodeclass
limits:
nvidia.com/gpu: 5
disruption:
consolidationPolicy: WhenEmpty
consolidateAfter: 15m
---
apiVersion: karpenter.sh/v1
kind: NodePool
metadata:
name: ng-a10g-2xlarge
spec:
template:
metadata:
labels:
role: gpu
gpu-type: a10g-2xlarge
spec:
taints:
- key: gpu
value: "true"
effect: NoSchedule
requirements:
- key: node.kubernetes.io/instance-type
operator: In
values:
- g5.2xlarge
- key: "karpenter.sh/capacity-type"
operator: In
values:
- on-demand
nodeClassRef:
group: karpenter.k8s.aws
kind: EC2NodeClass
name: gpu-nodeclass
limits:
nvidia.com/gpu: 5
disruption:
consolidationPolicy: WhenEmpty
consolidateAfter: 15m
---
apiVersion: karpenter.sh/v1
kind: NodePool
metadata:
name: ng-a10g-12xlarge
spec:
template:
metadata:
labels:
role: gpu
gpu-type: a10g-12xlarge
spec:
taints:
- key: gpu
value: "true"
effect: NoSchedule
requirements:
- key: node.kubernetes.io/instance-type
operator: In
values:
- g5.12xlarge
- key: "karpenter.sh/capacity-type"
operator: In
values:
- on-demand
nodeClassRef:
group: karpenter.k8s.aws
kind: EC2NodeClass
name: gpu-nodeclass
limits:
nvidia.com/gpu: 5
disruption:
consolidationPolicy: WhenEmpty
consolidateAfter: 15m
---
apiVersion: karpenter.sh/v1
kind: NodePool
metadata:
name: ng-a10g-48xlarge
spec:
template:
metadata:
labels:
role: gpu
gpu-type: a10g-48xlarge
spec:
taints:
- key: gpu
value: "true"
effect: NoSchedule
requirements:
- key: node.kubernetes.io/instance-type
operator: In
values:
- g5.48xlarge
- key: "karpenter.sh/capacity-type"
operator: In
values:
- on-demand
nodeClassRef:
group: karpenter.k8s.aws
kind: EC2NodeClass
name: gpu-nodeclass
limits:
nvidia.com/gpu: 5
disruption:
consolidationPolicy: WhenEmpty
consolidateAfter: 15m
---