Skip to content

Commit bc0162f

Browse files
authored
Incremental cluster growth (#769)
1 parent 2f4bbf7 commit bc0162f

File tree

4 files changed

+30
-0
lines changed

4 files changed

+30
-0
lines changed

manager/manifests/cluster-autoscaler.yaml.j2

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -170,7 +170,10 @@ spec:
170170
- --expander=least-waste
171171
{% endif %}
172172
- --max-nodes-total={{ config['max_instances'] + 1 }}
173+
- --max-total-unready-percentage=5
174+
- --ok-total-unready-count=30
173175
- --max-node-provision-time=5m
176+
- --scan-interval=20s
174177
- --node-group-auto-discovery=asg:tag=k8s.io/cluster-autoscaler/enabled,k8s.io/cluster-autoscaler/{{ config['cluster_name'] }}
175178
volumeMounts:
176179
- name: ssl-certs

manager/manifests/fluentd.yaml

Lines changed: 9 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -47,7 +47,15 @@ roleRef:
4747
name: fluentd
4848
apiGroup: rbac.authorization.k8s.io
4949
---
50+
apiVersion: scheduling.k8s.io/v1
51+
kind: PriorityClass
52+
metadata:
53+
name: fluentd
54+
value: 1000
55+
globalDefault: false
56+
description: "This priority class should be used for fluentd daemonset only."
5057

58+
---
5159
apiVersion: v1
5260
kind: ConfigMap
5361
metadata:
@@ -166,6 +174,7 @@ spec:
166174
app: fluentd
167175
spec:
168176
serviceAccountName: fluentd
177+
priorityClassName: fluentd
169178
initContainers:
170179
- name: copy-fluentd-config
171180
image: busybox

manager/manifests/nvidia.yaml

Lines changed: 9 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -14,6 +14,14 @@
1414

1515
# Source: https://github.com/NVIDIA/k8s-device-plugin/blob/1.0.0-beta4/nvidia-device-plugin.yml
1616

17+
apiVersion: scheduling.k8s.io/v1
18+
kind: PriorityClass
19+
metadata:
20+
name: nvidia
21+
value: 1000
22+
globalDefault: false
23+
description: "This priority class should be used for nvidia daemonset only."
24+
---
1725
apiVersion: apps/v1
1826
kind: DaemonSet
1927
metadata:
@@ -34,6 +42,7 @@ spec:
3442
labels:
3543
name: nvidia-device-plugin-ds
3644
spec:
45+
priorityClassName: nvidia
3746
tolerations:
3847
# This toleration is deprecated. Kept here for backward compatibility
3948
# See https://kubernetes.io/docs/tasks/administer-cluster/guaranteed-scheduling-critical-addon-pods/

manager/manifests/statsd.yaml

Lines changed: 9 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -41,6 +41,14 @@ metadata:
4141
name: cwagentstatsdconfig
4242
namespace: default
4343
---
44+
apiVersion: scheduling.k8s.io/v1
45+
kind: PriorityClass
46+
metadata:
47+
name: statsd
48+
value: 1000
49+
globalDefault: false
50+
description: "This priority class should be used for statsd daemonset only."
51+
---
4452
apiVersion: apps/v1
4553
kind: DaemonSet
4654
metadata:
@@ -55,6 +63,7 @@ spec:
5563
labels:
5664
name: cloudwatch-agent-statsd
5765
spec:
66+
priorityClassName: statsd
5867
containers:
5968
- name: cloudwatch-agent
6069
image: $CORTEX_IMAGE_STATSD

0 commit comments

Comments
 (0)