Skip to content

Commit

Permalink
feat: support autoscaling on broker and bookie (#1183)
Browse files Browse the repository at this point in the history
* feat: add autoscaling on chart

Signed-off-by: ericsyh <[email protected]>

* apply autoscaling on sn-platform

Signed-off-by: ericsyh <[email protected]>

* add autoscaling examples

Signed-off-by: ericsyh <[email protected]>

* fix name

Signed-off-by: ericsyh <[email protected]>

---------

Signed-off-by: ericsyh <[email protected]>
(cherry picked from commit 7a08d15)
  • Loading branch information
ericsyh committed Oct 22, 2024
1 parent 226769f commit c3a373f
Show file tree
Hide file tree
Showing 9 changed files with 241 additions and 0 deletions.
Original file line number Diff line number Diff line change
Expand Up @@ -48,6 +48,17 @@ spec:
replicas: {{ .Values.bookkeeper.replicaCount }}
image: "{{ .Values.images.bookie.repository }}:{{ .Values.images.bookie.tag }}"
imagePullPolicy: {{ .Values.images.bookie.pullPolicy }}
{{- if .Values.bookkeeper.autoScaling.enabled }}
autoScalingPolicy:
minReplicas: {{ .Values.bookkeeper.autoScaling.minReplicas }}
maxReplicas: {{ .Values.bookkeeper.autoScaling.maxReplicas }}
{{- if .Values.bookkeeper.autoScaling.metrics }}
metrics:
{{- with .Values.bookkeeper.autoScaling.metrics }}
{{ toYaml . | indent 4 }}
{{- end }}
{{- end }}
{{- end }}
logConfig:
level: {{ .Values.bookkeeper.logConfig.level }}
format: {{ .Values.bookkeeper.logConfig.format }}
Expand Down
11 changes: 11 additions & 0 deletions charts/sn-platform-slim/templates/broker/broker-cluster.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -50,6 +50,17 @@ spec:
replicas: {{ .Values.broker.replicaCount }}
image: "{{ .Values.images.broker.repository }}:{{ .Values.images.broker.tag }}"
imagePullPolicy: {{ .Values.images.broker.pullPolicy }}
{{- if .Values.broker.autoScaling.enabled }}
autoScalingPolicy:
minReplicas: {{ .Values.broker.autoScaling.minReplicas }}
maxReplicas: {{ .Values.broker.autoScaling.maxReplicas }}
{{- if .Values.broker.autoScaling.metrics }}
metrics:
{{- with .Values.broker.autoScaling.metrics }}
{{ toYaml . | indent 4 }}
{{- end }}
{{- end }}
{{- end }}
logConfig:
level: {{ .Values.broker.logConfig.level }}
format: {{ .Values.broker.logConfig.format }}
Expand Down
14 changes: 14 additions & 0 deletions charts/sn-platform-slim/values.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -803,6 +803,13 @@ bookkeeper:
# annotations that will be added on the BookKeeperCluster CR only.
annotations: {}

# The field autoScaling will track the average metrics usage of the Pulsar nodes and adjusts the nodes to keep at the target metrics usage level.
# If the average metrics usage for nodes is over the target, scaling controller will scale out to bring more nodes and if the average metrics for the nodes is less than the target, scaling controller will downscale nodes to save resources.
autoScaling:
enabled: false
minReplicas: 1
maxReplicas: 4
metrics: {}
# The field logConfig can be used to change the log level and log format of pods.
# The logConfig field is optional. If it is not specified, the component will use the default log configuration /pulsar/conf/log4j2.yaml.
# f it is specified will dynamically change the log level and log format of the component by changing the CR.
Expand Down Expand Up @@ -1040,6 +1047,13 @@ broker:
# annotations that will be added on the PulsarBroker CR only.
annotations: {}

# The field autoScaling will track the average metrics usage of the Pulsar nodes and adjusts the nodes to keep at the target metrics usage level.
# If the average metrics usage for nodes is over the target, scaling controller will scale out to bring more nodes and if the average metrics for the nodes is less than the target, scaling controller will downscale nodes to save resources.
autoScaling:
enabled: false
minReplicas: 1
maxReplicas: 4
metrics: {}
# The field logConfig can be used to change the log level and log format of pods.
# The logConfig field is optional. If it is not specified, the component will use the default log configuration /pulsar/conf/log4j2.yaml.
# If it is specified will dynamically change the log level and log format of the component by changing the CR.
Expand Down
11 changes: 11 additions & 0 deletions charts/sn-platform/templates/bookkeeper/bookkeeper-cluster.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -48,6 +48,17 @@ spec:
replicas: {{ .Values.bookkeeper.replicaCount }}
image: "{{ .Values.images.bookie.repository }}:{{ .Values.images.bookie.tag }}"
imagePullPolicy: {{ .Values.images.bookie.pullPolicy }}
{{- if .Values.bookkeeper.autoScaling.enabled }}
autoScalingPolicy:
minReplicas: {{ .Values.bookkeeper.autoScaling.minReplicas }}
maxReplicas: {{ .Values.bookkeeper.autoScaling.maxReplicas }}
{{- if .Values.bookkeeper.autoScaling.metrics }}
metrics:
{{- with .Values.bookkeeper.autoScaling.metrics }}
{{ toYaml . | indent 4 }}
{{- end }}
{{- end }}
{{- end }}
logConfig:
level: {{ .Values.bookkeeper.logConfig.level }}
format: {{ .Values.bookkeeper.logConfig.format }}
Expand Down
11 changes: 11 additions & 0 deletions charts/sn-platform/templates/broker/broker-cluster.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -50,6 +50,17 @@ spec:
replicas: {{ .Values.broker.replicaCount }}
image: "{{ .Values.images.broker.repository }}:{{ .Values.images.broker.tag }}"
imagePullPolicy: {{ .Values.images.broker.pullPolicy }}
{{- if .Values.broker.autoScaling.enabled }}
autoScalingPolicy:
minReplicas: {{ .Values.broker.autoScaling.minReplicas }}
maxReplicas: {{ .Values.broker.autoScaling.maxReplicas }}
{{- if .Values.broker.autoScaling.metrics }}
metrics:
{{- with .Values.broker.autoScaling.metrics }}
{{ toYaml . | indent 4 }}
{{- end }}
{{- end }}
{{- end }}
logConfig:
level: {{ .Values.broker.logConfig.level }}
format: {{ .Values.broker.logConfig.format }}
Expand Down
16 changes: 16 additions & 0 deletions charts/sn-platform/values.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -878,6 +878,14 @@ bookkeeper:
# annotations that will be added on the BookKeeperCluster CR only.
annotations: {}

# The field autoScaling will track the average metrics usage of the Pulsar nodes and adjusts the nodes to keep at the target metrics usage level.
# If the average metrics usage for nodes is over the target, scaling controller will scale out to bring more nodes and if the average metrics for the nodes is less than the target, scaling controller will downscale nodes to save resources.
autoScaling:
enabled: false
minReplicas: 1
maxReplicas: 4
metrics: {}

# The field logConfig can be used to change the log level and log format of pods.
# The logConfig field is optional. If it is not specified, the component will use the default log configuration /pulsar/conf/log4j2.yaml.
# If it is specified will dynamically change the log level and log format of the component by changing the CR.
Expand Down Expand Up @@ -1115,6 +1123,14 @@ broker:
# annotations that will be added on the PulsarBroker CR only.
annotations: {}

# The field autoScaling will track the average metrics usage of the Pulsar nodes and adjusts the nodes to keep at the target metrics usage level.
# If the average metrics usage for nodes is over the target, scaling controller will scale out to bring more nodes and if the average metrics for the nodes is less than the target, scaling controller will downscale nodes to save resources.
autoScaling:
enabled: false
minReplicas: 1
maxReplicas: 4
metrics: {}

# The field logConfig can be used to change the log level and log format of pods.
# The logConfig field is optional. If it is not specified, the component will use the default log configuration /pulsar/conf/log4j2.yaml.
# If it is specified will dynamically change the log level and log format of the component by changing the CR.
Expand Down
59 changes: 59 additions & 0 deletions examples/sn-platform/autoscaling-custom-metrics.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,59 @@
broker:
autoScaling:
enabled: true
minReplicas: 1
maxReplicas: 4
# Deploy the https://prometheus.io/ and https://github.com/kubernetes-sigs/prometheus-adapter to support custom metrics.
# Refer the prometheus.-adapter.yaml how to setup the custom metrics.
metrics:
- pods:
metric:
name: cpu_usage
target:
averageValue: "75"
type: AverageValue
type: Pods
- pods:
metric:
name: network_in_rate_kb
target:
averageValue: "204800"
type: AverageValue
type: Pods
- pods:
metric:
name: network_out_rate_kb
target:
averageValue: "204800"
type: AverageValue
type: Pods

bookkeeper:
autoScaling:
enabled: true
minReplicas: 1
maxReplicas: 4
# Deploy the https://prometheus.io/ and https://github.com/kubernetes-sigs/prometheus-adapter to support custom metrics.
# Refer the prometheus.-adapter.yaml how to setup the custom metrics.
metrics:
- pods:
metric:
name: cpu_usage
target:
averageValue: "75"
type: AverageValue
type: Pods
- pods:
metric:
name: network_in_rate_kb
target:
averageValue: "204800"
type: AverageValue
type: Pods
- pods:
metric:
name: network_out_rate_kb
target:
averageValue: "204800"
type: AverageValue
type: Pods
29 changes: 29 additions & 0 deletions examples/sn-platform/autoscaling-resource-metrics.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,29 @@
broker:
autoScaling:
enabled: true
minReplicas: 1
maxReplicas: 4
# Deploy the https://github.com/kubernetes-sigs/metrics-server to support resource metrics.
# Metrics server supports the cpu and memory PodMetrics.
metrics:
type: Resource
resource:
name: cpu
target:
type: Utilization
averageUtilization: 70

bookkeeper:
autoScaling:
enabled: true
minReplicas: 1
maxReplicas: 4
# Deploy the https://github.com/kubernetes-sigs/metrics-server to support resource metrics.
# Metrics server supports the cpu and memory PodMetrics.
metrics:
type: Resource
resource:
name: cpu
target:
type: Utilization
averageUtilization: 70
79 changes: 79 additions & 0 deletions examples/sn-platform/prometheus-adapter.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,79 @@
prometheus:
url: http://prometheus-server.monitor.svc
port: 80
listenPort: 8443
rules:
default: false
custom:
- seriesQuery: '{namespace!="",__name__!~"^container_.*"}'
resources:
template: "<<.Resource>>"
name:
matches: "^(.*)_total"
as: ""
metricsQuery: |
sum by (<<.GroupBy>>) (
irate (
<<.Series>>{<<.LabelMatchers>>}[1m]
)
)
- seriesQuery: 'container_cpu_usage_seconds_total{namespace!~"(sn-system|kube-system|olm|cert-manager)"}'
seriesFilters: []
resources:
overrides:
pod:
resource: pod
namespace:
resource: namespace
name:
matches: "container_cpu_usage_seconds_total"
as: "cpu_usage"
metricsQuery: sum(rate(container_cpu_usage_seconds_total{<<.LabelMatchers>>}[5m])) by (<<.GroupBy>>) / (sum(container_spec_cpu_shares{<<.LabelMatchers>>}/1000) by (<<.GroupBy>>)) * 100
- seriesQuery: 'container_network_receive_bytes_total{namespace!~"(sn-system|kube-system|olm|cert-manager)"}'
seriesFilters: []
resources:
overrides:
pod:
resource: pod
namespace:
resource: namespace
name:
matches: "container_network_receive_bytes_total"
as: "network_in_rate_kb"
metricsQuery: rate(container_network_receive_bytes_total{<<.LabelMatchers>>}[5m]) / 1024
- seriesQuery: 'container_network_transmit_bytes_total{namespace!~"(sn-system|kube-system|olm|cert-manager)"}'
seriesFilters: []
resources:
overrides:
pod:
resource: pod
namespace:
resource: namespace
name:
matches: "container_network_transmit_bytes_total"
as: "network_out_rate_kb"
metricsQuery: rate(container_network_transmit_bytes_total{<<.LabelMatchers>>}[5m]) / 1024
- seriesQuery: 'container_fs_reads_bytes_total{namespace!~"(sn-system|kube-system|olm|cert-manager)"}'
seriesFilters: []
resources:
overrides:
pod:
resource: pod
namespace:
resource: namespace
name:
matches: "container_fs_reads_bytes_total"
as: "disk_read_rate_kb"
metricsQuery: sum(rate(container_fs_reads_bytes_total{<<.LabelMatchers>>}[5m])) by (<<.GroupBy>>) / 1024
- seriesQuery: 'container_fs_writes_bytes_total{namespace!~"(sn-system|kube-system|olm|cert-manager)"}'
seriesFilters: []
resources:
overrides:
pod:
resource: pod
namespace:
resource: namespace
name:
matches: "container_fs_writes_bytes_total"
as: "disk_write_rate_kb"
metricsQuery: sum(rate(container_fs_writes_bytes_total{<<.LabelMatchers>>}[5m])) by (<<.GroupBy>>) / 1024

0 comments on commit c3a373f

Please sign in to comment.