Skip to content

Commit

Permalink
scheduler server add leader elect
Browse files Browse the repository at this point in the history
Signed-off-by: rongfu.leng <[email protected]>
  • Loading branch information
lengrongfu committed Apr 12, 2024
1 parent 8381474 commit a55741e
Show file tree
Hide file tree
Showing 3 changed files with 10 additions and 3 deletions.
6 changes: 6 additions & 0 deletions charts/hami/templates/scheduler/deployment.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -47,6 +47,9 @@ spec:
- {{ . }}
{{- end }}
{{- end }}
- --leader-elect={{ .Values.scheduler.leaderElect }}
- --leader-elect-resource-name={{ .Values.schedulerName }}
- --leader-elect-resource-namespace={{ .Release.Namespace }}
volumeMounts:
- name: scheduler-config
mountPath: /config
Expand All @@ -71,6 +74,9 @@ spec:
- --default-cores={{ .Values.scheduler.defaultCores }}
- --iluvatar-memory={{ .Values.iluvatarResourceMem }}
- --iluvatar-cores={{ .Values.iluvatarResourceCore }}
- --leader-elect={{ .Values.scheduler.leaderElect }}
- --leader-elect-resource-name={{ .Values.schedulerName }}
- --leader-elect-resource-namespace={{ .Release.Namespace }}
{{- range .Values.scheduler.extender.extraArgs }}
- {{ . }}
{{- end }}
Expand Down
4 changes: 2 additions & 2 deletions charts/hami/values.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -2,7 +2,7 @@

nameOverride: ""
fullnameOverride: ""
imagePullSecrets: []
imagePullSecrets: [ ]
version: "v2.3.9"

#Nvidia GPU Parameters
Expand Down Expand Up @@ -45,6 +45,7 @@ scheduler:
defaultCores: 0
defaultGPUNum: 1
metricsBindAddress: ":9395"
leaderElect: true
kubeScheduler:
# @param enabled indicate whether to run kube-scheduler container in the scheduler pod, it's true by default.
enabled: true
Expand All @@ -56,7 +57,6 @@ scheduler:
- -v=4
extraArgs:
- --policy-config-file=/config/config.json
- --leader-elect=false
- -v=4
extender:
image: "projecthami/hami"
Expand Down
3 changes: 2 additions & 1 deletion cmd/scheduler/main.go
Original file line number Diff line number Diff line change
Expand Up @@ -57,6 +57,7 @@ func init() {
rootCmd.Flags().Int32Var(&config.DefaultCores, "default-cores", 0, "default gpu core percentage to allocate")
rootCmd.Flags().Int32Var(&config.DefaultResourceNum, "default-gpu", 1, "default gpu to allocate")
rootCmd.Flags().StringVar(&config.MetricsBindAddress, "metrics-bind-address", ":9395", "The TCP address that the scheduler should bind to for serving prometheus metrics(e.g. 127.0.0.1:9395, :9395)")

rootCmd.PersistentFlags().AddGoFlagSet(device.GlobalFlagSet())
rootCmd.AddCommand(version.VersionCmd)
rootCmd.Flags().AddGoFlagSet(util.InitKlogFlags())
Expand All @@ -65,7 +66,7 @@ func init() {
func start() {
sher = scheduler.NewScheduler()
sher.Start()
defer sher.Stop()
go sher.Stop()

// start monitor metrics
go sher.RegisterFromNodeAnnotations()
Expand Down

0 comments on commit a55741e

Please sign in to comment.