138 lines
3.6 KiB
Go
138 lines
3.6 KiB
Go
/*
|
|
Copyright 2017 The Kubernetes Authors.
|
|
|
|
Licensed under the Apache License, Version 2.0 (the "License");
|
|
you may not use this file except in compliance with the License.
|
|
You may obtain a copy of the License at
|
|
|
|
http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
Unless required by applicable law or agreed to in writing, software
|
|
distributed under the License is distributed on an "AS IS" BASIS,
|
|
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
See the License for the specific language governing permissions and
|
|
limitations under the License.
|
|
*/
|
|
|
|
package app
|
|
|
|
import (
|
|
"context"
|
|
"fmt"
|
|
"net/http"
|
|
"os"
|
|
"time"
|
|
|
|
"github.com/prometheus/client_golang/prometheus/promhttp"
|
|
|
|
"volcano.sh/volcano/cmd/scheduler/app/options"
|
|
"volcano.sh/volcano/pkg/apis/helpers"
|
|
"volcano.sh/volcano/pkg/kube"
|
|
"volcano.sh/volcano/pkg/scheduler"
|
|
"volcano.sh/volcano/pkg/version"
|
|
|
|
v1 "k8s.io/api/core/v1"
|
|
"k8s.io/apimachinery/pkg/util/uuid"
|
|
clientset "k8s.io/client-go/kubernetes"
|
|
"k8s.io/client-go/kubernetes/scheme"
|
|
corev1 "k8s.io/client-go/kubernetes/typed/core/v1"
|
|
"k8s.io/klog"
|
|
|
|
// Register gcp auth
|
|
_ "k8s.io/client-go/plugin/pkg/client/auth/gcp"
|
|
restclient "k8s.io/client-go/rest"
|
|
"k8s.io/client-go/tools/leaderelection"
|
|
"k8s.io/client-go/tools/leaderelection/resourcelock"
|
|
"k8s.io/client-go/tools/record"
|
|
)
|
|
|
|
const (
|
|
leaseDuration = 15 * time.Second
|
|
renewDeadline = 10 * time.Second
|
|
retryPeriod = 5 * time.Second
|
|
)
|
|
|
|
// Run the volcano scheduler
|
|
func Run(opt *options.ServerOption) error {
|
|
if opt.PrintVersion {
|
|
version.PrintVersionAndExit()
|
|
}
|
|
|
|
config, err := kube.BuildConfig(opt.KubeClientOptions)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
sched, err := scheduler.NewScheduler(config,
|
|
opt.SchedulerName,
|
|
opt.SchedulerConf,
|
|
opt.SchedulePeriod,
|
|
opt.DefaultQueue)
|
|
if err != nil {
|
|
panic(err)
|
|
}
|
|
|
|
go func() {
|
|
http.Handle("/metrics", promhttp.Handler())
|
|
klog.Fatalf("Prometheus Http Server failed %s", http.ListenAndServe(opt.ListenAddress, nil))
|
|
}()
|
|
|
|
if err := helpers.StartHealthz(opt.HealthzBindAddress, "volcano-scheduler"); err != nil {
|
|
return err
|
|
}
|
|
|
|
run := func(ctx context.Context) {
|
|
sched.Run(ctx.Done())
|
|
<-ctx.Done()
|
|
}
|
|
|
|
if !opt.EnableLeaderElection {
|
|
run(context.TODO())
|
|
return fmt.Errorf("finished without leader elect")
|
|
}
|
|
|
|
leaderElectionClient, err := clientset.NewForConfig(restclient.AddUserAgent(config, "leader-election"))
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
// Prepare event clients.
|
|
broadcaster := record.NewBroadcaster()
|
|
broadcaster.StartRecordingToSink(&corev1.EventSinkImpl{Interface: leaderElectionClient.CoreV1().Events(opt.LockObjectNamespace)})
|
|
eventRecorder := broadcaster.NewRecorder(scheme.Scheme, v1.EventSource{Component: opt.SchedulerName})
|
|
|
|
hostname, err := os.Hostname()
|
|
if err != nil {
|
|
return fmt.Errorf("unable to get hostname: %v", err)
|
|
}
|
|
// add a uniquifier so that two processes on the same host don't accidentally both become active
|
|
id := hostname + "_" + string(uuid.NewUUID())
|
|
|
|
rl, err := resourcelock.New(resourcelock.ConfigMapsResourceLock,
|
|
opt.LockObjectNamespace,
|
|
opt.SchedulerName,
|
|
leaderElectionClient.CoreV1(),
|
|
leaderElectionClient.CoordinationV1(),
|
|
resourcelock.ResourceLockConfig{
|
|
Identity: id,
|
|
EventRecorder: eventRecorder,
|
|
})
|
|
if err != nil {
|
|
return fmt.Errorf("couldn't create resource lock: %v", err)
|
|
}
|
|
|
|
leaderelection.RunOrDie(context.TODO(), leaderelection.LeaderElectionConfig{
|
|
Lock: rl,
|
|
LeaseDuration: leaseDuration,
|
|
RenewDeadline: renewDeadline,
|
|
RetryPeriod: retryPeriod,
|
|
Callbacks: leaderelection.LeaderCallbacks{
|
|
OnStartedLeading: run,
|
|
OnStoppedLeading: func() {
|
|
klog.Fatalf("leaderelection lost")
|
|
},
|
|
},
|
|
})
|
|
return fmt.Errorf("lost lease")
|
|
}
|