/* * Copyright 2020 The Dragonfly Authors * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package scheduler import ( "context" "net/http" "time" "go.opentelemetry.io/contrib/instrumentation/google.golang.org/grpc/otelgrpc" "google.golang.org/grpc" "d7y.io/dragonfly/v2/cmd/dependency" logger "d7y.io/dragonfly/v2/internal/dflog" "d7y.io/dragonfly/v2/internal/dynconfig" "d7y.io/dragonfly/v2/pkg/dfpath" "d7y.io/dragonfly/v2/pkg/gc" "d7y.io/dragonfly/v2/pkg/rpc" "d7y.io/dragonfly/v2/pkg/rpc/manager" managerclient "d7y.io/dragonfly/v2/pkg/rpc/manager/client" "d7y.io/dragonfly/v2/scheduler/config" "d7y.io/dragonfly/v2/scheduler/core" "d7y.io/dragonfly/v2/scheduler/job" "d7y.io/dragonfly/v2/scheduler/metrics" "d7y.io/dragonfly/v2/scheduler/rpcserver" ) const ( gracefulStopTimeout = 10 * time.Second ) type Server struct { // Server configuration config *config.Config // GRPC server grpcServer *grpc.Server // Metrics server metricsServer *http.Server // Scheduler service service *core.SchedulerService // Manager client managerClient managerclient.Client // Dynamic config dynconfig config.DynconfigInterface // Async job job job.Job // GC server gc gc.GC } func New(cfg *config.Config, d dfpath.Dfpath) (*Server, error) { s := &Server{config: cfg} // Initialize manager client if cfg.Manager.Addr != "" { managerClient, err := managerclient.New(cfg.Manager.Addr) if err != nil { return nil, err } s.managerClient = managerClient // Register to manager if _, err := s.managerClient.UpdateScheduler(&manager.UpdateSchedulerRequest{ SourceType: manager.SourceType_SCHEDULER_SOURCE, HostName: s.config.Server.Host, Ip: s.config.Server.IP, Port: int32(s.config.Server.Port), Idc: s.config.Host.IDC, Location: s.config.Host.Location, SchedulerClusterId: uint64(s.config.Manager.SchedulerClusterID), }); err != nil { return nil, err } } // Initialize dynconfig client options := []dynconfig.Option{dynconfig.WithLocalConfigPath(dependency.GetConfigPath("scheduler"))} if s.managerClient != nil && cfg.DynConfig.Type == dynconfig.ManagerSourceType { options = append(options, dynconfig.WithManagerClient(config.NewManagerClient(s.managerClient, cfg)), dynconfig.WithExpireTime(cfg.DynConfig.ExpireTime), ) } dynConfig, err := config.NewDynconfig(cfg.DynConfig.Type, d.CacheDir(), cfg.DynConfig.CDNDirPath, options...) if err != nil { return nil, err } s.dynconfig = dynConfig // Initialize GC s.gc = gc.New(gc.WithLogger(logger.MetaGCLogger)) // Initialize scheduler service var openTel bool if cfg.Options.Telemetry.Jaeger != "" { openTel = true } service, err := core.NewSchedulerService(cfg.Scheduler, d.PluginDir(), cfg.Metrics, dynConfig, s.gc, core.WithDisableCDN(cfg.DisableCDN), core.WithOpenTel(openTel)) if err != nil { return nil, err } s.service = service // Initialize grpc service var opts []grpc.ServerOption if s.config.Options.Telemetry.Jaeger != "" { opts = append(opts, grpc.ChainUnaryInterceptor(otelgrpc.UnaryServerInterceptor()), grpc.ChainStreamInterceptor(otelgrpc.StreamServerInterceptor())) } grpcServer, err := rpcserver.New(s.service, opts...) if err != nil { return nil, err } s.grpcServer = grpcServer // Initialize prometheus if cfg.Metrics != nil { s.metricsServer = metrics.New(cfg.Metrics, grpcServer) } // Initialize job service if cfg.Job.Redis.Host != "" { s.job, err = job.New(context.Background(), cfg.Job, cfg.Manager.SchedulerClusterID, cfg.Server.Host, s.service) if err != nil { return nil, err } } return s, nil } func (s *Server) Serve() error { // Serve dynConfig go func() { if err := s.dynconfig.Serve(); err != nil { logger.Fatalf("dynconfig start failed %v", err) } logger.Info("dynconfig start successfully") }() // Serve GC s.gc.Serve() logger.Info("gc start successfully") // Serve service go func() { s.service.Serve() logger.Info("scheduler service start successfully") }() // Serve Job if s.job != nil { go func() { if err := s.job.Serve(); err != nil { logger.Fatalf("job start failed %v", err) } logger.Info("job start successfully") }() } // Started metrics server if s.metricsServer != nil { go func() { logger.Infof("started metrics server at %s", s.metricsServer.Addr) if err := s.metricsServer.ListenAndServe(); err != nil { if err == http.ErrServerClosed { return } logger.Fatalf("metrics server closed unexpect: %v", err) } }() } // Serve Keepalive if s.managerClient != nil { go func() { logger.Info("start keepalive to manager") s.managerClient.KeepAlive(s.config.Manager.KeepAlive.Interval, &manager.KeepAliveRequest{ HostName: s.config.Server.Host, SourceType: manager.SourceType_SCHEDULER_SOURCE, ClusterId: uint64(s.config.Manager.SchedulerClusterID), }) }() } // Generate GRPC listener lis, _, err := rpc.ListenWithPortRange(s.config.Server.IP, s.config.Server.Port, s.config.Server.Port) if err != nil { logger.Fatalf("net listener failed to start: %v", err) } defer lis.Close() // Started GRPC server logger.Infof("started grpc server at %s://%s", lis.Addr().Network(), lis.Addr().String()) if err := s.grpcServer.Serve(lis); err != nil { logger.Errorf("stoped grpc server: %v", err) return err } return nil } func (s *Server) Stop() { // Stop dynconfig server if err := s.dynconfig.Stop(); err != nil { logger.Errorf("dynconfig client closed failed %v", err) } logger.Info("dynconfig client closed") // Stop manager client if s.managerClient != nil { if err := s.managerClient.Close(); err != nil { logger.Errorf("manager client failed to stop: %v", err) } logger.Info("manager client closed") } // Stop GC s.gc.Stop() logger.Info("gc closed") // Stop scheduler service s.service.Stop() logger.Info("scheduler service closed") // Stop metrics server if s.metricsServer != nil { if err := s.metricsServer.Shutdown(context.Background()); err != nil { logger.Errorf("metrics server failed to stop: %v", err) } logger.Info("metrics server closed under request") } // Stop GRPC server stopped := make(chan struct{}) go func() { s.grpcServer.GracefulStop() logger.Info("grpc server closed under request") close(stopped) }() t := time.NewTimer(gracefulStopTimeout) select { case <-t.C: s.grpcServer.Stop() case <-stopped: t.Stop() } }