karmada/pkg/estimator/client/accurate.go

145 lines
5.1 KiB
Go

package client
import (
"context"
"fmt"
"time"
"google.golang.org/grpc/metadata"
utilerrors "k8s.io/apimachinery/pkg/util/errors"
clusterv1alpha1 "github.com/karmada-io/karmada/pkg/apis/cluster/v1alpha1"
workv1alpha2 "github.com/karmada-io/karmada/pkg/apis/work/v1alpha2"
"github.com/karmada-io/karmada/pkg/estimator/pb"
"github.com/karmada-io/karmada/pkg/util"
)
// RegisterSchedulerEstimator will register a SchedulerEstimator.
func RegisterSchedulerEstimator(se *SchedulerEstimator) {
replicaEstimators["scheduler-estimator"] = se
unschedulableReplicaEstimators["scheduler-estimator"] = se
}
type getClusterReplicasFunc func(ctx context.Context, cluster string) (int32, error)
// SchedulerEstimator is an estimator that calls karmada-scheduler-estimator for estimation.
type SchedulerEstimator struct {
cache *SchedulerEstimatorCache
timeout time.Duration
}
// NewSchedulerEstimator builds a new SchedulerEstimator.
func NewSchedulerEstimator(cache *SchedulerEstimatorCache, timeout time.Duration) *SchedulerEstimator {
return &SchedulerEstimator{
cache: cache,
timeout: timeout,
}
}
// MaxAvailableReplicas estimates the maximum replicas that can be applied to the target cluster by calling karmada-scheduler-estimator.
func (se *SchedulerEstimator) MaxAvailableReplicas(
parentCtx context.Context,
clusters []*clusterv1alpha1.Cluster,
replicaRequirements *workv1alpha2.ReplicaRequirements,
) ([]workv1alpha2.TargetCluster, error) {
clusterNames := make([]string, len(clusters))
for i, cluster := range clusters {
clusterNames[i] = cluster.Name
}
return getClusterReplicasConcurrently(parentCtx, clusterNames, se.timeout, func(ctx context.Context, cluster string) (int32, error) {
return se.maxAvailableReplicas(ctx, cluster, replicaRequirements.DeepCopy())
})
}
// GetUnschedulableReplicas gets the unschedulable replicas which belong to a specified workload by calling karmada-scheduler-estimator.
func (se *SchedulerEstimator) GetUnschedulableReplicas(
parentCtx context.Context,
clusters []string,
reference *workv1alpha2.ObjectReference,
unscheduableThreshold time.Duration,
) ([]workv1alpha2.TargetCluster, error) {
return getClusterReplicasConcurrently(parentCtx, clusters, se.timeout, func(ctx context.Context, cluster string) (int32, error) {
return se.maxUnscheduableReplicas(ctx, cluster, reference.DeepCopy(), unscheduableThreshold)
})
}
func (se *SchedulerEstimator) maxAvailableReplicas(ctx context.Context, cluster string, replicaRequirements *workv1alpha2.ReplicaRequirements) (int32, error) {
client, err := se.cache.GetClient(cluster)
if err != nil {
return UnauthenticReplica, err
}
req := &pb.MaxAvailableReplicasRequest{
Cluster: cluster,
ReplicaRequirements: pb.ReplicaRequirements{},
}
if replicaRequirements != nil {
req.ReplicaRequirements.ResourceRequest = replicaRequirements.ResourceRequest
if replicaRequirements.NodeClaim != nil {
req.ReplicaRequirements.NodeClaim = &pb.NodeClaim{
NodeAffinity: replicaRequirements.NodeClaim.HardNodeAffinity,
NodeSelector: replicaRequirements.NodeClaim.NodeSelector,
Tolerations: replicaRequirements.NodeClaim.Tolerations,
}
}
}
res, err := client.MaxAvailableReplicas(ctx, req)
if err != nil {
return UnauthenticReplica, fmt.Errorf("gRPC request cluster(%s) estimator error when calling MaxAvailableReplicas: %v", cluster, err)
}
return res.MaxReplicas, nil
}
func (se *SchedulerEstimator) maxUnscheduableReplicas(
ctx context.Context,
cluster string,
reference *workv1alpha2.ObjectReference,
threshold time.Duration,
) (int32, error) {
client, err := se.cache.GetClient(cluster)
if err != nil {
return UnauthenticReplica, err
}
req := &pb.UnschedulableReplicasRequest{
Cluster: cluster,
Resource: pb.ObjectReference{
APIVersion: reference.APIVersion,
Kind: reference.Kind,
Namespace: reference.Namespace,
Name: reference.Name,
},
UnschedulableThreshold: threshold,
}
res, err := client.GetUnschedulableReplicas(ctx, req)
if err != nil {
return UnauthenticReplica, fmt.Errorf("gRPC request cluster(%s) estimator error when calling UnschedulableReplicas: %v", cluster, err)
}
return res.UnschedulableReplicas, nil
}
func getClusterReplicasConcurrently(parentCtx context.Context, clusters []string,
timeout time.Duration, getClusterReplicas getClusterReplicasFunc) ([]workv1alpha2.TargetCluster, error) {
// add object information into gRPC metadata
if u, ok := parentCtx.Value(util.ContextKeyObject).(string); ok {
parentCtx = metadata.AppendToOutgoingContext(parentCtx, string(util.ContextKeyObject), u)
}
ctx, cancel := context.WithTimeout(parentCtx, timeout)
defer cancel()
clusterReplicas := make([]workv1alpha2.TargetCluster, len(clusters))
funcs := make([]func() error, len(clusters))
for index, cluster := range clusters {
localIndex, localCluster := index, cluster
funcs[index] = func() error {
replicas, err := getClusterReplicas(ctx, localCluster)
if err != nil {
return err
}
clusterReplicas[localIndex] = workv1alpha2.TargetCluster{Name: localCluster, Replicas: replicas}
return nil
}
}
return clusterReplicas, utilerrors.AggregateGoroutines(funcs...)
}