1169 lines
47 KiB
Go
1169 lines
47 KiB
Go
package detector
|
|
|
|
import (
|
|
"context"
|
|
"fmt"
|
|
"regexp"
|
|
"sync"
|
|
"time"
|
|
|
|
corev1 "k8s.io/api/core/v1"
|
|
apierrors "k8s.io/apimachinery/pkg/api/errors"
|
|
"k8s.io/apimachinery/pkg/api/meta"
|
|
metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
|
|
"k8s.io/apimachinery/pkg/apis/meta/v1/unstructured"
|
|
"k8s.io/apimachinery/pkg/labels"
|
|
"k8s.io/apimachinery/pkg/runtime"
|
|
"k8s.io/apimachinery/pkg/runtime/schema"
|
|
"k8s.io/apimachinery/pkg/util/errors"
|
|
"k8s.io/apimachinery/pkg/util/wait"
|
|
"k8s.io/client-go/discovery"
|
|
"k8s.io/client-go/dynamic"
|
|
"k8s.io/client-go/tools/cache"
|
|
"k8s.io/client-go/tools/record"
|
|
"k8s.io/client-go/util/retry"
|
|
"k8s.io/klog/v2"
|
|
"sigs.k8s.io/controller-runtime/pkg/client"
|
|
"sigs.k8s.io/controller-runtime/pkg/controller/controllerutil"
|
|
"sigs.k8s.io/controller-runtime/pkg/manager"
|
|
|
|
configv1alpha1 "github.com/karmada-io/karmada/pkg/apis/config/v1alpha1"
|
|
policyv1alpha1 "github.com/karmada-io/karmada/pkg/apis/policy/v1alpha1"
|
|
workv1alpha2 "github.com/karmada-io/karmada/pkg/apis/work/v1alpha2"
|
|
"github.com/karmada-io/karmada/pkg/events"
|
|
"github.com/karmada-io/karmada/pkg/metrics"
|
|
"github.com/karmada-io/karmada/pkg/resourceinterpreter"
|
|
"github.com/karmada-io/karmada/pkg/sharedcli/ratelimiterflag"
|
|
"github.com/karmada-io/karmada/pkg/util"
|
|
"github.com/karmada-io/karmada/pkg/util/fedinformer"
|
|
"github.com/karmada-io/karmada/pkg/util/fedinformer/genericmanager"
|
|
"github.com/karmada-io/karmada/pkg/util/fedinformer/keys"
|
|
"github.com/karmada-io/karmada/pkg/util/helper"
|
|
"github.com/karmada-io/karmada/pkg/util/lifted"
|
|
"github.com/karmada-io/karmada/pkg/util/names"
|
|
"github.com/karmada-io/karmada/pkg/util/restmapper"
|
|
)
|
|
|
|
// ResourceDetector is a resource watcher which watches all resources and reconcile the events.
|
|
type ResourceDetector struct {
|
|
// DiscoveryClientSet is used to resource discovery.
|
|
DiscoveryClientSet *discovery.DiscoveryClient
|
|
// Client is used to retrieve objects, it is often more convenient than lister.
|
|
Client client.Client
|
|
// DynamicClient used to fetch arbitrary resources.
|
|
DynamicClient dynamic.Interface
|
|
InformerManager genericmanager.SingleClusterInformerManager
|
|
EventHandler cache.ResourceEventHandler
|
|
Processor util.AsyncWorker
|
|
SkippedResourceConfig *util.SkippedResourceConfig
|
|
SkippedPropagatingNamespaces []*regexp.Regexp
|
|
// ResourceInterpreter knows the details of resource structure.
|
|
ResourceInterpreter resourceinterpreter.ResourceInterpreter
|
|
EventRecorder record.EventRecorder
|
|
// policyReconcileWorker maintains a rate limited queue which used to store PropagationPolicy's key and
|
|
// a reconcile function to consume the items in queue.
|
|
policyReconcileWorker util.AsyncWorker
|
|
propagationPolicyLister cache.GenericLister
|
|
|
|
// clusterPolicyReconcileWorker maintains a rate limited queue which used to store ClusterPropagationPolicy's key and
|
|
// a reconcile function to consume the items in queue.
|
|
clusterPolicyReconcileWorker util.AsyncWorker
|
|
clusterPropagationPolicyLister cache.GenericLister
|
|
|
|
RESTMapper meta.RESTMapper
|
|
|
|
// waitingObjects tracks of objects which haven't be propagated yet as lack of appropriate policies.
|
|
waitingObjects map[keys.ClusterWideKey]struct{}
|
|
// waitingLock is the lock for waitingObjects operation.
|
|
waitingLock sync.RWMutex
|
|
// ConcurrentResourceTemplateSyncs is the number of resource templates that are allowed to sync concurrently.
|
|
// Larger number means responsive resource template syncing but more CPU(and network) load.
|
|
ConcurrentResourceTemplateSyncs int
|
|
|
|
// RateLimiterOptions is the configuration for rate limiter which may significantly influence the performance of
|
|
// the controller.
|
|
RateLimiterOptions ratelimiterflag.Options
|
|
|
|
stopCh <-chan struct{}
|
|
}
|
|
|
|
// Start runs the detector, never stop until stopCh closed.
|
|
func (d *ResourceDetector) Start(ctx context.Context) error {
|
|
klog.Infof("Starting resource detector.")
|
|
d.waitingObjects = make(map[keys.ClusterWideKey]struct{})
|
|
d.stopCh = ctx.Done()
|
|
|
|
// setup policy reconcile worker
|
|
policyWorkerOptions := util.Options{
|
|
Name: "propagationPolicy reconciler",
|
|
KeyFunc: ClusterWideKeyFunc,
|
|
ReconcileFunc: d.ReconcilePropagationPolicy,
|
|
}
|
|
d.policyReconcileWorker = util.NewAsyncWorker(policyWorkerOptions)
|
|
d.policyReconcileWorker.Run(1, d.stopCh)
|
|
clusterPolicyWorkerOptions := util.Options{
|
|
Name: "clusterPropagationPolicy reconciler",
|
|
KeyFunc: ClusterWideKeyFunc,
|
|
ReconcileFunc: d.ReconcileClusterPropagationPolicy,
|
|
}
|
|
d.clusterPolicyReconcileWorker = util.NewAsyncWorker(clusterPolicyWorkerOptions)
|
|
d.clusterPolicyReconcileWorker.Run(1, d.stopCh)
|
|
|
|
// watch and enqueue PropagationPolicy changes.
|
|
propagationPolicyGVR := schema.GroupVersionResource{
|
|
Group: policyv1alpha1.GroupVersion.Group,
|
|
Version: policyv1alpha1.GroupVersion.Version,
|
|
Resource: "propagationpolicies",
|
|
}
|
|
policyHandler := fedinformer.NewHandlerOnEvents(d.OnPropagationPolicyAdd, d.OnPropagationPolicyUpdate, d.OnPropagationPolicyDelete)
|
|
d.InformerManager.ForResource(propagationPolicyGVR, policyHandler)
|
|
d.propagationPolicyLister = d.InformerManager.Lister(propagationPolicyGVR)
|
|
|
|
// watch and enqueue ClusterPropagationPolicy changes.
|
|
clusterPropagationPolicyGVR := schema.GroupVersionResource{
|
|
Group: policyv1alpha1.GroupVersion.Group,
|
|
Version: policyv1alpha1.GroupVersion.Version,
|
|
Resource: "clusterpropagationpolicies",
|
|
}
|
|
clusterPolicyHandler := fedinformer.NewHandlerOnEvents(d.OnClusterPropagationPolicyAdd, d.OnClusterPropagationPolicyUpdate, d.OnClusterPropagationPolicyDelete)
|
|
d.InformerManager.ForResource(clusterPropagationPolicyGVR, clusterPolicyHandler)
|
|
d.clusterPropagationPolicyLister = d.InformerManager.Lister(clusterPropagationPolicyGVR)
|
|
|
|
detectorWorkerOptions := util.Options{
|
|
Name: "resource detector",
|
|
KeyFunc: ClusterWideKeyFunc,
|
|
ReconcileFunc: d.Reconcile,
|
|
RateLimiterOptions: d.RateLimiterOptions,
|
|
}
|
|
|
|
d.EventHandler = fedinformer.NewFilteringHandlerOnAllEvents(d.EventFilter, d.OnAdd, d.OnUpdate, d.OnDelete)
|
|
d.Processor = util.NewAsyncWorker(detectorWorkerOptions)
|
|
d.Processor.Run(d.ConcurrentResourceTemplateSyncs, d.stopCh)
|
|
go d.discoverResources(30 * time.Second)
|
|
|
|
<-d.stopCh
|
|
klog.Infof("Stopped as stopCh closed.")
|
|
return nil
|
|
}
|
|
|
|
// Check if our ResourceDetector implements necessary interfaces
|
|
var (
|
|
_ manager.Runnable = &ResourceDetector{}
|
|
_ manager.LeaderElectionRunnable = &ResourceDetector{}
|
|
)
|
|
|
|
func (d *ResourceDetector) discoverResources(period time.Duration) {
|
|
wait.Until(func() {
|
|
newResources := lifted.GetDeletableResources(d.DiscoveryClientSet)
|
|
for r := range newResources {
|
|
if d.InformerManager.IsHandlerExist(r, d.EventHandler) || d.gvrDisabled(r) {
|
|
continue
|
|
}
|
|
klog.Infof("Setup informer for %s", r.String())
|
|
d.InformerManager.ForResource(r, d.EventHandler)
|
|
}
|
|
d.InformerManager.Start()
|
|
}, period, d.stopCh)
|
|
}
|
|
|
|
// gvrDisabled returns whether GroupVersionResource is disabled.
|
|
func (d *ResourceDetector) gvrDisabled(gvr schema.GroupVersionResource) bool {
|
|
if d.SkippedResourceConfig == nil {
|
|
return false
|
|
}
|
|
|
|
if d.SkippedResourceConfig.GroupVersionDisabled(gvr.GroupVersion()) {
|
|
return true
|
|
}
|
|
if d.SkippedResourceConfig.GroupDisabled(gvr.Group) {
|
|
return true
|
|
}
|
|
|
|
gvks, err := d.RESTMapper.KindsFor(gvr)
|
|
if err != nil {
|
|
klog.Errorf("gvr(%s) transform failed: %v", gvr.String(), err)
|
|
return false
|
|
}
|
|
|
|
for _, gvk := range gvks {
|
|
if d.SkippedResourceConfig.GroupVersionKindDisabled(gvk) {
|
|
return true
|
|
}
|
|
}
|
|
|
|
return false
|
|
}
|
|
|
|
// NeedLeaderElection implements LeaderElectionRunnable interface.
|
|
// So that the detector could run in the leader election mode.
|
|
func (d *ResourceDetector) NeedLeaderElection() bool {
|
|
return true
|
|
}
|
|
|
|
// Reconcile performs a full reconciliation for the object referred to by the key.
|
|
// The key will be re-queued if an error is non-nil.
|
|
func (d *ResourceDetector) Reconcile(key util.QueueKey) error {
|
|
clusterWideKey, ok := key.(keys.ClusterWideKey)
|
|
if !ok {
|
|
klog.Error("Invalid key")
|
|
return fmt.Errorf("invalid key")
|
|
}
|
|
klog.Infof("Reconciling object: %s", clusterWideKey)
|
|
|
|
object, err := d.GetUnstructuredObject(clusterWideKey)
|
|
if err != nil {
|
|
if apierrors.IsNotFound(err) {
|
|
// The resource may no longer exist, in which case we try (may not exist in waiting list) remove it from waiting list and stop processing.
|
|
d.RemoveWaiting(clusterWideKey)
|
|
|
|
// Once resource be deleted, the derived ResourceBinding or ClusterResourceBinding also need to be cleaned up,
|
|
// currently we do that by setting owner reference to derived objects.
|
|
return nil
|
|
}
|
|
klog.Errorf("Failed to get unstructured object(%s), error: %v", clusterWideKey, err)
|
|
return err
|
|
}
|
|
|
|
return d.propagateResource(object, clusterWideKey)
|
|
}
|
|
|
|
// EventFilter tells if an object should be take care of.
|
|
//
|
|
// All objects under Kubernetes reserved namespace should be ignored:
|
|
// - kube-*
|
|
// All objects under Karmada reserved namespace should be ignored:
|
|
// - karmada-system
|
|
// - karmada-cluster
|
|
// - karmada-es-*
|
|
//
|
|
// If '--skipped-propagating-namespaces' is specified, all APIs in the skipped-propagating-namespaces will be ignored.
|
|
func (d *ResourceDetector) EventFilter(obj interface{}) bool {
|
|
key, err := ClusterWideKeyFunc(obj)
|
|
if err != nil {
|
|
return false
|
|
}
|
|
|
|
clusterWideKey, ok := key.(keys.ClusterWideKey)
|
|
if !ok {
|
|
klog.Errorf("Invalid key")
|
|
return false
|
|
}
|
|
|
|
if names.IsReservedNamespace(clusterWideKey.Namespace) {
|
|
return false
|
|
}
|
|
|
|
// if SkippedPropagatingNamespaces is set, skip object events in these namespaces.
|
|
for _, nsRegexp := range d.SkippedPropagatingNamespaces {
|
|
if match := nsRegexp.MatchString(clusterWideKey.Namespace); match {
|
|
return false
|
|
}
|
|
}
|
|
|
|
if unstructObj, ok := obj.(*unstructured.Unstructured); ok {
|
|
switch unstructObj.GroupVersionKind() {
|
|
// The secret, with type 'kubernetes.io/service-account-token', is created along with `ServiceAccount` should be
|
|
// prevented from propagating.
|
|
// Refer to https://github.com/karmada-io/karmada/pull/1525#issuecomment-1091030659 for more details.
|
|
case corev1.SchemeGroupVersion.WithKind("Secret"):
|
|
secretType, found, _ := unstructured.NestedString(unstructObj.Object, "type")
|
|
if found && secretType == string(corev1.SecretTypeServiceAccountToken) {
|
|
return false
|
|
}
|
|
}
|
|
}
|
|
|
|
return true
|
|
}
|
|
|
|
// OnAdd handles object add event and push the object to queue.
|
|
func (d *ResourceDetector) OnAdd(obj interface{}) {
|
|
runtimeObj, ok := obj.(runtime.Object)
|
|
if !ok {
|
|
return
|
|
}
|
|
d.Processor.Enqueue(runtimeObj)
|
|
}
|
|
|
|
// OnUpdate handles object update event and push the object to queue.
|
|
func (d *ResourceDetector) OnUpdate(oldObj, newObj interface{}) {
|
|
unstructuredOldObj, err := helper.ToUnstructured(oldObj)
|
|
if err != nil {
|
|
klog.Errorf("Failed to transform oldObj, error: %v", err)
|
|
return
|
|
}
|
|
|
|
unstructuredNewObj, err := helper.ToUnstructured(newObj)
|
|
if err != nil {
|
|
klog.Errorf("Failed to transform newObj, error: %v", err)
|
|
return
|
|
}
|
|
|
|
if !SpecificationChanged(unstructuredOldObj, unstructuredNewObj) {
|
|
klog.V(4).Infof("Ignore update event of object (kind=%s, %s/%s) as specification no change", unstructuredOldObj.GetKind(), unstructuredOldObj.GetNamespace(), unstructuredOldObj.GetName())
|
|
return
|
|
}
|
|
|
|
d.OnAdd(newObj)
|
|
}
|
|
|
|
// OnDelete handles object delete event and push the object to queue.
|
|
func (d *ResourceDetector) OnDelete(obj interface{}) {
|
|
d.OnAdd(obj)
|
|
}
|
|
|
|
// LookForMatchedPolicy tries to find a policy for object referenced by object key.
|
|
func (d *ResourceDetector) LookForMatchedPolicy(object *unstructured.Unstructured, objectKey keys.ClusterWideKey) (*policyv1alpha1.PropagationPolicy, error) {
|
|
if len(objectKey.Namespace) == 0 {
|
|
return nil, nil
|
|
}
|
|
|
|
klog.V(2).Infof("Attempts to match policy for resource(%s)", objectKey)
|
|
policyObjects, err := d.propagationPolicyLister.ByNamespace(objectKey.Namespace).List(labels.Everything())
|
|
if err != nil {
|
|
klog.Errorf("Failed to list propagation policy: %v", err)
|
|
return nil, err
|
|
}
|
|
if len(policyObjects) == 0 {
|
|
klog.V(2).Infof("No propagationpolicy find in namespace(%s).", objectKey.Namespace)
|
|
return nil, nil
|
|
}
|
|
|
|
policyList := make([]*policyv1alpha1.PropagationPolicy, 0)
|
|
for index := range policyObjects {
|
|
policy := &policyv1alpha1.PropagationPolicy{}
|
|
if err = helper.ConvertToTypedObject(policyObjects[index], policy); err != nil {
|
|
klog.Errorf("Failed to convert PropagationPolicy from unstructured object: %v", err)
|
|
return nil, err
|
|
}
|
|
policyList = append(policyList, policy)
|
|
}
|
|
|
|
return getHighestPriorityPropagationPolicy(policyList, object, objectKey), nil
|
|
}
|
|
|
|
// LookForMatchedClusterPolicy tries to find a ClusterPropagationPolicy for object referenced by object key.
|
|
func (d *ResourceDetector) LookForMatchedClusterPolicy(object *unstructured.Unstructured, objectKey keys.ClusterWideKey) (*policyv1alpha1.ClusterPropagationPolicy, error) {
|
|
klog.V(2).Infof("Attempts to match cluster policy for resource(%s)", objectKey)
|
|
policyObjects, err := d.clusterPropagationPolicyLister.List(labels.Everything())
|
|
if err != nil {
|
|
klog.Errorf("Failed to list cluster propagation policy: %v", err)
|
|
return nil, err
|
|
}
|
|
if len(policyObjects) == 0 {
|
|
klog.V(2).Infof("No clusterpropagationpolicy find.")
|
|
return nil, nil
|
|
}
|
|
|
|
policyList := make([]*policyv1alpha1.ClusterPropagationPolicy, 0)
|
|
for index := range policyObjects {
|
|
policy := &policyv1alpha1.ClusterPropagationPolicy{}
|
|
if err = helper.ConvertToTypedObject(policyObjects[index], policy); err != nil {
|
|
klog.Errorf("Failed to convert ClusterPropagationPolicy from unstructured object: %v", err)
|
|
return nil, err
|
|
}
|
|
policyList = append(policyList, policy)
|
|
}
|
|
|
|
return getHighestPriorityClusterPropagationPolicy(policyList, object, objectKey), nil
|
|
}
|
|
|
|
// ApplyPolicy starts propagate the object referenced by object key according to PropagationPolicy.
|
|
func (d *ResourceDetector) ApplyPolicy(object *unstructured.Unstructured, objectKey keys.ClusterWideKey, policy *policyv1alpha1.PropagationPolicy) (err error) {
|
|
start := time.Now()
|
|
klog.Infof("Applying policy(%s/%s) for object: %s", policy.Namespace, policy.Name, objectKey)
|
|
var operationResult controllerutil.OperationResult
|
|
defer func() {
|
|
metrics.ObserveApplyPolicyAttemptAndLatency(object, policy.ObjectMeta, err, start)
|
|
if err != nil {
|
|
d.EventRecorder.Eventf(object, corev1.EventTypeWarning, events.EventReasonApplyPolicyFailed, "Apply policy(%s/%s) failed: %v", policy.Namespace, policy.Name, err)
|
|
} else if operationResult != controllerutil.OperationResultNone {
|
|
d.EventRecorder.Eventf(object, corev1.EventTypeNormal, events.EventReasonApplyPolicySucceed, "Apply policy(%s/%s) succeed", policy.Namespace, policy.Name)
|
|
}
|
|
}()
|
|
|
|
if err := d.ClaimPolicyForObject(object, policy.Namespace, policy.Name); err != nil {
|
|
klog.Errorf("Failed to claim policy(%s) for object: %s", policy.Name, object)
|
|
return err
|
|
}
|
|
|
|
policyLabels := map[string]string{
|
|
policyv1alpha1.PropagationPolicyNamespaceLabel: policy.GetNamespace(),
|
|
policyv1alpha1.PropagationPolicyNameLabel: policy.GetName(),
|
|
}
|
|
|
|
binding, err := d.BuildResourceBinding(object, objectKey, policyLabels, &policy.Spec)
|
|
if err != nil {
|
|
klog.Errorf("Failed to build resourceBinding for object: %s. error: %v", objectKey, err)
|
|
return err
|
|
}
|
|
bindingCopy := binding.DeepCopy()
|
|
err = retry.RetryOnConflict(retry.DefaultRetry, func() (err error) {
|
|
operationResult, err = controllerutil.CreateOrUpdate(context.TODO(), d.Client, bindingCopy, func() error {
|
|
// If this binding exists and its owner is not the input object, return error and let garbage collector
|
|
// delete this binding and try again later. See https://github.com/karmada-io/karmada/issues/2090.
|
|
if ownerRef := metav1.GetControllerOfNoCopy(bindingCopy); ownerRef != nil && ownerRef.UID != object.GetUID() {
|
|
return fmt.Errorf("failed to update binding due to different owner reference UID, will " +
|
|
"try again later after binding is garbage collected, see https://github.com/karmada-io/karmada/issues/2090")
|
|
}
|
|
// Just update necessary fields, especially avoid modifying Spec.Clusters which is scheduling result, if already exists.
|
|
bindingCopy.Labels = util.DedupeAndMergeLabels(bindingCopy.Labels, binding.Labels)
|
|
bindingCopy.OwnerReferences = binding.OwnerReferences
|
|
bindingCopy.Finalizers = binding.Finalizers
|
|
bindingCopy.Spec.Resource = binding.Spec.Resource
|
|
bindingCopy.Spec.ReplicaRequirements = binding.Spec.ReplicaRequirements
|
|
bindingCopy.Spec.Replicas = binding.Spec.Replicas
|
|
bindingCopy.Spec.PropagateDeps = binding.Spec.PropagateDeps
|
|
bindingCopy.Spec.SchedulerName = binding.Spec.SchedulerName
|
|
bindingCopy.Spec.Placement = binding.Spec.Placement
|
|
bindingCopy.Spec.Failover = binding.Spec.Failover
|
|
return nil
|
|
})
|
|
if err != nil {
|
|
return err
|
|
}
|
|
return nil
|
|
})
|
|
if err != nil {
|
|
klog.Errorf("Failed to apply policy(%s) for object: %s. error: %v", policy.Name, objectKey, err)
|
|
return err
|
|
}
|
|
|
|
if operationResult == controllerutil.OperationResultCreated {
|
|
klog.Infof("Create ResourceBinding(%s/%s) successfully.", binding.GetNamespace(), binding.GetName())
|
|
} else if operationResult == controllerutil.OperationResultUpdated {
|
|
klog.Infof("Update ResourceBinding(%s/%s) successfully.", binding.GetNamespace(), binding.GetName())
|
|
} else {
|
|
klog.V(2).Infof("ResourceBinding(%s/%s) is up to date.", binding.GetNamespace(), binding.GetName())
|
|
}
|
|
|
|
return nil
|
|
}
|
|
|
|
// ApplyClusterPolicy starts propagate the object referenced by object key according to ClusterPropagationPolicy.
|
|
// nolint:gocyclo
|
|
func (d *ResourceDetector) ApplyClusterPolicy(object *unstructured.Unstructured, objectKey keys.ClusterWideKey, policy *policyv1alpha1.ClusterPropagationPolicy) (err error) {
|
|
start := time.Now()
|
|
klog.Infof("Applying cluster policy(%s) for object: %s", policy.Name, objectKey)
|
|
var operationResult controllerutil.OperationResult
|
|
defer func() {
|
|
metrics.ObserveApplyPolicyAttemptAndLatency(object, policy.ObjectMeta, err, start)
|
|
if err != nil {
|
|
d.EventRecorder.Eventf(object, corev1.EventTypeWarning, events.EventReasonApplyPolicyFailed, "Apply cluster policy(%s) failed: %v", policy.Name, err)
|
|
} else if operationResult != controllerutil.OperationResultNone {
|
|
d.EventRecorder.Eventf(object, corev1.EventTypeNormal, events.EventReasonApplyPolicySucceed, "Apply cluster policy(%s) succeed", policy.Name)
|
|
}
|
|
}()
|
|
|
|
if err := d.ClaimClusterPolicyForObject(object, policy.Name); err != nil {
|
|
klog.Errorf("Failed to claim cluster policy(%s) for object: %s", policy.Name, object)
|
|
return err
|
|
}
|
|
|
|
policyLabels := map[string]string{
|
|
policyv1alpha1.ClusterPropagationPolicyLabel: policy.GetName(),
|
|
}
|
|
|
|
// Build `ResourceBinding` or `ClusterResourceBinding` according to the resource template's scope.
|
|
// For namespace-scoped resources, which namespace is not empty, building `ResourceBinding`.
|
|
// For cluster-scoped resources, which namespace is empty, building `ClusterResourceBinding`.
|
|
if object.GetNamespace() != "" {
|
|
binding, err := d.BuildResourceBinding(object, objectKey, policyLabels, &policy.Spec)
|
|
if err != nil {
|
|
klog.Errorf("Failed to build resourceBinding for object: %s. error: %v", objectKey, err)
|
|
return err
|
|
}
|
|
bindingCopy := binding.DeepCopy()
|
|
err = retry.RetryOnConflict(retry.DefaultRetry, func() (err error) {
|
|
operationResult, err = controllerutil.CreateOrUpdate(context.TODO(), d.Client, bindingCopy, func() error {
|
|
// If this binding exists and its owner is not the input object, return error and let garbage collector
|
|
// delete this binding and try again later. See https://github.com/karmada-io/karmada/issues/2090.
|
|
if ownerRef := metav1.GetControllerOfNoCopy(bindingCopy); ownerRef != nil && ownerRef.UID != object.GetUID() {
|
|
return fmt.Errorf("failed to update binding due to different owner reference UID, will " +
|
|
"try again later after binding is garbage collected, see https://github.com/karmada-io/karmada/issues/2090")
|
|
}
|
|
// Just update necessary fields, especially avoid modifying Spec.Clusters which is scheduling result, if already exists.
|
|
bindingCopy.Labels = util.DedupeAndMergeLabels(bindingCopy.Labels, binding.Labels)
|
|
bindingCopy.OwnerReferences = binding.OwnerReferences
|
|
bindingCopy.Finalizers = binding.Finalizers
|
|
bindingCopy.Spec.Resource = binding.Spec.Resource
|
|
bindingCopy.Spec.ReplicaRequirements = binding.Spec.ReplicaRequirements
|
|
bindingCopy.Spec.Replicas = binding.Spec.Replicas
|
|
bindingCopy.Spec.PropagateDeps = binding.Spec.PropagateDeps
|
|
bindingCopy.Spec.SchedulerName = binding.Spec.SchedulerName
|
|
bindingCopy.Spec.Placement = binding.Spec.Placement
|
|
bindingCopy.Spec.Failover = binding.Spec.Failover
|
|
return nil
|
|
})
|
|
if err != nil {
|
|
return err
|
|
}
|
|
return nil
|
|
})
|
|
|
|
if err != nil {
|
|
klog.Errorf("Failed to apply cluster policy(%s) for object: %s. error: %v", policy.Name, objectKey, err)
|
|
return err
|
|
}
|
|
|
|
if operationResult == controllerutil.OperationResultCreated {
|
|
klog.Infof("Create ResourceBinding(%s) successfully.", binding.GetName())
|
|
} else if operationResult == controllerutil.OperationResultUpdated {
|
|
klog.Infof("Update ResourceBinding(%s) successfully.", binding.GetName())
|
|
} else {
|
|
klog.V(2).Infof("ResourceBinding(%s) is up to date.", binding.GetName())
|
|
}
|
|
} else {
|
|
binding, err := d.BuildClusterResourceBinding(object, objectKey, policyLabels, &policy.Spec)
|
|
if err != nil {
|
|
klog.Errorf("Failed to build clusterResourceBinding for object: %s. error: %v", objectKey, err)
|
|
return err
|
|
}
|
|
bindingCopy := binding.DeepCopy()
|
|
operationResult, err = controllerutil.CreateOrUpdate(context.TODO(), d.Client, bindingCopy, func() error {
|
|
// If this binding exists and its owner is not the input object, return error and let garbage collector
|
|
// delete this binding and try again later. See https://github.com/karmada-io/karmada/issues/2090.
|
|
if ownerRef := metav1.GetControllerOfNoCopy(bindingCopy); ownerRef != nil && ownerRef.UID != object.GetUID() {
|
|
return fmt.Errorf("failed to update binding due to different owner reference UID, will " +
|
|
"try again later after binding is garbage collected, see https://github.com/karmada-io/karmada/issues/2090")
|
|
}
|
|
// Just update necessary fields, especially avoid modifying Spec.Clusters which is scheduling result, if already exists.
|
|
bindingCopy.Labels = util.DedupeAndMergeLabels(bindingCopy.Labels, binding.Labels)
|
|
bindingCopy.OwnerReferences = binding.OwnerReferences
|
|
bindingCopy.Finalizers = binding.Finalizers
|
|
bindingCopy.Spec.Resource = binding.Spec.Resource
|
|
bindingCopy.Spec.ReplicaRequirements = binding.Spec.ReplicaRequirements
|
|
bindingCopy.Spec.Replicas = binding.Spec.Replicas
|
|
bindingCopy.Spec.SchedulerName = binding.Spec.SchedulerName
|
|
bindingCopy.Spec.Placement = binding.Spec.Placement
|
|
bindingCopy.Spec.Failover = binding.Spec.Failover
|
|
return nil
|
|
})
|
|
if err != nil {
|
|
klog.Errorf("Failed to apply cluster policy(%s) for object: %s. error: %v", policy.Name, objectKey, err)
|
|
return err
|
|
}
|
|
|
|
if operationResult == controllerutil.OperationResultCreated {
|
|
klog.Infof("Create ClusterResourceBinding(%s) successfully.", binding.GetName())
|
|
} else if operationResult == controllerutil.OperationResultUpdated {
|
|
klog.Infof("Update ClusterResourceBinding(%s) successfully.", binding.GetName())
|
|
} else {
|
|
klog.V(2).Infof("ClusterResourceBinding(%s) is up to date.", binding.GetName())
|
|
}
|
|
}
|
|
|
|
return nil
|
|
}
|
|
|
|
// GetUnstructuredObject retrieves object by key and returned its unstructured.
|
|
func (d *ResourceDetector) GetUnstructuredObject(objectKey keys.ClusterWideKey) (*unstructured.Unstructured, error) {
|
|
objectGVR, err := restmapper.GetGroupVersionResource(d.RESTMapper, objectKey.GroupVersionKind())
|
|
if err != nil {
|
|
klog.Errorf("Failed to get GVR of object: %s, error: %v", objectKey, err)
|
|
return nil, err
|
|
}
|
|
|
|
object, err := d.InformerManager.Lister(objectGVR).Get(objectKey.NamespaceKey())
|
|
if err != nil {
|
|
if apierrors.IsNotFound(err) {
|
|
// If the target object is not found in the informer cache,
|
|
// use the DynamicClient to get the target object again.
|
|
var object *unstructured.Unstructured
|
|
object, err = d.DynamicClient.Resource(objectGVR).Namespace(objectKey.Namespace).
|
|
Get(context.TODO(), objectKey.Name, metav1.GetOptions{})
|
|
if err == nil {
|
|
return object, nil
|
|
}
|
|
}
|
|
klog.Errorf("Failed to get object(%s), error: %v", objectKey, err)
|
|
return nil, err
|
|
}
|
|
|
|
unstructuredObj, err := helper.ToUnstructured(object)
|
|
if err != nil {
|
|
klog.Errorf("Failed to transform object(%s), error: %v", objectKey, err)
|
|
return nil, err
|
|
}
|
|
|
|
return unstructuredObj, nil
|
|
}
|
|
|
|
// ClaimPolicyForObject set policy identifier which the object associated with.
|
|
func (d *ResourceDetector) ClaimPolicyForObject(object *unstructured.Unstructured, policyNamespace string, policyName string) error {
|
|
claimedNS := util.GetLabelValue(object.GetLabels(), policyv1alpha1.PropagationPolicyNamespaceLabel)
|
|
claimedName := util.GetLabelValue(object.GetLabels(), policyv1alpha1.PropagationPolicyNameLabel)
|
|
|
|
// object has been claimed, don't need to claim again
|
|
if claimedNS == policyNamespace && claimedName == policyName {
|
|
return nil
|
|
}
|
|
|
|
util.MergeLabel(object, policyv1alpha1.PropagationPolicyNamespaceLabel, policyNamespace)
|
|
util.MergeLabel(object, policyv1alpha1.PropagationPolicyNameLabel, policyName)
|
|
|
|
return d.Client.Update(context.TODO(), object)
|
|
}
|
|
|
|
// ClaimClusterPolicyForObject set cluster identifier which the object associated with.
|
|
func (d *ResourceDetector) ClaimClusterPolicyForObject(object *unstructured.Unstructured, policyName string) error {
|
|
claimedName := util.GetLabelValue(object.GetLabels(), policyv1alpha1.ClusterPropagationPolicyLabel)
|
|
|
|
// object has been claimed, don't need to claim again
|
|
if claimedName == policyName {
|
|
return nil
|
|
}
|
|
|
|
util.MergeLabel(object, policyv1alpha1.ClusterPropagationPolicyLabel, policyName)
|
|
return d.Client.Update(context.TODO(), object)
|
|
}
|
|
|
|
// BuildResourceBinding builds a desired ResourceBinding for object.
|
|
func (d *ResourceDetector) BuildResourceBinding(object *unstructured.Unstructured, objectKey keys.ClusterWideKey, labels map[string]string, policySpec *policyv1alpha1.PropagationSpec) (*workv1alpha2.ResourceBinding, error) {
|
|
bindingName := names.GenerateBindingName(object.GetKind(), object.GetName())
|
|
propagationBinding := &workv1alpha2.ResourceBinding{
|
|
ObjectMeta: metav1.ObjectMeta{
|
|
Name: bindingName,
|
|
Namespace: object.GetNamespace(),
|
|
OwnerReferences: []metav1.OwnerReference{
|
|
*metav1.NewControllerRef(object, objectKey.GroupVersionKind()),
|
|
},
|
|
Labels: labels,
|
|
Finalizers: []string{util.BindingControllerFinalizer},
|
|
},
|
|
Spec: workv1alpha2.ResourceBindingSpec{
|
|
PropagateDeps: policySpec.PropagateDeps,
|
|
SchedulerName: policySpec.SchedulerName,
|
|
Placement: &policySpec.Placement,
|
|
Failover: policySpec.Failover,
|
|
Resource: workv1alpha2.ObjectReference{
|
|
APIVersion: object.GetAPIVersion(),
|
|
Kind: object.GetKind(),
|
|
Namespace: object.GetNamespace(),
|
|
Name: object.GetName(),
|
|
UID: object.GetUID(),
|
|
ResourceVersion: object.GetResourceVersion(),
|
|
},
|
|
},
|
|
}
|
|
|
|
if d.ResourceInterpreter.HookEnabled(object.GroupVersionKind(), configv1alpha1.InterpreterOperationInterpretReplica) {
|
|
replicas, replicaRequirements, err := d.ResourceInterpreter.GetReplicas(object)
|
|
if err != nil {
|
|
klog.Errorf("Failed to customize replicas for %s(%s), %v", object.GroupVersionKind(), object.GetName(), err)
|
|
return nil, err
|
|
}
|
|
propagationBinding.Spec.Replicas = replicas
|
|
propagationBinding.Spec.ReplicaRequirements = replicaRequirements
|
|
}
|
|
|
|
return propagationBinding, nil
|
|
}
|
|
|
|
// BuildClusterResourceBinding builds a desired ClusterResourceBinding for object.
|
|
func (d *ResourceDetector) BuildClusterResourceBinding(object *unstructured.Unstructured, objectKey keys.ClusterWideKey, labels map[string]string, policySpec *policyv1alpha1.PropagationSpec) (*workv1alpha2.ClusterResourceBinding, error) {
|
|
bindingName := names.GenerateBindingName(object.GetKind(), object.GetName())
|
|
binding := &workv1alpha2.ClusterResourceBinding{
|
|
ObjectMeta: metav1.ObjectMeta{
|
|
Name: bindingName,
|
|
OwnerReferences: []metav1.OwnerReference{
|
|
*metav1.NewControllerRef(object, objectKey.GroupVersionKind()),
|
|
},
|
|
Labels: labels,
|
|
Finalizers: []string{util.ClusterResourceBindingControllerFinalizer},
|
|
},
|
|
Spec: workv1alpha2.ResourceBindingSpec{
|
|
PropagateDeps: policySpec.PropagateDeps,
|
|
SchedulerName: policySpec.SchedulerName,
|
|
Placement: &policySpec.Placement,
|
|
Failover: policySpec.Failover,
|
|
Resource: workv1alpha2.ObjectReference{
|
|
APIVersion: object.GetAPIVersion(),
|
|
Kind: object.GetKind(),
|
|
Name: object.GetName(),
|
|
UID: object.GetUID(),
|
|
ResourceVersion: object.GetResourceVersion(),
|
|
},
|
|
},
|
|
}
|
|
|
|
if d.ResourceInterpreter.HookEnabled(object.GroupVersionKind(), configv1alpha1.InterpreterOperationInterpretReplica) {
|
|
replicas, replicaRequirements, err := d.ResourceInterpreter.GetReplicas(object)
|
|
if err != nil {
|
|
klog.Errorf("Failed to customize replicas for %s(%s), %v", object.GroupVersionKind(), object.GetName(), err)
|
|
return nil, err
|
|
}
|
|
binding.Spec.Replicas = replicas
|
|
binding.Spec.ReplicaRequirements = replicaRequirements
|
|
}
|
|
|
|
return binding, nil
|
|
}
|
|
|
|
// isWaiting indicates if the object is in waiting list.
|
|
func (d *ResourceDetector) isWaiting(objectKey keys.ClusterWideKey) bool {
|
|
d.waitingLock.RLock()
|
|
_, ok := d.waitingObjects[objectKey]
|
|
d.waitingLock.RUnlock()
|
|
return ok
|
|
}
|
|
|
|
// AddWaiting adds object's key to waiting list.
|
|
func (d *ResourceDetector) AddWaiting(objectKey keys.ClusterWideKey) {
|
|
d.waitingLock.Lock()
|
|
defer d.waitingLock.Unlock()
|
|
|
|
d.waitingObjects[objectKey] = struct{}{}
|
|
klog.V(1).Infof("Add object(%s) to waiting list, length of list is: %d", objectKey.String(), len(d.waitingObjects))
|
|
}
|
|
|
|
// RemoveWaiting removes object's key from waiting list.
|
|
func (d *ResourceDetector) RemoveWaiting(objectKey keys.ClusterWideKey) {
|
|
d.waitingLock.Lock()
|
|
defer d.waitingLock.Unlock()
|
|
|
|
delete(d.waitingObjects, objectKey)
|
|
}
|
|
|
|
// GetMatching gets objects keys in waiting list that matches one of resource selectors.
|
|
func (d *ResourceDetector) GetMatching(resourceSelectors []policyv1alpha1.ResourceSelector) []keys.ClusterWideKey {
|
|
d.waitingLock.RLock()
|
|
defer d.waitingLock.RUnlock()
|
|
|
|
var matchedResult []keys.ClusterWideKey
|
|
|
|
for waitKey := range d.waitingObjects {
|
|
waitObj, err := d.GetUnstructuredObject(waitKey)
|
|
if err != nil {
|
|
// all object in waiting list should exist. Just print a log to trace.
|
|
klog.Errorf("Failed to get object(%s), error: %v", waitKey.String(), err)
|
|
continue
|
|
}
|
|
|
|
for _, rs := range resourceSelectors {
|
|
if util.ResourceMatches(waitObj, rs) {
|
|
matchedResult = append(matchedResult, waitKey)
|
|
break
|
|
}
|
|
}
|
|
}
|
|
|
|
return matchedResult
|
|
}
|
|
|
|
// OnPropagationPolicyAdd handles object add event and push the object to queue.
|
|
func (d *ResourceDetector) OnPropagationPolicyAdd(obj interface{}) {
|
|
key, err := ClusterWideKeyFunc(obj)
|
|
if err != nil {
|
|
return
|
|
}
|
|
|
|
klog.V(2).Infof("Create PropagationPolicy(%s)", key)
|
|
d.policyReconcileWorker.Add(key)
|
|
}
|
|
|
|
// OnPropagationPolicyUpdate handles object update event and push the object to queue.
|
|
func (d *ResourceDetector) OnPropagationPolicyUpdate(oldObj, newObj interface{}) {
|
|
key, err := ClusterWideKeyFunc(newObj)
|
|
if err != nil {
|
|
return
|
|
}
|
|
|
|
klog.V(2).Infof("Update PropagationPolicy(%s)", key)
|
|
d.policyReconcileWorker.Add(key)
|
|
}
|
|
|
|
// OnPropagationPolicyDelete handles object delete event and push the object to queue.
|
|
func (d *ResourceDetector) OnPropagationPolicyDelete(obj interface{}) {
|
|
key, err := ClusterWideKeyFunc(obj)
|
|
if err != nil {
|
|
return
|
|
}
|
|
|
|
klog.V(2).Infof("Delete PropagationPolicy(%s)", key)
|
|
d.policyReconcileWorker.Add(key)
|
|
}
|
|
|
|
// ReconcilePropagationPolicy handles PropagationPolicy resource changes.
|
|
// When adding a PropagationPolicy, the detector will pick the objects in waitingObjects list that matches the policy and
|
|
// put the object to queue.
|
|
// When removing a PropagationPolicy, the relevant ResourceBinding will be removed and
|
|
// the relevant objects will be put into queue again to try another policy.
|
|
func (d *ResourceDetector) ReconcilePropagationPolicy(key util.QueueKey) error {
|
|
ckey, ok := key.(keys.ClusterWideKey)
|
|
if !ok { // should not happen
|
|
klog.Error("Found invalid key when reconciling propagation policy.")
|
|
return fmt.Errorf("invalid key")
|
|
}
|
|
|
|
unstructuredObj, err := d.propagationPolicyLister.Get(ckey.NamespaceKey())
|
|
if err != nil {
|
|
if apierrors.IsNotFound(err) {
|
|
klog.Infof("PropagationPolicy(%s) has been removed.", ckey.NamespaceKey())
|
|
return d.HandlePropagationPolicyDeletion(ckey.Namespace, ckey.Name)
|
|
}
|
|
klog.Errorf("Failed to get PropagationPolicy(%s): %v", ckey.NamespaceKey(), err)
|
|
return err
|
|
}
|
|
|
|
klog.Infof("PropagationPolicy(%s) has been added.", ckey.NamespaceKey())
|
|
propagationObject := &policyv1alpha1.PropagationPolicy{}
|
|
if err = helper.ConvertToTypedObject(unstructuredObj, propagationObject); err != nil {
|
|
klog.Errorf("Failed to convert PropagationPolicy(%s) from unstructured object: %v", ckey.NamespaceKey(), err)
|
|
return err
|
|
}
|
|
return d.HandlePropagationPolicyCreationOrUpdate(propagationObject)
|
|
}
|
|
|
|
// OnClusterPropagationPolicyAdd handles object add event and push the object to queue.
|
|
func (d *ResourceDetector) OnClusterPropagationPolicyAdd(obj interface{}) {
|
|
key, err := ClusterWideKeyFunc(obj)
|
|
if err != nil {
|
|
return
|
|
}
|
|
|
|
klog.V(2).Infof("Create ClusterPropagationPolicy(%s)", key)
|
|
d.clusterPolicyReconcileWorker.Add(key)
|
|
}
|
|
|
|
// OnClusterPropagationPolicyUpdate handles object update event and push the object to queue.
|
|
func (d *ResourceDetector) OnClusterPropagationPolicyUpdate(oldObj, newObj interface{}) {
|
|
key, err := ClusterWideKeyFunc(newObj)
|
|
if err != nil {
|
|
return
|
|
}
|
|
|
|
klog.V(2).Infof("Update ClusterPropagationPolicy(%s)", key)
|
|
d.clusterPolicyReconcileWorker.Add(key)
|
|
}
|
|
|
|
// OnClusterPropagationPolicyDelete handles object delete event and push the object to queue.
|
|
func (d *ResourceDetector) OnClusterPropagationPolicyDelete(obj interface{}) {
|
|
key, err := ClusterWideKeyFunc(obj)
|
|
if err != nil {
|
|
return
|
|
}
|
|
|
|
klog.V(2).Infof("Delete ClusterPropagationPolicy(%s)", key)
|
|
d.clusterPolicyReconcileWorker.Add(key)
|
|
}
|
|
|
|
// ReconcileClusterPropagationPolicy handles ClusterPropagationPolicy resource changes.
|
|
// When adding a ClusterPropagationPolicy, the detector will pick the objects in waitingObjects list that matches the policy and
|
|
// put the object to queue.
|
|
// When removing a ClusterPropagationPolicy, the relevant ClusterResourceBinding will be removed and
|
|
// the relevant objects will be put into queue again to try another policy.
|
|
func (d *ResourceDetector) ReconcileClusterPropagationPolicy(key util.QueueKey) error {
|
|
ckey, ok := key.(keys.ClusterWideKey)
|
|
if !ok { // should not happen
|
|
klog.Error("Found invalid key when reconciling cluster propagation policy.")
|
|
return fmt.Errorf("invalid key")
|
|
}
|
|
|
|
unstructuredObj, err := d.clusterPropagationPolicyLister.Get(ckey.NamespaceKey())
|
|
if err != nil {
|
|
if apierrors.IsNotFound(err) {
|
|
klog.Infof("ClusterPropagationPolicy(%s) has been removed.", ckey.NamespaceKey())
|
|
return d.HandleClusterPropagationPolicyDeletion(ckey.Name)
|
|
}
|
|
|
|
klog.Errorf("Failed to get ClusterPropagationPolicy(%s): %v", ckey.NamespaceKey(), err)
|
|
return err
|
|
}
|
|
|
|
klog.Infof("Policy(%s) has been added", ckey.NamespaceKey())
|
|
propagationObject := &policyv1alpha1.ClusterPropagationPolicy{}
|
|
if err = helper.ConvertToTypedObject(unstructuredObj, propagationObject); err != nil {
|
|
klog.Errorf("Failed to convert ClusterPropagationPolicy(%s) from unstructured object: %v", ckey.NamespaceKey(), err)
|
|
return err
|
|
}
|
|
return d.HandleClusterPropagationPolicyCreationOrUpdate(propagationObject)
|
|
}
|
|
|
|
// HandlePropagationPolicyDeletion handles PropagationPolicy delete event.
|
|
// After a policy is removed, the label marked on relevant resource template will be removed(which gives
|
|
// the resource template a change to match another policy).
|
|
//
|
|
// Note: The relevant ResourceBinding will continue to exist until the resource template is gone.
|
|
func (d *ResourceDetector) HandlePropagationPolicyDeletion(policyNS string, policyName string) error {
|
|
labelSet := labels.Set{
|
|
policyv1alpha1.PropagationPolicyNamespaceLabel: policyNS,
|
|
policyv1alpha1.PropagationPolicyNameLabel: policyName,
|
|
}
|
|
|
|
rbs, err := helper.GetResourceBindings(d.Client, labelSet)
|
|
if err != nil {
|
|
klog.Errorf("Failed to list propagation bindings: %v", err)
|
|
return err
|
|
}
|
|
|
|
for index, binding := range rbs.Items {
|
|
// Cleanup the labels from the reference binding so that the karmada scheduler won't reschedule the binding.
|
|
if err := d.CleanupResourceBindingLabels(&rbs.Items[index], policyv1alpha1.PropagationPolicyNamespaceLabel, policyv1alpha1.PropagationPolicyNameLabel); err != nil {
|
|
klog.Errorf("Failed to cleanup label from resource binding(%s/%s) when propagation policy(%s/%s) removing, error: %v",
|
|
binding.Namespace, binding.Name, policyNS, policyName, err)
|
|
return err
|
|
}
|
|
|
|
// Cleanup the labels from the object referencing by binding.
|
|
// In addition, this will give the object a chance to match another policy.
|
|
if err := d.CleanupLabels(binding.Spec.Resource, policyv1alpha1.PropagationPolicyNamespaceLabel, policyv1alpha1.PropagationPolicyNameLabel); err != nil {
|
|
klog.Errorf("Failed to cleanup label from resource(%s-%s/%s) when propagation policy(%s/%s) removing, error: %v",
|
|
binding.Spec.Resource.Kind, binding.Spec.Resource.Namespace, binding.Spec.Resource.Name, policyNS, policyName, err)
|
|
return err
|
|
}
|
|
}
|
|
return nil
|
|
}
|
|
|
|
// HandleClusterPropagationPolicyDeletion handles ClusterPropagationPolicy delete event.
|
|
// After a policy is removed, the label marked on relevant resource template will be removed(which gives
|
|
// the resource template a change to match another policy).
|
|
//
|
|
// Note: The relevant ClusterResourceBinding or ResourceBinding will continue to exist until the resource template is gone.
|
|
func (d *ResourceDetector) HandleClusterPropagationPolicyDeletion(policyName string) error {
|
|
var errs []error
|
|
labelSet := labels.Set{
|
|
policyv1alpha1.ClusterPropagationPolicyLabel: policyName,
|
|
}
|
|
|
|
// load the ClusterResourceBindings which labeled with current policy
|
|
crbs, err := helper.GetClusterResourceBindings(d.Client, labelSet)
|
|
if err != nil {
|
|
klog.Errorf("Failed to load cluster resource binding by policy(%s), error: %v", policyName, err)
|
|
errs = append(errs, err)
|
|
} else if len(crbs.Items) > 0 {
|
|
for index, binding := range crbs.Items {
|
|
// Cleanup the labels from the reference binding so that the karmada scheduler won't reschedule the binding.
|
|
if err := d.CleanupClusterResourceBindingLabels(&crbs.Items[index], policyv1alpha1.ClusterPropagationPolicyLabel); err != nil {
|
|
klog.Errorf("Failed to cleanup label from cluster resource binding(%s) when cluster propagation policy(%s) removing, error: %v",
|
|
binding.Name, policyName, err)
|
|
errs = append(errs, err)
|
|
}
|
|
|
|
// Cleanup the labels from the object referencing by binding.
|
|
// In addition, this will give the object a chance to match another policy.
|
|
if err := d.CleanupLabels(binding.Spec.Resource, policyv1alpha1.ClusterPropagationPolicyLabel); err != nil {
|
|
klog.Errorf("Failed to cleanup label from resource(%s-%s/%s) when cluster resource binding(%s) removing, error: %v",
|
|
binding.Spec.Resource.Kind, binding.Spec.Resource.Namespace, binding.Spec.Resource.Name, binding.Name, err)
|
|
errs = append(errs, err)
|
|
}
|
|
}
|
|
}
|
|
|
|
// load the ResourceBindings which labeled with current policy
|
|
rbs, err := helper.GetResourceBindings(d.Client, labelSet)
|
|
if err != nil {
|
|
klog.Errorf("Failed to load resource binding by policy(%s), error: %v", policyName, err)
|
|
errs = append(errs, err)
|
|
} else if len(rbs.Items) > 0 {
|
|
for index, binding := range rbs.Items {
|
|
// Cleanup the labels from the reference binding so that the karmada scheduler won't reschedule the binding.
|
|
if err := d.CleanupResourceBindingLabels(&rbs.Items[index], policyv1alpha1.ClusterPropagationPolicyLabel); err != nil {
|
|
klog.Errorf("Failed to cleanup label from resource binding(%s/%s) when cluster propagation policy(%s) removing, error: %v",
|
|
binding.Namespace, binding.Name, policyName, err)
|
|
errs = append(errs, err)
|
|
}
|
|
|
|
// Cleanup the labels from the object referencing by binding.
|
|
// In addition, this will give the object a chance to match another policy.
|
|
if err := d.CleanupLabels(binding.Spec.Resource, policyv1alpha1.ClusterPropagationPolicyLabel); err != nil {
|
|
klog.Errorf("Failed to cleanup label from resource binding(%s/%s), error: %v", binding.Namespace, binding.Name, err)
|
|
errs = append(errs, err)
|
|
}
|
|
}
|
|
}
|
|
return errors.NewAggregate(errs)
|
|
}
|
|
|
|
// HandlePropagationPolicyCreationOrUpdate handles PropagationPolicy add and update event.
|
|
// When a new policy arrives, should first check whether existing objects are no longer
|
|
// matched by the current policy, if yes, clean the labels on the object.
|
|
// And then check if object in waiting list matches the policy, if yes remove the object
|
|
// from waiting list and throw the object to it's reconcile queue. If not, do nothing.
|
|
func (d *ResourceDetector) HandlePropagationPolicyCreationOrUpdate(policy *policyv1alpha1.PropagationPolicy) error {
|
|
err := d.cleanPPUnmatchedResourceBindings(policy.Namespace, policy.Name, policy.Spec.ResourceSelectors)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
// When updating fields other than ResourceSelector, should first find the corresponding ResourceBinding
|
|
// and add the bound object to the processor's queue for reconciliation to make sure that
|
|
// PropagationPolicy's updates can be synchronized to ResourceBinding.
|
|
resourceBindings, err := d.listPPDerivedRB(policy.Namespace, policy.Name)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
for _, rb := range resourceBindings.Items {
|
|
resourceKey, err := helper.ConstructClusterWideKey(rb.Spec.Resource)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
d.Processor.Add(resourceKey)
|
|
}
|
|
|
|
matchedKeys := d.GetMatching(policy.Spec.ResourceSelectors)
|
|
klog.Infof("Matched %d resources by policy(%s/%s)", len(matchedKeys), policy.Namespace, policy.Name)
|
|
|
|
// check dependents only when there at least a real match.
|
|
if len(matchedKeys) > 0 {
|
|
// return err when dependents not present, that we can retry at next reconcile.
|
|
if present, err := helper.IsDependentOverridesPresent(d.Client, policy); err != nil || !present {
|
|
klog.Infof("Waiting for dependent overrides present for policy(%s/%s)", policy.Namespace, policy.Name)
|
|
return fmt.Errorf("waiting for dependent overrides")
|
|
}
|
|
}
|
|
|
|
for _, key := range matchedKeys {
|
|
d.RemoveWaiting(key)
|
|
d.Processor.Add(key)
|
|
}
|
|
|
|
return nil
|
|
}
|
|
|
|
// HandleClusterPropagationPolicyCreationOrUpdate handles ClusterPropagationPolicy add and update event.
|
|
// When a new policy arrives, should first check whether existing objects are no longer
|
|
// matched by the current policy, if yes, clean the labels on the object.
|
|
// And then check if object in waiting list matches the policy, if yes remove the object
|
|
// from waiting list and throw the object to it's reconcile queue. If not, do nothing.
|
|
func (d *ResourceDetector) HandleClusterPropagationPolicyCreationOrUpdate(policy *policyv1alpha1.ClusterPropagationPolicy) error {
|
|
err := d.cleanCPPUnmatchedResourceBindings(policy.Name, policy.Spec.ResourceSelectors)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
err = d.cleanUnmatchedClusterResourceBinding(policy.Name, policy.Spec.ResourceSelectors)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
// When updating fields other than ResourceSelector, should first find the corresponding ResourceBinding/ClusterResourceBinding
|
|
// and add the bound object to the processor's queue for reconciliation to make sure that
|
|
// ClusterPropagationPolicy's updates can be synchronized to ResourceBinding/ClusterResourceBinding.
|
|
resourceBindings, err := d.listCPPDerivedRB(policy.Name)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
clusterResourceBindings, err := d.listCPPDerivedCRB(policy.Name)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
for _, rb := range resourceBindings.Items {
|
|
resourceKey, err := helper.ConstructClusterWideKey(rb.Spec.Resource)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
d.Processor.Add(resourceKey)
|
|
}
|
|
for _, crb := range clusterResourceBindings.Items {
|
|
resourceKey, err := helper.ConstructClusterWideKey(crb.Spec.Resource)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
d.Processor.Add(resourceKey)
|
|
}
|
|
|
|
matchedKeys := d.GetMatching(policy.Spec.ResourceSelectors)
|
|
klog.Infof("Matched %d resources by policy(%s)", len(matchedKeys), policy.Name)
|
|
|
|
// check dependents only when there at least a real match.
|
|
if len(matchedKeys) > 0 {
|
|
// return err when dependents not present, that we can retry at next reconcile.
|
|
if present, err := helper.IsDependentClusterOverridesPresent(d.Client, policy); err != nil || !present {
|
|
klog.Infof("Waiting for dependent overrides present for policy(%s)", policy.Name)
|
|
return fmt.Errorf("waiting for dependent overrides")
|
|
}
|
|
}
|
|
|
|
for _, key := range matchedKeys {
|
|
d.RemoveWaiting(key)
|
|
d.Processor.Add(key)
|
|
}
|
|
|
|
return nil
|
|
}
|
|
|
|
// CleanupLabels removes labels from object referencing by objRef.
|
|
func (d *ResourceDetector) CleanupLabels(objRef workv1alpha2.ObjectReference, labels ...string) error {
|
|
workload, err := helper.FetchResourceTemplate(d.DynamicClient, d.InformerManager, d.RESTMapper, objRef)
|
|
if err != nil {
|
|
// do nothing if resource template not exist, it might has been removed.
|
|
if apierrors.IsNotFound(err) {
|
|
return nil
|
|
}
|
|
klog.Errorf("Failed to fetch resource(kind=%s, %s/%s): %v", objRef.Kind, objRef.Namespace, objRef.Name, err)
|
|
return err
|
|
}
|
|
|
|
workloadLabels := workload.GetLabels()
|
|
for _, l := range labels {
|
|
delete(workloadLabels, l)
|
|
}
|
|
workload.SetLabels(workloadLabels)
|
|
|
|
gvr, err := restmapper.GetGroupVersionResource(d.RESTMapper, workload.GroupVersionKind())
|
|
if err != nil {
|
|
klog.Errorf("Failed to delete resource(%s/%s) labels as mapping GVK to GVR failed: %v", workload.GetNamespace(), workload.GetName(), err)
|
|
return err
|
|
}
|
|
|
|
newWorkload, err := d.DynamicClient.Resource(gvr).Namespace(workload.GetNamespace()).Update(context.TODO(), workload, metav1.UpdateOptions{})
|
|
if err != nil {
|
|
klog.Errorf("Failed to update resource %v/%v, err is %v ", workload.GetNamespace(), workload.GetName(), err)
|
|
return err
|
|
}
|
|
klog.V(2).Infof("Updated resource template(kind=%s, %s/%s) successfully", newWorkload.GetKind(), newWorkload.GetNamespace(), newWorkload.GetName())
|
|
return nil
|
|
}
|
|
|
|
// CleanupResourceBindingLabels removes labels from resource binding.
|
|
func (d *ResourceDetector) CleanupResourceBindingLabels(rb *workv1alpha2.ResourceBinding, labels ...string) error {
|
|
bindingLabels := rb.GetLabels()
|
|
for _, l := range labels {
|
|
delete(bindingLabels, l)
|
|
}
|
|
|
|
return retry.RetryOnConflict(retry.DefaultRetry, func() (err error) {
|
|
rb.SetLabels(bindingLabels)
|
|
updateErr := d.Client.Update(context.TODO(), rb)
|
|
if updateErr == nil {
|
|
return nil
|
|
}
|
|
|
|
updated := &workv1alpha2.ResourceBinding{}
|
|
if err = d.Client.Get(context.TODO(), client.ObjectKey{Namespace: rb.GetNamespace(), Name: rb.GetName()}, updated); err == nil {
|
|
//make a copy, so we don't mutate the shared cache
|
|
rb = updated.DeepCopy()
|
|
} else {
|
|
klog.Errorf("Failed to get updated resource binding %s/%s: %v", rb.GetNamespace(), rb.GetName(), err)
|
|
}
|
|
return updateErr
|
|
})
|
|
}
|
|
|
|
// CleanupClusterResourceBindingLabels removes labels from cluster resource binding.
|
|
func (d *ResourceDetector) CleanupClusterResourceBindingLabels(crb *workv1alpha2.ClusterResourceBinding, labels ...string) error {
|
|
bindingLabels := crb.GetLabels()
|
|
for _, l := range labels {
|
|
delete(bindingLabels, l)
|
|
}
|
|
|
|
return retry.RetryOnConflict(retry.DefaultRetry, func() (err error) {
|
|
crb.SetLabels(bindingLabels)
|
|
updateErr := d.Client.Update(context.TODO(), crb)
|
|
if updateErr == nil {
|
|
return nil
|
|
}
|
|
|
|
updated := &workv1alpha2.ClusterResourceBinding{}
|
|
if err = d.Client.Get(context.TODO(), client.ObjectKey{Name: crb.GetName()}, updated); err == nil {
|
|
//make a copy, so we don't mutate the shared cache
|
|
crb = updated.DeepCopy()
|
|
} else {
|
|
klog.Errorf("Failed to get updated cluster resource binding %s: %v", crb.GetName(), err)
|
|
}
|
|
return updateErr
|
|
})
|
|
}
|