916 lines
		
	
	
		
			38 KiB
		
	
	
	
		
			Go
		
	
	
	
			
		
		
	
	
			916 lines
		
	
	
		
			38 KiB
		
	
	
	
		
			Go
		
	
	
	
| /*
 | |
| Copyright 2019 The Kubernetes Authors.
 | |
| 
 | |
| Licensed under the Apache License, Version 2.0 (the "License");
 | |
| you may not use this file except in compliance with the License.
 | |
| You may obtain a copy of the License at
 | |
| 
 | |
|     http://www.apache.org/licenses/LICENSE-2.0
 | |
| 
 | |
| Unless required by applicable law or agreed to in writing, software
 | |
| distributed under the License is distributed on an "AS IS" BASIS,
 | |
| WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 | |
| See the License for the specific language governing permissions and
 | |
| limitations under the License.
 | |
| */
 | |
| 
 | |
| package flowcontrol
 | |
| 
 | |
| import (
 | |
| 	"context"
 | |
| 	"crypto/sha256"
 | |
| 	"encoding/binary"
 | |
| 	"encoding/json"
 | |
| 	"errors"
 | |
| 	"fmt"
 | |
| 	"math"
 | |
| 	"math/rand"
 | |
| 	"sort"
 | |
| 	"sync"
 | |
| 	"time"
 | |
| 
 | |
| 	"github.com/google/go-cmp/cmp"
 | |
| 	apiequality "k8s.io/apimachinery/pkg/api/equality"
 | |
| 	apierrors "k8s.io/apimachinery/pkg/api/errors"
 | |
| 	metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
 | |
| 	"k8s.io/apimachinery/pkg/labels"
 | |
| 	apitypes "k8s.io/apimachinery/pkg/types"
 | |
| 	utilerrors "k8s.io/apimachinery/pkg/util/errors"
 | |
| 	utilruntime "k8s.io/apimachinery/pkg/util/runtime"
 | |
| 	"k8s.io/apimachinery/pkg/util/sets"
 | |
| 	"k8s.io/apimachinery/pkg/util/wait"
 | |
| 	fcboot "k8s.io/apiserver/pkg/apis/flowcontrol/bootstrap"
 | |
| 	"k8s.io/apiserver/pkg/authentication/user"
 | |
| 	"k8s.io/apiserver/pkg/endpoints/request"
 | |
| 	"k8s.io/apiserver/pkg/util/apihelpers"
 | |
| 	fq "k8s.io/apiserver/pkg/util/flowcontrol/fairqueuing"
 | |
| 	fcfmt "k8s.io/apiserver/pkg/util/flowcontrol/format"
 | |
| 	"k8s.io/apiserver/pkg/util/flowcontrol/metrics"
 | |
| 	fcrequest "k8s.io/apiserver/pkg/util/flowcontrol/request"
 | |
| 	"k8s.io/client-go/tools/cache"
 | |
| 	"k8s.io/client-go/util/workqueue"
 | |
| 	"k8s.io/klog/v2"
 | |
| 	"k8s.io/utils/clock"
 | |
| 
 | |
| 	flowcontrol "k8s.io/api/flowcontrol/v1beta2"
 | |
| 	flowcontrolclient "k8s.io/client-go/kubernetes/typed/flowcontrol/v1beta2"
 | |
| 	flowcontrollister "k8s.io/client-go/listers/flowcontrol/v1beta2"
 | |
| )
 | |
| 
 | |
| const timeFmt = "2006-01-02T15:04:05.999"
 | |
| 
 | |
| // This file contains a simple local (to the apiserver) controller
 | |
| // that digests API Priority and Fairness config objects (FlowSchema
 | |
| // and PriorityLevelConfiguration) into the data structure that the
 | |
| // filter uses.  At this first level of development this controller
 | |
| // takes the simplest possible approach: whenever notified of any
 | |
| // change to any config object, or when any priority level that is
 | |
| // undesired becomes completely unused, all the config objects are
 | |
| // read and processed as a whole.
 | |
| 
 | |
| // The funcs in this package follow the naming convention that the suffix
 | |
| // "Locked" means the relevant mutex must be locked at the start of each
 | |
| // call and will be locked upon return.  For a configController, the
 | |
| // suffix "ReadLocked" stipulates a read lock while just "Locked"
 | |
| // stipulates a full lock.  Absence of either suffix means that either
 | |
| // (a) the lock must NOT be held at call time and will not be held
 | |
| // upon return or (b) locking is irrelevant.
 | |
| 
 | |
| // StartFunction begins the process of handling a request.  If the
 | |
| // request gets queued then this function uses the given hashValue as
 | |
| // the source of entropy as it shuffle-shards the request into a
 | |
| // queue.  The descr1 and descr2 values play no role in the logic but
 | |
| // appear in log messages.  This method does not return until the
 | |
| // queuing, if any, for this request is done.  If `execute` is false
 | |
| // then `afterExecution` is irrelevant and the request should be
 | |
| // rejected.  Otherwise the request should be executed and
 | |
| // `afterExecution` must be called exactly once.
 | |
| type StartFunction func(ctx context.Context, hashValue uint64) (execute bool, afterExecution func())
 | |
| 
 | |
| // RequestDigest holds necessary info from request for flow-control
 | |
| type RequestDigest struct {
 | |
| 	RequestInfo  *request.RequestInfo
 | |
| 	User         user.Info
 | |
| 	WorkEstimate fcrequest.WorkEstimate
 | |
| }
 | |
| 
 | |
| // `*configController` maintains eventual consistency with the API
 | |
| // objects that configure API Priority and Fairness, and provides a
 | |
| // procedural interface to the configured behavior.  The methods of
 | |
| // this type and cfgMeal follow the convention that the suffix
 | |
| // "Locked" means that the caller must hold the configController lock.
 | |
| type configController struct {
 | |
| 	name                  string // varies in tests of fighting controllers
 | |
| 	clock                 clock.PassiveClock
 | |
| 	queueSetFactory       fq.QueueSetFactory
 | |
| 	reqsObsPairGenerator  metrics.TimedObserverPairGenerator
 | |
| 	execSeatsObsGenerator metrics.TimedObserverGenerator
 | |
| 
 | |
| 	// How this controller appears in an ObjectMeta ManagedFieldsEntry.Manager
 | |
| 	asFieldManager string
 | |
| 
 | |
| 	// Given a boolean indicating whether a FlowSchema's referenced
 | |
| 	// PriorityLevelConfig exists, return a boolean indicating whether
 | |
| 	// the reference is dangling
 | |
| 	foundToDangling func(bool) bool
 | |
| 
 | |
| 	// configQueue holds `(interface{})(0)` when the configuration
 | |
| 	// objects need to be reprocessed.
 | |
| 	configQueue workqueue.RateLimitingInterface
 | |
| 
 | |
| 	plLister         flowcontrollister.PriorityLevelConfigurationLister
 | |
| 	plInformerSynced cache.InformerSynced
 | |
| 
 | |
| 	fsLister         flowcontrollister.FlowSchemaLister
 | |
| 	fsInformerSynced cache.InformerSynced
 | |
| 
 | |
| 	flowcontrolClient flowcontrolclient.FlowcontrolV1beta2Interface
 | |
| 
 | |
| 	// serverConcurrencyLimit is the limit on the server's total
 | |
| 	// number of non-exempt requests being served at once.  This comes
 | |
| 	// from server configuration.
 | |
| 	serverConcurrencyLimit int
 | |
| 
 | |
| 	// requestWaitLimit comes from server configuration.
 | |
| 	requestWaitLimit time.Duration
 | |
| 
 | |
| 	// watchTracker implements the necessary WatchTracker interface.
 | |
| 	WatchTracker
 | |
| 
 | |
| 	// the most recent update attempts, ordered by increasing age.
 | |
| 	// Consumer trims to keep only the last minute's worth of entries.
 | |
| 	// The controller uses this to limit itself to at most six updates
 | |
| 	// to a given FlowSchema in any minute.
 | |
| 	// This may only be accessed from the one and only worker goroutine.
 | |
| 	mostRecentUpdates []updateAttempt
 | |
| 
 | |
| 	// This must be locked while accessing flowSchemas or
 | |
| 	// priorityLevelStates.  A lock for writing is needed
 | |
| 	// for writing to any of the following:
 | |
| 	// - the flowSchemas field
 | |
| 	// - the slice held in the flowSchemas field
 | |
| 	// - the priorityLevelStates field
 | |
| 	// - the map held in the priorityLevelStates field
 | |
| 	// - any field of a priorityLevelState held in that map
 | |
| 	lock sync.RWMutex
 | |
| 
 | |
| 	// flowSchemas holds the flow schema objects, sorted by increasing
 | |
| 	// numerical (decreasing logical) matching precedence.  Every
 | |
| 	// FlowSchema in this slice is immutable.
 | |
| 	flowSchemas apihelpers.FlowSchemaSequence
 | |
| 
 | |
| 	// priorityLevelStates maps the PriorityLevelConfiguration object
 | |
| 	// name to the state for that level.  Every name referenced from a
 | |
| 	// member of `flowSchemas` has an entry here.
 | |
| 	priorityLevelStates map[string]*priorityLevelState
 | |
| }
 | |
| 
 | |
| type updateAttempt struct {
 | |
| 	timeUpdated  time.Time
 | |
| 	updatedItems sets.String // FlowSchema names
 | |
| }
 | |
| 
 | |
| // priorityLevelState holds the state specific to a priority level.
 | |
| type priorityLevelState struct {
 | |
| 	// the API object or prototype prescribing this level.  Nothing
 | |
| 	// reached through this pointer is mutable.
 | |
| 	pl *flowcontrol.PriorityLevelConfiguration
 | |
| 
 | |
| 	// qsCompleter holds the QueueSetCompleter derived from `config`
 | |
| 	// and `queues` if config is not exempt, nil otherwise.
 | |
| 	qsCompleter fq.QueueSetCompleter
 | |
| 
 | |
| 	// The QueueSet for this priority level.  This is nil if and only
 | |
| 	// if the priority level is exempt.
 | |
| 	queues fq.QueueSet
 | |
| 
 | |
| 	// quiescing==true indicates that this priority level should be
 | |
| 	// removed when its queues have all drained.  May be true only if
 | |
| 	// queues is non-nil.
 | |
| 	quiescing bool
 | |
| 
 | |
| 	// number of goroutines between Controller::Match and calling the
 | |
| 	// returned StartFunction
 | |
| 	numPending int
 | |
| 
 | |
| 	// Observers tracking number of requests waiting, executing
 | |
| 	reqsObsPair metrics.TimedObserverPair
 | |
| 
 | |
| 	// Observer of number of seats occupied throughout execution
 | |
| 	execSeatsObs metrics.TimedObserver
 | |
| }
 | |
| 
 | |
| // NewTestableController is extra flexible to facilitate testing
 | |
| func newTestableController(config TestableConfig) *configController {
 | |
| 	cfgCtlr := &configController{
 | |
| 		name:                   config.Name,
 | |
| 		clock:                  config.Clock,
 | |
| 		queueSetFactory:        config.QueueSetFactory,
 | |
| 		reqsObsPairGenerator:   config.ReqsObsPairGenerator,
 | |
| 		execSeatsObsGenerator:  config.ExecSeatsObsGenerator,
 | |
| 		asFieldManager:         config.AsFieldManager,
 | |
| 		foundToDangling:        config.FoundToDangling,
 | |
| 		serverConcurrencyLimit: config.ServerConcurrencyLimit,
 | |
| 		requestWaitLimit:       config.RequestWaitLimit,
 | |
| 		flowcontrolClient:      config.FlowcontrolClient,
 | |
| 		priorityLevelStates:    make(map[string]*priorityLevelState),
 | |
| 		WatchTracker:           NewWatchTracker(),
 | |
| 	}
 | |
| 	klog.V(2).Infof("NewTestableController %q with serverConcurrencyLimit=%d, requestWaitLimit=%s, name=%s, asFieldManager=%q", cfgCtlr.name, cfgCtlr.serverConcurrencyLimit, cfgCtlr.requestWaitLimit, cfgCtlr.name, cfgCtlr.asFieldManager)
 | |
| 	// Start with longish delay because conflicts will be between
 | |
| 	// different processes, so take some time to go away.
 | |
| 	cfgCtlr.configQueue = workqueue.NewNamedRateLimitingQueue(workqueue.NewItemExponentialFailureRateLimiter(200*time.Millisecond, 8*time.Hour), "priority_and_fairness_config_queue")
 | |
| 	// ensure the data structure reflects the mandatory config
 | |
| 	cfgCtlr.lockAndDigestConfigObjects(nil, nil)
 | |
| 	fci := config.InformerFactory.Flowcontrol().V1beta2()
 | |
| 	pli := fci.PriorityLevelConfigurations()
 | |
| 	fsi := fci.FlowSchemas()
 | |
| 	cfgCtlr.plLister = pli.Lister()
 | |
| 	cfgCtlr.plInformerSynced = pli.Informer().HasSynced
 | |
| 	cfgCtlr.fsLister = fsi.Lister()
 | |
| 	cfgCtlr.fsInformerSynced = fsi.Informer().HasSynced
 | |
| 	pli.Informer().AddEventHandler(cache.ResourceEventHandlerFuncs{
 | |
| 		AddFunc: func(obj interface{}) {
 | |
| 			pl := obj.(*flowcontrol.PriorityLevelConfiguration)
 | |
| 			klog.V(7).Infof("Triggered API priority and fairness config reloading in %s due to creation of PLC %s", cfgCtlr.name, pl.Name)
 | |
| 			cfgCtlr.configQueue.Add(0)
 | |
| 		},
 | |
| 		UpdateFunc: func(oldObj, newObj interface{}) {
 | |
| 			newPL := newObj.(*flowcontrol.PriorityLevelConfiguration)
 | |
| 			oldPL := oldObj.(*flowcontrol.PriorityLevelConfiguration)
 | |
| 			if !apiequality.Semantic.DeepEqual(oldPL.Spec, newPL.Spec) {
 | |
| 				klog.V(7).Infof("Triggered API priority and fairness config reloading in %s due to spec update of PLC %s", cfgCtlr.name, newPL.Name)
 | |
| 				cfgCtlr.configQueue.Add(0)
 | |
| 			} else {
 | |
| 				klog.V(7).Infof("No trigger API priority and fairness config reloading in %s due to spec non-change of PLC %s", cfgCtlr.name, newPL.Name)
 | |
| 			}
 | |
| 		},
 | |
| 		DeleteFunc: func(obj interface{}) {
 | |
| 			name, _ := cache.DeletionHandlingMetaNamespaceKeyFunc(obj)
 | |
| 			klog.V(7).Infof("Triggered API priority and fairness config reloading in %s due to deletion of PLC %s", cfgCtlr.name, name)
 | |
| 			cfgCtlr.configQueue.Add(0)
 | |
| 
 | |
| 		}})
 | |
| 	fsi.Informer().AddEventHandler(cache.ResourceEventHandlerFuncs{
 | |
| 		AddFunc: func(obj interface{}) {
 | |
| 			fs := obj.(*flowcontrol.FlowSchema)
 | |
| 			klog.V(7).Infof("Triggered API priority and fairness config reloading in %s due to creation of FS %s", cfgCtlr.name, fs.Name)
 | |
| 			cfgCtlr.configQueue.Add(0)
 | |
| 		},
 | |
| 		UpdateFunc: func(oldObj, newObj interface{}) {
 | |
| 			newFS := newObj.(*flowcontrol.FlowSchema)
 | |
| 			oldFS := oldObj.(*flowcontrol.FlowSchema)
 | |
| 			// Changes to either Spec or Status are relevant.  The
 | |
| 			// concern is that we might, in some future release, want
 | |
| 			// different behavior than is implemented now. One of the
 | |
| 			// hardest questions is how does an operator roll out the
 | |
| 			// new release in a cluster with multiple kube-apiservers
 | |
| 			// --- in a way that works no matter what servers crash
 | |
| 			// and restart when. If this handler reacts only to
 | |
| 			// changes in Spec then we have a scenario in which the
 | |
| 			// rollout leaves the old Status in place. The scenario
 | |
| 			// ends with this subsequence: deploy the last new server
 | |
| 			// before deleting the last old server, and in between
 | |
| 			// those two operations the last old server crashes and
 | |
| 			// recovers. The chosen solution is making this controller
 | |
| 			// insist on maintaining the particular state that it
 | |
| 			// establishes.
 | |
| 			if !(apiequality.Semantic.DeepEqual(oldFS.Spec, newFS.Spec) &&
 | |
| 				apiequality.Semantic.DeepEqual(oldFS.Status, newFS.Status)) {
 | |
| 				klog.V(7).Infof("Triggered API priority and fairness config reloading in %s due to spec and/or status update of FS %s", cfgCtlr.name, newFS.Name)
 | |
| 				cfgCtlr.configQueue.Add(0)
 | |
| 			} else {
 | |
| 				klog.V(7).Infof("No trigger of API priority and fairness config reloading in %s due to spec and status non-change of FS %s", cfgCtlr.name, newFS.Name)
 | |
| 			}
 | |
| 		},
 | |
| 		DeleteFunc: func(obj interface{}) {
 | |
| 			name, _ := cache.DeletionHandlingMetaNamespaceKeyFunc(obj)
 | |
| 			klog.V(7).Infof("Triggered API priority and fairness config reloading in %s due to deletion of FS %s", cfgCtlr.name, name)
 | |
| 			cfgCtlr.configQueue.Add(0)
 | |
| 
 | |
| 		}})
 | |
| 	return cfgCtlr
 | |
| }
 | |
| 
 | |
| // MaintainObservations keeps the observers from
 | |
| // metrics.PriorityLevelConcurrencyObserverPairGenerator from falling
 | |
| // too far behind
 | |
| func (cfgCtlr *configController) MaintainObservations(stopCh <-chan struct{}) {
 | |
| 	wait.Until(cfgCtlr.updateObservations, 10*time.Second, stopCh)
 | |
| }
 | |
| 
 | |
| func (cfgCtlr *configController) updateObservations() {
 | |
| 	cfgCtlr.lock.RLock()
 | |
| 	defer cfgCtlr.lock.RUnlock()
 | |
| 	for _, plc := range cfgCtlr.priorityLevelStates {
 | |
| 		if plc.queues != nil {
 | |
| 			plc.queues.UpdateObservations()
 | |
| 		}
 | |
| 	}
 | |
| }
 | |
| 
 | |
| func (cfgCtlr *configController) Run(stopCh <-chan struct{}) error {
 | |
| 	defer utilruntime.HandleCrash()
 | |
| 
 | |
| 	// Let the config worker stop when we are done
 | |
| 	defer cfgCtlr.configQueue.ShutDown()
 | |
| 
 | |
| 	klog.Info("Starting API Priority and Fairness config controller")
 | |
| 	if ok := cache.WaitForCacheSync(stopCh, cfgCtlr.plInformerSynced, cfgCtlr.fsInformerSynced); !ok {
 | |
| 		return fmt.Errorf("Never achieved initial sync")
 | |
| 	}
 | |
| 
 | |
| 	klog.Info("Running API Priority and Fairness config worker")
 | |
| 	go wait.Until(cfgCtlr.runWorker, time.Second, stopCh)
 | |
| 
 | |
| 	<-stopCh
 | |
| 	klog.Info("Shutting down API Priority and Fairness config worker")
 | |
| 	return nil
 | |
| }
 | |
| 
 | |
| // runWorker is the logic of the one and only worker goroutine.  We
 | |
| // limit the number to one in order to obviate explicit
 | |
| // synchronization around access to `cfgCtlr.mostRecentUpdates`.
 | |
| func (cfgCtlr *configController) runWorker() {
 | |
| 	for cfgCtlr.processNextWorkItem() {
 | |
| 	}
 | |
| }
 | |
| 
 | |
| // processNextWorkItem works on one entry from the work queue.
 | |
| // Only invoke this in the one and only worker goroutine.
 | |
| func (cfgCtlr *configController) processNextWorkItem() bool {
 | |
| 	obj, shutdown := cfgCtlr.configQueue.Get()
 | |
| 	if shutdown {
 | |
| 		return false
 | |
| 	}
 | |
| 
 | |
| 	func(obj interface{}) {
 | |
| 		defer cfgCtlr.configQueue.Done(obj)
 | |
| 		specificDelay, err := cfgCtlr.syncOne()
 | |
| 		switch {
 | |
| 		case err != nil:
 | |
| 			klog.Error(err)
 | |
| 			cfgCtlr.configQueue.AddRateLimited(obj)
 | |
| 		case specificDelay > 0:
 | |
| 			cfgCtlr.configQueue.AddAfter(obj, specificDelay)
 | |
| 		default:
 | |
| 			cfgCtlr.configQueue.Forget(obj)
 | |
| 		}
 | |
| 	}(obj)
 | |
| 
 | |
| 	return true
 | |
| }
 | |
| 
 | |
| // syncOne does one full synchronization.  It reads all the API
 | |
| // objects that configure API Priority and Fairness and updates the
 | |
| // local configController accordingly.
 | |
| // Only invoke this in the one and only worker goroutine
 | |
| func (cfgCtlr *configController) syncOne() (specificDelay time.Duration, err error) {
 | |
| 	klog.V(5).Infof("%s syncOne at %s", cfgCtlr.name, cfgCtlr.clock.Now().Format(timeFmt))
 | |
| 	all := labels.Everything()
 | |
| 	newPLs, err := cfgCtlr.plLister.List(all)
 | |
| 	if err != nil {
 | |
| 		return 0, fmt.Errorf("unable to list PriorityLevelConfiguration objects: %w", err)
 | |
| 	}
 | |
| 	newFSs, err := cfgCtlr.fsLister.List(all)
 | |
| 	if err != nil {
 | |
| 		return 0, fmt.Errorf("unable to list FlowSchema objects: %w", err)
 | |
| 	}
 | |
| 	return cfgCtlr.digestConfigObjects(newPLs, newFSs)
 | |
| }
 | |
| 
 | |
| // cfgMeal is the data involved in the process of digesting the API
 | |
| // objects that configure API Priority and Fairness.  All the config
 | |
| // objects are digested together, because this is the simplest way to
 | |
| // cope with the various dependencies between objects.  The process of
 | |
| // digestion is done in four passes over config objects --- three
 | |
| // passes over PriorityLevelConfigurations and one pass over the
 | |
| // FlowSchemas --- with the work dvided among the passes according to
 | |
| // those dependencies.
 | |
| type cfgMeal struct {
 | |
| 	cfgCtlr *configController
 | |
| 
 | |
| 	newPLStates map[string]*priorityLevelState
 | |
| 
 | |
| 	// The sum of the concurrency shares of the priority levels in the
 | |
| 	// new configuration
 | |
| 	shareSum float64
 | |
| 
 | |
| 	// These keep track of which mandatory priority level config
 | |
| 	// objects have been digested
 | |
| 	haveExemptPL, haveCatchAllPL bool
 | |
| 
 | |
| 	// Buffered FlowSchema status updates to do.  Do them when the
 | |
| 	// lock is not held, to avoid a deadlock due to such a request
 | |
| 	// provoking a call into this controller while the lock held
 | |
| 	// waiting on that request to complete.
 | |
| 	fsStatusUpdates []fsStatusUpdate
 | |
| }
 | |
| 
 | |
| // A buffered set of status updates for FlowSchemas
 | |
| type fsStatusUpdate struct {
 | |
| 	flowSchema *flowcontrol.FlowSchema
 | |
| 	condition  flowcontrol.FlowSchemaCondition
 | |
| 	oldValue   flowcontrol.FlowSchemaCondition
 | |
| }
 | |
| 
 | |
| // digestConfigObjects is given all the API objects that configure
 | |
| // cfgCtlr and writes its consequent new configState.
 | |
| // Only invoke this in the one and only worker goroutine
 | |
| func (cfgCtlr *configController) digestConfigObjects(newPLs []*flowcontrol.PriorityLevelConfiguration, newFSs []*flowcontrol.FlowSchema) (time.Duration, error) {
 | |
| 	fsStatusUpdates := cfgCtlr.lockAndDigestConfigObjects(newPLs, newFSs)
 | |
| 	var errs []error
 | |
| 	currResult := updateAttempt{
 | |
| 		timeUpdated:  cfgCtlr.clock.Now(),
 | |
| 		updatedItems: sets.String{},
 | |
| 	}
 | |
| 	var suggestedDelay time.Duration
 | |
| 	for _, fsu := range fsStatusUpdates {
 | |
| 		// if we should skip this name, indicate we will need a delay, but continue with other entries
 | |
| 		if cfgCtlr.shouldDelayUpdate(fsu.flowSchema.Name) {
 | |
| 			if suggestedDelay == 0 {
 | |
| 				suggestedDelay = time.Duration(30+rand.Intn(45)) * time.Second
 | |
| 			}
 | |
| 			continue
 | |
| 		}
 | |
| 
 | |
| 		// if we are going to issue an update, be sure we track every name we update so we know if we update it too often.
 | |
| 		currResult.updatedItems.Insert(fsu.flowSchema.Name)
 | |
| 		patchBytes, err := makeFlowSchemaConditionPatch(fsu.condition)
 | |
| 		if err != nil {
 | |
| 			// should never happen because these conditions are created here and well formed
 | |
| 			panic(fmt.Sprintf("Failed to json.Marshall(%#+v): %s", fsu.condition, err.Error()))
 | |
| 		}
 | |
| 		if klog.V(4).Enabled() {
 | |
| 			klog.V(4).Infof("%s writing Condition %s to FlowSchema %s, which had ResourceVersion=%s, because its previous value was %s, diff: %s",
 | |
| 				cfgCtlr.name, fsu.condition, fsu.flowSchema.Name, fsu.flowSchema.ResourceVersion, fcfmt.Fmt(fsu.oldValue), cmp.Diff(fsu.oldValue, fsu.condition))
 | |
| 		}
 | |
| 		fsIfc := cfgCtlr.flowcontrolClient.FlowSchemas()
 | |
| 		patchOptions := metav1.PatchOptions{FieldManager: cfgCtlr.asFieldManager}
 | |
| 		_, err = fsIfc.Patch(context.TODO(), fsu.flowSchema.Name, apitypes.StrategicMergePatchType, patchBytes, patchOptions, "status")
 | |
| 		if err != nil {
 | |
| 			if apierrors.IsNotFound(err) {
 | |
| 				// This object has been deleted.  A notification is coming
 | |
| 				// and nothing more needs to be done here.
 | |
| 				klog.V(5).Infof("%s at %s: attempted update of concurrently deleted FlowSchema %s; nothing more needs to be done", cfgCtlr.name, cfgCtlr.clock.Now().Format(timeFmt), fsu.flowSchema.Name)
 | |
| 			} else {
 | |
| 				errs = append(errs, fmt.Errorf("failed to set a status.condition for FlowSchema %s: %w", fsu.flowSchema.Name, err))
 | |
| 			}
 | |
| 		}
 | |
| 	}
 | |
| 	cfgCtlr.addUpdateResult(currResult)
 | |
| 
 | |
| 	return suggestedDelay, utilerrors.NewAggregate(errs)
 | |
| }
 | |
| 
 | |
| // makeFlowSchemaConditionPatch takes in a condition and returns the patch status as a json.
 | |
| func makeFlowSchemaConditionPatch(condition flowcontrol.FlowSchemaCondition) ([]byte, error) {
 | |
| 	o := struct {
 | |
| 		Status flowcontrol.FlowSchemaStatus `json:"status"`
 | |
| 	}{
 | |
| 		Status: flowcontrol.FlowSchemaStatus{
 | |
| 			Conditions: []flowcontrol.FlowSchemaCondition{
 | |
| 				condition,
 | |
| 			},
 | |
| 		},
 | |
| 	}
 | |
| 	return json.Marshal(o)
 | |
| }
 | |
| 
 | |
| // shouldDelayUpdate checks to see if a flowschema has been updated too often and returns true if a delay is needed.
 | |
| // Only invoke this in the one and only worker goroutine
 | |
| func (cfgCtlr *configController) shouldDelayUpdate(flowSchemaName string) bool {
 | |
| 	numUpdatesInPastMinute := 0
 | |
| 	oneMinuteAgo := cfgCtlr.clock.Now().Add(-1 * time.Minute)
 | |
| 	for idx, update := range cfgCtlr.mostRecentUpdates {
 | |
| 		if oneMinuteAgo.After(update.timeUpdated) {
 | |
| 			// this and the remaining items are no longer relevant
 | |
| 			cfgCtlr.mostRecentUpdates = cfgCtlr.mostRecentUpdates[:idx]
 | |
| 			return false
 | |
| 		}
 | |
| 		if update.updatedItems.Has(flowSchemaName) {
 | |
| 			numUpdatesInPastMinute++
 | |
| 			if numUpdatesInPastMinute > 5 {
 | |
| 				return true
 | |
| 			}
 | |
| 		}
 | |
| 	}
 | |
| 	return false
 | |
| }
 | |
| 
 | |
| // addUpdateResult adds the result. It isn't a ring buffer because
 | |
| // this is small and rate limited.
 | |
| // Only invoke this in the one and only worker goroutine
 | |
| func (cfgCtlr *configController) addUpdateResult(result updateAttempt) {
 | |
| 	cfgCtlr.mostRecentUpdates = append([]updateAttempt{result}, cfgCtlr.mostRecentUpdates...)
 | |
| }
 | |
| 
 | |
| func (cfgCtlr *configController) lockAndDigestConfigObjects(newPLs []*flowcontrol.PriorityLevelConfiguration, newFSs []*flowcontrol.FlowSchema) []fsStatusUpdate {
 | |
| 	cfgCtlr.lock.Lock()
 | |
| 	defer cfgCtlr.lock.Unlock()
 | |
| 	meal := cfgMeal{
 | |
| 		cfgCtlr:     cfgCtlr,
 | |
| 		newPLStates: make(map[string]*priorityLevelState),
 | |
| 	}
 | |
| 
 | |
| 	meal.digestNewPLsLocked(newPLs)
 | |
| 	meal.digestFlowSchemasLocked(newFSs)
 | |
| 	meal.processOldPLsLocked()
 | |
| 
 | |
| 	// Supply missing mandatory PriorityLevelConfiguration objects
 | |
| 	if !meal.haveExemptPL {
 | |
| 		meal.imaginePL(fcboot.MandatoryPriorityLevelConfigurationExempt, cfgCtlr.requestWaitLimit)
 | |
| 	}
 | |
| 	if !meal.haveCatchAllPL {
 | |
| 		meal.imaginePL(fcboot.MandatoryPriorityLevelConfigurationCatchAll, cfgCtlr.requestWaitLimit)
 | |
| 	}
 | |
| 
 | |
| 	meal.finishQueueSetReconfigsLocked()
 | |
| 
 | |
| 	// The new config has been constructed
 | |
| 	cfgCtlr.priorityLevelStates = meal.newPLStates
 | |
| 	klog.V(5).Infof("Switched to new API Priority and Fairness configuration")
 | |
| 	return meal.fsStatusUpdates
 | |
| }
 | |
| 
 | |
| // Digest the new set of PriorityLevelConfiguration objects.
 | |
| // Pretend broken ones do not exist.
 | |
| func (meal *cfgMeal) digestNewPLsLocked(newPLs []*flowcontrol.PriorityLevelConfiguration) {
 | |
| 	for _, pl := range newPLs {
 | |
| 		state := meal.cfgCtlr.priorityLevelStates[pl.Name]
 | |
| 		if state == nil {
 | |
| 			labelValues := []string{pl.Name}
 | |
| 			state = &priorityLevelState{reqsObsPair: meal.cfgCtlr.reqsObsPairGenerator.Generate(1, 1, labelValues), execSeatsObs: meal.cfgCtlr.execSeatsObsGenerator.Generate(1, 1, labelValues)}
 | |
| 		}
 | |
| 		qsCompleter, err := queueSetCompleterForPL(meal.cfgCtlr.queueSetFactory, state.queues, pl, meal.cfgCtlr.requestWaitLimit, state.reqsObsPair, state.execSeatsObs)
 | |
| 		if err != nil {
 | |
| 			klog.Warningf("Ignoring PriorityLevelConfiguration object %s because its spec (%s) is broken: %s", pl.Name, fcfmt.Fmt(pl.Spec), err)
 | |
| 			continue
 | |
| 		}
 | |
| 		meal.newPLStates[pl.Name] = state
 | |
| 		state.pl = pl
 | |
| 		state.qsCompleter = qsCompleter
 | |
| 		if state.quiescing { // it was undesired, but no longer
 | |
| 			klog.V(3).Infof("Priority level %q was undesired and has become desired again", pl.Name)
 | |
| 			state.quiescing = false
 | |
| 		}
 | |
| 		if state.pl.Spec.Limited != nil {
 | |
| 			meal.shareSum += float64(state.pl.Spec.Limited.AssuredConcurrencyShares)
 | |
| 		}
 | |
| 		meal.haveExemptPL = meal.haveExemptPL || pl.Name == flowcontrol.PriorityLevelConfigurationNameExempt
 | |
| 		meal.haveCatchAllPL = meal.haveCatchAllPL || pl.Name == flowcontrol.PriorityLevelConfigurationNameCatchAll
 | |
| 	}
 | |
| }
 | |
| 
 | |
| // Digest the given FlowSchema objects.  Ones that reference a missing
 | |
| // or broken priority level are not to be passed on to the filter for
 | |
| // use.  We do this before holding over old priority levels so that
 | |
| // requests stop going to those levels and FlowSchemaStatus values
 | |
| // reflect this.  This function also adds any missing mandatory
 | |
| // FlowSchema objects.  The given objects must all have distinct
 | |
| // names.
 | |
| func (meal *cfgMeal) digestFlowSchemasLocked(newFSs []*flowcontrol.FlowSchema) {
 | |
| 	fsSeq := make(apihelpers.FlowSchemaSequence, 0, len(newFSs))
 | |
| 	fsMap := make(map[string]*flowcontrol.FlowSchema, len(newFSs))
 | |
| 	var haveExemptFS, haveCatchAllFS bool
 | |
| 	for i, fs := range newFSs {
 | |
| 		otherFS := fsMap[fs.Name]
 | |
| 		if otherFS != nil {
 | |
| 			// This client is forbidden to do this.
 | |
| 			panic(fmt.Sprintf("Given two FlowSchema objects with the same name: %s and %s", fcfmt.Fmt(otherFS), fcfmt.Fmt(fs)))
 | |
| 		}
 | |
| 		fsMap[fs.Name] = fs
 | |
| 		_, goodPriorityRef := meal.newPLStates[fs.Spec.PriorityLevelConfiguration.Name]
 | |
| 
 | |
| 		// Ensure the object's status reflects whether its priority
 | |
| 		// level reference is broken.
 | |
| 		//
 | |
| 		// TODO: consider not even trying if server is not handling
 | |
| 		// requests yet.
 | |
| 		meal.presyncFlowSchemaStatus(fs, meal.cfgCtlr.foundToDangling(goodPriorityRef), fs.Spec.PriorityLevelConfiguration.Name)
 | |
| 
 | |
| 		if !goodPriorityRef {
 | |
| 			klog.V(6).Infof("Ignoring FlowSchema %s because of bad priority level reference %q", fs.Name, fs.Spec.PriorityLevelConfiguration.Name)
 | |
| 			continue
 | |
| 		}
 | |
| 		fsSeq = append(fsSeq, newFSs[i])
 | |
| 		haveExemptFS = haveExemptFS || fs.Name == flowcontrol.FlowSchemaNameExempt
 | |
| 		haveCatchAllFS = haveCatchAllFS || fs.Name == flowcontrol.FlowSchemaNameCatchAll
 | |
| 	}
 | |
| 	// sort into the order to be used for matching
 | |
| 	sort.Sort(fsSeq)
 | |
| 
 | |
| 	// Supply missing mandatory FlowSchemas, in correct position
 | |
| 	if !haveExemptFS {
 | |
| 		fsSeq = append(apihelpers.FlowSchemaSequence{fcboot.MandatoryFlowSchemaExempt}, fsSeq...)
 | |
| 	}
 | |
| 	if !haveCatchAllFS {
 | |
| 		fsSeq = append(fsSeq, fcboot.MandatoryFlowSchemaCatchAll)
 | |
| 	}
 | |
| 
 | |
| 	meal.cfgCtlr.flowSchemas = fsSeq
 | |
| 	if klog.V(5).Enabled() {
 | |
| 		for _, fs := range fsSeq {
 | |
| 			klog.Infof("Using FlowSchema %s", fcfmt.Fmt(fs))
 | |
| 		}
 | |
| 	}
 | |
| }
 | |
| 
 | |
| // Consider all the priority levels in the previous configuration.
 | |
| // Keep the ones that are in the new config, supply mandatory
 | |
| // behavior, or are still busy; for the rest: drop it if it has no
 | |
| // queues, otherwise start the quiescing process if that has not
 | |
| // already been started.
 | |
| func (meal *cfgMeal) processOldPLsLocked() {
 | |
| 	for plName, plState := range meal.cfgCtlr.priorityLevelStates {
 | |
| 		if meal.newPLStates[plName] != nil {
 | |
| 			// Still desired and already updated
 | |
| 			continue
 | |
| 		}
 | |
| 		if plName == flowcontrol.PriorityLevelConfigurationNameExempt && !meal.haveExemptPL || plName == flowcontrol.PriorityLevelConfigurationNameCatchAll && !meal.haveCatchAllPL {
 | |
| 			// BTW, we know the Spec has not changed because the
 | |
| 			// mandatory objects have immutable Specs
 | |
| 			klog.V(3).Infof("Retaining mandatory priority level %q despite lack of API object", plName)
 | |
| 		} else {
 | |
| 			if plState.queues == nil || plState.numPending == 0 && plState.queues.IsIdle() {
 | |
| 				// Either there are no queues or they are done
 | |
| 				// draining and no use is coming from another
 | |
| 				// goroutine
 | |
| 				klog.V(3).Infof("Removing undesired priority level %q (nilQueues=%v), Type=%v", plName, plState.queues == nil, plState.pl.Spec.Type)
 | |
| 				continue
 | |
| 			}
 | |
| 			if !plState.quiescing {
 | |
| 				klog.V(3).Infof("Priority level %q became undesired", plName)
 | |
| 				plState.quiescing = true
 | |
| 			}
 | |
| 		}
 | |
| 		var err error
 | |
| 		plState.qsCompleter, err = queueSetCompleterForPL(meal.cfgCtlr.queueSetFactory, plState.queues, plState.pl, meal.cfgCtlr.requestWaitLimit, plState.reqsObsPair, plState.execSeatsObs)
 | |
| 		if err != nil {
 | |
| 			// This can not happen because queueSetCompleterForPL already approved this config
 | |
| 			panic(fmt.Sprintf("%s from name=%q spec=%s", err, plName, fcfmt.Fmt(plState.pl.Spec)))
 | |
| 		}
 | |
| 		if plState.pl.Spec.Limited != nil {
 | |
| 			// We deliberately include the lingering priority levels
 | |
| 			// here so that their queues get some concurrency and they
 | |
| 			// continue to drain.  During this interim a lingering
 | |
| 			// priority level continues to get a concurrency
 | |
| 			// allocation determined by all the share values in the
 | |
| 			// regular way.
 | |
| 			meal.shareSum += float64(plState.pl.Spec.Limited.AssuredConcurrencyShares)
 | |
| 		}
 | |
| 		meal.haveExemptPL = meal.haveExemptPL || plName == flowcontrol.PriorityLevelConfigurationNameExempt
 | |
| 		meal.haveCatchAllPL = meal.haveCatchAllPL || plName == flowcontrol.PriorityLevelConfigurationNameCatchAll
 | |
| 		meal.newPLStates[plName] = plState
 | |
| 	}
 | |
| }
 | |
| 
 | |
| // For all the priority levels of the new config, divide up the
 | |
| // server's total concurrency limit among them and create/update their
 | |
| // QueueSets.
 | |
| func (meal *cfgMeal) finishQueueSetReconfigsLocked() {
 | |
| 	for plName, plState := range meal.newPLStates {
 | |
| 		if plState.pl.Spec.Limited == nil {
 | |
| 			klog.V(5).Infof("Using exempt priority level %q: quiescing=%v", plName, plState.quiescing)
 | |
| 			continue
 | |
| 		}
 | |
| 
 | |
| 		// The use of math.Ceil here means that the results might sum
 | |
| 		// to a little more than serverConcurrencyLimit but the
 | |
| 		// difference will be negligible.
 | |
| 		concurrencyLimit := int(math.Ceil(float64(meal.cfgCtlr.serverConcurrencyLimit) * float64(plState.pl.Spec.Limited.AssuredConcurrencyShares) / meal.shareSum))
 | |
| 		metrics.UpdateSharedConcurrencyLimit(plName, concurrencyLimit)
 | |
| 
 | |
| 		if plState.queues == nil {
 | |
| 			klog.V(5).Infof("Introducing queues for priority level %q: config=%s, concurrencyLimit=%d, quiescing=%v (shares=%v, shareSum=%v)", plName, fcfmt.Fmt(plState.pl.Spec), concurrencyLimit, plState.quiescing, plState.pl.Spec.Limited.AssuredConcurrencyShares, meal.shareSum)
 | |
| 		} else {
 | |
| 			klog.V(5).Infof("Retaining queues for priority level %q: config=%s, concurrencyLimit=%d, quiescing=%v, numPending=%d (shares=%v, shareSum=%v)", plName, fcfmt.Fmt(plState.pl.Spec), concurrencyLimit, plState.quiescing, plState.numPending, plState.pl.Spec.Limited.AssuredConcurrencyShares, meal.shareSum)
 | |
| 		}
 | |
| 		plState.queues = plState.qsCompleter.Complete(fq.DispatchingConfig{ConcurrencyLimit: concurrencyLimit})
 | |
| 	}
 | |
| }
 | |
| 
 | |
| // queueSetCompleterForPL returns an appropriate QueueSetCompleter for the
 | |
| // given priority level configuration.  Returns nil if that config
 | |
| // does not call for limiting.  Returns nil and an error if the given
 | |
| // object is malformed in a way that is a problem for this package.
 | |
| func queueSetCompleterForPL(qsf fq.QueueSetFactory, queues fq.QueueSet, pl *flowcontrol.PriorityLevelConfiguration, requestWaitLimit time.Duration, reqsIntPair metrics.TimedObserverPair, execSeatsObs metrics.TimedObserver) (fq.QueueSetCompleter, error) {
 | |
| 	if (pl.Spec.Type == flowcontrol.PriorityLevelEnablementExempt) != (pl.Spec.Limited == nil) {
 | |
| 		return nil, errors.New("broken union structure at the top")
 | |
| 	}
 | |
| 	if (pl.Spec.Type == flowcontrol.PriorityLevelEnablementExempt) != (pl.Name == flowcontrol.PriorityLevelConfigurationNameExempt) {
 | |
| 		// This package does not attempt to cope with a priority level dynamically switching between exempt and not.
 | |
| 		return nil, errors.New("non-alignment between name and type")
 | |
| 	}
 | |
| 	if pl.Spec.Limited == nil {
 | |
| 		return nil, nil
 | |
| 	}
 | |
| 	if (pl.Spec.Limited.LimitResponse.Type == flowcontrol.LimitResponseTypeReject) != (pl.Spec.Limited.LimitResponse.Queuing == nil) {
 | |
| 		return nil, errors.New("broken union structure for limit response")
 | |
| 	}
 | |
| 	qcAPI := pl.Spec.Limited.LimitResponse.Queuing
 | |
| 	qcQS := fq.QueuingConfig{Name: pl.Name}
 | |
| 	if qcAPI != nil {
 | |
| 		qcQS = fq.QueuingConfig{Name: pl.Name,
 | |
| 			DesiredNumQueues: int(qcAPI.Queues),
 | |
| 			QueueLengthLimit: int(qcAPI.QueueLengthLimit),
 | |
| 			HandSize:         int(qcAPI.HandSize),
 | |
| 			RequestWaitLimit: requestWaitLimit,
 | |
| 		}
 | |
| 	}
 | |
| 	var qsc fq.QueueSetCompleter
 | |
| 	var err error
 | |
| 	if queues != nil {
 | |
| 		qsc, err = queues.BeginConfigChange(qcQS)
 | |
| 	} else {
 | |
| 		qsc, err = qsf.BeginConstruction(qcQS, reqsIntPair, execSeatsObs)
 | |
| 	}
 | |
| 	if err != nil {
 | |
| 		err = fmt.Errorf("priority level %q has QueuingConfiguration %#+v, which is invalid: %w", pl.Name, qcAPI, err)
 | |
| 	}
 | |
| 	return qsc, err
 | |
| }
 | |
| 
 | |
| func (meal *cfgMeal) presyncFlowSchemaStatus(fs *flowcontrol.FlowSchema, isDangling bool, plName string) {
 | |
| 	danglingCondition := apihelpers.GetFlowSchemaConditionByType(fs, flowcontrol.FlowSchemaConditionDangling)
 | |
| 	if danglingCondition == nil {
 | |
| 		danglingCondition = &flowcontrol.FlowSchemaCondition{
 | |
| 			Type: flowcontrol.FlowSchemaConditionDangling,
 | |
| 		}
 | |
| 	}
 | |
| 	desiredStatus := flowcontrol.ConditionFalse
 | |
| 	var desiredReason, desiredMessage string
 | |
| 	if isDangling {
 | |
| 		desiredStatus = flowcontrol.ConditionTrue
 | |
| 		desiredReason = "NotFound"
 | |
| 		desiredMessage = fmt.Sprintf("This FlowSchema references the PriorityLevelConfiguration object named %q but there is no such object", plName)
 | |
| 	} else {
 | |
| 		desiredReason = "Found"
 | |
| 		desiredMessage = fmt.Sprintf("This FlowSchema references the PriorityLevelConfiguration object named %q and it exists", plName)
 | |
| 	}
 | |
| 	if danglingCondition.Status == desiredStatus && danglingCondition.Reason == desiredReason && danglingCondition.Message == desiredMessage {
 | |
| 		return
 | |
| 	}
 | |
| 	now := meal.cfgCtlr.clock.Now()
 | |
| 	meal.fsStatusUpdates = append(meal.fsStatusUpdates, fsStatusUpdate{
 | |
| 		flowSchema: fs,
 | |
| 		condition: flowcontrol.FlowSchemaCondition{
 | |
| 			Type:               flowcontrol.FlowSchemaConditionDangling,
 | |
| 			Status:             desiredStatus,
 | |
| 			LastTransitionTime: metav1.NewTime(now),
 | |
| 			Reason:             desiredReason,
 | |
| 			Message:            desiredMessage,
 | |
| 		},
 | |
| 		oldValue: *danglingCondition})
 | |
| }
 | |
| 
 | |
| // imaginePL adds a priority level based on one of the mandatory ones
 | |
| // that does not actually exist (right now) as a real API object.
 | |
| func (meal *cfgMeal) imaginePL(proto *flowcontrol.PriorityLevelConfiguration, requestWaitLimit time.Duration) {
 | |
| 	klog.V(3).Infof("No %s PriorityLevelConfiguration found, imagining one", proto.Name)
 | |
| 	labelValues := []string{proto.Name}
 | |
| 	reqsObsPair := meal.cfgCtlr.reqsObsPairGenerator.Generate(1, 1, labelValues)
 | |
| 	execSeatsObs := meal.cfgCtlr.execSeatsObsGenerator.Generate(1, 1, labelValues)
 | |
| 	qsCompleter, err := queueSetCompleterForPL(meal.cfgCtlr.queueSetFactory, nil, proto, requestWaitLimit, reqsObsPair, execSeatsObs)
 | |
| 	if err != nil {
 | |
| 		// This can not happen because proto is one of the mandatory
 | |
| 		// objects and these are not erroneous
 | |
| 		panic(err)
 | |
| 	}
 | |
| 	meal.newPLStates[proto.Name] = &priorityLevelState{
 | |
| 		pl:           proto,
 | |
| 		qsCompleter:  qsCompleter,
 | |
| 		reqsObsPair:  reqsObsPair,
 | |
| 		execSeatsObs: execSeatsObs,
 | |
| 	}
 | |
| 	if proto.Spec.Limited != nil {
 | |
| 		meal.shareSum += float64(proto.Spec.Limited.AssuredConcurrencyShares)
 | |
| 	}
 | |
| }
 | |
| 
 | |
| type immediateRequest struct{}
 | |
| 
 | |
| func (immediateRequest) Finish(execute func()) bool {
 | |
| 	execute()
 | |
| 	return false
 | |
| }
 | |
| 
 | |
| // startRequest classifies and, if appropriate, enqueues the request.
 | |
| // Returns a nil Request if and only if the request is to be rejected.
 | |
| // The returned bool indicates whether the request is exempt from
 | |
| // limitation.  The startWaitingTime is when the request started
 | |
| // waiting in its queue, or `Time{}` if this did not happen.
 | |
| func (cfgCtlr *configController) startRequest(ctx context.Context, rd RequestDigest, queueNoteFn fq.QueueNoteFn) (fs *flowcontrol.FlowSchema, pl *flowcontrol.PriorityLevelConfiguration, isExempt bool, req fq.Request, startWaitingTime time.Time, flowDistinguisher string) {
 | |
| 	klog.V(7).Infof("startRequest(%#+v)", rd)
 | |
| 	cfgCtlr.lock.RLock()
 | |
| 	defer cfgCtlr.lock.RUnlock()
 | |
| 	var selectedFlowSchema, catchAllFlowSchema *flowcontrol.FlowSchema
 | |
| 	for _, fs := range cfgCtlr.flowSchemas {
 | |
| 		if matchesFlowSchema(rd, fs) {
 | |
| 			selectedFlowSchema = fs
 | |
| 			break
 | |
| 		}
 | |
| 		if fs.Name == flowcontrol.FlowSchemaNameCatchAll {
 | |
| 			catchAllFlowSchema = fs
 | |
| 		}
 | |
| 	}
 | |
| 	if selectedFlowSchema == nil {
 | |
| 		// This should never happen. If the requestDigest's User is a part of
 | |
| 		// system:authenticated or system:unauthenticated, the catch-all flow
 | |
| 		// schema should match it. However, if that invariant somehow fails,
 | |
| 		// fallback to the catch-all flow schema anyway.
 | |
| 		if catchAllFlowSchema == nil {
 | |
| 			// This should absolutely never, ever happen! APF guarantees two
 | |
| 			// undeletable flow schemas at all times: an exempt flow schema and a
 | |
| 			// catch-all flow schema.
 | |
| 			panic(fmt.Sprintf("no fallback catch-all flow schema found for request %#+v and user %#+v", rd.RequestInfo, rd.User))
 | |
| 		}
 | |
| 		selectedFlowSchema = catchAllFlowSchema
 | |
| 		klog.Warningf("no match found for request %#+v and user %#+v; selecting catchAll=%s as fallback flow schema", rd.RequestInfo, rd.User, fcfmt.Fmt(selectedFlowSchema))
 | |
| 	}
 | |
| 	plName := selectedFlowSchema.Spec.PriorityLevelConfiguration.Name
 | |
| 	plState := cfgCtlr.priorityLevelStates[plName]
 | |
| 	if plState.pl.Spec.Type == flowcontrol.PriorityLevelEnablementExempt {
 | |
| 		klog.V(7).Infof("startRequest(%#+v) => fsName=%q, distMethod=%#+v, plName=%q, immediate", rd, selectedFlowSchema.Name, selectedFlowSchema.Spec.DistinguisherMethod, plName)
 | |
| 		return selectedFlowSchema, plState.pl, true, immediateRequest{}, time.Time{}, ""
 | |
| 	}
 | |
| 	var numQueues int32
 | |
| 	if plState.pl.Spec.Limited.LimitResponse.Type == flowcontrol.LimitResponseTypeQueue {
 | |
| 		numQueues = plState.pl.Spec.Limited.LimitResponse.Queuing.Queues
 | |
| 	}
 | |
| 	var hashValue uint64
 | |
| 	if numQueues > 1 {
 | |
| 		flowDistinguisher = computeFlowDistinguisher(rd, selectedFlowSchema.Spec.DistinguisherMethod)
 | |
| 		hashValue = hashFlowID(selectedFlowSchema.Name, flowDistinguisher)
 | |
| 	}
 | |
| 	startWaitingTime = time.Now()
 | |
| 	klog.V(7).Infof("startRequest(%#+v) => fsName=%q, distMethod=%#+v, plName=%q, numQueues=%d", rd, selectedFlowSchema.Name, selectedFlowSchema.Spec.DistinguisherMethod, plName, numQueues)
 | |
| 	req, idle := plState.queues.StartRequest(ctx, &rd.WorkEstimate, hashValue, flowDistinguisher, selectedFlowSchema.Name, rd.RequestInfo, rd.User, queueNoteFn)
 | |
| 	if idle {
 | |
| 		cfgCtlr.maybeReapReadLocked(plName, plState)
 | |
| 	}
 | |
| 	return selectedFlowSchema, plState.pl, false, req, startWaitingTime, flowDistinguisher
 | |
| }
 | |
| 
 | |
| // maybeReap will remove the last internal traces of the named
 | |
| // priority level if it has no more use.  Call this after getting a
 | |
| // clue that the given priority level is undesired and idle.
 | |
| func (cfgCtlr *configController) maybeReap(plName string) {
 | |
| 	cfgCtlr.lock.RLock()
 | |
| 	defer cfgCtlr.lock.RUnlock()
 | |
| 	plState := cfgCtlr.priorityLevelStates[plName]
 | |
| 	if plState == nil {
 | |
| 		klog.V(7).Infof("plName=%s, plState==nil", plName)
 | |
| 		return
 | |
| 	}
 | |
| 	if plState.queues != nil {
 | |
| 		useless := plState.quiescing && plState.numPending == 0 && plState.queues.IsIdle()
 | |
| 		klog.V(7).Infof("plState.quiescing=%v, plState.numPending=%d, useless=%v", plState.quiescing, plState.numPending, useless)
 | |
| 		if !useless {
 | |
| 			return
 | |
| 		}
 | |
| 	}
 | |
| 	klog.V(3).Infof("Triggered API priority and fairness config reloading because priority level %s is undesired and idle", plName)
 | |
| 	cfgCtlr.configQueue.Add(0)
 | |
| }
 | |
| 
 | |
| // maybeReapLocked requires the cfgCtlr's lock to already be held and
 | |
| // will remove the last internal traces of the named priority level if
 | |
| // it has no more use.  Call this if both (1) plState.queues is
 | |
| // non-nil and reported being idle, and (2) cfgCtlr's lock has not
 | |
| // been released since then.
 | |
| func (cfgCtlr *configController) maybeReapReadLocked(plName string, plState *priorityLevelState) {
 | |
| 	if !(plState.quiescing && plState.numPending == 0) {
 | |
| 		return
 | |
| 	}
 | |
| 	klog.V(3).Infof("Triggered API priority and fairness config reloading because priority level %s is undesired and idle", plName)
 | |
| 	cfgCtlr.configQueue.Add(0)
 | |
| }
 | |
| 
 | |
| // computeFlowDistinguisher extracts the flow distinguisher according to the given method
 | |
| func computeFlowDistinguisher(rd RequestDigest, method *flowcontrol.FlowDistinguisherMethod) string {
 | |
| 	if method == nil {
 | |
| 		return ""
 | |
| 	}
 | |
| 	switch method.Type {
 | |
| 	case flowcontrol.FlowDistinguisherMethodByUserType:
 | |
| 		return rd.User.GetName()
 | |
| 	case flowcontrol.FlowDistinguisherMethodByNamespaceType:
 | |
| 		return rd.RequestInfo.Namespace
 | |
| 	default:
 | |
| 		// this line shall never reach
 | |
| 		panic("invalid flow-distinguisher method")
 | |
| 	}
 | |
| }
 | |
| 
 | |
| func hashFlowID(fsName, fDistinguisher string) uint64 {
 | |
| 	hash := sha256.New()
 | |
| 	var sep = [1]byte{0}
 | |
| 	hash.Write([]byte(fsName))
 | |
| 	hash.Write(sep[:])
 | |
| 	hash.Write([]byte(fDistinguisher))
 | |
| 	var sum [32]byte
 | |
| 	hash.Sum(sum[:0])
 | |
| 	return binary.LittleEndian.Uint64(sum[:8])
 | |
| }
 |