123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890 |
- /*
- Copyright 2015 The Kubernetes Authors.
- Licensed under the Apache License, Version 2.0 (the "License");
- you may not use this file except in compliance with the License.
- You may obtain a copy of the License at
- http://www.apache.org/licenses/LICENSE-2.0
- Unless required by applicable law or agreed to in writing, software
- distributed under the License is distributed on an "AS IS" BASIS,
- WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- See the License for the specific language governing permissions and
- limitations under the License.
- */
- package podautoscaler
- import (
- "fmt"
- "math"
- "time"
- autoscalingv1 "k8s.io/api/autoscaling/v1"
- autoscalingv2 "k8s.io/api/autoscaling/v2beta2"
- v1 "k8s.io/api/core/v1"
- apiequality "k8s.io/apimachinery/pkg/api/equality"
- "k8s.io/apimachinery/pkg/api/errors"
- apimeta "k8s.io/apimachinery/pkg/api/meta"
- "k8s.io/apimachinery/pkg/api/resource"
- metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
- "k8s.io/apimachinery/pkg/labels"
- "k8s.io/apimachinery/pkg/runtime"
- "k8s.io/apimachinery/pkg/runtime/schema"
- utilruntime "k8s.io/apimachinery/pkg/util/runtime"
- "k8s.io/apimachinery/pkg/util/wait"
- autoscalinginformers "k8s.io/client-go/informers/autoscaling/v1"
- coreinformers "k8s.io/client-go/informers/core/v1"
- "k8s.io/client-go/kubernetes/scheme"
- autoscalingclient "k8s.io/client-go/kubernetes/typed/autoscaling/v1"
- v1core "k8s.io/client-go/kubernetes/typed/core/v1"
- autoscalinglisters "k8s.io/client-go/listers/autoscaling/v1"
- corelisters "k8s.io/client-go/listers/core/v1"
- scaleclient "k8s.io/client-go/scale"
- "k8s.io/client-go/tools/cache"
- "k8s.io/client-go/tools/record"
- "k8s.io/client-go/util/workqueue"
- "k8s.io/klog"
- "k8s.io/kubernetes/pkg/api/legacyscheme"
- "k8s.io/kubernetes/pkg/controller"
- metricsclient "k8s.io/kubernetes/pkg/controller/podautoscaler/metrics"
- )
- var (
- scaleUpLimitFactor = 2.0
- scaleUpLimitMinimum = 4.0
- )
- type timestampedRecommendation struct {
- recommendation int32
- timestamp time.Time
- }
- // HorizontalController is responsible for the synchronizing HPA objects stored
- // in the system with the actual deployments/replication controllers they
- // control.
- type HorizontalController struct {
- scaleNamespacer scaleclient.ScalesGetter
- hpaNamespacer autoscalingclient.HorizontalPodAutoscalersGetter
- mapper apimeta.RESTMapper
- replicaCalc *ReplicaCalculator
- eventRecorder record.EventRecorder
- downscaleStabilisationWindow time.Duration
- // hpaLister is able to list/get HPAs from the shared cache from the informer passed in to
- // NewHorizontalController.
- hpaLister autoscalinglisters.HorizontalPodAutoscalerLister
- hpaListerSynced cache.InformerSynced
- // podLister is able to list/get Pods from the shared cache from the informer passed in to
- // NewHorizontalController.
- podLister corelisters.PodLister
- podListerSynced cache.InformerSynced
- // Controllers that need to be synced
- queue workqueue.RateLimitingInterface
- // Latest unstabilized recommendations for each autoscaler.
- recommendations map[string][]timestampedRecommendation
- }
- // NewHorizontalController creates a new HorizontalController.
- func NewHorizontalController(
- evtNamespacer v1core.EventsGetter,
- scaleNamespacer scaleclient.ScalesGetter,
- hpaNamespacer autoscalingclient.HorizontalPodAutoscalersGetter,
- mapper apimeta.RESTMapper,
- metricsClient metricsclient.MetricsClient,
- hpaInformer autoscalinginformers.HorizontalPodAutoscalerInformer,
- podInformer coreinformers.PodInformer,
- resyncPeriod time.Duration,
- downscaleStabilisationWindow time.Duration,
- tolerance float64,
- cpuInitializationPeriod,
- delayOfInitialReadinessStatus time.Duration,
- ) *HorizontalController {
- broadcaster := record.NewBroadcaster()
- broadcaster.StartLogging(klog.Infof)
- broadcaster.StartRecordingToSink(&v1core.EventSinkImpl{Interface: evtNamespacer.Events("")})
- recorder := broadcaster.NewRecorder(scheme.Scheme, v1.EventSource{Component: "horizontal-pod-autoscaler"})
- hpaController := &HorizontalController{
- eventRecorder: recorder,
- scaleNamespacer: scaleNamespacer,
- hpaNamespacer: hpaNamespacer,
- downscaleStabilisationWindow: downscaleStabilisationWindow,
- queue: workqueue.NewNamedRateLimitingQueue(NewDefaultHPARateLimiter(resyncPeriod), "horizontalpodautoscaler"),
- mapper: mapper,
- recommendations: map[string][]timestampedRecommendation{},
- }
- hpaInformer.Informer().AddEventHandlerWithResyncPeriod(
- cache.ResourceEventHandlerFuncs{
- AddFunc: hpaController.enqueueHPA,
- UpdateFunc: hpaController.updateHPA,
- DeleteFunc: hpaController.deleteHPA,
- },
- resyncPeriod,
- )
- hpaController.hpaLister = hpaInformer.Lister()
- hpaController.hpaListerSynced = hpaInformer.Informer().HasSynced
- hpaController.podLister = podInformer.Lister()
- hpaController.podListerSynced = podInformer.Informer().HasSynced
- replicaCalc := NewReplicaCalculator(
- metricsClient,
- hpaController.podLister,
- tolerance,
- cpuInitializationPeriod,
- delayOfInitialReadinessStatus,
- )
- hpaController.replicaCalc = replicaCalc
- return hpaController
- }
- // Run begins watching and syncing.
- func (a *HorizontalController) Run(stopCh <-chan struct{}) {
- defer utilruntime.HandleCrash()
- defer a.queue.ShutDown()
- klog.Infof("Starting HPA controller")
- defer klog.Infof("Shutting down HPA controller")
- if !controller.WaitForCacheSync("HPA", stopCh, a.hpaListerSynced, a.podListerSynced) {
- return
- }
- // start a single worker (we may wish to start more in the future)
- go wait.Until(a.worker, time.Second, stopCh)
- <-stopCh
- }
- // obj could be an *v1.HorizontalPodAutoscaler, or a DeletionFinalStateUnknown marker item.
- func (a *HorizontalController) updateHPA(old, cur interface{}) {
- a.enqueueHPA(cur)
- }
- // obj could be an *v1.HorizontalPodAutoscaler, or a DeletionFinalStateUnknown marker item.
- func (a *HorizontalController) enqueueHPA(obj interface{}) {
- key, err := controller.KeyFunc(obj)
- if err != nil {
- utilruntime.HandleError(fmt.Errorf("couldn't get key for object %+v: %v", obj, err))
- return
- }
- // Requests are always added to queue with resyncPeriod delay. If there's already
- // request for the HPA in the queue then a new request is always dropped. Requests spend resync
- // interval in queue so HPAs are processed every resync interval.
- a.queue.AddRateLimited(key)
- }
- func (a *HorizontalController) deleteHPA(obj interface{}) {
- key, err := controller.KeyFunc(obj)
- if err != nil {
- utilruntime.HandleError(fmt.Errorf("couldn't get key for object %+v: %v", obj, err))
- return
- }
- // TODO: could we leak if we fail to get the key?
- a.queue.Forget(key)
- }
- func (a *HorizontalController) worker() {
- for a.processNextWorkItem() {
- }
- klog.Infof("horizontal pod autoscaler controller worker shutting down")
- }
- func (a *HorizontalController) processNextWorkItem() bool {
- key, quit := a.queue.Get()
- if quit {
- return false
- }
- defer a.queue.Done(key)
- deleted, err := a.reconcileKey(key.(string))
- if err != nil {
- utilruntime.HandleError(err)
- }
- // Add request processing HPA to queue with resyncPeriod delay.
- // Requests are always added to queue with resyncPeriod delay. If there's already request
- // for the HPA in the queue then a new request is always dropped. Requests spend resyncPeriod
- // in queue so HPAs are processed every resyncPeriod.
- // Request is added here just in case last resync didn't insert request into the queue. This
- // happens quite often because there is race condition between adding request after resyncPeriod
- // and removing them from queue. Request can be added by resync before previous request is
- // removed from queue. If we didn't add request here then in this case one request would be dropped
- // and HPA would processed after 2 x resyncPeriod.
- if !deleted {
- a.queue.AddRateLimited(key)
- }
- return true
- }
- // computeReplicasForMetrics computes the desired number of replicas for the metric specifications listed in the HPA,
- // returning the maximum of the computed replica counts, a description of the associated metric, and the statuses of
- // all metrics computed.
- func (a *HorizontalController) computeReplicasForMetrics(hpa *autoscalingv2.HorizontalPodAutoscaler, scale *autoscalingv1.Scale,
- metricSpecs []autoscalingv2.MetricSpec) (replicas int32, metric string, statuses []autoscalingv2.MetricStatus, timestamp time.Time, err error) {
- specReplicas := scale.Spec.Replicas
- statusReplicas := scale.Status.Replicas
- statuses = make([]autoscalingv2.MetricStatus, len(metricSpecs))
- if scale.Status.Selector == "" {
- errMsg := "selector is required"
- a.eventRecorder.Event(hpa, v1.EventTypeWarning, "SelectorRequired", errMsg)
- setCondition(hpa, autoscalingv2.ScalingActive, v1.ConditionFalse, "InvalidSelector", "the HPA target's scale is missing a selector")
- return 0, "", nil, time.Time{}, fmt.Errorf(errMsg)
- }
- selector, err := labels.Parse(scale.Status.Selector)
- if err != nil {
- errMsg := fmt.Sprintf("couldn't convert selector into a corresponding internal selector object: %v", err)
- a.eventRecorder.Event(hpa, v1.EventTypeWarning, "InvalidSelector", errMsg)
- setCondition(hpa, autoscalingv2.ScalingActive, v1.ConditionFalse, "InvalidSelector", errMsg)
- return 0, "", nil, time.Time{}, fmt.Errorf(errMsg)
- }
- invalidMetricsCount := 0
- var invalidMetricError error
- for i, metricSpec := range metricSpecs {
- replicaCountProposal, metricNameProposal, timestampProposal, err := a.computeReplicasForMetric(hpa, metricSpec, specReplicas, statusReplicas, selector, &statuses[i])
- if err != nil {
- invalidMetricsCount++
- invalidMetricError = err
- }
- if err == nil && (replicas == 0 || replicaCountProposal > replicas) {
- timestamp = timestampProposal
- replicas = replicaCountProposal
- metric = metricNameProposal
- }
- }
- // If all metrics are invalid or some are invalid and we would scale down,
- // return an error and set the condition of the hpa based on the first invalid metric.
- // Otherwise set the condition as scaling active as we're going to scale
- if invalidMetricsCount >= len(metricSpecs) || (invalidMetricsCount > 0 && replicas < specReplicas) {
- return 0, "", statuses, time.Time{}, fmt.Errorf("Invalid metrics (%v invalid out of %v), last error was: %v", invalidMetricsCount, len(metricSpecs), invalidMetricError)
- } else {
- setCondition(hpa, autoscalingv2.ScalingActive, v1.ConditionTrue, "ValidMetricFound", "the HPA was able to successfully calculate a replica count from %v", metric)
- }
- return replicas, metric, statuses, timestamp, nil
- }
- // computeReplicasForMetric computes the desired number of replicas for for a specific hpa and single metric specification.
- func (a *HorizontalController) computeReplicasForMetric(hpa *autoscalingv2.HorizontalPodAutoscaler, spec autoscalingv2.MetricSpec,
- specReplicas, statusReplicas int32, selector labels.Selector, status *autoscalingv2.MetricStatus) (replicaCountProposal int32, metricNameProposal string,
- timestampProposal time.Time, err error) {
- switch spec.Type {
- case autoscalingv2.ObjectMetricSourceType:
- metricSelector, err := metav1.LabelSelectorAsSelector(spec.Object.Metric.Selector)
- if err != nil {
- a.eventRecorder.Event(hpa, v1.EventTypeWarning, "FailedGetObjectMetric", err.Error())
- setCondition(hpa, autoscalingv2.ScalingActive, v1.ConditionFalse, "FailedGetObjectMetric", "the HPA was unable to compute the replica count: %v", err)
- return 0, "", time.Time{}, fmt.Errorf("failed to get object metric value: %v", err)
- }
- replicaCountProposal, timestampProposal, metricNameProposal, err = a.computeStatusForObjectMetric(specReplicas, statusReplicas, spec, hpa, selector, status, metricSelector)
- if err != nil {
- return 0, "", time.Time{}, fmt.Errorf("failed to get object metric value: %v", err)
- }
- case autoscalingv2.PodsMetricSourceType:
- metricSelector, err := metav1.LabelSelectorAsSelector(spec.Pods.Metric.Selector)
- if err != nil {
- a.eventRecorder.Event(hpa, v1.EventTypeWarning, "FailedGetPodsMetric", err.Error())
- setCondition(hpa, autoscalingv2.ScalingActive, v1.ConditionFalse, "FailedGetPodsMetric", "the HPA was unable to compute the replica count: %v", err)
- return 0, "", time.Time{}, fmt.Errorf("failed to get pods metric value: %v", err)
- }
- replicaCountProposal, timestampProposal, metricNameProposal, err = a.computeStatusForPodsMetric(specReplicas, spec, hpa, selector, status, metricSelector)
- if err != nil {
- return 0, "", time.Time{}, fmt.Errorf("failed to get object metric value: %v", err)
- }
- case autoscalingv2.ResourceMetricSourceType:
- replicaCountProposal, timestampProposal, metricNameProposal, err = a.computeStatusForResourceMetric(specReplicas, spec, hpa, selector, status)
- if err != nil {
- return 0, "", time.Time{}, err
- }
- case autoscalingv2.ExternalMetricSourceType:
- replicaCountProposal, timestampProposal, metricNameProposal, err = a.computeStatusForExternalMetric(specReplicas, statusReplicas, spec, hpa, selector, status)
- if err != nil {
- return 0, "", time.Time{}, err
- }
- default:
- errMsg := fmt.Sprintf("unknown metric source type %q", string(spec.Type))
- a.eventRecorder.Event(hpa, v1.EventTypeWarning, "InvalidMetricSourceType", errMsg)
- setCondition(hpa, autoscalingv2.ScalingActive, v1.ConditionFalse, "InvalidMetricSourceType", "the HPA was unable to compute the replica count: %v", fmt.Errorf(errMsg))
- return 0, "", time.Time{}, fmt.Errorf(errMsg)
- }
- return replicaCountProposal, metricNameProposal, timestampProposal, nil
- }
- func (a *HorizontalController) reconcileKey(key string) (deleted bool, err error) {
- namespace, name, err := cache.SplitMetaNamespaceKey(key)
- if err != nil {
- return true, err
- }
- hpa, err := a.hpaLister.HorizontalPodAutoscalers(namespace).Get(name)
- if errors.IsNotFound(err) {
- klog.Infof("Horizontal Pod Autoscaler %s has been deleted in %s", name, namespace)
- delete(a.recommendations, key)
- return true, nil
- }
- return false, a.reconcileAutoscaler(hpa, key)
- }
- // computeStatusForObjectMetric computes the desired number of replicas for the specified metric of type ObjectMetricSourceType.
- func (a *HorizontalController) computeStatusForObjectMetric(specReplicas, statusReplicas int32, metricSpec autoscalingv2.MetricSpec, hpa *autoscalingv2.HorizontalPodAutoscaler, selector labels.Selector, status *autoscalingv2.MetricStatus, metricSelector labels.Selector) (int32, time.Time, string, error) {
- if metricSpec.Object.Target.Type == autoscalingv2.ValueMetricType {
- replicaCountProposal, utilizationProposal, timestampProposal, err := a.replicaCalc.GetObjectMetricReplicas(specReplicas, metricSpec.Object.Target.Value.MilliValue(), metricSpec.Object.Metric.Name, hpa.Namespace, &metricSpec.Object.DescribedObject, selector, metricSelector)
- if err != nil {
- a.eventRecorder.Event(hpa, v1.EventTypeWarning, "FailedGetObjectMetric", err.Error())
- setCondition(hpa, autoscalingv2.ScalingActive, v1.ConditionFalse, "FailedGetObjectMetric", "the HPA was unable to compute the replica count: %v", err)
- return 0, timestampProposal, "", err
- }
- *status = autoscalingv2.MetricStatus{
- Type: autoscalingv2.ObjectMetricSourceType,
- Object: &autoscalingv2.ObjectMetricStatus{
- DescribedObject: metricSpec.Object.DescribedObject,
- Metric: autoscalingv2.MetricIdentifier{
- Name: metricSpec.Object.Metric.Name,
- Selector: metricSpec.Object.Metric.Selector,
- },
- Current: autoscalingv2.MetricValueStatus{
- Value: resource.NewMilliQuantity(utilizationProposal, resource.DecimalSI),
- },
- },
- }
- return replicaCountProposal, timestampProposal, fmt.Sprintf("%s metric %s", metricSpec.Object.DescribedObject.Kind, metricSpec.Object.Metric.Name), nil
- } else if metricSpec.Object.Target.Type == autoscalingv2.AverageValueMetricType {
- replicaCountProposal, utilizationProposal, timestampProposal, err := a.replicaCalc.GetObjectPerPodMetricReplicas(statusReplicas, metricSpec.Object.Target.AverageValue.MilliValue(), metricSpec.Object.Metric.Name, hpa.Namespace, &metricSpec.Object.DescribedObject, metricSelector)
- if err != nil {
- a.eventRecorder.Event(hpa, v1.EventTypeWarning, "FailedGetObjectMetric", err.Error())
- setCondition(hpa, autoscalingv2.ScalingActive, v1.ConditionFalse, "FailedGetObjectMetric", "the HPA was unable to compute the replica count: %v", err)
- return 0, time.Time{}, "", fmt.Errorf("failed to get %s object metric: %v", metricSpec.Object.Metric.Name, err)
- }
- *status = autoscalingv2.MetricStatus{
- Type: autoscalingv2.ObjectMetricSourceType,
- Object: &autoscalingv2.ObjectMetricStatus{
- Metric: autoscalingv2.MetricIdentifier{
- Name: metricSpec.Object.Metric.Name,
- Selector: metricSpec.Object.Metric.Selector,
- },
- Current: autoscalingv2.MetricValueStatus{
- AverageValue: resource.NewMilliQuantity(utilizationProposal, resource.DecimalSI),
- },
- },
- }
- return replicaCountProposal, timestampProposal, fmt.Sprintf("external metric %s(%+v)", metricSpec.Object.Metric.Name, metricSpec.Object.Metric.Selector), nil
- }
- errMsg := "invalid object metric source: neither a value target nor an average value target was set"
- a.eventRecorder.Event(hpa, v1.EventTypeWarning, "FailedGetObjectMetric", errMsg)
- setCondition(hpa, autoscalingv2.ScalingActive, v1.ConditionFalse, "FailedGetObjectMetric", "the HPA was unable to compute the replica count: %s", errMsg)
- return 0, time.Time{}, "", fmt.Errorf(errMsg)
- }
- // computeStatusForPodsMetric computes the desired number of replicas for the specified metric of type PodsMetricSourceType.
- func (a *HorizontalController) computeStatusForPodsMetric(currentReplicas int32, metricSpec autoscalingv2.MetricSpec, hpa *autoscalingv2.HorizontalPodAutoscaler, selector labels.Selector, status *autoscalingv2.MetricStatus, metricSelector labels.Selector) (int32, time.Time, string, error) {
- replicaCountProposal, utilizationProposal, timestampProposal, err := a.replicaCalc.GetMetricReplicas(currentReplicas, metricSpec.Pods.Target.AverageValue.MilliValue(), metricSpec.Pods.Metric.Name, hpa.Namespace, selector, metricSelector)
- if err != nil {
- a.eventRecorder.Event(hpa, v1.EventTypeWarning, "FailedGetPodsMetric", err.Error())
- setCondition(hpa, autoscalingv2.ScalingActive, v1.ConditionFalse, "FailedGetPodsMetric", "the HPA was unable to compute the replica count: %v", err)
- return 0, timestampProposal, "", err
- }
- *status = autoscalingv2.MetricStatus{
- Type: autoscalingv2.PodsMetricSourceType,
- Pods: &autoscalingv2.PodsMetricStatus{
- Metric: autoscalingv2.MetricIdentifier{
- Name: metricSpec.Pods.Metric.Name,
- Selector: metricSpec.Pods.Metric.Selector,
- },
- Current: autoscalingv2.MetricValueStatus{
- AverageValue: resource.NewMilliQuantity(utilizationProposal, resource.DecimalSI),
- },
- },
- }
- return replicaCountProposal, timestampProposal, fmt.Sprintf("pods metric %s", metricSpec.Pods.Metric.Name), nil
- }
- // computeStatusForResourceMetric computes the desired number of replicas for the specified metric of type ResourceMetricSourceType.
- func (a *HorizontalController) computeStatusForResourceMetric(currentReplicas int32, metricSpec autoscalingv2.MetricSpec, hpa *autoscalingv2.HorizontalPodAutoscaler, selector labels.Selector, status *autoscalingv2.MetricStatus) (int32, time.Time, string, error) {
- if metricSpec.Resource.Target.AverageValue != nil {
- var rawProposal int64
- replicaCountProposal, rawProposal, timestampProposal, err := a.replicaCalc.GetRawResourceReplicas(currentReplicas, metricSpec.Resource.Target.AverageValue.MilliValue(), metricSpec.Resource.Name, hpa.Namespace, selector)
- if err != nil {
- a.eventRecorder.Event(hpa, v1.EventTypeWarning, "FailedGetResourceMetric", err.Error())
- setCondition(hpa, autoscalingv2.ScalingActive, v1.ConditionFalse, "FailedGetResourceMetric", "the HPA was unable to compute the replica count: %v", err)
- return 0, time.Time{}, "", fmt.Errorf("failed to get %s utilization: %v", metricSpec.Resource.Name, err)
- }
- metricNameProposal := fmt.Sprintf("%s resource", metricSpec.Resource.Name)
- *status = autoscalingv2.MetricStatus{
- Type: autoscalingv2.ResourceMetricSourceType,
- Resource: &autoscalingv2.ResourceMetricStatus{
- Name: metricSpec.Resource.Name,
- Current: autoscalingv2.MetricValueStatus{
- AverageValue: resource.NewMilliQuantity(rawProposal, resource.DecimalSI),
- },
- },
- }
- return replicaCountProposal, timestampProposal, metricNameProposal, nil
- } else {
- if metricSpec.Resource.Target.AverageUtilization == nil {
- errMsg := "invalid resource metric source: neither a utilization target nor a value target was set"
- a.eventRecorder.Event(hpa, v1.EventTypeWarning, "FailedGetResourceMetric", errMsg)
- setCondition(hpa, autoscalingv2.ScalingActive, v1.ConditionFalse, "FailedGetResourceMetric", "the HPA was unable to compute the replica count: %s", errMsg)
- return 0, time.Time{}, "", fmt.Errorf(errMsg)
- }
- targetUtilization := *metricSpec.Resource.Target.AverageUtilization
- var percentageProposal int32
- var rawProposal int64
- replicaCountProposal, percentageProposal, rawProposal, timestampProposal, err := a.replicaCalc.GetResourceReplicas(currentReplicas, targetUtilization, metricSpec.Resource.Name, hpa.Namespace, selector)
- if err != nil {
- a.eventRecorder.Event(hpa, v1.EventTypeWarning, "FailedGetResourceMetric", err.Error())
- setCondition(hpa, autoscalingv2.ScalingActive, v1.ConditionFalse, "FailedGetResourceMetric", "the HPA was unable to compute the replica count: %v", err)
- return 0, time.Time{}, "", fmt.Errorf("failed to get %s utilization: %v", metricSpec.Resource.Name, err)
- }
- metricNameProposal := fmt.Sprintf("%s resource utilization (percentage of request)", metricSpec.Resource.Name)
- *status = autoscalingv2.MetricStatus{
- Type: autoscalingv2.ResourceMetricSourceType,
- Resource: &autoscalingv2.ResourceMetricStatus{
- Name: metricSpec.Resource.Name,
- Current: autoscalingv2.MetricValueStatus{
- AverageUtilization: &percentageProposal,
- AverageValue: resource.NewMilliQuantity(rawProposal, resource.DecimalSI),
- },
- },
- }
- return replicaCountProposal, timestampProposal, metricNameProposal, nil
- }
- }
- // computeStatusForExternalMetric computes the desired number of replicas for the specified metric of type ExternalMetricSourceType.
- func (a *HorizontalController) computeStatusForExternalMetric(specReplicas, statusReplicas int32, metricSpec autoscalingv2.MetricSpec, hpa *autoscalingv2.HorizontalPodAutoscaler, selector labels.Selector, status *autoscalingv2.MetricStatus) (int32, time.Time, string, error) {
- if metricSpec.External.Target.AverageValue != nil {
- replicaCountProposal, utilizationProposal, timestampProposal, err := a.replicaCalc.GetExternalPerPodMetricReplicas(statusReplicas, metricSpec.External.Target.AverageValue.MilliValue(), metricSpec.External.Metric.Name, hpa.Namespace, metricSpec.External.Metric.Selector)
- if err != nil {
- a.eventRecorder.Event(hpa, v1.EventTypeWarning, "FailedGetExternalMetric", err.Error())
- setCondition(hpa, autoscalingv2.ScalingActive, v1.ConditionFalse, "FailedGetExternalMetric", "the HPA was unable to compute the replica count: %v", err)
- return 0, time.Time{}, "", fmt.Errorf("failed to get %s external metric: %v", metricSpec.External.Metric.Name, err)
- }
- *status = autoscalingv2.MetricStatus{
- Type: autoscalingv2.ExternalMetricSourceType,
- External: &autoscalingv2.ExternalMetricStatus{
- Metric: autoscalingv2.MetricIdentifier{
- Name: metricSpec.External.Metric.Name,
- Selector: metricSpec.External.Metric.Selector,
- },
- Current: autoscalingv2.MetricValueStatus{
- AverageValue: resource.NewMilliQuantity(utilizationProposal, resource.DecimalSI),
- },
- },
- }
- return replicaCountProposal, timestampProposal, fmt.Sprintf("external metric %s(%+v)", metricSpec.External.Metric.Name, metricSpec.External.Metric.Selector), nil
- }
- if metricSpec.External.Target.Value != nil {
- replicaCountProposal, utilizationProposal, timestampProposal, err := a.replicaCalc.GetExternalMetricReplicas(specReplicas, metricSpec.External.Target.Value.MilliValue(), metricSpec.External.Metric.Name, hpa.Namespace, metricSpec.External.Metric.Selector, selector)
- if err != nil {
- a.eventRecorder.Event(hpa, v1.EventTypeWarning, "FailedGetExternalMetric", err.Error())
- setCondition(hpa, autoscalingv2.ScalingActive, v1.ConditionFalse, "FailedGetExternalMetric", "the HPA was unable to compute the replica count: %v", err)
- return 0, time.Time{}, "", fmt.Errorf("failed to get external metric %s: %v", metricSpec.External.Metric.Name, err)
- }
- *status = autoscalingv2.MetricStatus{
- Type: autoscalingv2.ExternalMetricSourceType,
- External: &autoscalingv2.ExternalMetricStatus{
- Metric: autoscalingv2.MetricIdentifier{
- Name: metricSpec.External.Metric.Name,
- Selector: metricSpec.External.Metric.Selector,
- },
- Current: autoscalingv2.MetricValueStatus{
- Value: resource.NewMilliQuantity(utilizationProposal, resource.DecimalSI),
- },
- },
- }
- return replicaCountProposal, timestampProposal, fmt.Sprintf("external metric %s(%+v)", metricSpec.External.Metric.Name, metricSpec.External.Metric.Selector), nil
- }
- errMsg := "invalid external metric source: neither a value target nor an average value target was set"
- a.eventRecorder.Event(hpa, v1.EventTypeWarning, "FailedGetExternalMetric", errMsg)
- setCondition(hpa, autoscalingv2.ScalingActive, v1.ConditionFalse, "FailedGetExternalMetric", "the HPA was unable to compute the replica count: %s", errMsg)
- return 0, time.Time{}, "", fmt.Errorf(errMsg)
- }
- func (a *HorizontalController) recordInitialRecommendation(currentReplicas int32, key string) {
- if a.recommendations[key] == nil {
- a.recommendations[key] = []timestampedRecommendation{{currentReplicas, time.Now()}}
- }
- }
- func (a *HorizontalController) reconcileAutoscaler(hpav1Shared *autoscalingv1.HorizontalPodAutoscaler, key string) error {
- // make a copy so that we never mutate the shared informer cache (conversion can mutate the object)
- hpav1 := hpav1Shared.DeepCopy()
- // then, convert to autoscaling/v2, which makes our lives easier when calculating metrics
- hpaRaw, err := unsafeConvertToVersionVia(hpav1, autoscalingv2.SchemeGroupVersion)
- if err != nil {
- a.eventRecorder.Event(hpav1, v1.EventTypeWarning, "FailedConvertHPA", err.Error())
- return fmt.Errorf("failed to convert the given HPA to %s: %v", autoscalingv2.SchemeGroupVersion.String(), err)
- }
- hpa := hpaRaw.(*autoscalingv2.HorizontalPodAutoscaler)
- hpaStatusOriginal := hpa.Status.DeepCopy()
- reference := fmt.Sprintf("%s/%s/%s", hpa.Spec.ScaleTargetRef.Kind, hpa.Namespace, hpa.Spec.ScaleTargetRef.Name)
- targetGV, err := schema.ParseGroupVersion(hpa.Spec.ScaleTargetRef.APIVersion)
- if err != nil {
- a.eventRecorder.Event(hpa, v1.EventTypeWarning, "FailedGetScale", err.Error())
- setCondition(hpa, autoscalingv2.AbleToScale, v1.ConditionFalse, "FailedGetScale", "the HPA controller was unable to get the target's current scale: %v", err)
- a.updateStatusIfNeeded(hpaStatusOriginal, hpa)
- return fmt.Errorf("invalid API version in scale target reference: %v", err)
- }
- targetGK := schema.GroupKind{
- Group: targetGV.Group,
- Kind: hpa.Spec.ScaleTargetRef.Kind,
- }
- mappings, err := a.mapper.RESTMappings(targetGK)
- if err != nil {
- a.eventRecorder.Event(hpa, v1.EventTypeWarning, "FailedGetScale", err.Error())
- setCondition(hpa, autoscalingv2.AbleToScale, v1.ConditionFalse, "FailedGetScale", "the HPA controller was unable to get the target's current scale: %v", err)
- a.updateStatusIfNeeded(hpaStatusOriginal, hpa)
- return fmt.Errorf("unable to determine resource for scale target reference: %v", err)
- }
- scale, targetGR, err := a.scaleForResourceMappings(hpa.Namespace, hpa.Spec.ScaleTargetRef.Name, mappings)
- if err != nil {
- a.eventRecorder.Event(hpa, v1.EventTypeWarning, "FailedGetScale", err.Error())
- setCondition(hpa, autoscalingv2.AbleToScale, v1.ConditionFalse, "FailedGetScale", "the HPA controller was unable to get the target's current scale: %v", err)
- a.updateStatusIfNeeded(hpaStatusOriginal, hpa)
- return fmt.Errorf("failed to query scale subresource for %s: %v", reference, err)
- }
- setCondition(hpa, autoscalingv2.AbleToScale, v1.ConditionTrue, "SucceededGetScale", "the HPA controller was able to get the target's current scale")
- currentReplicas := scale.Spec.Replicas
- a.recordInitialRecommendation(currentReplicas, key)
- var (
- metricStatuses []autoscalingv2.MetricStatus
- metricDesiredReplicas int32
- metricName string
- )
- desiredReplicas := int32(0)
- rescaleReason := ""
- rescale := true
- if scale.Spec.Replicas == 0 {
- // Autoscaling is disabled for this resource
- desiredReplicas = 0
- rescale = false
- setCondition(hpa, autoscalingv2.ScalingActive, v1.ConditionFalse, "ScalingDisabled", "scaling is disabled since the replica count of the target is zero")
- } else if currentReplicas > hpa.Spec.MaxReplicas {
- rescaleReason = "Current number of replicas above Spec.MaxReplicas"
- desiredReplicas = hpa.Spec.MaxReplicas
- } else if hpa.Spec.MinReplicas != nil && currentReplicas < *hpa.Spec.MinReplicas {
- rescaleReason = "Current number of replicas below Spec.MinReplicas"
- desiredReplicas = *hpa.Spec.MinReplicas
- } else if currentReplicas == 0 {
- rescaleReason = "Current number of replicas must be greater than 0"
- desiredReplicas = 1
- } else {
- var metricTimestamp time.Time
- metricDesiredReplicas, metricName, metricStatuses, metricTimestamp, err = a.computeReplicasForMetrics(hpa, scale, hpa.Spec.Metrics)
- if err != nil {
- a.setCurrentReplicasInStatus(hpa, currentReplicas)
- if err := a.updateStatusIfNeeded(hpaStatusOriginal, hpa); err != nil {
- utilruntime.HandleError(err)
- }
- a.eventRecorder.Event(hpa, v1.EventTypeWarning, "FailedComputeMetricsReplicas", err.Error())
- return fmt.Errorf("failed to compute desired number of replicas based on listed metrics for %s: %v", reference, err)
- }
- klog.V(4).Infof("proposing %v desired replicas (based on %s from %s) for %s", metricDesiredReplicas, metricName, metricTimestamp, reference)
- rescaleMetric := ""
- if metricDesiredReplicas > desiredReplicas {
- desiredReplicas = metricDesiredReplicas
- rescaleMetric = metricName
- }
- if desiredReplicas > currentReplicas {
- rescaleReason = fmt.Sprintf("%s above target", rescaleMetric)
- }
- if desiredReplicas < currentReplicas {
- rescaleReason = "All metrics below target"
- }
- desiredReplicas = a.normalizeDesiredReplicas(hpa, key, currentReplicas, desiredReplicas)
- rescale = desiredReplicas != currentReplicas
- }
- if rescale {
- scale.Spec.Replicas = desiredReplicas
- _, err = a.scaleNamespacer.Scales(hpa.Namespace).Update(targetGR, scale)
- if err != nil {
- a.eventRecorder.Eventf(hpa, v1.EventTypeWarning, "FailedRescale", "New size: %d; reason: %s; error: %v", desiredReplicas, rescaleReason, err.Error())
- setCondition(hpa, autoscalingv2.AbleToScale, v1.ConditionFalse, "FailedUpdateScale", "the HPA controller was unable to update the target scale: %v", err)
- a.setCurrentReplicasInStatus(hpa, currentReplicas)
- if err := a.updateStatusIfNeeded(hpaStatusOriginal, hpa); err != nil {
- utilruntime.HandleError(err)
- }
- return fmt.Errorf("failed to rescale %s: %v", reference, err)
- }
- setCondition(hpa, autoscalingv2.AbleToScale, v1.ConditionTrue, "SucceededRescale", "the HPA controller was able to update the target scale to %d", desiredReplicas)
- a.eventRecorder.Eventf(hpa, v1.EventTypeNormal, "SuccessfulRescale", "New size: %d; reason: %s", desiredReplicas, rescaleReason)
- klog.Infof("Successful rescale of %s, old size: %d, new size: %d, reason: %s",
- hpa.Name, currentReplicas, desiredReplicas, rescaleReason)
- } else {
- klog.V(4).Infof("decided not to scale %s to %v (last scale time was %s)", reference, desiredReplicas, hpa.Status.LastScaleTime)
- desiredReplicas = currentReplicas
- }
- a.setStatus(hpa, currentReplicas, desiredReplicas, metricStatuses, rescale)
- return a.updateStatusIfNeeded(hpaStatusOriginal, hpa)
- }
- // stabilizeRecommendation:
- // - replaces old recommendation with the newest recommendation,
- // - returns max of recommendations that are not older than downscaleStabilisationWindow.
- func (a *HorizontalController) stabilizeRecommendation(key string, prenormalizedDesiredReplicas int32) int32 {
- maxRecommendation := prenormalizedDesiredReplicas
- foundOldSample := false
- oldSampleIndex := 0
- cutoff := time.Now().Add(-a.downscaleStabilisationWindow)
- for i, rec := range a.recommendations[key] {
- if rec.timestamp.Before(cutoff) {
- foundOldSample = true
- oldSampleIndex = i
- } else if rec.recommendation > maxRecommendation {
- maxRecommendation = rec.recommendation
- }
- }
- if foundOldSample {
- a.recommendations[key][oldSampleIndex] = timestampedRecommendation{prenormalizedDesiredReplicas, time.Now()}
- } else {
- a.recommendations[key] = append(a.recommendations[key], timestampedRecommendation{prenormalizedDesiredReplicas, time.Now()})
- }
- return maxRecommendation
- }
- // normalizeDesiredReplicas takes the metrics desired replicas value and normalizes it based on the appropriate conditions (i.e. < maxReplicas, >
- // minReplicas, etc...)
- func (a *HorizontalController) normalizeDesiredReplicas(hpa *autoscalingv2.HorizontalPodAutoscaler, key string, currentReplicas int32, prenormalizedDesiredReplicas int32) int32 {
- stabilizedRecommendation := a.stabilizeRecommendation(key, prenormalizedDesiredReplicas)
- if stabilizedRecommendation != prenormalizedDesiredReplicas {
- setCondition(hpa, autoscalingv2.AbleToScale, v1.ConditionTrue, "ScaleDownStabilized", "recent recommendations were higher than current one, applying the highest recent recommendation")
- } else {
- setCondition(hpa, autoscalingv2.AbleToScale, v1.ConditionTrue, "ReadyForNewScale", "recommended size matches current size")
- }
- var minReplicas int32
- if hpa.Spec.MinReplicas != nil {
- minReplicas = *hpa.Spec.MinReplicas
- } else {
- minReplicas = 0
- }
- desiredReplicas, condition, reason := convertDesiredReplicasWithRules(currentReplicas, stabilizedRecommendation, minReplicas, hpa.Spec.MaxReplicas)
- if desiredReplicas == stabilizedRecommendation {
- setCondition(hpa, autoscalingv2.ScalingLimited, v1.ConditionFalse, condition, reason)
- } else {
- setCondition(hpa, autoscalingv2.ScalingLimited, v1.ConditionTrue, condition, reason)
- }
- return desiredReplicas
- }
- // convertDesiredReplicas performs the actual normalization, without depending on `HorizontalController` or `HorizontalPodAutoscaler`
- func convertDesiredReplicasWithRules(currentReplicas, desiredReplicas, hpaMinReplicas, hpaMaxReplicas int32) (int32, string, string) {
- var minimumAllowedReplicas int32
- var maximumAllowedReplicas int32
- var possibleLimitingCondition string
- var possibleLimitingReason string
- if hpaMinReplicas == 0 {
- minimumAllowedReplicas = 1
- possibleLimitingReason = "the desired replica count is zero"
- } else {
- minimumAllowedReplicas = hpaMinReplicas
- possibleLimitingReason = "the desired replica count is less than the minimum replica count"
- }
- // Do not upscale too much to prevent incorrect rapid increase of the number of master replicas caused by
- // bogus CPU usage report from heapster/kubelet (like in issue #32304).
- scaleUpLimit := calculateScaleUpLimit(currentReplicas)
- if hpaMaxReplicas > scaleUpLimit {
- maximumAllowedReplicas = scaleUpLimit
- possibleLimitingCondition = "ScaleUpLimit"
- possibleLimitingReason = "the desired replica count is increasing faster than the maximum scale rate"
- } else {
- maximumAllowedReplicas = hpaMaxReplicas
- possibleLimitingCondition = "TooManyReplicas"
- possibleLimitingReason = "the desired replica count is more than the maximum replica count"
- }
- if desiredReplicas < minimumAllowedReplicas {
- possibleLimitingCondition = "TooFewReplicas"
- return minimumAllowedReplicas, possibleLimitingCondition, possibleLimitingReason
- } else if desiredReplicas > maximumAllowedReplicas {
- return maximumAllowedReplicas, possibleLimitingCondition, possibleLimitingReason
- }
- return desiredReplicas, "DesiredWithinRange", "the desired count is within the acceptable range"
- }
- func calculateScaleUpLimit(currentReplicas int32) int32 {
- return int32(math.Max(scaleUpLimitFactor*float64(currentReplicas), scaleUpLimitMinimum))
- }
- // scaleForResourceMappings attempts to fetch the scale for the
- // resource with the given name and namespace, trying each RESTMapping
- // in turn until a working one is found. If none work, the first error
- // is returned. It returns both the scale, as well as the group-resource from
- // the working mapping.
- func (a *HorizontalController) scaleForResourceMappings(namespace, name string, mappings []*apimeta.RESTMapping) (*autoscalingv1.Scale, schema.GroupResource, error) {
- var firstErr error
- for i, mapping := range mappings {
- targetGR := mapping.Resource.GroupResource()
- scale, err := a.scaleNamespacer.Scales(namespace).Get(targetGR, name)
- if err == nil {
- return scale, targetGR, nil
- }
- // if this is the first error, remember it,
- // then go on and try other mappings until we find a good one
- if i == 0 {
- firstErr = err
- }
- }
- // make sure we handle an empty set of mappings
- if firstErr == nil {
- firstErr = fmt.Errorf("unrecognized resource")
- }
- return nil, schema.GroupResource{}, firstErr
- }
- // setCurrentReplicasInStatus sets the current replica count in the status of the HPA.
- func (a *HorizontalController) setCurrentReplicasInStatus(hpa *autoscalingv2.HorizontalPodAutoscaler, currentReplicas int32) {
- a.setStatus(hpa, currentReplicas, hpa.Status.DesiredReplicas, hpa.Status.CurrentMetrics, false)
- }
- // setStatus recreates the status of the given HPA, updating the current and
- // desired replicas, as well as the metric statuses
- func (a *HorizontalController) setStatus(hpa *autoscalingv2.HorizontalPodAutoscaler, currentReplicas, desiredReplicas int32, metricStatuses []autoscalingv2.MetricStatus, rescale bool) {
- hpa.Status = autoscalingv2.HorizontalPodAutoscalerStatus{
- CurrentReplicas: currentReplicas,
- DesiredReplicas: desiredReplicas,
- LastScaleTime: hpa.Status.LastScaleTime,
- CurrentMetrics: metricStatuses,
- Conditions: hpa.Status.Conditions,
- }
- if rescale {
- now := metav1.NewTime(time.Now())
- hpa.Status.LastScaleTime = &now
- }
- }
- // updateStatusIfNeeded calls updateStatus only if the status of the new HPA is not the same as the old status
- func (a *HorizontalController) updateStatusIfNeeded(oldStatus *autoscalingv2.HorizontalPodAutoscalerStatus, newHPA *autoscalingv2.HorizontalPodAutoscaler) error {
- // skip a write if we wouldn't need to update
- if apiequality.Semantic.DeepEqual(oldStatus, &newHPA.Status) {
- return nil
- }
- return a.updateStatus(newHPA)
- }
- // updateStatus actually does the update request for the status of the given HPA
- func (a *HorizontalController) updateStatus(hpa *autoscalingv2.HorizontalPodAutoscaler) error {
- // convert back to autoscalingv1
- hpaRaw, err := unsafeConvertToVersionVia(hpa, autoscalingv1.SchemeGroupVersion)
- if err != nil {
- a.eventRecorder.Event(hpa, v1.EventTypeWarning, "FailedConvertHPA", err.Error())
- return fmt.Errorf("failed to convert the given HPA to %s: %v", autoscalingv2.SchemeGroupVersion.String(), err)
- }
- hpav1 := hpaRaw.(*autoscalingv1.HorizontalPodAutoscaler)
- _, err = a.hpaNamespacer.HorizontalPodAutoscalers(hpav1.Namespace).UpdateStatus(hpav1)
- if err != nil {
- a.eventRecorder.Event(hpa, v1.EventTypeWarning, "FailedUpdateStatus", err.Error())
- return fmt.Errorf("failed to update status for %s: %v", hpa.Name, err)
- }
- klog.V(2).Infof("Successfully updated status for %s", hpa.Name)
- return nil
- }
- // unsafeConvertToVersionVia is like Scheme.UnsafeConvertToVersion, but it does so via an internal version first.
- // We use it since working with v2alpha1 is convenient here, but we want to use the v1 client (and
- // can't just use the internal version). Note that conversion mutates the object, so you need to deepcopy
- // *before* you call this if the input object came out of a shared cache.
- func unsafeConvertToVersionVia(obj runtime.Object, externalVersion schema.GroupVersion) (runtime.Object, error) {
- objInt, err := legacyscheme.Scheme.UnsafeConvertToVersion(obj, schema.GroupVersion{Group: externalVersion.Group, Version: runtime.APIVersionInternal})
- if err != nil {
- return nil, fmt.Errorf("failed to convert the given object to the internal version: %v", err)
- }
- objExt, err := legacyscheme.Scheme.UnsafeConvertToVersion(objInt, externalVersion)
- if err != nil {
- return nil, fmt.Errorf("failed to convert the given object back to the external version: %v", err)
- }
- return objExt, err
- }
- // setCondition sets the specific condition type on the given HPA to the specified value with the given reason
- // and message. The message and args are treated like a format string. The condition will be added if it is
- // not present.
- func setCondition(hpa *autoscalingv2.HorizontalPodAutoscaler, conditionType autoscalingv2.HorizontalPodAutoscalerConditionType, status v1.ConditionStatus, reason, message string, args ...interface{}) {
- hpa.Status.Conditions = setConditionInList(hpa.Status.Conditions, conditionType, status, reason, message, args...)
- }
- // setConditionInList sets the specific condition type on the given HPA to the specified value with the given
- // reason and message. The message and args are treated like a format string. The condition will be added if
- // it is not present. The new list will be returned.
- func setConditionInList(inputList []autoscalingv2.HorizontalPodAutoscalerCondition, conditionType autoscalingv2.HorizontalPodAutoscalerConditionType, status v1.ConditionStatus, reason, message string, args ...interface{}) []autoscalingv2.HorizontalPodAutoscalerCondition {
- resList := inputList
- var existingCond *autoscalingv2.HorizontalPodAutoscalerCondition
- for i, condition := range resList {
- if condition.Type == conditionType {
- // can't take a pointer to an iteration variable
- existingCond = &resList[i]
- break
- }
- }
- if existingCond == nil {
- resList = append(resList, autoscalingv2.HorizontalPodAutoscalerCondition{
- Type: conditionType,
- })
- existingCond = &resList[len(resList)-1]
- }
- if existingCond.Status != status {
- existingCond.LastTransitionTime = metav1.Now()
- }
- existingCond.Status = status
- existingCond.Reason = reason
- existingCond.Message = fmt.Sprintf(message, args...)
- return resList
- }
|