2017-02-01 00:45:59 +00:00
/ *
Copyright 2016 The Kubernetes Authors .
Licensed under the Apache License , Version 2.0 ( the "License" ) ;
you may not use this file except in compliance with the License .
You may obtain a copy of the License at
http : //www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing , software
distributed under the License is distributed on an "AS IS" BASIS ,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND , either express or implied .
See the License for the specific language governing permissions and
limitations under the License .
* /
package deployment
import (
"fmt"
"reflect"
"sort"
"strconv"
"github.com/golang/glog"
"k8s.io/apimachinery/pkg/api/errors"
metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
"k8s.io/apimachinery/pkg/labels"
utilerrors "k8s.io/apimachinery/pkg/util/errors"
"k8s.io/kubernetes/pkg/api"
"k8s.io/kubernetes/pkg/api/v1"
extensions "k8s.io/kubernetes/pkg/apis/extensions/v1beta1"
"k8s.io/kubernetes/pkg/controller"
deploymentutil "k8s.io/kubernetes/pkg/controller/deployment/util"
labelsutil "k8s.io/kubernetes/pkg/util/labels"
)
// syncStatusOnly only updates Deployments Status and doesn't take any mutating actions.
func ( dc * DeploymentController ) syncStatusOnly ( deployment * extensions . Deployment ) error {
newRS , oldRSs , err := dc . getAllReplicaSetsAndSyncRevision ( deployment , false )
if err != nil {
return err
}
allRSs := append ( oldRSs , newRS )
return dc . syncDeploymentStatus ( allRSs , newRS , deployment )
}
// sync is responsible for reconciling deployments on scaling events or when they
// are paused.
func ( dc * DeploymentController ) sync ( deployment * extensions . Deployment ) error {
newRS , oldRSs , err := dc . getAllReplicaSetsAndSyncRevision ( deployment , false )
if err != nil {
return err
}
if err := dc . scale ( deployment , newRS , oldRSs ) ; err != nil {
// If we get an error while trying to scale, the deployment will be requeued
// so we can abort this resync
return err
}
allRSs := append ( oldRSs , newRS )
return dc . syncDeploymentStatus ( allRSs , newRS , deployment )
}
// checkPausedConditions checks if the given deployment is paused or not and adds an appropriate condition.
// These conditions are needed so that we won't accidentally report lack of progress for resumed deployments
// that were paused for longer than progressDeadlineSeconds.
func ( dc * DeploymentController ) checkPausedConditions ( d * extensions . Deployment ) error {
if d . Spec . ProgressDeadlineSeconds == nil {
return nil
}
cond := deploymentutil . GetDeploymentCondition ( d . Status , extensions . DeploymentProgressing )
if cond != nil && cond . Reason == deploymentutil . TimedOutReason {
// If we have reported lack of progress, do not overwrite it with a paused condition.
return nil
}
pausedCondExists := cond != nil && cond . Reason == deploymentutil . PausedDeployReason
needsUpdate := false
if d . Spec . Paused && ! pausedCondExists {
condition := deploymentutil . NewDeploymentCondition ( extensions . DeploymentProgressing , v1 . ConditionUnknown , deploymentutil . PausedDeployReason , "Deployment is paused" )
deploymentutil . SetDeploymentCondition ( & d . Status , * condition )
needsUpdate = true
} else if ! d . Spec . Paused && pausedCondExists {
condition := deploymentutil . NewDeploymentCondition ( extensions . DeploymentProgressing , v1 . ConditionUnknown , deploymentutil . ResumedDeployReason , "Deployment is resumed" )
deploymentutil . SetDeploymentCondition ( & d . Status , * condition )
needsUpdate = true
}
if ! needsUpdate {
return nil
}
var err error
d , err = dc . client . Extensions ( ) . Deployments ( d . Namespace ) . UpdateStatus ( d )
return err
}
// getAllReplicaSetsAndSyncRevision returns all the replica sets for the provided deployment (new and all old), with new RS's and deployment's revision updated.
// 1. Get all old RSes this deployment targets, and calculate the max revision number among them (maxOldV).
// 2. Get new RS this deployment targets (whose pod template matches deployment's), and update new RS's revision number to (maxOldV + 1),
// only if its revision number is smaller than (maxOldV + 1). If this step failed, we'll update it in the next deployment sync loop.
// 3. Copy new RS's revision number to deployment (update deployment's revision). If this step failed, we'll update it in the next deployment sync loop.
// Note that currently the deployment controller is using caches to avoid querying the server for reads.
// This may lead to stale reads of replica sets, thus incorrect deployment status.
func ( dc * DeploymentController ) getAllReplicaSetsAndSyncRevision ( deployment * extensions . Deployment , createIfNotExisted bool ) ( * extensions . ReplicaSet , [ ] * extensions . ReplicaSet , error ) {
// List the deployment's RSes & Pods and apply pod-template-hash info to deployment's adopted RSes/Pods
rsList , podList , err := dc . rsAndPodsWithHashKeySynced ( deployment )
if err != nil {
return nil , nil , fmt . Errorf ( "error labeling replica sets and pods with pod-template-hash: %v" , err )
}
_ , allOldRSs , err := deploymentutil . FindOldReplicaSets ( deployment , rsList , podList )
if err != nil {
return nil , nil , err
}
// Get new replica set with the updated revision number
newRS , err := dc . getNewReplicaSet ( deployment , rsList , allOldRSs , createIfNotExisted )
if err != nil {
return nil , nil , err
}
return newRS , allOldRSs , nil
}
// rsAndPodsWithHashKeySynced returns the RSes and pods the given deployment targets, with pod-template-hash information synced.
func ( dc * DeploymentController ) rsAndPodsWithHashKeySynced ( deployment * extensions . Deployment ) ( [ ] * extensions . ReplicaSet , * v1 . PodList , error ) {
rsList , err := deploymentutil . ListReplicaSets ( deployment ,
2017-02-03 13:41:32 +00:00
func ( namespace string , options metav1 . ListOptions ) ( [ ] * extensions . ReplicaSet , error ) {
2017-02-01 00:45:59 +00:00
parsed , err := labels . Parse ( options . LabelSelector )
if err != nil {
return nil , err
}
return dc . rsLister . ReplicaSets ( namespace ) . List ( parsed )
} )
if err != nil {
return nil , nil , fmt . Errorf ( "error listing ReplicaSets: %v" , err )
}
syncedRSList := [ ] * extensions . ReplicaSet { }
for _ , rs := range rsList {
// Add pod-template-hash information if it's not in the RS.
// Otherwise, new RS produced by Deployment will overlap with pre-existing ones
// that aren't constrained by the pod-template-hash.
syncedRS , err := dc . addHashKeyToRSAndPods ( rs )
if err != nil {
return nil , nil , err
}
syncedRSList = append ( syncedRSList , syncedRS )
}
syncedPodList , err := dc . listPods ( deployment )
if err != nil {
return nil , nil , err
}
return syncedRSList , syncedPodList , nil
}
// addHashKeyToRSAndPods adds pod-template-hash information to the given rs, if it's not already there, with the following steps:
// 1. Add hash label to the rs's pod template, and make sure the controller sees this update so that no orphaned pods will be created
// 2. Add hash label to all pods this rs owns, wait until replicaset controller reports rs.Status.FullyLabeledReplicas equal to the desired number of replicas
// 3. Add hash label to the rs's label and selector
func ( dc * DeploymentController ) addHashKeyToRSAndPods ( rs * extensions . ReplicaSet ) ( * extensions . ReplicaSet , error ) {
// If the rs already has the new hash label in its selector, it's done syncing
if labelsutil . SelectorHasLabel ( rs . Spec . Selector , extensions . DefaultDeploymentUniqueLabelKey ) {
return rs , nil
}
hash := deploymentutil . GetReplicaSetHash ( rs )
// 1. Add hash template label to the rs. This ensures that any newly created pods will have the new label.
updatedRS , err := deploymentutil . UpdateRSWithRetries ( dc . client . Extensions ( ) . ReplicaSets ( rs . Namespace ) , dc . rsLister , rs . Namespace , rs . Name ,
func ( updated * extensions . ReplicaSet ) error {
// Precondition: the RS doesn't contain the new hash in its pod template label.
if updated . Spec . Template . Labels [ extensions . DefaultDeploymentUniqueLabelKey ] == hash {
return utilerrors . ErrPreconditionViolated
}
updated . Spec . Template . Labels = labelsutil . AddLabel ( updated . Spec . Template . Labels , extensions . DefaultDeploymentUniqueLabelKey , hash )
return nil
} )
if err != nil {
return nil , fmt . Errorf ( "error updating replica set %s/%s pod template label with template hash: %v" , rs . Namespace , rs . Name , err )
}
// Make sure rs pod template is updated so that it won't create pods without the new label (orphaned pods).
if updatedRS . Generation > updatedRS . Status . ObservedGeneration {
if err = deploymentutil . WaitForReplicaSetUpdated ( dc . client , updatedRS . Generation , updatedRS . Namespace , updatedRS . Name ) ; err != nil {
return nil , fmt . Errorf ( "error waiting for replica set %s/%s to be observed by controller: %v" , updatedRS . Namespace , updatedRS . Name , err )
}
glog . V ( 4 ) . Infof ( "Observed the update of replica set %s/%s's pod template with hash %s." , rs . Namespace , rs . Name , hash )
}
// 2. Update all pods managed by the rs to have the new hash label, so they will be correctly adopted.
selector , err := metav1 . LabelSelectorAsSelector ( updatedRS . Spec . Selector )
if err != nil {
return nil , fmt . Errorf ( "error in converting selector to label selector for replica set %s: %s" , updatedRS . Name , err )
}
2017-02-03 13:41:32 +00:00
options := metav1 . ListOptions { LabelSelector : selector . String ( ) }
2017-02-01 00:45:59 +00:00
parsed , err := labels . Parse ( options . LabelSelector )
if err != nil {
return nil , err
}
pods , err := dc . podLister . Pods ( updatedRS . Namespace ) . List ( parsed )
if err != nil {
return nil , fmt . Errorf ( "error in getting pod list for namespace %s and list options %+v: %s" , rs . Namespace , options , err )
}
podList := v1 . PodList { Items : make ( [ ] v1 . Pod , 0 , len ( pods ) ) }
for i := range pods {
podList . Items = append ( podList . Items , * pods [ i ] )
}
if err := deploymentutil . LabelPodsWithHash ( & podList , dc . client , dc . podLister , rs . Namespace , rs . Name , hash ) ; err != nil {
return nil , fmt . Errorf ( "error in adding template hash label %s to pods %+v: %s" , hash , podList , err )
}
// We need to wait for the replicaset controller to observe the pods being
// labeled with pod template hash. Because previously we've called
// WaitForReplicaSetUpdated, the replicaset controller should have dropped
// FullyLabeledReplicas to 0 already, we only need to wait it to increase
// back to the number of replicas in the spec.
if err := deploymentutil . WaitForPodsHashPopulated ( dc . client , updatedRS . Generation , updatedRS . Namespace , updatedRS . Name ) ; err != nil {
return nil , fmt . Errorf ( "Replica set %s/%s: error waiting for replicaset controller to observe pods being labeled with template hash: %v" , updatedRS . Namespace , updatedRS . Name , err )
}
// 3. Update rs label and selector to include the new hash label
// Copy the old selector, so that we can scrub out any orphaned pods
updatedRS , err = deploymentutil . UpdateRSWithRetries ( dc . client . Extensions ( ) . ReplicaSets ( rs . Namespace ) , dc . rsLister , rs . Namespace , rs . Name , func ( updated * extensions . ReplicaSet ) error {
// Precondition: the RS doesn't contain the new hash in its label and selector.
if updated . Labels [ extensions . DefaultDeploymentUniqueLabelKey ] == hash && updated . Spec . Selector . MatchLabels [ extensions . DefaultDeploymentUniqueLabelKey ] == hash {
return utilerrors . ErrPreconditionViolated
}
updated . Labels = labelsutil . AddLabel ( updated . Labels , extensions . DefaultDeploymentUniqueLabelKey , hash )
updated . Spec . Selector = labelsutil . AddLabelToSelector ( updated . Spec . Selector , extensions . DefaultDeploymentUniqueLabelKey , hash )
return nil
} )
// If the RS isn't actually updated, that's okay, we'll retry in the
// next sync loop since its selector isn't updated yet.
if err != nil {
return nil , fmt . Errorf ( "error updating ReplicaSet %s/%s label and selector with template hash: %v" , updatedRS . Namespace , updatedRS . Name , err )
}
// TODO: look for orphaned pods and label them in the background somewhere else periodically
return updatedRS , nil
}
func ( dc * DeploymentController ) listPods ( deployment * extensions . Deployment ) ( * v1 . PodList , error ) {
return deploymentutil . ListPods ( deployment ,
2017-02-03 13:41:32 +00:00
func ( namespace string , options metav1 . ListOptions ) ( * v1 . PodList , error ) {
2017-02-01 00:45:59 +00:00
parsed , err := labels . Parse ( options . LabelSelector )
if err != nil {
return nil , err
}
pods , err := dc . podLister . Pods ( namespace ) . List ( parsed )
result := v1 . PodList { Items : make ( [ ] v1 . Pod , 0 , len ( pods ) ) }
for i := range pods {
result . Items = append ( result . Items , * pods [ i ] )
}
return & result , err
} )
}
// Returns a replica set that matches the intent of the given deployment. Returns nil if the new replica set doesn't exist yet.
// 1. Get existing new RS (the RS that the given deployment targets, whose pod template is the same as deployment's).
// 2. If there's existing new RS, update its revision number if it's smaller than (maxOldRevision + 1), where maxOldRevision is the max revision number among all old RSes.
// 3. If there's no existing new RS and createIfNotExisted is true, create one with appropriate revision number (maxOldRevision + 1) and replicas.
// Note that the pod-template-hash will be added to adopted RSes and pods.
func ( dc * DeploymentController ) getNewReplicaSet ( deployment * extensions . Deployment , rsList , oldRSs [ ] * extensions . ReplicaSet , createIfNotExisted bool ) ( * extensions . ReplicaSet , error ) {
existingNewRS , err := deploymentutil . FindNewReplicaSet ( deployment , rsList )
if err != nil {
return nil , err
}
// Calculate the max revision number among all old RSes
maxOldRevision := deploymentutil . MaxRevision ( oldRSs )
// Calculate revision number for this new replica set
newRevision := strconv . FormatInt ( maxOldRevision + 1 , 10 )
// Latest replica set exists. We need to sync its annotations (includes copying all but
// annotationsToSkip from the parent deployment, and update revision, desiredReplicas,
// and maxReplicas) and also update the revision annotation in the deployment with the
// latest revision.
if existingNewRS != nil {
objCopy , err := api . Scheme . Copy ( existingNewRS )
if err != nil {
return nil , err
}
rsCopy := objCopy . ( * extensions . ReplicaSet )
// Set existing new replica set's annotation
annotationsUpdated := deploymentutil . SetNewReplicaSetAnnotations ( deployment , rsCopy , newRevision , true )
minReadySecondsNeedsUpdate := rsCopy . Spec . MinReadySeconds != deployment . Spec . MinReadySeconds
if annotationsUpdated || minReadySecondsNeedsUpdate {
rsCopy . Spec . MinReadySeconds = deployment . Spec . MinReadySeconds
return dc . client . Extensions ( ) . ReplicaSets ( rsCopy . ObjectMeta . Namespace ) . Update ( rsCopy )
}
updateConditions := deploymentutil . SetDeploymentRevision ( deployment , newRevision )
// If no other Progressing condition has been recorded and we need to estimate the progress
// of this deployment then it is likely that old users started caring about progress. In that
// case we need to take into account the first time we noticed their new replica set.
cond := deploymentutil . GetDeploymentCondition ( deployment . Status , extensions . DeploymentProgressing )
if deployment . Spec . ProgressDeadlineSeconds != nil && cond == nil {
msg := fmt . Sprintf ( "Found new replica set %q" , rsCopy . Name )
condition := deploymentutil . NewDeploymentCondition ( extensions . DeploymentProgressing , v1 . ConditionTrue , deploymentutil . FoundNewRSReason , msg )
deploymentutil . SetDeploymentCondition ( & deployment . Status , * condition )
updateConditions = true
}
if updateConditions {
if deployment , err = dc . client . Extensions ( ) . Deployments ( deployment . Namespace ) . UpdateStatus ( deployment ) ; err != nil {
return nil , err
}
}
return rsCopy , nil
}
if ! createIfNotExisted {
return nil , nil
}
// new ReplicaSet does not exist, create one.
namespace := deployment . Namespace
podTemplateSpecHash := fmt . Sprintf ( "%d" , deploymentutil . GetPodTemplateSpecHash ( deployment . Spec . Template ) )
newRSTemplate := deploymentutil . GetNewReplicaSetTemplate ( deployment )
newRSTemplate . Labels = labelsutil . CloneAndAddLabel ( deployment . Spec . Template . Labels , extensions . DefaultDeploymentUniqueLabelKey , podTemplateSpecHash )
// Add podTemplateHash label to selector.
newRSSelector := labelsutil . CloneSelectorAndAddLabel ( deployment . Spec . Selector , extensions . DefaultDeploymentUniqueLabelKey , podTemplateSpecHash )
// Create new ReplicaSet
newRS := extensions . ReplicaSet {
2017-02-03 13:41:32 +00:00
ObjectMeta : metav1 . ObjectMeta {
2017-02-01 00:45:59 +00:00
// Make the name deterministic, to ensure idempotence
Name : deployment . Name + "-" + podTemplateSpecHash ,
Namespace : namespace ,
} ,
Spec : extensions . ReplicaSetSpec {
Replicas : func ( i int32 ) * int32 { return & i } ( 0 ) ,
MinReadySeconds : deployment . Spec . MinReadySeconds ,
Selector : newRSSelector ,
Template : newRSTemplate ,
} ,
}
var trueVar = true
controllerRef := & metav1 . OwnerReference {
APIVersion : getDeploymentKind ( ) . GroupVersion ( ) . String ( ) ,
Kind : getDeploymentKind ( ) . Kind ,
Name : deployment . Name ,
UID : deployment . UID ,
Controller : & trueVar ,
}
newRS . OwnerReferences = append ( newRS . OwnerReferences , * controllerRef )
allRSs := append ( oldRSs , & newRS )
newReplicasCount , err := deploymentutil . NewRSNewReplicas ( deployment , allRSs , & newRS )
if err != nil {
return nil , err
}
* ( newRS . Spec . Replicas ) = newReplicasCount
// Set new replica set's annotation
deploymentutil . SetNewReplicaSetAnnotations ( deployment , & newRS , newRevision , false )
createdRS , err := dc . client . Extensions ( ) . ReplicaSets ( namespace ) . Create ( & newRS )
switch {
// We may end up hitting this due to a slow cache or a fast resync of the deployment.
// TODO: Restore once https://github.com/kubernetes/kubernetes/issues/29735 is fixed
// ie. we start using a new hashing algorithm.
case errors . IsAlreadyExists ( err ) :
return nil , err
// return dc.rsLister.ReplicaSets(namespace).Get(newRS.Name)
case err != nil :
msg := fmt . Sprintf ( "Failed to create new replica set %q: %v" , newRS . Name , err )
if deployment . Spec . ProgressDeadlineSeconds != nil {
cond := deploymentutil . NewDeploymentCondition ( extensions . DeploymentProgressing , v1 . ConditionFalse , deploymentutil . FailedRSCreateReason , msg )
deploymentutil . SetDeploymentCondition ( & deployment . Status , * cond )
// We don't really care about this error at this point, since we have a bigger issue to report.
// TODO: Update the rest of the Deployment status, too. We may need to do this every time we
// error out in all other places in the controller so that we let users know that their deployments
// have been noticed by the controller, albeit with errors.
// TODO: Identify which errors are permanent and switch DeploymentIsFailed to take into account
// these reasons as well. Related issue: https://github.com/kubernetes/kubernetes/issues/18568
_ , _ = dc . client . Extensions ( ) . Deployments ( deployment . ObjectMeta . Namespace ) . UpdateStatus ( deployment )
}
dc . eventRecorder . Eventf ( deployment , v1 . EventTypeWarning , deploymentutil . FailedRSCreateReason , msg )
return nil , err
}
if newReplicasCount > 0 {
dc . eventRecorder . Eventf ( deployment , v1 . EventTypeNormal , "ScalingReplicaSet" , "Scaled up replica set %s to %d" , createdRS . Name , newReplicasCount )
}
deploymentutil . SetDeploymentRevision ( deployment , newRevision )
if deployment . Spec . ProgressDeadlineSeconds != nil {
msg := fmt . Sprintf ( "Created new replica set %q" , createdRS . Name )
condition := deploymentutil . NewDeploymentCondition ( extensions . DeploymentProgressing , v1 . ConditionTrue , deploymentutil . NewReplicaSetReason , msg )
deploymentutil . SetDeploymentCondition ( & deployment . Status , * condition )
}
_ , err = dc . client . Extensions ( ) . Deployments ( deployment . Namespace ) . UpdateStatus ( deployment )
return createdRS , err
}
// scale scales proportionally in order to mitigate risk. Otherwise, scaling up can increase the size
// of the new replica set and scaling down can decrease the sizes of the old ones, both of which would
// have the effect of hastening the rollout progress, which could produce a higher proportion of unavailable
// replicas in the event of a problem with the rolled out template. Should run only on scaling events or
// when a deployment is paused and not during the normal rollout process.
func ( dc * DeploymentController ) scale ( deployment * extensions . Deployment , newRS * extensions . ReplicaSet , oldRSs [ ] * extensions . ReplicaSet ) error {
// If there is only one active replica set then we should scale that up to the full count of the
// deployment. If there is no active replica set, then we should scale up the newest replica set.
if activeOrLatest := deploymentutil . FindActiveOrLatest ( newRS , oldRSs ) ; activeOrLatest != nil {
if * ( activeOrLatest . Spec . Replicas ) == * ( deployment . Spec . Replicas ) {
return nil
}
_ , _ , err := dc . scaleReplicaSetAndRecordEvent ( activeOrLatest , * ( deployment . Spec . Replicas ) , deployment )
return err
}
// If the new replica set is saturated, old replica sets should be fully scaled down.
// This case handles replica set adoption during a saturated new replica set.
if deploymentutil . IsSaturated ( deployment , newRS ) {
for _ , old := range controller . FilterActiveReplicaSets ( oldRSs ) {
if _ , _ , err := dc . scaleReplicaSetAndRecordEvent ( old , 0 , deployment ) ; err != nil {
return err
}
}
return nil
}
// There are old replica sets with pods and the new replica set is not saturated.
// We need to proportionally scale all replica sets (new and old) in case of a
// rolling deployment.
if deploymentutil . IsRollingUpdate ( deployment ) {
allRSs := controller . FilterActiveReplicaSets ( append ( oldRSs , newRS ) )
allRSsReplicas := deploymentutil . GetReplicaCountForReplicaSets ( allRSs )
allowedSize := int32 ( 0 )
if * ( deployment . Spec . Replicas ) > 0 {
allowedSize = * ( deployment . Spec . Replicas ) + deploymentutil . MaxSurge ( * deployment )
}
// Number of additional replicas that can be either added or removed from the total
// replicas count. These replicas should be distributed proportionally to the active
// replica sets.
deploymentReplicasToAdd := allowedSize - allRSsReplicas
// The additional replicas should be distributed proportionally amongst the active
// replica sets from the larger to the smaller in size replica set. Scaling direction
// drives what happens in case we are trying to scale replica sets of the same size.
// In such a case when scaling up, we should scale up newer replica sets first, and
// when scaling down, we should scale down older replica sets first.
var scalingOperation string
switch {
case deploymentReplicasToAdd > 0 :
sort . Sort ( controller . ReplicaSetsBySizeNewer ( allRSs ) )
scalingOperation = "up"
case deploymentReplicasToAdd < 0 :
sort . Sort ( controller . ReplicaSetsBySizeOlder ( allRSs ) )
scalingOperation = "down"
}
// Iterate over all active replica sets and estimate proportions for each of them.
// The absolute value of deploymentReplicasAdded should never exceed the absolute
// value of deploymentReplicasToAdd.
deploymentReplicasAdded := int32 ( 0 )
nameToSize := make ( map [ string ] int32 )
for i := range allRSs {
rs := allRSs [ i ]
// Estimate proportions if we have replicas to add, otherwise simply populate
// nameToSize with the current sizes for each replica set.
if deploymentReplicasToAdd != 0 {
proportion := deploymentutil . GetProportion ( rs , * deployment , deploymentReplicasToAdd , deploymentReplicasAdded )
nameToSize [ rs . Name ] = * ( rs . Spec . Replicas ) + proportion
deploymentReplicasAdded += proportion
} else {
nameToSize [ rs . Name ] = * ( rs . Spec . Replicas )
}
}
// Update all replica sets
for i := range allRSs {
rs := allRSs [ i ]
// Add/remove any leftovers to the largest replica set.
if i == 0 && deploymentReplicasToAdd != 0 {
leftover := deploymentReplicasToAdd - deploymentReplicasAdded
nameToSize [ rs . Name ] = nameToSize [ rs . Name ] + leftover
if nameToSize [ rs . Name ] < 0 {
nameToSize [ rs . Name ] = 0
}
}
// TODO: Use transactions when we have them.
if _ , _ , err := dc . scaleReplicaSet ( rs , nameToSize [ rs . Name ] , deployment , scalingOperation ) ; err != nil {
// Return as soon as we fail, the deployment is requeued
return err
}
}
}
return nil
}
func ( dc * DeploymentController ) scaleReplicaSetAndRecordEvent ( rs * extensions . ReplicaSet , newScale int32 , deployment * extensions . Deployment ) ( bool , * extensions . ReplicaSet , error ) {
// No need to scale
if * ( rs . Spec . Replicas ) == newScale {
return false , rs , nil
}
var scalingOperation string
if * ( rs . Spec . Replicas ) < newScale {
scalingOperation = "up"
} else {
scalingOperation = "down"
}
scaled , newRS , err := dc . scaleReplicaSet ( rs , newScale , deployment , scalingOperation )
return scaled , newRS , err
}
func ( dc * DeploymentController ) scaleReplicaSet ( rs * extensions . ReplicaSet , newScale int32 , deployment * extensions . Deployment , scalingOperation string ) ( bool , * extensions . ReplicaSet , error ) {
objCopy , err := api . Scheme . Copy ( rs )
if err != nil {
return false , nil , err
}
rsCopy := objCopy . ( * extensions . ReplicaSet )
sizeNeedsUpdate := * ( rsCopy . Spec . Replicas ) != newScale
// TODO: Do not mutate the replica set here, instead simply compare the annotation and if they mismatch
// call SetReplicasAnnotations inside the following if clause. Then we can also move the deep-copy from
// above inside the if too.
annotationsNeedUpdate := deploymentutil . SetReplicasAnnotations ( rsCopy , * ( deployment . Spec . Replicas ) , * ( deployment . Spec . Replicas ) + deploymentutil . MaxSurge ( * deployment ) )
scaled := false
if sizeNeedsUpdate || annotationsNeedUpdate {
* ( rsCopy . Spec . Replicas ) = newScale
rs , err = dc . client . Extensions ( ) . ReplicaSets ( rsCopy . Namespace ) . Update ( rsCopy )
if err == nil && sizeNeedsUpdate {
scaled = true
dc . eventRecorder . Eventf ( deployment , v1 . EventTypeNormal , "ScalingReplicaSet" , "Scaled %s replica set %s to %d" , scalingOperation , rs . Name , newScale )
}
}
return scaled , rs , err
}
// cleanupDeployment is responsible for cleaning up a deployment ie. retains all but the latest N old replica sets
// where N=d.Spec.RevisionHistoryLimit. Old replica sets are older versions of the podtemplate of a deployment kept
// around by default 1) for historical reasons and 2) for the ability to rollback a deployment.
func ( dc * DeploymentController ) cleanupDeployment ( oldRSs [ ] * extensions . ReplicaSet , deployment * extensions . Deployment ) error {
if deployment . Spec . RevisionHistoryLimit == nil {
return nil
}
diff := int32 ( len ( oldRSs ) ) - * deployment . Spec . RevisionHistoryLimit
if diff <= 0 {
return nil
}
sort . Sort ( controller . ReplicaSetsByCreationTimestamp ( oldRSs ) )
var errList [ ] error
// TODO: This should be parallelized.
for i := int32 ( 0 ) ; i < diff ; i ++ {
rs := oldRSs [ i ]
// Avoid delete replica set with non-zero replica counts
if rs . Status . Replicas != 0 || * ( rs . Spec . Replicas ) != 0 || rs . Generation > rs . Status . ObservedGeneration {
continue
}
if err := dc . client . Extensions ( ) . ReplicaSets ( rs . Namespace ) . Delete ( rs . Name , nil ) ; err != nil && ! errors . IsNotFound ( err ) {
glog . V ( 2 ) . Infof ( "Failed deleting old replica set %v for deployment %v: %v" , rs . Name , deployment . Name , err )
errList = append ( errList , err )
}
}
return utilerrors . NewAggregate ( errList )
}
// syncDeploymentStatus checks if the status is up-to-date and sync it if necessary
func ( dc * DeploymentController ) syncDeploymentStatus ( allRSs [ ] * extensions . ReplicaSet , newRS * extensions . ReplicaSet , d * extensions . Deployment ) error {
newStatus := calculateStatus ( allRSs , newRS , d )
if reflect . DeepEqual ( d . Status , newStatus ) {
return nil
}
newDeployment := d
newDeployment . Status = newStatus
_ , err := dc . client . Extensions ( ) . Deployments ( newDeployment . Namespace ) . UpdateStatus ( newDeployment )
return err
}
// calculateStatus calculates the latest status for the provided deployment by looking into the provided replica sets.
func calculateStatus ( allRSs [ ] * extensions . ReplicaSet , newRS * extensions . ReplicaSet , deployment * extensions . Deployment ) extensions . DeploymentStatus {
availableReplicas := deploymentutil . GetAvailableReplicaCountForReplicaSets ( allRSs )
totalReplicas := deploymentutil . GetReplicaCountForReplicaSets ( allRSs )
unavailableReplicas := totalReplicas - availableReplicas
// If unavailableReplicas is negative, then that means the Deployment has more available replicas running than
// desired, eg. whenever it scales down. In such a case we should simply default unavailableReplicas to zero.
if unavailableReplicas < 0 {
unavailableReplicas = 0
}
status := extensions . DeploymentStatus {
// TODO: Ensure that if we start retrying status updates, we won't pick up a new Generation value.
ObservedGeneration : deployment . Generation ,
Replicas : deploymentutil . GetActualReplicaCountForReplicaSets ( allRSs ) ,
UpdatedReplicas : deploymentutil . GetActualReplicaCountForReplicaSets ( [ ] * extensions . ReplicaSet { newRS } ) ,
ReadyReplicas : deploymentutil . GetReadyReplicaCountForReplicaSets ( allRSs ) ,
AvailableReplicas : availableReplicas ,
UnavailableReplicas : unavailableReplicas ,
}
// Copy conditions one by one so we won't mutate the original object.
conditions := deployment . Status . Conditions
for i := range conditions {
status . Conditions = append ( status . Conditions , conditions [ i ] )
}
if availableReplicas >= * ( deployment . Spec . Replicas ) - deploymentutil . MaxUnavailable ( * deployment ) {
minAvailability := deploymentutil . NewDeploymentCondition ( extensions . DeploymentAvailable , v1 . ConditionTrue , deploymentutil . MinimumReplicasAvailable , "Deployment has minimum availability." )
deploymentutil . SetDeploymentCondition ( & status , * minAvailability )
} else {
noMinAvailability := deploymentutil . NewDeploymentCondition ( extensions . DeploymentAvailable , v1 . ConditionFalse , deploymentutil . MinimumReplicasUnavailable , "Deployment does not have minimum availability." )
deploymentutil . SetDeploymentCondition ( & status , * noMinAvailability )
}
return status
}
// isScalingEvent checks whether the provided deployment has been updated with a scaling event
// by looking at the desired-replicas annotation in the active replica sets of the deployment.
func ( dc * DeploymentController ) isScalingEvent ( d * extensions . Deployment ) ( bool , error ) {
newRS , oldRSs , err := dc . getAllReplicaSetsAndSyncRevision ( d , false )
if err != nil {
return false , err
}
allRSs := append ( oldRSs , newRS )
for _ , rs := range controller . FilterActiveReplicaSets ( allRSs ) {
desired , ok := deploymentutil . GetDesiredReplicasAnnotation ( rs )
if ! ok {
continue
}
if desired != * ( d . Spec . Replicas ) {
return true , nil
}
}
return false , nil
}