Skip to content

Commit ea31a09

Browse files
committed
apps: deployment config stuck in the new state should respect timeoutSecods
1 parent 05d2e14 commit ea31a09

File tree

4 files changed

+166
-0
lines changed

4 files changed

+166
-0
lines changed

pkg/apps/apis/apps/types.go

+1
Original file line numberDiff line numberDiff line change
@@ -113,6 +113,7 @@ const (
113113
DeploymentCancelledNewerDeploymentExists = "newer deployment was found running"
114114
DeploymentFailedUnrelatedDeploymentExists = "unrelated pod with the same name as this deployment is already running"
115115
DeploymentFailedDeployerPodNoLongerExists = "deployer pod no longer exists"
116+
DeploymentFailedUnableToCreateDeployerPod = "unable to create deployer pod"
116117
)
117118

118119
// DeploymentStatus describes the possible states a deployment can be in.

pkg/apps/controller/deployer/deployer_controller.go

+15
Original file line numberDiff line numberDiff line change
@@ -127,6 +127,21 @@ func (c *DeploymentController) handle(deployment *v1.ReplicationController, will
127127
}
128128
break
129129
}
130+
// In case the deployment is stuck in "new" state because we fail to create
131+
// deployer pod (quota, etc..) we should respect the timeoutSeconds in the
132+
// config strategy and transition the rollout to failed instead of waiting for
133+
// the deployment pod forever.
134+
config, err := deployutil.DecodeDeploymentConfig(deployment, c.codec)
135+
if err != nil {
136+
return err
137+
}
138+
if deployutil.RolloutExceededTimeoutSeconds(config, deployment) {
139+
nextStatus = deployapi.DeploymentStatusFailed
140+
updatedAnnotations[deployapi.DeploymentStatusReasonAnnotation] = deployapi.DeploymentFailedUnableToCreateDeployerPod
141+
c.emitDeploymentEvent(deployment, v1.EventTypeWarning, "RolloutTimeout", fmt.Sprintf("Rollout for %q failed to create deployer pod (timeoutSeconds: %ds)", deployutil.LabelForDeploymentV1(deployment), deployutil.GetTimeoutSecondsForStrategy(config)))
142+
glog.V(4).Infof("Failing deployment %s/%s as we timeout out while waiting for the deployer pod to be created", deployment.Namespace, deployment.Name)
143+
break
144+
}
130145

131146
switch {
132147
case kerrors.IsNotFound(deployerErr):

pkg/apps/util/util.go

+42
Original file line numberDiff line numberDiff line change
@@ -652,6 +652,12 @@ func IsTerminatedDeployment(deployment runtime.Object) bool {
652652
return IsCompleteDeployment(deployment) || IsFailedDeployment(deployment)
653653
}
654654

655+
// IsNewDeployment returns true if the passed deployment is in new state.
656+
func IsNewDeployment(deployment runtime.Object) bool {
657+
current := DeploymentStatusFor(deployment)
658+
return current == deployapi.DeploymentStatusNew
659+
}
660+
655661
// IsCompleteDeployment returns true if the passed deployment is in state complete.
656662
func IsCompleteDeployment(deployment runtime.Object) bool {
657663
current := DeploymentStatusFor(deployment)
@@ -782,6 +788,42 @@ func DeploymentsForCleanup(configuration *deployapi.DeploymentConfig, deployment
782788
return relevantDeployments
783789
}
784790

791+
// GetTimeoutSecondsForStrategy returns the timeout in seconds defined in the
792+
// deployment config strategy.
793+
func GetTimeoutSecondsForStrategy(config *deployapi.DeploymentConfig) int64 {
794+
var timeoutSeconds int64
795+
switch config.Spec.Strategy.Type {
796+
case deployapi.DeploymentStrategyTypeRolling:
797+
timeoutSeconds = deployapi.DefaultRollingTimeoutSeconds
798+
if t := config.Spec.Strategy.RollingParams.TimeoutSeconds; t != nil {
799+
timeoutSeconds = *t
800+
}
801+
case deployapi.DeploymentStrategyTypeRecreate:
802+
timeoutSeconds = deployapi.DefaultRecreateTimeoutSeconds
803+
if t := config.Spec.Strategy.RecreateParams.TimeoutSeconds; t != nil {
804+
timeoutSeconds = *t
805+
}
806+
case deployapi.DeploymentStrategyTypeCustom:
807+
timeoutSeconds = deployapi.DefaultRecreateTimeoutSeconds
808+
}
809+
return timeoutSeconds
810+
}
811+
812+
// RolloutExceededTimeoutSeconds returns true if the current deployment exceeded
813+
// the timeoutSeconds defined for its strategy.
814+
// Note that this is different than activeDeadlineSeconds which is the timeout
815+
// set for the deployer pod. In some cases, the deployer pod cannot be created
816+
// (like quota, etc...). In that case deployer controller use this function to
817+
// measure if the created deployment (RC) exceeded the timeout.
818+
func RolloutExceededTimeoutSeconds(config *deployapi.DeploymentConfig, latestRC *v1.ReplicationController) bool {
819+
timeoutSeconds := GetTimeoutSecondsForStrategy(config)
820+
// If user set the timeoutSeconds to 0, we assume there should be no timeout.
821+
if timeoutSeconds == 0 {
822+
return false
823+
}
824+
return int64(time.Since(latestRC.CreationTimestamp.Time).Seconds()) > timeoutSeconds
825+
}
826+
785827
// WaitForRunningDeployerPod waits a given period of time until the deployer pod
786828
// for given replication controller is not running.
787829
func WaitForRunningDeployerPod(podClient kcoreclient.PodsGetter, rc *api.ReplicationController, timeout time.Duration) error {

pkg/apps/util/util_test.go

+108
Original file line numberDiff line numberDiff line change
@@ -586,3 +586,111 @@ func TestRemoveCondition(t *testing.T) {
586586
}
587587
}
588588
}
589+
590+
func TestRolloutExceededTimeoutSeconds(t *testing.T) {
591+
now := time.Now()
592+
tests := []struct {
593+
name string
594+
config func(int64) *deployapi.DeploymentConfig
595+
timeoutSeconds int64
596+
deploymentCreationTime time.Time
597+
expectTimeout bool
598+
}{
599+
// Recreate strategy with deployment running for 20s (exceeding 10s timeout)
600+
{
601+
name: "recreate timeout",
602+
config: func(timeoutSeconds int64) *deployapi.DeploymentConfig {
603+
config := deploytest.OkDeploymentConfig(1)
604+
config.Spec.Strategy.RecreateParams.TimeoutSeconds = &timeoutSeconds
605+
return config
606+
},
607+
timeoutSeconds: int64(10),
608+
deploymentCreationTime: now.Add(-20 * time.Second),
609+
expectTimeout: true,
610+
},
611+
// Recreate strategy with no timeout
612+
{
613+
name: "recreate no timeout",
614+
config: func(timeoutSeconds int64) *deployapi.DeploymentConfig {
615+
config := deploytest.OkDeploymentConfig(1)
616+
config.Spec.Strategy.RecreateParams.TimeoutSeconds = &timeoutSeconds
617+
return config
618+
},
619+
timeoutSeconds: int64(0),
620+
deploymentCreationTime: now.Add(-700 * time.Second),
621+
expectTimeout: false,
622+
},
623+
624+
// Rolling strategy with deployment running for 20s (exceeding 10s timeout)
625+
{
626+
name: "rolling timeout",
627+
config: func(timeoutSeconds int64) *deployapi.DeploymentConfig {
628+
config := deploytest.OkDeploymentConfig(1)
629+
config.Spec.Strategy = deploytest.OkRollingStrategy()
630+
config.Spec.Strategy.RollingParams.TimeoutSeconds = &timeoutSeconds
631+
return config
632+
},
633+
timeoutSeconds: int64(10),
634+
deploymentCreationTime: now.Add(-20 * time.Second),
635+
expectTimeout: true,
636+
},
637+
// Rolling strategy with deployment with no timeout specified.
638+
{
639+
name: "rolling using default timeout",
640+
config: func(timeoutSeconds int64) *deployapi.DeploymentConfig {
641+
config := deploytest.OkDeploymentConfig(1)
642+
config.Spec.Strategy = deploytest.OkRollingStrategy()
643+
config.Spec.Strategy.RollingParams.TimeoutSeconds = nil
644+
return config
645+
},
646+
deploymentCreationTime: now.Add(-20 * time.Second),
647+
expectTimeout: false,
648+
},
649+
// Recreate strategy with deployment with no timeout specified.
650+
{
651+
name: "recreate using default timeout",
652+
config: func(timeoutSeconds int64) *deployapi.DeploymentConfig {
653+
config := deploytest.OkDeploymentConfig(1)
654+
config.Spec.Strategy.RecreateParams.TimeoutSeconds = nil
655+
return config
656+
},
657+
deploymentCreationTime: now.Add(-20 * time.Second),
658+
expectTimeout: false,
659+
},
660+
// Custom strategy with deployment with no timeout specified.
661+
{
662+
name: "custom using default timeout",
663+
config: func(timeoutSeconds int64) *deployapi.DeploymentConfig {
664+
config := deploytest.OkDeploymentConfig(1)
665+
config.Spec.Strategy = deploytest.OkCustomStrategy()
666+
return config
667+
},
668+
deploymentCreationTime: now.Add(-20 * time.Second),
669+
expectTimeout: false,
670+
},
671+
// Custom strategy use default timeout exceeding it.
672+
{
673+
name: "custom using default timeout timing out",
674+
config: func(timeoutSeconds int64) *deployapi.DeploymentConfig {
675+
config := deploytest.OkDeploymentConfig(1)
676+
config.Spec.Strategy = deploytest.OkCustomStrategy()
677+
return config
678+
},
679+
deploymentCreationTime: now.Add(-700 * time.Second),
680+
expectTimeout: true,
681+
},
682+
}
683+
684+
for _, tc := range tests {
685+
config := tc.config(tc.timeoutSeconds)
686+
deployment, err := MakeDeploymentV1(config, kapi.Codecs.LegacyCodec(deployv1.SchemeGroupVersion))
687+
if err != nil {
688+
t.Fatalf("unexpected error: %v", err)
689+
}
690+
deployment.ObjectMeta.CreationTimestamp = metav1.Time{Time: tc.deploymentCreationTime}
691+
gotTimeout := RolloutExceededTimeoutSeconds(config, deployment)
692+
if tc.expectTimeout && !gotTimeout {
693+
t.Errorf("[%s]: expected timeout, but got no timeout", tc.name)
694+
}
695+
}
696+
}

0 commit comments

Comments
 (0)