kubernetes · tenzen-y · Nov 13, 2023 · Nov 13, 2023 · Nov 16, 2023 · mimowo
diff --git a/pkg/controller/job/job_controller.go b/pkg/controller/job/job_controller.go
@@ -855,12 +855,6 @@ func (jm *Controller) syncJob(ctx context.Context, key string) (rErr error) {
 			// check if the number of pod restart exceeds backoff (for restart OnFailure only)
 			// OR if the number of failed jobs increased since the last syncJob
 			jobCtx.finishedCondition = newCondition(batch.JobFailed, v1.ConditionTrue, batch.JobReasonBackoffLimitExceeded, "Job has reached the specified backoff limit", jm.clock.Now())
-		} else if jm.pastActiveDeadline(&job) {
-			jobCtx.finishedCondition = newCondition(batch.JobFailed, v1.ConditionTrue, batch.JobReasonDeadlineExceeded, "Job was active longer than specified deadline", jm.clock.Now())
-		} else if job.Spec.ActiveDeadlineSeconds != nil && !jobSuspended(&job) {
-			syncDuration := time.Duration(*job.Spec.ActiveDeadlineSeconds)*time.Second - jm.clock.Since(job.Status.StartTime.Time)
-			logger.V(2).Info("Job has activeDeadlineSeconds configuration. Will sync this job again", "key", key, "nextSyncIn", syncDuration)
-			jm.queue.AddAfter(key, syncDuration)
 		}
 	}
 
@@ -884,6 +878,41 @@ func (jm *Controller) syncJob(ctx context.Context, key string) (rErr error) {
 			}
 		}
 	}
+
+	complete := false
+	if jobCtx.finishedCondition == nil {
+		if job.Spec.Completions == nil {
+			// This type of job is complete when any pod exits with success.
+			// Each pod is capable of
+			// determining whether or not the entire Job is done.  Subsequent pods are
+			// not expected to fail, but if they do, the failure is ignored.  Once any
+			// pod succeeds, the controller waits for remaining pods to finish, and
+			// then the job is complete.
+			complete = jobCtx.succeeded > 0 && active == 0
+		} else {
+			// If job is scaled down and the number of succeeded pods already reached completions,
+			// job should be marked as complete here.
+			wantActive := active
+			if feature.DefaultFeatureGate.Enabled(features.ElasticIndexedJob) && satisfiedExpectations && job.DeletionTimestamp == nil {
+				wantActive = wantActivePods(&job, jobCtx)
+			}
+			// Job specifies a number of completions.  This type of job signals
+			// success by having that number of successes.  Since we do not
+			// start more pods than there are remaining completions, there should
+			// not be any remaining active pods once this count is reached.
+			complete = jobCtx.succeeded >= *job.Spec.Completions && wantActive == 0
+		}
+		if !complete {
+			if jm.pastActiveDeadline(&job) {
+				jobCtx.finishedCondition = newCondition(batch.JobFailed, v1.ConditionTrue, batch.JobReasonDeadlineExceeded, "Job was active longer than specified deadline", jm.clock.Now())
+			} else if job.Spec.ActiveDeadlineSeconds != nil && !jobSuspended(&job) {
+				syncDuration := time.Duration(*job.Spec.ActiveDeadlineSeconds)*time.Second - jm.clock.Since(job.Status.StartTime.Time)
+				logger.V(2).Info("Job has activeDeadlineSeconds configuration. Will sync this job again", "key", key, "nextSyncIn", syncDuration)
+				jm.queue.AddAfter(key, syncDuration)
+			}
+		}
+	}
+
 	suspendCondChanged := false
 	// Remove active pods if Job failed.
 	if jobCtx.finishedCondition != nil {
@@ -901,22 +930,6 @@ func (jm *Controller) syncJob(ctx context.Context, key string) (rErr error) {
 			active, action, manageJobErr = jm.manageJob(ctx, &job, jobCtx)
 			manageJobCalled = true
 		}
-		complete := false
-		if job.Spec.Completions == nil {
-			// This type of job is complete when any pod exits with success.
-			// Each pod is capable of
-			// determining whether or not the entire Job is done.  Subsequent pods are
-			// not expected to fail, but if they do, the failure is ignored.  Once any
-			// pod succeeds, the controller waits for remaining pods to finish, and
-			// then the job is complete.
-			complete = jobCtx.succeeded > 0 && active == 0
-		} else {
-			// Job specifies a number of completions.  This type of job signals
-			// success by having that number of successes.  Since we do not
-			// start more pods than there are remaining completions, there should
-			// not be any remaining active pods once this count is reached.
-			complete = jobCtx.succeeded >= *job.Spec.Completions && active == 0
-		}
 		if complete {
 			jobCtx.finishedCondition = newCondition(batch.JobComplete, v1.ConditionTrue, "", "", jm.clock.Now())
 		} else if manageJobCalled {
@@ -1486,7 +1499,6 @@ func jobSuspended(job *batch.Job) bool {
 func (jm *Controller) manageJob(ctx context.Context, job *batch.Job, jobCtx *syncJobCtx) (int32, string, error) {
 	logger := klog.FromContext(ctx)
 	active := int32(len(jobCtx.activePods))
-	parallelism := *job.Spec.Parallelism
 	jobKey, err := controller.KeyFunc(job)
 	if err != nil {
 		utilruntime.HandleError(fmt.Errorf("Couldn't get key for job %#v: %v", job, err))
@@ -1513,27 +1525,7 @@ func (jm *Controller) manageJob(ctx context.Context, job *batch.Job, jobCtx *syn
 			terminating = *jobCtx.terminating
 		}
 	}
-	wantActive := int32(0)
-	if job.Spec.Completions == nil {
-		// Job does not specify a number of completions.  Therefore, number active
-		// should be equal to parallelism, unless the job has seen at least
-		// once success, in which leave whatever is running, running.
-		if jobCtx.succeeded > 0 {
-			wantActive = active
-		} else {
-			wantActive = parallelism
-		}
-	} else {
-		// Job specifies a specific number of completions.  Therefore, number
-		// active should not ever exceed number of remaining completions.
-		wantActive = *job.Spec.Completions - jobCtx.succeeded
-		if wantActive > parallelism {
-			wantActive = parallelism
-		}
-		if wantActive < 0 {
-			wantActive = 0
-		}
-	}
+	wantActive := wantActivePods(job, jobCtx)
 
 	rmAtLeast := active - wantActive
 	if rmAtLeast < 0 {
@@ -1676,6 +1668,35 @@ func (jm *Controller) manageJob(ctx context.Context, job *batch.Job, jobCtx *syn
 	return active, metrics.JobSyncActionTracking, nil
 }
 
+// wantActivePods returns a desired number of active pods.
+func wantActivePods(job *batch.Job, jobCtx *syncJobCtx) int32 {
+	active := int32(len(jobCtx.activePods))
+	parallelism := *job.Spec.Parallelism
+	wantActive := int32(0)
+
+	if job.Spec.Completions == nil {
+		// Job does not specify a number of completions.  Therefore, number active
+		// should be equal to parallelism, unless the job has seen at least
+		// once success, in which leave whatever is running, running.
+		if jobCtx.succeeded > 0 {
+			wantActive = active
+		} else {
+			wantActive = parallelism
+		}
+	} else {
+		// Job specifies a specific number of completions.  Therefore, number
+		// active should not ever exceed number of remaining completions.
+		wantActive = *job.Spec.Completions - jobCtx.succeeded
+		if wantActive > parallelism {
+			wantActive = parallelism
+		}
+		if wantActive < 0 {
+			wantActive = 0
+		}
+	}
+	return wantActive
+}
+
 // getPodCreationInfoForIndependentIndexes returns a sub-list of all indexes
 // to create that contains those which can be already created. In case no indexes
 // are ready to create pods, it returns the lowest remaining time to create pods

diff --git a/pkg/controller/job/job_controller_test.go b/pkg/controller/job/job_controller_test.go
@@ -2089,6 +2089,35 @@ func TestSyncJobPastDeadline(t *testing.T) {
 			expectedCondition:       batch.JobSuspended,
 			expectedConditionReason: "JobSuspended",
 		},
+		"nonIndexed job succeeded and exceeded activeDeadlineSeconds": {
+			parallelism:           1,
+			activeDeadlineSeconds: 10,
+			startTime:             15,
+			succeededPods:         1,
+			expectedSucceeded:     1,
+			expectedCondition:     batch.JobComplete,
+		},
+		"indexed job succeeded and exceeded activeDeadlineSeconds": {
+			parallelism:           2,
+			completions:           2,
+			activeDeadlineSeconds: 10,
+			startTime:             15,
+			succeededPods:         2,
+			expectedSucceeded:     2,
+			expectedCondition:     batch.JobComplete,
+		},
+		"elasticIndexed job is scaled down and exceeded activeDeadlineSeconds; the number of succeeded pods already reached the completions": {
+			parallelism:           1,
+			completions:           1,
+			activeDeadlineSeconds: 10,
+			startTime:             15,
+			succeededPods:         1,
+			activePods:            2,
+			expectedFailed:        2,
+			expectedSucceeded:     1,
+			expectedDeletions:     2,
+			expectedCondition:     batch.JobComplete,
+		},
 	}
 
 	for name, tc := range testCases {