hashicorp · Jun 20, 2025
diff --git a/‎scheduler/generic_sched.go
Lines changed: 26 additions & 22 deletions b/‎scheduler/generic_sched.go
Lines changed: 26 additions & 22 deletions
diff --git a/‎scheduler/reconciler/allocs.go
Lines changed: 0 additions & 255 deletions b/‎scheduler/reconciler/allocs.go
Lines changed: 0 additions & 255 deletions
@@ -340,51 +340,55 @@ func (s *GenericScheduler) computeJobAllocs() error {
 
 	r := reconciler.NewAllocReconciler(s.logger,
 		genericAllocUpdateFn(s.ctx, s.stack, s.eval.ID),
-		s.batch, s.eval.JobID, s.job, s.deployment, allocs, tainted, s.eval.ID,
-		s.eval.Priority, s.planner.ServersMeetMinimumVersion(minVersionMaxClientDisconnect, true))
-	r.Compute()
-	s.logger.Debug("reconciled current state with desired state", "results", log.Fmt("%#v", r.Result))
+		s.batch, s.eval.JobID, s.job, s.deployment, allocs, s.eval.ID,
+		s.eval.Priority, reconciler.ClusterState{
+			TaintedNodes:                tainted,
+			SupportsDisconnectedClients: s.planner.ServersMeetMinimumVersion(minVersionMaxClientDisconnect, true),
+			Now:                         time.Now().UTC(),
+		})
+	result := r.Compute()
+	s.logger.Debug("reconciled current state with desired state", "results", log.Fmt("%#v", result))
 
 	if s.eval.AnnotatePlan {
 		s.plan.Annotations = &structs.PlanAnnotations{
-			DesiredTGUpdates: r.Result.DesiredTGUpdates,
+			DesiredTGUpdates: result.DesiredTGUpdates,
 		}
 	}
 
 	// Add the deployment changes to the plan
-	s.plan.Deployment = r.Result.Deployment
-	s.plan.DeploymentUpdates = r.Result.DeploymentUpdates
+	s.plan.Deployment = result.Deployment
+	s.plan.DeploymentUpdates = result.DeploymentUpdates
 
 	// Store all the follow up evaluations from rescheduled allocations
-	if len(r.Result.DesiredFollowupEvals) > 0 {
-		for _, evals := range r.Result.DesiredFollowupEvals {
+	if len(result.DesiredFollowupEvals) > 0 {
+		for _, evals := range result.DesiredFollowupEvals {
 			s.followUpEvals = append(s.followUpEvals, evals...)
 		}
 	}
 
 	// Update the stored deployment
-	if r.Result.Deployment != nil {
-		s.deployment = r.Result.Deployment
+	if result.Deployment != nil {
+		s.deployment = result.Deployment
 	}
 
 	// Handle the stop
-	for _, stop := range r.Result.Stop {
+	for _, stop := range result.Stop {
 		s.plan.AppendStoppedAlloc(stop.Alloc, stop.StatusDescription, stop.ClientStatus, stop.FollowupEvalID)
 	}
 
 	// Handle disconnect updates
-	for _, update := range r.Result.DisconnectUpdates {
+	for _, update := range result.DisconnectUpdates {
 		s.plan.AppendUnknownAlloc(update)
 	}
 
 	// Handle reconnect updates.
 	// Reconnected allocs have a new AllocState entry.
-	for _, update := range r.Result.ReconnectUpdates {
+	for _, update := range result.ReconnectUpdates {
 		s.ctx.Plan().AppendAlloc(update, nil)
 	}
 
 	// Handle the in-place updates
-	for _, update := range r.Result.InplaceUpdate {
+	for _, update := range result.InplaceUpdate {
 		if update.DeploymentID != s.deployment.GetID() {
 			update.DeploymentID = s.deployment.GetID()
 			update.DeploymentStatus = nil
@@ -393,12 +397,12 @@ func (s *GenericScheduler) computeJobAllocs() error {
 	}
 
 	// Handle the annotation updates
-	for _, update := range r.Result.AttributeUpdates {
+	for _, update := range result.AttributeUpdates {
 		s.ctx.Plan().AppendAlloc(update, nil)
 	}
 
 	// Nothing remaining to do if placement is not required
-	if len(r.Result.Place)+len(r.Result.DestructiveUpdate) == 0 {
+	if len(result.Place)+len(result.DestructiveUpdate) == 0 {
 		// If the job has been purged we don't have access to the job. Otherwise
 		// set the queued allocs to zero. This is true if the job is being
 		// stopped as well.
@@ -411,18 +415,18 @@ func (s *GenericScheduler) computeJobAllocs() error {
 	}
 
 	// Compute the placements
-	place := make([]reconciler.PlacementResult, 0, len(r.Result.Place))
-	for _, p := range r.Result.Place {
+	place := make([]reconciler.PlacementResult, 0, len(result.Place))
+	for _, p := range result.Place {
 		s.queuedAllocs[p.TaskGroup().Name] += 1
 		place = append(place, p)
 	}
 
-	destructive := make([]reconciler.PlacementResult, 0, len(r.Result.DestructiveUpdate))
-	for _, p := range r.Result.DestructiveUpdate {
+	destructive := make([]reconciler.PlacementResult, 0, len(result.DestructiveUpdate))
+	for _, p := range result.DestructiveUpdate {
 		s.queuedAllocs[p.TaskGroup().Name] += 1
 		destructive = append(destructive, p)
 	}
-	return s.computePlacements(destructive, place, r.Result.TaskGroupAllocNameIndexes)
+	return s.computePlacements(destructive, place, result.TaskGroupAllocNameIndexes)
 }
 
 // downgradedJobForPlacement returns the previous stable version of the job for
 
@@ -224,235 +224,6 @@ func (a allocSet) fromKeys(keys ...[]string) allocSet {
 	return from
 }
 
-// filterByTainted takes a set of tainted nodes and filters the allocation set
-// into the following groups:
-// 1. Those that exist on untainted nodes
-// 2. Those exist on nodes that are draining
-// 3. Those that exist on lost nodes or have expired
-// 4. Those that are on nodes that are disconnected, but have not had their ClientState set to unknown
-// 5. Those that are on a node that has reconnected.
-// 6. Those that are in a state that results in a noop.
-func (a allocSet) filterByTainted(taintedNodes map[string]*structs.Node, serverSupportsDisconnectedClients bool, now time.Time) (untainted, migrate, lost, disconnecting, reconnecting, ignore, expiring allocSet) {
-	untainted = make(map[string]*structs.Allocation)
-	migrate = make(map[string]*structs.Allocation)
-	lost = make(map[string]*structs.Allocation)
-	disconnecting = make(map[string]*structs.Allocation)
-	reconnecting = make(map[string]*structs.Allocation)
-	ignore = make(map[string]*structs.Allocation)
-	expiring = make(map[string]*structs.Allocation)
-
-	for _, alloc := range a {
-		// make sure we don't apply any reconnect logic to task groups
-		// without max_client_disconnect
-		supportsDisconnectedClients := alloc.SupportsDisconnectedClients(serverSupportsDisconnectedClients)
-
-		reconnect := false
-
-		// Only compute reconnect for unknown, running, and failed since they
-		// need to go through the reconnect logic.
-		if supportsDisconnectedClients &&
-			(alloc.ClientStatus == structs.AllocClientStatusUnknown ||
-				alloc.ClientStatus == structs.AllocClientStatusRunning ||
-				alloc.ClientStatus == structs.AllocClientStatusFailed) {
-			reconnect = alloc.NeedsToReconnect()
-		}
-
-		// Failed allocs that need to be reconnected must be added to
-		// reconnecting so that they can be handled as a failed reconnect.
-		if supportsDisconnectedClients &&
-			reconnect &&
-			alloc.DesiredStatus == structs.AllocDesiredStatusRun &&
-			alloc.ClientStatus == structs.AllocClientStatusFailed {
-			reconnecting[alloc.ID] = alloc
-			continue
-		}
-
-		taintedNode, nodeIsTainted := taintedNodes[alloc.NodeID]
-		if taintedNode != nil && taintedNode.Status == structs.NodeStatusDisconnected {
-			// Group disconnecting
-			if supportsDisconnectedClients {
-				// Filter running allocs on a node that is disconnected to be marked as unknown.
-				if alloc.ClientStatus == structs.AllocClientStatusRunning {
-					disconnecting[alloc.ID] = alloc
-					continue
-				}
-				// Filter pending allocs on a node that is disconnected to be marked as lost.
-				if alloc.ClientStatus == structs.AllocClientStatusPending {
-					lost[alloc.ID] = alloc
-					continue
-				}
-
-			} else {
-				if alloc.PreventReplaceOnDisconnect() {
-					if alloc.ClientStatus == structs.AllocClientStatusRunning {
-						disconnecting[alloc.ID] = alloc
-						continue
-					}
-
-					untainted[alloc.ID] = alloc
-					continue
-				}
-
-				lost[alloc.ID] = alloc
-				continue
-			}
-		}
-
-		if alloc.TerminalStatus() && !reconnect {
-			// Server-terminal allocs, if supportsDisconnectedClient and not reconnect,
-			// are probably stopped replacements and should be ignored
-			if supportsDisconnectedClients && alloc.ServerTerminalStatus() {
-				ignore[alloc.ID] = alloc
-				continue
-			}
-
-			// Terminal canaries that have been marked for migration need to be
-			// migrated, otherwise we block deployments from progressing by
-			// counting them as running canaries.
-			if alloc.DeploymentStatus.IsCanary() && alloc.DesiredTransition.ShouldMigrate() {
-				migrate[alloc.ID] = alloc
-				continue
-			}
-
-			// Terminal allocs, if not reconnect, are always untainted as they
-			// should never be migrated.
-			untainted[alloc.ID] = alloc
-			continue
-		}
-
-		// Non-terminal allocs that should migrate should always migrate
-		if alloc.DesiredTransition.ShouldMigrate() {
-			migrate[alloc.ID] = alloc
-			continue
-		}
-
-		if supportsDisconnectedClients && alloc.Expired(now) {
-			expiring[alloc.ID] = alloc
-			continue
-		}
-
-		// Acknowledge unknown allocs that we want to reconnect eventually.
-		if supportsDisconnectedClients &&
-			alloc.ClientStatus == structs.AllocClientStatusUnknown &&
-			alloc.DesiredStatus == structs.AllocDesiredStatusRun {
-			untainted[alloc.ID] = alloc
-			continue
-		}
-
-		// Ignore failed allocs that need to be reconnected and that have been
-		// marked to stop by the server.
-		if supportsDisconnectedClients &&
-			reconnect &&
-			alloc.ClientStatus == structs.AllocClientStatusFailed &&
-			alloc.DesiredStatus == structs.AllocDesiredStatusStop {
-			ignore[alloc.ID] = alloc
-			continue
-		}
-
-		if !nodeIsTainted || (taintedNode != nil && taintedNode.Status == structs.NodeStatusReady) {
-			// Filter allocs on a node that is now re-connected to be resumed.
-			if reconnect {
-				// Expired unknown allocs should be processed depending on the max client disconnect
-				// and/or avoid reschedule on lost configurations, they are both treated as
-				// expiring.
-				if alloc.Expired(now) {
-					expiring[alloc.ID] = alloc
-					continue
-				}
-
-				reconnecting[alloc.ID] = alloc
-				continue
-			}
-
-			// Otherwise, Node is untainted so alloc is untainted
-			untainted[alloc.ID] = alloc
-			continue
-		}
-
-		// Allocs on GC'd (nil) or lost nodes are Lost
-		if taintedNode == nil {
-			lost[alloc.ID] = alloc
-			continue
-		}
-
-		// Allocs on terminal nodes that can't be rescheduled need to be treated
-		// differently than those that can.
-		if taintedNode.TerminalStatus() {
-			if alloc.PreventReplaceOnDisconnect() {
-				if alloc.ClientStatus == structs.AllocClientStatusUnknown {
-					untainted[alloc.ID] = alloc
-					continue
-				} else if alloc.ClientStatus == structs.AllocClientStatusRunning {
-					disconnecting[alloc.ID] = alloc
-					continue
-				}
-			}
-
-			lost[alloc.ID] = alloc
-			continue
-		}
-
-		// All other allocs are untainted
-		untainted[alloc.ID] = alloc
-	}
-
-	return
-}
-
-// filterByRescheduleable filters the allocation set to return the set of allocations that are either
-// untainted or a set of allocations that must be rescheduled now. Allocations that can be rescheduled
-// at a future time are also returned so that we can create follow up evaluations for them. Allocs are
-// skipped or considered untainted according to logic defined in shouldFilter method.
-func (a allocSet) filterByRescheduleable(isBatch, isDisconnecting bool, now time.Time, evalID string, deployment *structs.Deployment) (allocSet, allocSet, []*delayedRescheduleInfo) {
-	untainted := make(map[string]*structs.Allocation)
-	rescheduleNow := make(map[string]*structs.Allocation)
-	rescheduleLater := []*delayedRescheduleInfo{}
-
-	for _, alloc := range a {
-		// Ignore disconnecting allocs that are already unknown. This can happen
-		// in the case of canaries that are interrupted by a disconnect.
-		if isDisconnecting && alloc.ClientStatus == structs.AllocClientStatusUnknown {
-			continue
-		}
-
-		var eligibleNow, eligibleLater bool
-		var rescheduleTime time.Time
-
-		// Ignore failing allocs that have already been rescheduled.
-		// Only failed or disconnecting allocs should be rescheduled.
-		// Protects against a bug allowing rescheduling running allocs.
-		if alloc.NextAllocation != "" && alloc.TerminalStatus() {
-			continue
-		}
-
-		isUntainted, ignore := shouldFilter(alloc, isBatch)
-		if isUntainted && !isDisconnecting {
-			untainted[alloc.ID] = alloc
-			continue // these allocs can never be rescheduled, so skip checking
-		}
-
-		if ignore {
-			continue
-		}
-
-		eligibleNow, eligibleLater, rescheduleTime = updateByReschedulable(alloc, now, evalID, deployment, isDisconnecting)
-		if eligibleNow {
-			rescheduleNow[alloc.ID] = alloc
-			continue
-		}
-
-		// If the failed alloc is not eligible for rescheduling now we
-		// add it to the untainted set.
-		untainted[alloc.ID] = alloc
-
-		if eligibleLater {
-			rescheduleLater = append(rescheduleLater, &delayedRescheduleInfo{alloc.ID, alloc, rescheduleTime})
-		}
-
-	}
-	return untainted, rescheduleNow, rescheduleLater
-}
-
 // shouldFilter returns whether the alloc should be ignored or considered untainted.
 //
 // Ignored allocs are filtered out.
@@ -550,32 +321,6 @@ func updateByReschedulable(alloc *structs.Allocation, now time.Time, evalID stri
 	return
 }
 
-// filterByTerminal filters out terminal allocs
-func filterByTerminal(untainted allocSet) (nonTerminal allocSet) {
-	nonTerminal = make(map[string]*structs.Allocation)
-	for id, alloc := range untainted {
-		if !alloc.TerminalStatus() {
-			nonTerminal[id] = alloc
-		}
-	}
-	return
-}
-
-// filterByDeployment filters allocations into two sets, those that match the
-// given deployment ID and those that don't
-func (a allocSet) filterByDeployment(id string) (match, nonmatch allocSet) {
-	match = make(map[string]*structs.Allocation)
-	nonmatch = make(map[string]*structs.Allocation)
-	for _, alloc := range a {
-		if alloc.DeploymentID == id {
-			match[alloc.ID] = alloc
-		} else {
-			nonmatch[alloc.ID] = alloc
-		}
-	}
-	return
-}
-
 // delayByStopAfter returns a delay for any lost allocation that's got a
 // disconnect.stop_on_client_after configured
 func (a allocSet) delayByStopAfter() (later []*delayedRescheduleInfo) {