From dfc76b3e1f1887def8691e2ad27f7529db42fd80 Mon Sep 17 00:00:00 2001 From: Preetha Appan Date: Mon, 8 Oct 2018 21:03:49 -0500 Subject: [PATCH] Fix bug in reconciler where terminal allocs on a job already stopped were unnecessarily updated --- scheduler/reconcile.go | 1 + scheduler/reconcile_test.go | 62 +++++++++++++++++++++++++++++++++++++ 2 files changed, 63 insertions(+) diff --git a/scheduler/reconcile.go b/scheduler/reconcile.go index 9826751f319..43a73a2109c 100644 --- a/scheduler/reconcile.go +++ b/scheduler/reconcile.go @@ -272,6 +272,7 @@ func (a *allocReconciler) cancelDeployments() { // handleStop marks all allocations to be stopped, handling the lost case func (a *allocReconciler) handleStop(m allocMatrix) { for group, as := range m { + as = filterByTerminal(as) untainted, migrate, lost := as.filterByTainted(a.taintedNodes) a.markStop(untainted, "", allocNotNeeded) a.markStop(migrate, "", allocNotNeeded) diff --git a/scheduler/reconcile_test.go b/scheduler/reconcile_test.go index ea103dd9b1a..c0503b24c6e 100644 --- a/scheduler/reconcile_test.go +++ b/scheduler/reconcile_test.go @@ -1095,6 +1095,68 @@ func TestReconciler_JobStopped(t *testing.T) { } } +// Tests the reconciler doesn't update allocs in terminal state +// when job is stopped or nil +func TestReconciler_JobStopped_TerminalAllocs(t *testing.T) { + job := mock.Job() + job.Stop = true + + cases := []struct { + name string + job *structs.Job + jobID, taskGroup string + }{ + { + name: "stopped job", + job: job, + jobID: job.ID, + taskGroup: job.TaskGroups[0].Name, + }, + { + name: "nil job", + job: nil, + jobID: "foo", + taskGroup: "bar", + }, + } + + for _, c := range cases { + t.Run(c.name, func(t *testing.T) { + // Create 10 terminal allocations + var allocs []*structs.Allocation + for i := 0; i < 10; i++ { + alloc := mock.Alloc() + alloc.Job = c.job + alloc.JobID = c.jobID + alloc.NodeID = uuid.Generate() + alloc.Name = structs.AllocName(c.jobID, c.taskGroup, uint(i)) + alloc.TaskGroup = c.taskGroup + if i%2 == 0 { + alloc.DesiredStatus = structs.AllocDesiredStatusStop + } else { + alloc.ClientStatus = structs.AllocClientStatusFailed + } + allocs = append(allocs, alloc) + } + + reconciler := NewAllocReconciler(testlog.HCLogger(t), allocUpdateFnIgnore, false, c.jobID, c.job, nil, allocs, nil, "") + r := reconciler.Compute() + require.Len(t, r.stop, 0) + // Assert the correct results + assertResults(t, r, &resultExpectation{ + createDeployment: nil, + deploymentUpdates: nil, + place: 0, + inplace: 0, + stop: 0, + desiredTGUpdates: map[string]*structs.DesiredUpdates{ + c.taskGroup: {}, + }, + }) + }) + } +} + // Tests the reconciler properly handles jobs with multiple task groups func TestReconciler_MultiTG(t *testing.T) { job := mock.Job()