From 59335284049f94f6db0c4a36d215660294e162b7 Mon Sep 17 00:00:00 2001 From: Danielle Lancashire Date: Wed, 12 Jun 2019 16:00:21 +0200 Subject: [PATCH 1/2] trhooks: Add TaskStopHook interface to services We currently only run cleanup Service Hooks when a task is either Killed, or Exited. However, due to the implementation of a task runner, tasks are only Exited if they every correctly started running, which is not true when you recieve an error early in the task start flow, such as not being able to pull secrets from Vault. This updates the service hook to also call consul deregistration routines during a task Stop lifecycle event, to ensure that any registered checks and services are cleared in such cases. fixes #5770 --- client/allocrunner/alloc_runner_unix_test.go | 3 ++- client/allocrunner/taskrunner/service_hook.go | 12 ++++++++++++ client/allocrunner/taskrunner/task_runner_test.go | 6 +++++- 3 files changed, 19 insertions(+), 2 deletions(-) diff --git a/client/allocrunner/alloc_runner_unix_test.go b/client/allocrunner/alloc_runner_unix_test.go index ecb387d34e8..e0608efc75c 100644 --- a/client/allocrunner/alloc_runner_unix_test.go +++ b/client/allocrunner/alloc_runner_unix_test.go @@ -116,8 +116,9 @@ func TestAllocRunner_Restore_RunningTerminal(t *testing.T) { // Assert consul was cleaned up: // 2 removals (canary+noncanary) during prekill // 2 removals (canary+noncanary) during exited + // 2 removals (canary+noncanary) during stop consulOps := conf2.Consul.(*consul.MockConsulServiceClient).GetOps() - require.Len(t, consulOps, 4) + require.Len(t, consulOps, 6) for _, op := range consulOps { require.Equal(t, "remove", op.Op) } diff --git a/client/allocrunner/taskrunner/service_hook.go b/client/allocrunner/taskrunner/service_hook.go index c5def6b29a3..a8911041710 100644 --- a/client/allocrunner/taskrunner/service_hook.go +++ b/client/allocrunner/taskrunner/service_hook.go @@ -16,6 +16,11 @@ import ( "github.com/hashicorp/nomad/plugins/drivers" ) +var _ interfaces.TaskPoststartHook = &serviceHook{} +var _ interfaces.TaskPreKillHook = &serviceHook{} +var _ interfaces.TaskExitedHook = &serviceHook{} +var _ interfaces.TaskStopHook = &serviceHook{} + type serviceHookConfig struct { alloc *structs.Allocation task *structs.Task @@ -179,6 +184,13 @@ func (h *serviceHook) deregister() { } +func (h *serviceHook) Stop(ctx context.Context, req *interfaces.TaskStopRequest, resp *interfaces.TaskStopResponse) error { + h.mu.Lock() + defer h.mu.Unlock() + h.deregister() + return nil +} + func (h *serviceHook) getTaskServices() *agentconsul.TaskServices { // Interpolate with the task's environment interpolatedServices := interpolateServices(h.taskEnv, h.services) diff --git a/client/allocrunner/taskrunner/task_runner_test.go b/client/allocrunner/taskrunner/task_runner_test.go index 7d2bd5275e6..234aa70bd30 100644 --- a/client/allocrunner/taskrunner/task_runner_test.go +++ b/client/allocrunner/taskrunner/task_runner_test.go @@ -1991,7 +1991,7 @@ func TestTaskRunner_UnregisterConsul_Retries(t *testing.T) { consul := conf.Consul.(*consulapi.MockConsulServiceClient) consulOps := consul.GetOps() - require.Len(t, consulOps, 6) + require.Len(t, consulOps, 8) // Initial add require.Equal(t, "add", consulOps[0].Op) @@ -2006,6 +2006,10 @@ func TestTaskRunner_UnregisterConsul_Retries(t *testing.T) { // Removing canary and non-canary entries on retry require.Equal(t, "remove", consulOps[4].Op) require.Equal(t, "remove", consulOps[5].Op) + + // Removing canary and non-canary entries on stop + require.Equal(t, "remove", consulOps[1].Op) + require.Equal(t, "remove", consulOps[2].Op) } // testWaitForTaskToStart waits for the task to be running or fails the test From 1aa6bc80d8cdfedec0a097cdb666f912a909c5f0 Mon Sep 17 00:00:00 2001 From: Danielle Lancashire Date: Wed, 12 Jun 2019 17:06:11 +0200 Subject: [PATCH 2/2] trt: Fix test --- client/allocrunner/taskrunner/task_runner_test.go | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/client/allocrunner/taskrunner/task_runner_test.go b/client/allocrunner/taskrunner/task_runner_test.go index 234aa70bd30..b3506d1b36c 100644 --- a/client/allocrunner/taskrunner/task_runner_test.go +++ b/client/allocrunner/taskrunner/task_runner_test.go @@ -2008,8 +2008,8 @@ func TestTaskRunner_UnregisterConsul_Retries(t *testing.T) { require.Equal(t, "remove", consulOps[5].Op) // Removing canary and non-canary entries on stop - require.Equal(t, "remove", consulOps[1].Op) - require.Equal(t, "remove", consulOps[2].Op) + require.Equal(t, "remove", consulOps[6].Op) + require.Equal(t, "remove", consulOps[7].Op) } // testWaitForTaskToStart waits for the task to be running or fails the test