Skip to content

Commit

Permalink
client: run alloc pre-kill hooks on last pass despite no live tasks
Browse files Browse the repository at this point in the history
This PR fixes a bug where alloc pre-kill hooks were not run in the
edge case where there are no live tasks remaining, but it is also
the final update to process for the (terminal) allocation. We need
to run cleanup hooks here, otherwise they will not run until the
allocation gets garbage collected (i.e. via Destroy()), possibly
at a distant time in the future.

Fixes #15477
  • Loading branch information
shoenig committed Jan 23, 2023
1 parent 43fa28a commit 6d6d5df
Show file tree
Hide file tree
Showing 4 changed files with 55 additions and 2 deletions.
12 changes: 11 additions & 1 deletion client/allocrunner/alloc_runner.go
Original file line number Diff line number Diff line change
Expand Up @@ -125,7 +125,7 @@ type allocRunner struct {
allocDir *allocdir.AllocDir

// runnerHooks are alloc runner lifecycle hooks that should be run on state
// transistions.
// transitions.
runnerHooks []interfaces.RunnerHook

// hookState is the output of allocrunner hooks
Expand Down Expand Up @@ -546,7 +546,9 @@ func (ar *allocRunner) handleTaskStateUpdates() {
}
}

// kill remaining live tasks
if len(liveRunners) > 0 {

// if all live runners are sidecars - kill alloc
onlySidecarsRemaining := hasSidecars && !hasNonSidecarTasks(liveRunners)
if killEvent == nil && onlySidecarsRemaining {
Expand Down Expand Up @@ -586,6 +588,14 @@ func (ar *allocRunner) handleTaskStateUpdates() {
}
}
} else {
// there are no live runners left

// run AR pre-kill hooks if this alloc is terminal; any post-stop
// tasks would regularly run in this state anyway (?)
if done {
ar.preKillHooks()
}

// If there are no live runners left kill all non-poststop task
// runners to unblock them from the alloc restart loop.
for _, tr := range ar.tasks {
Expand Down
1 change: 1 addition & 0 deletions client/allocrunner/alloc_runner_hooks.go
Original file line number Diff line number Diff line change
Expand Up @@ -329,6 +329,7 @@ func (ar *allocRunner) destroy() error {
func (ar *allocRunner) preKillHooks() {
for _, hook := range ar.runnerHooks {
pre, ok := hook.(interfaces.RunnerPreKillHook)

if !ok {
continue
}
Expand Down
43 changes: 43 additions & 0 deletions client/allocrunner/alloc_runner_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -6,6 +6,7 @@ import (
"io/ioutil"
"os"
"path/filepath"
"sync/atomic"
"testing"
"time"

Expand All @@ -23,6 +24,8 @@ import (
"github.com/hashicorp/nomad/nomad/mock"
"github.com/hashicorp/nomad/nomad/structs"
"github.com/hashicorp/nomad/testutil"
"github.com/shoenig/test/must"
"github.com/shoenig/test/wait"
"github.com/stretchr/testify/require"
)

Expand Down Expand Up @@ -2398,3 +2401,43 @@ func TestHasSidecarTasks(t *testing.T) {
})
}
}

type allocPreKillHook struct {
ran atomic.Bool
}

func (*allocPreKillHook) Name() string { return "test_prekill" }

func (h *allocPreKillHook) PreKill() {
h.ran.Store(true)
}

func TestAllocRunner_PreKill_RunOnDone(t *testing.T) {
ci.Parallel(t)

alloc := mock.Alloc()
task := alloc.Job.TaskGroups[0].Tasks[0]
task.Driver = "mock_driver"
task.Config = map[string]interface{}{"run_for": "2ms"}
alloc.DesiredStatus = "stop"

conf, cleanup := testAllocRunnerConfig(t, alloc.Copy())
t.Cleanup(cleanup)

ar, err := NewAllocRunner(conf)
must.NoError(t, err)

// set our custom prekill hook
hook := new(allocPreKillHook)
ar.runnerHooks = append(ar.runnerHooks, hook)

go ar.Run()
defer destroy(ar)

// wait for completion or timeout
must.Wait(t, wait.InitialSuccess(
wait.BoolFunc(hook.ran.Load),
wait.Timeout(5*time.Second),
wait.Gap(500*time.Millisecond),
))
}
1 change: 0 additions & 1 deletion client/allocrunner/alloc_runner_unix_test.go
Original file line number Diff line number Diff line change
@@ -1,5 +1,4 @@
//go:build !windows
// +build !windows

package allocrunner

Expand Down

0 comments on commit 6d6d5df

Please sign in to comment.