open-nomad/client/allocrunner/taskrunner/script_check_hook_test.go

package taskrunner

import (
	"context"
	"fmt"
	"sync/atomic"
	"testing"
	"time"

	"github.com/hashicorp/consul/api"
	hclog "github.com/hashicorp/go-hclog"
	"github.com/hashicorp/nomad/client/allocrunner/taskrunner/interfaces"
	"github.com/hashicorp/nomad/client/consul"
	"github.com/hashicorp/nomad/client/taskenv"
	agentconsul "github.com/hashicorp/nomad/command/agent/consul"
	"github.com/hashicorp/nomad/helper/testlog"
	"github.com/hashicorp/nomad/nomad/mock"
	"github.com/hashicorp/nomad/nomad/structs"
	"github.com/stretchr/testify/require"
)

func newScriptMock(hb heartbeater, exec interfaces.ScriptExecutor, logger hclog.Logger, interval, timeout time.Duration) *scriptCheck {
	script := newScriptCheck(&scriptCheckConfig{
		allocID:   "allocid",
		taskName:  "testtask",
		serviceID: "serviceid",
		check: &structs.ServiceCheck{
			Interval: interval,
			Timeout:  timeout,
		},
		agent:      hb,
		driverExec: exec,
		taskEnv:    &taskenv.TaskEnv{},
		logger:     logger,
		shutdownCh: nil,
	})
	script.callback = newScriptCheckCallback(script)
	script.lastCheckOk = true
	return script
}

// fakeHeartbeater implements the heartbeater interface to allow mocking out
// Consul in script executor tests.
type fakeHeartbeater struct {
	heartbeats chan heartbeat
}

func (f *fakeHeartbeater) UpdateTTL(checkID, output, status string) error {
	f.heartbeats <- heartbeat{checkID: checkID, output: output, status: status}
	return nil
}

func newFakeHeartbeater() *fakeHeartbeater {
	return &fakeHeartbeater{heartbeats: make(chan heartbeat)}
}

type heartbeat struct {
	checkID string
	output  string
	status  string
}

// TestScript_Exec_Cancel asserts cancelling a script check shortcircuits
// any running scripts.
func TestScript_Exec_Cancel(t *testing.T) {
	exec, cancel := newBlockingScriptExec()
	defer cancel()

	logger := testlog.HCLogger(t)
	script := newScriptMock(nil, // heartbeater should never be called
		exec, logger, time.Hour, time.Hour)

	handle := script.run()
	<-exec.running  // wait until Exec is called
	handle.cancel() // cancel now that we're blocked in exec

	select {
	case <-handle.wait():
	case <-time.After(3 * time.Second):
		t.Fatalf("timed out waiting for script check to exit")
	}

	// The underlying ScriptExecutor (newBlockScriptExec) *cannot* be
	// canceled. Only a wrapper around it obeys the context cancelation.
	require.NotEqual(t, atomic.LoadInt32(&exec.exited), 1,
		"expected script executor to still be running after timeout")
}

// TestScript_Exec_TimeoutBasic asserts a script will be killed when the
// timeout is reached.
func TestScript_Exec_TimeoutBasic(t *testing.T) {
	t.Parallel()
	exec, cancel := newBlockingScriptExec()
	defer cancel()

	logger := testlog.HCLogger(t)
	hb := newFakeHeartbeater()
	script := newScriptMock(hb, exec, logger, time.Hour, time.Second)

	handle := script.run()
	defer handle.cancel() // cleanup
	<-exec.running        // wait until Exec is called

	// Check for UpdateTTL call
	select {
	case update := <-hb.heartbeats:
		require.Equal(t, update.output, context.DeadlineExceeded.Error())
		require.Equal(t, update.status, api.HealthCritical)
	case <-time.After(3 * time.Second):
		t.Fatalf("timed out waiting for script check to exit")
	}

	// The underlying ScriptExecutor (newBlockScriptExec) *cannot* be
	// canceled. Only a wrapper around it obeys the context cancelation.
	require.NotEqual(t, atomic.LoadInt32(&exec.exited), 1,
		"expected script executor to still be running after timeout")

	// Cancel and watch for exit
	handle.cancel()
	select {
	case <-handle.wait(): // ok!
	case update := <-hb.heartbeats:
		t.Errorf("unexpected UpdateTTL call on exit with status=%q", update)
	case <-time.After(3 * time.Second):
		t.Fatalf("timed out waiting for script check to exit")
	}
}

// TestScript_Exec_TimeoutCritical asserts a script will be killed when
// the timeout is reached and always set a critical status regardless of what
// Exec returns.
func TestScript_Exec_TimeoutCritical(t *testing.T) {
	t.Parallel()
	logger := testlog.HCLogger(t)
	hb := newFakeHeartbeater()
	script := newScriptMock(hb, sleeperExec{}, logger, time.Hour, time.Nanosecond)

	handle := script.run()
	defer handle.cancel() // cleanup

	// Check for UpdateTTL call
	select {
	case update := <-hb.heartbeats:
		require.Equal(t, update.output, context.DeadlineExceeded.Error())
		require.Equal(t, update.status, api.HealthCritical)
	case <-time.After(3 * time.Second):
		t.Fatalf("timed out waiting for script check to timeout")
	}
}

// TestScript_Exec_Shutdown asserts a script will be executed once more
// when told to shutdown.
func TestScript_Exec_Shutdown(t *testing.T) {
	shutdown := make(chan struct{})
	exec := newSimpleExec(0, nil)
	logger := testlog.HCLogger(t)
	hb := newFakeHeartbeater()
	script := newScriptMock(hb, exec, logger, time.Hour, 3*time.Second)
	script.shutdownCh = shutdown

	handle := script.run()
	defer handle.cancel() // cleanup
	close(shutdown)       // tell scriptCheck to exit

	select {
	case update := <-hb.heartbeats:
		require.Equal(t, update.output, "code=0 err=<nil>")
		require.Equal(t, update.status, api.HealthPassing)
	case <-time.After(3 * time.Second):
		t.Fatalf("timed out waiting for script check to exit")
	}

	select {
	case <-handle.wait(): // ok!
	case <-time.After(3 * time.Second):
		t.Fatalf("timed out waiting for script check to exit")
	}
}

// TestScript_Exec_Codes asserts script exit codes are translated to their
// corresponding Consul health check status.
func TestScript_Exec_Codes(t *testing.T) {

	exec := newScriptedExec([]execResult{
		{[]byte("output"), 1, nil},
		{[]byte("output"), 0, nil},
		{[]byte("output"), 0, context.DeadlineExceeded},
		{[]byte("output"), 0, nil},
		{[]byte("<ignored output>"), 2, fmt.Errorf("some error")},
		{[]byte("output"), 0, nil},
		{[]byte("error9000"), 9000, nil},
	})
	logger := testlog.HCLogger(t)
	hb := newFakeHeartbeater()
	script := newScriptMock(
		hb, exec, logger, time.Nanosecond, 3*time.Second)

	handle := script.run()
	defer handle.cancel() // cleanup
	deadline := time.After(3 * time.Second)

	expected := []heartbeat{
		{script.id, "output", api.HealthWarning},
		{script.id, "output", api.HealthPassing},
		{script.id, context.DeadlineExceeded.Error(), api.HealthCritical},
		{script.id, "output", api.HealthPassing},
		{script.id, "some error", api.HealthCritical},
		{script.id, "output", api.HealthPassing},
		{script.id, "error9000", api.HealthCritical},
	}

	for i := 0; i <= 6; i++ {
		select {
		case update := <-hb.heartbeats:
			require.Equal(t, update, expected[i],
				"expected update %d to be '%s' but received '%s'",
				i, expected[i], update)
		case <-deadline:
			t.Fatalf("timed out waiting for all script checks to finish")
		}
	}
}

// TestScript_TaskEnvInterpolation asserts that script check hooks are
// interpolated in the same way that services are
func TestScript_TaskEnvInterpolation(t *testing.T) {

	logger := testlog.HCLogger(t)
	consulClient := consul.NewMockConsulServiceClient(t, logger)
	exec, cancel := newBlockingScriptExec()
	defer cancel()

	alloc := mock.ConnectAlloc()
	task := alloc.Job.TaskGroups[0].Tasks[0]

	task.Services[0].Name = "${NOMAD_JOB_NAME}-${TASK}-${SVC_NAME}"
	task.Services[0].Checks[0].Name = "${NOMAD_JOB_NAME}-${SVC_NAME}-check"
	alloc.Job.Canonicalize() // need to re-canonicalize b/c the mock already did it

	env := taskenv.NewBuilder(mock.Node(), alloc, task, "global").SetHookEnv(
		"script_check",
		map[string]string{"SVC_NAME": "frontend"}).Build()

	svcHook := newServiceHook(serviceHookConfig{
		alloc:  alloc,
		task:   task,
		consul: consulClient,
		logger: logger,
	})
	// emulate prestart having been fired
	svcHook.taskEnv = env

	scHook := newScriptCheckHook(scriptCheckHookConfig{
		alloc:        alloc,
		task:         task,
		consul:       consulClient,
		logger:       logger,
		shutdownWait: time.Hour, // heartbeater will never be called
	})
	// emulate prestart having been fired
	scHook.taskEnv = env
	scHook.driverExec = exec

	expectedSvc := svcHook.getWorkloadServices().Services[0]
	expected := agentconsul.MakeCheckID(agentconsul.MakeAllocServiceID(
		alloc.ID, task.Name, expectedSvc), expectedSvc.Checks[0])

	actual := scHook.newScriptChecks()
	check, ok := actual[expected]
	require.True(t, ok)
	require.Equal(t, "my-job-frontend-check", check.check.Name)

	// emulate an update
	env = taskenv.NewBuilder(mock.Node(), alloc, task, "global").SetHookEnv(
		"script_check",
		map[string]string{"SVC_NAME": "backend"}).Build()
	scHook.taskEnv = env
	svcHook.taskEnv = env

	expectedSvc = svcHook.getWorkloadServices().Services[0]
	expected = agentconsul.MakeCheckID(agentconsul.MakeAllocServiceID(
		alloc.ID, task.Name, expectedSvc), expectedSvc.Checks[0])

	actual = scHook.newScriptChecks()
	check, ok = actual[expected]
	require.True(t, ok)
	require.Equal(t, "my-job-backend-check", check.check.Name)
}

func TestScript_associated(t *testing.T) {
	t.Run("neither set", func(t *testing.T) {
		require.False(t, new(scriptCheckHook).associated("task1", "", ""))
	})

	t.Run("service set", func(t *testing.T) {
		require.True(t, new(scriptCheckHook).associated("task1", "task1", ""))
		require.False(t, new(scriptCheckHook).associated("task1", "task2", ""))
	})

	t.Run("check set", func(t *testing.T) {
		require.True(t, new(scriptCheckHook).associated("task1", "", "task1"))
		require.False(t, new(scriptCheckHook).associated("task1", "", "task2"))
	})

	t.Run("both set", func(t *testing.T) {
		// ensure check.task takes precedence over service.task
		require.True(t, new(scriptCheckHook).associated("task1", "task1", "task1"))
		require.False(t, new(scriptCheckHook).associated("task1", "task1", "task2"))
		require.True(t, new(scriptCheckHook).associated("task1", "task2", "task1"))
		require.False(t, new(scriptCheckHook).associated("task1", "task2", "task2"))
	})
}
support script checks for task group services (#6197) In Nomad prior to Consul Connect, all Consul checks work the same except for Script checks. Because the Task being checked is running in its own container namespaces, the check is executed by Nomad in the Task's context. If the Script check passes, Nomad uses the TTL check feature of Consul to update the check status. This means in order to run a Script check, we need to know what Task to execute it in. To support Consul Connect, we need Group Services, and these need to be registered in Consul along with their checks. We could push the Service down into the Task, but this doesn't work if someone wants to associate a service with a task's ports, but do script checks in another task in the allocation. Because Nomad is handling the Script check and not Consul anyways, this moves the script check handling into the task runner so that the task runner can own the script check's configuration and lifecycle. This will allow us to pass the group service check configuration down into a task without associating the service itself with the task. When tasks are checked for script checks, we walk back through their task group to see if there are script checks associated with the task. If so, we'll spin off script check tasklets for them. The group-level service and any restart behaviors it needs are entirely encapsulated within the group service hook. 2019-09-03 19:09:04 +00:00			`package taskrunner`

			`import (`
			`"context"`
			`"fmt"`
			`"sync/atomic"`
			`"testing"`
			`"time"`

			`"github.com/hashicorp/consul/api"`
			`hclog "github.com/hashicorp/go-hclog"`
			`"github.com/hashicorp/nomad/client/allocrunner/taskrunner/interfaces"`
interpolate environment for services in script checks (#6916) In 0.10.2 (specifically 387b016) we added interpolation to group service blocks and centralized the logic for task environment interpolation. This wasn't also added to script checks, which caused a regression where the IDs for script checks for services w/ interpolated fields (ex. the service name) didn't match the service ID that was registered with Consul. This changeset calls the same taskenv interpolation logic during `script_check` configuration, and adds tests to reduce the risk of future regressions by comparing the IDs of service hook and the check hook. 2020-01-09 13:12:54 +00:00			`"github.com/hashicorp/nomad/client/consul"`
client: recreate script checks on Update (#6265) Splitting the immutable and mutable components of the scriptCheck led to a bug where the environment interpolation wasn't being incorporated into the check's ID, which caused the UpdateTTL to update for a check ID that Consul didn't have (because our Consul client creates the ID from the structs.ServiceCheck each time we update). Task group services don't have access to a task environment at creation, so their checks get registered before the check can be interpolated. Use the original check ID so they can be updated. 2019-09-05 15:43:23 +00:00			`"github.com/hashicorp/nomad/client/taskenv"`
interpolate environment for services in script checks (#6916) In 0.10.2 (specifically 387b016) we added interpolation to group service blocks and centralized the logic for task environment interpolation. This wasn't also added to script checks, which caused a regression where the IDs for script checks for services w/ interpolated fields (ex. the service name) didn't match the service ID that was registered with Consul. This changeset calls the same taskenv interpolation logic during `script_check` configuration, and adds tests to reduce the risk of future regressions by comparing the IDs of service hook and the check hook. 2020-01-09 13:12:54 +00:00			`agentconsul "github.com/hashicorp/nomad/command/agent/consul"`
support script checks for task group services (#6197) In Nomad prior to Consul Connect, all Consul checks work the same except for Script checks. Because the Task being checked is running in its own container namespaces, the check is executed by Nomad in the Task's context. If the Script check passes, Nomad uses the TTL check feature of Consul to update the check status. This means in order to run a Script check, we need to know what Task to execute it in. To support Consul Connect, we need Group Services, and these need to be registered in Consul along with their checks. We could push the Service down into the Task, but this doesn't work if someone wants to associate a service with a task's ports, but do script checks in another task in the allocation. Because Nomad is handling the Script check and not Consul anyways, this moves the script check handling into the task runner so that the task runner can own the script check's configuration and lifecycle. This will allow us to pass the group service check configuration down into a task without associating the service itself with the task. When tasks are checked for script checks, we walk back through their task group to see if there are script checks associated with the task. If so, we'll spin off script check tasklets for them. The group-level service and any restart behaviors it needs are entirely encapsulated within the group service hook. 2019-09-03 19:09:04 +00:00			`"github.com/hashicorp/nomad/helper/testlog"`
interpolate environment for services in script checks (#6916) In 0.10.2 (specifically 387b016) we added interpolation to group service blocks and centralized the logic for task environment interpolation. This wasn't also added to script checks, which caused a regression where the IDs for script checks for services w/ interpolated fields (ex. the service name) didn't match the service ID that was registered with Consul. This changeset calls the same taskenv interpolation logic during `script_check` configuration, and adds tests to reduce the risk of future regressions by comparing the IDs of service hook and the check hook. 2020-01-09 13:12:54 +00:00			`"github.com/hashicorp/nomad/nomad/mock"`
support script checks for task group services (#6197) In Nomad prior to Consul Connect, all Consul checks work the same except for Script checks. Because the Task being checked is running in its own container namespaces, the check is executed by Nomad in the Task's context. If the Script check passes, Nomad uses the TTL check feature of Consul to update the check status. This means in order to run a Script check, we need to know what Task to execute it in. To support Consul Connect, we need Group Services, and these need to be registered in Consul along with their checks. We could push the Service down into the Task, but this doesn't work if someone wants to associate a service with a task's ports, but do script checks in another task in the allocation. Because Nomad is handling the Script check and not Consul anyways, this moves the script check handling into the task runner so that the task runner can own the script check's configuration and lifecycle. This will allow us to pass the group service check configuration down into a task without associating the service itself with the task. When tasks are checked for script checks, we walk back through their task group to see if there are script checks associated with the task. If so, we'll spin off script check tasklets for them. The group-level service and any restart behaviors it needs are entirely encapsulated within the group service hook. 2019-09-03 19:09:04 +00:00			`"github.com/hashicorp/nomad/nomad/structs"`
			`"github.com/stretchr/testify/require"`
			`)`

			`func newScriptMock(hb heartbeater, exec interfaces.ScriptExecutor, logger hclog.Logger, interval, timeout time.Duration) *scriptCheck {`
			`script := newScriptCheck(&scriptCheckConfig{`
client: recreate script checks on Update (#6265) Splitting the immutable and mutable components of the scriptCheck led to a bug where the environment interpolation wasn't being incorporated into the check's ID, which caused the UpdateTTL to update for a check ID that Consul didn't have (because our Consul client creates the ID from the structs.ServiceCheck each time we update). Task group services don't have access to a task environment at creation, so their checks get registered before the check can be interpolated. Use the original check ID so they can be updated. 2019-09-05 15:43:23 +00:00			`allocID: "allocid",`
			`taskName: "testtask",`
			`serviceID: "serviceid",`
			`check: &structs.ServiceCheck{`
			`Interval: interval,`
			`Timeout: timeout,`
			`},`
			`agent: hb,`
			`driverExec: exec,`
			`taskEnv: &taskenv.TaskEnv{},`
			`logger: logger,`
			`shutdownCh: nil,`
support script checks for task group services (#6197) In Nomad prior to Consul Connect, all Consul checks work the same except for Script checks. Because the Task being checked is running in its own container namespaces, the check is executed by Nomad in the Task's context. If the Script check passes, Nomad uses the TTL check feature of Consul to update the check status. This means in order to run a Script check, we need to know what Task to execute it in. To support Consul Connect, we need Group Services, and these need to be registered in Consul along with their checks. We could push the Service down into the Task, but this doesn't work if someone wants to associate a service with a task's ports, but do script checks in another task in the allocation. Because Nomad is handling the Script check and not Consul anyways, this moves the script check handling into the task runner so that the task runner can own the script check's configuration and lifecycle. This will allow us to pass the group service check configuration down into a task without associating the service itself with the task. When tasks are checked for script checks, we walk back through their task group to see if there are script checks associated with the task. If so, we'll spin off script check tasklets for them. The group-level service and any restart behaviors it needs are entirely encapsulated within the group service hook. 2019-09-03 19:09:04 +00:00			`})`
			`script.callback = newScriptCheckCallback(script)`
			`script.lastCheckOk = true`
			`return script`
			`}`

			`// fakeHeartbeater implements the heartbeater interface to allow mocking out`
			`// Consul in script executor tests.`
			`type fakeHeartbeater struct {`
			`heartbeats chan heartbeat`
			`}`

			`func (f *fakeHeartbeater) UpdateTTL(checkID, output, status string) error {`
			`f.heartbeats <- heartbeat{checkID: checkID, output: output, status: status}`
			`return nil`
			`}`

			`func newFakeHeartbeater() *fakeHeartbeater {`
			`return &fakeHeartbeater{heartbeats: make(chan heartbeat)}`
			`}`

			`type heartbeat struct {`
			`checkID string`
			`output string`
			`status string`
			`}`

			`// TestScript_Exec_Cancel asserts cancelling a script check shortcircuits`
			`// any running scripts.`
			`func TestScript_Exec_Cancel(t *testing.T) {`
			`exec, cancel := newBlockingScriptExec()`
			`defer cancel()`

			`logger := testlog.HCLogger(t)`
			`script := newScriptMock(nil, // heartbeater should never be called`
			`exec, logger, time.Hour, time.Hour)`

			`handle := script.run()`
			`<-exec.running // wait until Exec is called`
			`handle.cancel() // cancel now that we're blocked in exec`

			`select {`
			`case <-handle.wait():`
			`case <-time.After(3 * time.Second):`
			`t.Fatalf("timed out waiting for script check to exit")`
			`}`

			`// The underlying ScriptExecutor (newBlockScriptExec) cannot be`
			`// canceled. Only a wrapper around it obeys the context cancelation.`
			`require.NotEqual(t, atomic.LoadInt32(&exec.exited), 1,`
			`"expected script executor to still be running after timeout")`
			`}`

			`// TestScript_Exec_TimeoutBasic asserts a script will be killed when the`
			`// timeout is reached.`
			`func TestScript_Exec_TimeoutBasic(t *testing.T) {`
			`t.Parallel()`
			`exec, cancel := newBlockingScriptExec()`
			`defer cancel()`

			`logger := testlog.HCLogger(t)`
			`hb := newFakeHeartbeater()`
			`script := newScriptMock(hb, exec, logger, time.Hour, time.Second)`

			`handle := script.run()`
			`defer handle.cancel() // cleanup`
			`<-exec.running // wait until Exec is called`

			`// Check for UpdateTTL call`
			`select {`
			`case update := <-hb.heartbeats:`
			`require.Equal(t, update.output, context.DeadlineExceeded.Error())`
			`require.Equal(t, update.status, api.HealthCritical)`
			`case <-time.After(3 * time.Second):`
			`t.Fatalf("timed out waiting for script check to exit")`
			`}`

			`// The underlying ScriptExecutor (newBlockScriptExec) cannot be`
			`// canceled. Only a wrapper around it obeys the context cancelation.`
			`require.NotEqual(t, atomic.LoadInt32(&exec.exited), 1,`
			`"expected script executor to still be running after timeout")`

			`// Cancel and watch for exit`
			`handle.cancel()`
			`select {`
			`case <-handle.wait(): // ok!`
			`case update := <-hb.heartbeats:`
			`t.Errorf("unexpected UpdateTTL call on exit with status=%q", update)`
			`case <-time.After(3 * time.Second):`
			`t.Fatalf("timed out waiting for script check to exit")`
			`}`
			`}`

			`// TestScript_Exec_TimeoutCritical asserts a script will be killed when`
			`// the timeout is reached and always set a critical status regardless of what`
			`// Exec returns.`
			`func TestScript_Exec_TimeoutCritical(t *testing.T) {`
			`t.Parallel()`
			`logger := testlog.HCLogger(t)`
			`hb := newFakeHeartbeater()`
			`script := newScriptMock(hb, sleeperExec{}, logger, time.Hour, time.Nanosecond)`

			`handle := script.run()`
			`defer handle.cancel() // cleanup`

			`// Check for UpdateTTL call`
			`select {`
			`case update := <-hb.heartbeats:`
			`require.Equal(t, update.output, context.DeadlineExceeded.Error())`
			`require.Equal(t, update.status, api.HealthCritical)`
			`case <-time.After(3 * time.Second):`
			`t.Fatalf("timed out waiting for script check to timeout")`
			`}`
			`}`

			`// TestScript_Exec_Shutdown asserts a script will be executed once more`
			`// when told to shutdown.`
			`func TestScript_Exec_Shutdown(t *testing.T) {`
			`shutdown := make(chan struct{})`
			`exec := newSimpleExec(0, nil)`
			`logger := testlog.HCLogger(t)`
			`hb := newFakeHeartbeater()`
			`script := newScriptMock(hb, exec, logger, time.Hour, 3*time.Second)`
			`script.shutdownCh = shutdown`

			`handle := script.run()`
			`defer handle.cancel() // cleanup`
			`close(shutdown) // tell scriptCheck to exit`

			`select {`
			`case update := <-hb.heartbeats:`
			`require.Equal(t, update.output, "code=0 err=<nil>")`
			`require.Equal(t, update.status, api.HealthPassing)`
			`case <-time.After(3 * time.Second):`
			`t.Fatalf("timed out waiting for script check to exit")`
			`}`

			`select {`
			`case <-handle.wait(): // ok!`
			`case <-time.After(3 * time.Second):`
			`t.Fatalf("timed out waiting for script check to exit")`
			`}`
			`}`

			`// TestScript_Exec_Codes asserts script exit codes are translated to their`
			`// corresponding Consul health check status.`
			`func TestScript_Exec_Codes(t *testing.T) {`

			`exec := newScriptedExec([]execResult{`
			`{[]byte("output"), 1, nil},`
			`{[]byte("output"), 0, nil},`
			`{[]byte("output"), 0, context.DeadlineExceeded},`
			`{[]byte("output"), 0, nil},`
			`{[]byte("<ignored output>"), 2, fmt.Errorf("some error")},`
			`{[]byte("output"), 0, nil},`
			`{[]byte("error9000"), 9000, nil},`
			`})`
			`logger := testlog.HCLogger(t)`
			`hb := newFakeHeartbeater()`
			`script := newScriptMock(`
			`hb, exec, logger, time.Nanosecond, 3*time.Second)`

			`handle := script.run()`
			`defer handle.cancel() // cleanup`
			`deadline := time.After(3 * time.Second)`

			`expected := []heartbeat{`
			`{script.id, "output", api.HealthWarning},`
			`{script.id, "output", api.HealthPassing},`
			`{script.id, context.DeadlineExceeded.Error(), api.HealthCritical},`
			`{script.id, "output", api.HealthPassing},`
			`{script.id, "some error", api.HealthCritical},`
			`{script.id, "output", api.HealthPassing},`
			`{script.id, "error9000", api.HealthCritical},`
			`}`

			`for i := 0; i <= 6; i++ {`
			`select {`
			`case update := <-hb.heartbeats:`
			`require.Equal(t, update, expected[i],`
			`"expected update %d to be '%s' but received '%s'",`
			`i, expected[i], update)`
			`case <-deadline:`
			`t.Fatalf("timed out waiting for all script checks to finish")`
			`}`
			`}`
			`}`
interpolate environment for services in script checks (#6916) In 0.10.2 (specifically 387b016) we added interpolation to group service blocks and centralized the logic for task environment interpolation. This wasn't also added to script checks, which caused a regression where the IDs for script checks for services w/ interpolated fields (ex. the service name) didn't match the service ID that was registered with Consul. This changeset calls the same taskenv interpolation logic during `script_check` configuration, and adds tests to reduce the risk of future regressions by comparing the IDs of service hook and the check hook. 2020-01-09 13:12:54 +00:00
			`// TestScript_TaskEnvInterpolation asserts that script check hooks are`
			`// interpolated in the same way that services are`
			`func TestScript_TaskEnvInterpolation(t *testing.T) {`

			`logger := testlog.HCLogger(t)`
			`consulClient := consul.NewMockConsulServiceClient(t, logger)`
			`exec, cancel := newBlockingScriptExec()`
			`defer cancel()`

			`alloc := mock.ConnectAlloc()`
			`task := alloc.Job.TaskGroups[0].Tasks[0]`

			`task.Services[0].Name = "${NOMAD_JOB_NAME}-${TASK}-${SVC_NAME}"`
			`task.Services[0].Checks[0].Name = "${NOMAD_JOB_NAME}-${SVC_NAME}-check"`
			`alloc.Job.Canonicalize() // need to re-canonicalize b/c the mock already did it`

			`env := taskenv.NewBuilder(mock.Node(), alloc, task, "global").SetHookEnv(`
			`"script_check",`
			`map[string]string{"SVC_NAME": "frontend"}).Build()`

			`svcHook := newServiceHook(serviceHookConfig{`
			`alloc: alloc,`
			`task: task,`
			`consul: consulClient,`
			`logger: logger,`
			`})`
			`// emulate prestart having been fired`
			`svcHook.taskEnv = env`

			`scHook := newScriptCheckHook(scriptCheckHookConfig{`
			`alloc: alloc,`
			`task: task,`
			`consul: consulClient,`
			`logger: logger,`
			`shutdownWait: time.Hour, // heartbeater will never be called`
			`})`
			`// emulate prestart having been fired`
			`scHook.taskEnv = env`
			`scHook.driverExec = exec`

			`expectedSvc := svcHook.getWorkloadServices().Services[0]`
			`expected := agentconsul.MakeCheckID(agentconsul.MakeAllocServiceID(`
			`alloc.ID, task.Name, expectedSvc), expectedSvc.Checks[0])`

			`actual := scHook.newScriptChecks()`
			`check, ok := actual[expected]`
			`require.True(t, ok)`
			`require.Equal(t, "my-job-frontend-check", check.check.Name)`

			`// emulate an update`
			`env = taskenv.NewBuilder(mock.Node(), alloc, task, "global").SetHookEnv(`
			`"script_check",`
			`map[string]string{"SVC_NAME": "backend"}).Build()`
			`scHook.taskEnv = env`
			`svcHook.taskEnv = env`

			`expectedSvc = svcHook.getWorkloadServices().Services[0]`
			`expected = agentconsul.MakeCheckID(agentconsul.MakeAllocServiceID(`
			`alloc.ID, task.Name, expectedSvc), expectedSvc.Checks[0])`

			`actual = scHook.newScriptChecks()`
			`check, ok = actual[expected]`
			`require.True(t, ok)`
			`require.Equal(t, "my-job-backend-check", check.check.Name)`
			`}`
consul: fix validation of task in group-level script-checks When defining a script-check in a group-level service, Nomad needs to know which task is associated with the check so that it can use the correct task driver to execute the check. This PR fixes two bugs: 1) validate service.task or service.check.task is configured 2) make service.check.task inherit service.task if it is itself unset Fixes #8952 2020-09-28 15:48:28 +00:00
			`func TestScript_associated(t *testing.T) {`
			`t.Run("neither set", func(t *testing.T) {`
			`require.False(t, new(scriptCheckHook).associated("task1", "", ""))`
			`})`

			`t.Run("service set", func(t *testing.T) {`
			`require.True(t, new(scriptCheckHook).associated("task1", "task1", ""))`
			`require.False(t, new(scriptCheckHook).associated("task1", "task2", ""))`
			`})`

			`t.Run("check set", func(t *testing.T) {`
			`require.True(t, new(scriptCheckHook).associated("task1", "", "task1"))`
			`require.False(t, new(scriptCheckHook).associated("task1", "", "task2"))`
			`})`

			`t.Run("both set", func(t *testing.T) {`
			`// ensure check.task takes precedence over service.task`
			`require.True(t, new(scriptCheckHook).associated("task1", "task1", "task1"))`
			`require.False(t, new(scriptCheckHook).associated("task1", "task1", "task2"))`
			`require.True(t, new(scriptCheckHook).associated("task1", "task2", "task1"))`
			`require.False(t, new(scriptCheckHook).associated("task1", "task2", "task2"))`
			`})`
			`}`