open-nomad/command/monitor.go

package command

import (
	"fmt"
	"sync"
	"time"

	"github.com/hashicorp/nomad/api"
	"github.com/hashicorp/nomad/nomad/structs"
	"github.com/mitchellh/cli"
)

const (
	// dateFmt is the format we use when printing the date in
	// status update messages during monitoring.
	dateFmt = "2006/01/02 15:04:05"
)

// monitor wraps an evaluation monitor and holds metadata and
// state information.
type monitor struct {
	ui     cli.Ui
	client *api.Client
	state  *monitorState

	sync.Mutex
}

// newMonitor returns a new monitor. The returned monitor will
// write output information to the provided ui.
func newMonitor(ui cli.Ui, client *api.Client) *monitor {
	return &monitor{
		ui:     ui,
		client: client,
		state: &monitorState{
			allocs: make(map[string]*allocState),
		},
	}
}

// output is used to write informational messages to the ui.
func (m *monitor) output(msg string) {
	m.ui.Output(fmt.Sprintf("    %s %s", time.Now().Format(dateFmt), msg))
}

// monitorState is used to store the current "state of the world"
// in the context of monitoring an evaluation.
type monitorState struct {
	status string
	nodeID string
	allocs map[string]*allocState
	wait   time.Duration
}

// allocState is used to track the state of an allocation
type allocState struct {
	group   string
	node    string
	desired string
	client  string
}

// update is used to update our monitor with new state. It can be
// called whether the passed information is new or not, and will
// only dump update messages when state changes.
func (m *monitor) update(eval *api.Evaluation, allocs []*api.AllocationListStub) {
	m.Lock()
	defer m.Unlock()

	existing := m.state

	// Create the new state
	update := &monitorState{
		status: eval.Status,
		nodeID: eval.NodeID,
		allocs: make(map[string]*allocState),
		wait:   eval.Wait,
	}
	for _, alloc := range allocs {
		update.allocs[alloc.ID] = &allocState{
			group:   alloc.TaskGroup,
			node:    alloc.NodeID,
			desired: alloc.DesiredStatus,
			client:  alloc.ClientStatus,
		}
	}
	defer func() { m.state = update }()

	// Check the allocations
	for allocID, alloc := range update.allocs {
		if _, ok := existing.allocs[allocID]; !ok {
			// Check if this is a failure indication allocation
			if alloc.desired == structs.AllocDesiredStatusFailed {
				m.output("Scheduling failed")
			} else {
				m.output(fmt.Sprintf("Allocated task group %q on node %q",
					alloc.group, alloc.node))
			}
		}
	}

	// Check if the status changed
	if existing.status != update.status {
		m.output(fmt.Sprintf("Evaluation changed status from %q to %q",
			existing.status, eval.Status))
	}

	// Check if the wait time is different
	if existing.wait == 0 && update.wait != 0 {
		m.output(fmt.Sprintf("Waiting %s before running eval",
			eval.Wait))
	}

	// Check if the nodeID changed
	if existing.nodeID == "" && update.nodeID != "" {
		m.output(fmt.Sprintf("Evaluation was assigned node ID %q",
			eval.NodeID))
	}
}

// monitor is used to start monitoring the given evaluation ID. It
// writes output directly to the monitor's ui, and returns the
// exit code for the command. The return code is 0 if monitoring
// succeeded and exited successfully, or 1 if an error was encountered
// or the eval status was returned as failed.
func (m *monitor) monitor(evalID string) int {
	m.ui.Info(fmt.Sprintf("Monitoring evaluation %q", evalID))
	for {
		// Check the current state of things
		eval, _, err := m.client.Evaluations().Info(evalID, nil)
		if err != nil {
			m.ui.Error(fmt.Sprintf("Error reading evaluation: %s", err))
			return 1
		}

		allocs, _, err := m.client.Evaluations().Allocations(evalID, nil)
		if err != nil {
			m.ui.Error(fmt.Sprintf("Error reading allocations: %s", err))
			return 1
		}

		// Update the state
		m.update(eval, allocs)

		switch eval.Status {
		case structs.EvalStatusComplete, structs.EvalStatusFailed:
			m.ui.Info(fmt.Sprintf("Evaluation %q finished with status %q",
				eval.ID, eval.Status))
		default:
			// Wait for the next update
			time.Sleep(time.Second)
			continue
		}

		// Monitor the next eval, if it exists.
		if eval.NextEval != "" {
			return m.monitor(eval.NextEval)
		}

		// Check if the eval is complete
		switch eval.Status {
		case structs.EvalStatusComplete:
			return 0
		case structs.EvalStatusFailed:
			return 1
		}
	}

	return 0
}
command: start implementing eval monitoring for run 2015-09-16 20:58:33 +00:00			`package command`

			`import (`
			`"fmt"`
			`"sync"`
			`"time"`

			`"github.com/hashicorp/nomad/api"`
			`"github.com/hashicorp/nomad/nomad/structs"`
			`"github.com/mitchellh/cli"`
			`)`

			`const (`
			`// dateFmt is the format we use when printing the date in`
			`// status update messages during monitoring.`
			`dateFmt = "2006/01/02 15:04:05"`
			`)`

			`// monitor wraps an evaluation monitor and holds metadata and`
			`// state information.`
			`type monitor struct {`
			`ui cli.Ui`
			`client *api.Client`
			`state *monitorState`

			`sync.Mutex`
			`}`

			`// newMonitor returns a new monitor. The returned monitor will`
			`// write output information to the provided ui.`
			`func newMonitor(ui cli.Ui, client api.Client) monitor {`
			`return &monitor{`
			`ui: ui,`
			`client: client,`
command: working on monitor 2015-09-16 21:45:21 +00:00			`state: &monitorState{`
			`allocs: make(map[string]*allocState),`
			`},`
command: start implementing eval monitoring for run 2015-09-16 20:58:33 +00:00			`}`
			`}`

			`// output is used to write informational messages to the ui.`
			`func (m *monitor) output(msg string) {`
command: working on monitor 2015-09-16 21:45:21 +00:00			`m.ui.Output(fmt.Sprintf(" %s %s", time.Now().Format(dateFmt), msg))`
command: start implementing eval monitoring for run 2015-09-16 20:58:33 +00:00			`}`

			`// monitorState is used to store the current "state of the world"`
			`// in the context of monitoring an evaluation.`
			`type monitorState struct {`
			`status string`
			`nodeID string`
command: working on monitor 2015-09-16 21:45:21 +00:00			`allocs map[string]*allocState`
command: start implementing eval monitoring for run 2015-09-16 20:58:33 +00:00			`wait time.Duration`
			`}`

command: working on monitor 2015-09-16 21:45:21 +00:00			`// allocState is used to track the state of an allocation`
			`type allocState struct {`
			`group string`
			`node string`
			`desired string`
			`client string`
			`}`

command: start implementing eval monitoring for run 2015-09-16 20:58:33 +00:00			`// update is used to update our monitor with new state. It can be`
			`// called whether the passed information is new or not, and will`
			`// only dump update messages when state changes.`
command: working on monitor 2015-09-16 21:45:21 +00:00			`func (m monitor) update(eval api.Evaluation, allocs []*api.AllocationListStub) {`
command: start implementing eval monitoring for run 2015-09-16 20:58:33 +00:00			`m.Lock()`
			`defer m.Unlock()`

			`existing := m.state`

			`// Create the new state`
			`update := &monitorState{`
			`status: eval.Status,`
			`nodeID: eval.NodeID,`
command: working on monitor 2015-09-16 21:45:21 +00:00			`allocs: make(map[string]*allocState),`
command: start implementing eval monitoring for run 2015-09-16 20:58:33 +00:00			`wait: eval.Wait,`
			`}`
command: working on monitor 2015-09-16 21:45:21 +00:00			`for _, alloc := range allocs {`
			`update.allocs[alloc.ID] = &allocState{`
			`group: alloc.TaskGroup,`
			`node: alloc.NodeID,`
			`desired: alloc.DesiredStatus,`
			`client: alloc.ClientStatus,`
			`}`
			`}`
command: start implementing eval monitoring for run 2015-09-16 20:58:33 +00:00			`defer func() { m.state = update }()`

command: working on monitor 2015-09-16 21:45:21 +00:00			`// Check the allocations`
			`for allocID, alloc := range update.allocs {`
			`if _, ok := existing.allocs[allocID]; !ok {`
			`// Check if this is a failure indication allocation`
			`if alloc.desired == structs.AllocDesiredStatusFailed {`
			`m.output("Scheduling failed")`
			`} else {`
			`m.output(fmt.Sprintf("Allocated task group %q on node %q",`
			`alloc.group, alloc.node))`
			`}`
			`}`
			`}`

command: start implementing eval monitoring for run 2015-09-16 20:58:33 +00:00			`// Check if the status changed`
			`if existing.status != update.status {`
			`m.output(fmt.Sprintf("Evaluation changed status from %q to %q",`
			`existing.status, eval.Status))`
			`}`

			`// Check if the wait time is different`
			`if existing.wait == 0 && update.wait != 0 {`
			`m.output(fmt.Sprintf("Waiting %s before running eval",`
			`eval.Wait))`
			`}`

			`// Check if the nodeID changed`
			`if existing.nodeID == "" && update.nodeID != "" {`
			`m.output(fmt.Sprintf("Evaluation was assigned node ID %q",`
			`eval.NodeID))`
			`}`
			`}`

			`// monitor is used to start monitoring the given evaluation ID. It`
			`// writes output directly to the monitor's ui, and returns the`
			`// exit code for the command. The return code is 0 if monitoring`
			`// succeeded and exited successfully, or 1 if an error was encountered`
			`// or the eval status was returned as failed.`
			`func (m *monitor) monitor(evalID string) int {`
command: working on monitor 2015-09-16 21:45:21 +00:00			`m.ui.Info(fmt.Sprintf("Monitoring evaluation %q", evalID))`
command: start implementing eval monitoring for run 2015-09-16 20:58:33 +00:00			`for {`
			`// Check the current state of things`
			`eval, _, err := m.client.Evaluations().Info(evalID, nil)`
			`if err != nil {`
			`m.ui.Error(fmt.Sprintf("Error reading evaluation: %s", err))`
			`return 1`
			`}`

command: working on monitor 2015-09-16 21:45:21 +00:00			`allocs, _, err := m.client.Evaluations().Allocations(evalID, nil)`
			`if err != nil {`
			`m.ui.Error(fmt.Sprintf("Error reading allocations: %s", err))`
			`return 1`
			`}`

command: start implementing eval monitoring for run 2015-09-16 20:58:33 +00:00			`// Update the state`
command: working on monitor 2015-09-16 21:45:21 +00:00			`m.update(eval, allocs)`

			`switch eval.Status {`
			`case structs.EvalStatusComplete, structs.EvalStatusFailed:`
			`m.ui.Info(fmt.Sprintf("Evaluation %q finished with status %q",`
			`eval.ID, eval.Status))`
			`default:`
			`// Wait for the next update`
			`time.Sleep(time.Second)`
			`continue`
			`}`

			`// Monitor the next eval, if it exists.`
			`if eval.NextEval != "" {`
			`return m.monitor(eval.NextEval)`
			`}`
command: start implementing eval monitoring for run 2015-09-16 20:58:33 +00:00
			`// Check if the eval is complete`
			`switch eval.Status {`
			`case structs.EvalStatusComplete:`
			`return 0`
			`case structs.EvalStatusFailed:`
			`return 1`
			`}`
			`}`

			`return 0`
			`}`