open-nomad/nomad/plan_apply.go

package nomad

import (
	"fmt"
	"time"

	"github.com/armon/go-metrics"
	"github.com/hashicorp/go-multierror"
	"github.com/hashicorp/nomad/nomad/state"
	"github.com/hashicorp/nomad/nomad/structs"
	"github.com/hashicorp/raft"
)

// planApply is a long lived goroutine that reads plan allocations from
// the plan queue, determines if they can be applied safely and applies
// them via Raft.
//
// Naively, we could simply dequeue a plan, verify, apply and then respond.
// However, the plan application is bounded by the Raft apply time and
// subject to some latency. This creates a stall condition, where we are
// not evaluating, but simply waiting for a transaction to apply.
//
// To avoid this, we overlap verification with apply. This means once
// we've verified plan N we attempt to apply it. However, while waiting
// for apply, we begin to verify plan N+1 under the assumption that plan
// N has succeeded.
//
// In this sense, we track two parallel versions of the world. One is
// the pessimistic one driven by the Raft log which is replicated. The
// other is optimistic and assumes our transactions will succeed. In the
// happy path, this lets us do productive work during the latency of
// apply.
//
// In the unhappy path (Raft transaction fails), effectively we only
// wasted work during a time we would have been waiting anyways. However,
// in anticipation of this case we cannot respond to the plan until
// the Raft log is updated. This means our schedulers will stall,
// but there are many of those and only a single plan verifier.
//
func (s *Server) planApply() {
	// waitCh is used to track an outstanding application while snap
	// holds an optimistic state which includes that plan application.
	var waitCh chan struct{}
	var snap *state.StateSnapshot
	pool := NewEvaluatePool(workerPoolSize, workerPoolBufferSize)
	defer pool.Shutdown()

	for {
		// Pull the next pending plan, exit if we are no longer leader
		pending, err := s.planQueue.Dequeue(0)
		if err != nil {
			return
		}

		// Verify the evaluation is outstanding, and that the tokens match.
		if err := s.evalBroker.OutstandingReset(pending.plan.EvalID, pending.plan.EvalToken); err != nil {
			s.logger.Printf("[ERR] nomad: plan rejected for evaluation %s: %v",
				pending.plan.EvalID, err)
			pending.respond(nil, err)
			continue
		}

		// Check if out last plan has completed
		select {
		case <-waitCh:
			waitCh = nil
			snap = nil
		default:
		}

		// Snapshot the state so that we have a consistent view of the world
		// if no snapshot is available
		if waitCh == nil || snap == nil {
			snap, err = s.fsm.State().Snapshot()
			if err != nil {
				s.logger.Printf("[ERR] nomad: failed to snapshot state: %v", err)
				pending.respond(nil, err)
				continue
			}
		}

		// Evaluate the plan
		result, err := evaluatePlan(pool, snap, pending.plan)
		if err != nil {
			s.logger.Printf("[ERR] nomad: failed to evaluate plan: %v", err)
			pending.respond(nil, err)
			continue
		}

		// Fast-path the response if there is nothing to do
		if result.IsNoOp() {
			pending.respond(result, nil)
			continue
		}

		// Ensure any parallel apply is complete before starting the next one.
		// This also limits how out of date our snapshot can be.
		if waitCh != nil {
			<-waitCh
			snap, err = s.fsm.State().Snapshot()
			if err != nil {
				s.logger.Printf("[ERR] nomad: failed to snapshot state: %v", err)
				pending.respond(nil, err)
				continue
			}
		}

		// Dispatch the Raft transaction for the plan
		future, err := s.applyPlan(result, snap)
		if err != nil {
			s.logger.Printf("[ERR] nomad: failed to submit plan: %v", err)
			pending.respond(nil, err)
			continue
		}

		// Respond to the plan in async
		waitCh = make(chan struct{})
		go s.asyncPlanWait(waitCh, future, result, pending)
	}
}

// applyPlan is used to apply the plan result and to return the alloc index
func (s *Server) applyPlan(result *structs.PlanResult, snap *state.StateSnapshot) (raft.ApplyFuture, error) {
	req := structs.AllocUpdateRequest{}
	for _, updateList := range result.NodeUpdate {
		req.Alloc = append(req.Alloc, updateList...)
	}
	for _, allocList := range result.NodeAllocation {
		req.Alloc = append(req.Alloc, allocList...)
	}
	req.Alloc = append(req.Alloc, result.FailedAllocs...)

	// Set the time the alloc was applied for the first time. This can be used
	// to approximate the scheduling time.
	now := time.Now().UTC().UnixNano()
	for _, alloc := range req.Alloc {
		if alloc.CreateTime == 0 {
			alloc.CreateTime = now
		}
	}

	// Dispatch the Raft transaction
	future, err := s.raftApplyFuture(structs.AllocUpdateRequestType, &req)
	if err != nil {
		return nil, err
	}

	// Optimistically apply to our state view
	if snap != nil {
		nextIdx := s.raft.AppliedIndex() + 1
		if err := snap.UpsertAllocs(nextIdx, req.Alloc); err != nil {
			return future, err
		}
	}
	return future, nil
}

// asyncPlanWait is used to apply and respond to a plan async
func (s *Server) asyncPlanWait(waitCh chan struct{}, future raft.ApplyFuture,
	result *structs.PlanResult, pending *pendingPlan) {
	defer metrics.MeasureSince([]string{"nomad", "plan", "apply"}, time.Now())
	defer close(waitCh)

	// Wait for the plan to apply
	if err := future.Error(); err != nil {
		s.logger.Printf("[ERR] nomad: failed to apply plan: %v", err)
		pending.respond(nil, err)
		return
	}

	// Respond to the plan
	result.AllocIndex = future.Index()
	pending.respond(result, nil)
}

// evaluatePlan is used to determine what portions of a plan
// can be applied if any. Returns if there should be a plan application
// which may be partial or if there was an error
func evaluatePlan(pool *EvaluatePool, snap *state.StateSnapshot, plan *structs.Plan) (*structs.PlanResult, error) {
	defer metrics.MeasureSince([]string{"nomad", "plan", "evaluate"}, time.Now())

	// Create a result holder for the plan
	result := &structs.PlanResult{
		NodeUpdate:     make(map[string][]*structs.Allocation),
		NodeAllocation: make(map[string][]*structs.Allocation),
		FailedAllocs:   plan.FailedAllocs,
	}

	// Collect all the nodeIDs
	nodeIDs := make(map[string]struct{})
	for nodeID := range plan.NodeUpdate {
		nodeIDs[nodeID] = struct{}{}
	}
	for nodeID := range plan.NodeAllocation {
		nodeIDs[nodeID] = struct{}{}
	}

	// Setup a multierror to handle potentially getting many
	// errors since we are processing in parallel.
	var mErr multierror.Error

	// handleResult is used to process the result of evaluateNodePlan
	handleResult := func(nodeID string, fit bool, err error) (cancel bool) {
		// Evaluate the plan for this node
		if err != nil {
			mErr.Errors = append(mErr.Errors, err)
			return true
		}
		if !fit {
			// Scheduler must have stale data, RefreshIndex should force
			// the latest view of allocations and nodes
			allocIndex, err := snap.Index("allocs")
			if err != nil {
				mErr.Errors = append(mErr.Errors, err)
				return true
			}
			nodeIndex, err := snap.Index("nodes")
			if err != nil {
				mErr.Errors = append(mErr.Errors, err)
				return true
			}
			result.RefreshIndex = maxUint64(nodeIndex, allocIndex)

			// If we require all-at-once scheduling, there is no point
			// to continue the evaluation, as we've already failed.
			if plan.AllAtOnce {
				result.NodeUpdate = nil
				result.NodeAllocation = nil
				return true
			}

			// Skip this node, since it cannot be used.
			return
		}

		// Add this to the plan result
		if nodeUpdate := plan.NodeUpdate[nodeID]; len(nodeUpdate) > 0 {
			result.NodeUpdate[nodeID] = nodeUpdate
		}
		if nodeAlloc := plan.NodeAllocation[nodeID]; len(nodeAlloc) > 0 {
			result.NodeAllocation[nodeID] = nodeAlloc
		}
		return
	}

	// Get the pool channels
	req := pool.RequestCh()
	resp := pool.ResultCh()
	outstanding := 0
	didCancel := false

	// Evalute each node in the plan, handling results as
	// they are ready to avoid blocking.
	for nodeID := range nodeIDs {
		select {
		case req <- evaluateRequest{snap, plan, nodeID}:
			outstanding++
		case r := <-resp:
			outstanding--

			// Handle a result that allows us to cancel evaluation,
			// which may save time processing additional entries.
			if cancel := handleResult(r.nodeID, r.fit, r.err); cancel {
				didCancel = true
				break
			}
		}
	}

	// Drain the remaining results
	for outstanding > 0 {
		r := <-resp
		if !didCancel {
			if cancel := handleResult(r.nodeID, r.fit, r.err); cancel {
				didCancel = true
			}
		}
		outstanding--
	}
	return result, mErr.ErrorOrNil()
}

// evaluateNodePlan is used to evalute the plan for a single node,
// returning if the plan is valid or if an error is encountered
func evaluateNodePlan(snap *state.StateSnapshot, plan *structs.Plan, nodeID string) (bool, error) {
	// If this is an evict-only plan, it always 'fits' since we are removing things.
	if len(plan.NodeAllocation[nodeID]) == 0 {
		return true, nil
	}

	// Get the node itself
	node, err := snap.NodeByID(nodeID)
	if err != nil {
		return false, fmt.Errorf("failed to get node '%s': %v", nodeID, err)
	}

	// If the node does not exist or is not ready for schduling it is not fit
	// XXX: There is a potential race between when we do this check and when
	// the Raft commit happens.
	if node == nil || node.Status != structs.NodeStatusReady || node.Drain {
		return false, nil
	}

	// Get the existing allocations that are non-terminal
	existingAlloc, err := snap.AllocsByNodeTerminal(nodeID, false)
	if err != nil {
		return false, fmt.Errorf("failed to get existing allocations for '%s': %v", nodeID, err)
	}

	// Determine the proposed allocation by first removing allocations
	// that are planned evictions and adding the new allocations.
	proposed := existingAlloc
	var remove []*structs.Allocation
	if update := plan.NodeUpdate[nodeID]; len(update) > 0 {
		remove = append(remove, update...)
	}
	if updated := plan.NodeAllocation[nodeID]; len(updated) > 0 {
		for _, alloc := range updated {
			remove = append(remove, alloc)
		}
	}
	proposed = structs.RemoveAllocs(existingAlloc, remove)
	proposed = append(proposed, plan.NodeAllocation[nodeID]...)

	// Check if these allocations fit
	fit, _, _, err := structs.AllocsFit(node, proposed, nil)
	return fit, err
}
nomad: adding skeleton no-op plan evaluator 2015-07-27 22:31:09 +00:00			`package nomad`

nomad: first pass at plan eval and apply 2015-08-04 23:32:46 +00:00			`import (`
			`"fmt"`
nomad: add some profiling 2015-08-04 23:35:49 +00:00			`"time"`
nomad: first pass at plan eval and apply 2015-08-04 23:32:46 +00:00
nomad: add some profiling 2015-08-04 23:35:49 +00:00			`"github.com/armon/go-metrics"`
nomad: plan apply uses the EvaluatePool 2016-02-20 21:12:14 +00:00			`"github.com/hashicorp/go-multierror"`
nomad: move state and mocks into shared packages 2015-08-11 21:27:14 +00:00			`"github.com/hashicorp/nomad/nomad/state"`
nomad: first pass at plan eval and apply 2015-08-04 23:32:46 +00:00			`"github.com/hashicorp/nomad/nomad/structs"`
nomad: plan apply uses raw Raft future 2015-10-11 21:48:18 +00:00			`"github.com/hashicorp/raft"`
nomad: first pass at plan eval and apply 2015-08-04 23:32:46 +00:00			`)`
nomad: adding skeleton no-op plan evaluator 2015-07-27 22:31:09 +00:00
			`// planApply is a long lived goroutine that reads plan allocations from`
			`// the plan queue, determines if they can be applied safely and applies`
			`// them via Raft.`
nomad: plan apply uses raw Raft future 2015-10-11 21:48:18 +00:00			`//`
			`// Naively, we could simply dequeue a plan, verify, apply and then respond.`
			`// However, the plan application is bounded by the Raft apply time and`
			`// subject to some latency. This creates a stall condition, where we are`
nomad: comment cleanups 2015-10-12 21:35:17 +00:00			`// not evaluating, but simply waiting for a transaction to apply.`
nomad: plan apply uses raw Raft future 2015-10-11 21:48:18 +00:00			`//`
			`// To avoid this, we overlap verification with apply. This means once`
			`// we've verified plan N we attempt to apply it. However, while waiting`
			`// for apply, we begin to verify plan N+1 under the assumption that plan`
			`// N has succeeded.`
			`//`
			`// In this sense, we track two parallel versions of the world. One is`
			`// the pessimistic one driven by the Raft log which is replicated. The`
			`// other is optimistic and assumes our transactions will succeed. In the`
			`// happy path, this lets us do productive work during the latency of`
			`// apply.`
			`//`
			`// In the unhappy path (Raft transaction fails), effectively we only`
			`// wasted work during a time we would have been waiting anyways. However,`
			`// in anticipation of this case we cannot respond to the plan until`
			`// the Raft log is updated. This means our schedulers will stall,`
			`// but there are many of those and only a single plan verifier.`
			`//`
nomad: adding skeleton no-op plan evaluator 2015-07-27 22:31:09 +00:00			`func (s *Server) planApply() {`
nomad: comment cleanups 2015-10-12 21:35:17 +00:00			`// waitCh is used to track an outstanding application while snap`
			`// holds an optimistic state which includes that plan application.`
nomad: overlap plan evaluation with apply 2015-10-11 22:34:52 +00:00			`var waitCh chan struct{}`
			`var snap *state.StateSnapshot`
nomad: plan apply uses the EvaluatePool 2016-02-20 21:12:14 +00:00			`pool := NewEvaluatePool(workerPoolSize, workerPoolBufferSize)`
			`defer pool.Shutdown()`
nomad: overlap plan evaluation with apply 2015-10-11 22:34:52 +00:00
nomad: adding skeleton no-op plan evaluator 2015-07-27 22:31:09 +00:00			`for {`
			`// Pull the next pending plan, exit if we are no longer leader`
			`pending, err := s.planQueue.Dequeue(0)`
			`if err != nil {`
			`return`
			`}`

nomad: avoid split-brain in plan processing due to leader transition or eval retry 2015-08-12 22:44:36 +00:00			`// Verify the evaluation is outstanding, and that the tokens match.`
nomad: use OutstandingReset in Eval endpoints and Plan apply 2015-10-23 17:22:44 +00:00			`if err := s.evalBroker.OutstandingReset(pending.plan.EvalID, pending.plan.EvalToken); err != nil {`
			`s.logger.Printf("[ERR] nomad: plan rejected for evaluation %s: %v",`
			`pending.plan.EvalID, err)`
			`pending.respond(nil, err)`
nomad: avoid split-brain in plan processing due to leader transition or eval retry 2015-08-12 22:44:36 +00:00			`continue`
			`}`

nomad: overlap plan evaluation with apply 2015-10-11 22:34:52 +00:00			`// Check if out last plan has completed`
			`select {`
			`case <-waitCh:`
			`waitCh = nil`
			`snap = nil`
			`default:`
			`}`

nomad: testing plan evaluation 2015-08-05 01:30:05 +00:00			`// Snapshot the state so that we have a consistent view of the world`
nomad: overlap plan evaluation with apply 2015-10-11 22:34:52 +00:00			`// if no snapshot is available`
nomad: refresh snapshot under error return 2015-10-11 22:38:07 +00:00			`if waitCh == nil \|\| snap == nil {`
nomad: overlap plan evaluation with apply 2015-10-11 22:34:52 +00:00			`snap, err = s.fsm.State().Snapshot()`
			`if err != nil {`
			`s.logger.Printf("[ERR] nomad: failed to snapshot state: %v", err)`
			`pending.respond(nil, err)`
			`continue`
			`}`
nomad: testing plan evaluation 2015-08-05 01:30:05 +00:00			`}`

nomad: first pass at plan eval and apply 2015-08-04 23:32:46 +00:00			`// Evaluate the plan`
nomad: plan apply uses the EvaluatePool 2016-02-20 21:12:14 +00:00			`result, err := evaluatePlan(pool, snap, pending.plan)`
nomad: first pass at plan eval and apply 2015-08-04 23:32:46 +00:00			`if err != nil {`
			`s.logger.Printf("[ERR] nomad: failed to evaluate plan: %v", err)`
			`pending.respond(nil, err)`
			`continue`
			`}`
nomad: adding skeleton no-op plan evaluator 2015-07-27 22:31:09 +00:00
nomad: wait for plan to apply async 2015-10-11 21:57:36 +00:00			`// Fast-path the response if there is nothing to do`
			`if result.IsNoOp() {`
			`pending.respond(result, nil)`
			`continue`
			`}`

nomad: comment cleanups 2015-10-12 21:35:17 +00:00			`// Ensure any parallel apply is complete before starting the next one.`
			`// This also limits how out of date our snapshot can be.`
nomad: overlap plan evaluation with apply 2015-10-11 22:34:52 +00:00			`if waitCh != nil {`
			`<-waitCh`
			`snap, err = s.fsm.State().Snapshot()`
			`if err != nil {`
			`s.logger.Printf("[ERR] nomad: failed to snapshot state: %v", err)`
			`pending.respond(nil, err)`
			`continue`
			`}`
			`}`

nomad: wait for plan to apply async 2015-10-11 21:57:36 +00:00			`// Dispatch the Raft transaction for the plan`
nomad: optimistically apply plan to state snapshot 2015-10-11 22:19:01 +00:00			`future, err := s.applyPlan(result, snap)`
nomad: wait for plan to apply async 2015-10-11 21:57:36 +00:00			`if err != nil {`
			`s.logger.Printf("[ERR] nomad: failed to submit plan: %v", err)`
			`pending.respond(nil, err)`
			`continue`
nomad: adding skeleton no-op plan evaluator 2015-07-27 22:31:09 +00:00			`}`

nomad: wait for plan to apply async 2015-10-11 21:57:36 +00:00			`// Respond to the plan in async`
nomad: overlap plan evaluation with apply 2015-10-11 22:34:52 +00:00			`waitCh = make(chan struct{})`
nomad: wait for plan to apply async 2015-10-11 21:57:36 +00:00			`go s.asyncPlanWait(waitCh, future, result, pending)`
nomad: adding skeleton no-op plan evaluator 2015-07-27 22:31:09 +00:00			`}`
			`}`
nomad: first pass at plan eval and apply 2015-08-04 23:32:46 +00:00
nomad: testing plan evaluation 2015-08-05 01:30:05 +00:00			`// applyPlan is used to apply the plan result and to return the alloc index`
nomad: optimistically apply plan to state snapshot 2015-10-11 22:19:01 +00:00			`func (s Server) applyPlan(result structs.PlanResult, snap *state.StateSnapshot) (raft.ApplyFuture, error) {`
nomad: testing plan evaluation 2015-08-05 01:30:05 +00:00			`req := structs.AllocUpdateRequest{}`
nomad: updating for new alloc representation 2015-08-26 00:36:52 +00:00			`for _, updateList := range result.NodeUpdate {`
			`req.Alloc = append(req.Alloc, updateList...)`
nomad: testing plan evaluation 2015-08-05 01:30:05 +00:00			`}`
			`for _, allocList := range result.NodeAllocation {`
			`req.Alloc = append(req.Alloc, allocList...)`
			`}`
nomad: thread through failed allocations 2015-08-15 20:33:20 +00:00			`req.Alloc = append(req.Alloc, result.FailedAllocs...)`
nomad: testing plan evaluation 2015-08-05 01:30:05 +00:00
Store alloc creation time 2016-02-09 05:58:05 +00:00			`// Set the time the alloc was applied for the first time. This can be used`
			`// to approximate the scheduling time.`
			`now := time.Now().UTC().UnixNano()`
			`for _, alloc := range req.Alloc {`
			`if alloc.CreateTime == 0 {`
			`alloc.CreateTime = now`
			`}`
			`}`

nomad: optimistically apply plan to state snapshot 2015-10-11 22:19:01 +00:00			`// Dispatch the Raft transaction`
			`future, err := s.raftApplyFuture(structs.AllocUpdateRequestType, &req)`
			`if err != nil {`
			`return nil, err`
			`}`

			`// Optimistically apply to our state view`
			`if snap != nil {`
			`nextIdx := s.raft.AppliedIndex() + 1`
			`if err := snap.UpsertAllocs(nextIdx, req.Alloc); err != nil {`
			`return future, err`
			`}`
			`}`
			`return future, nil`
nomad: plan apply uses raw Raft future 2015-10-11 21:48:18 +00:00			`}`

nomad: wait for plan to apply async 2015-10-11 21:57:36 +00:00			`// asyncPlanWait is used to apply and respond to a plan async`
			`func (s *Server) asyncPlanWait(waitCh chan struct{}, future raft.ApplyFuture,`
			`result structs.PlanResult, pending pendingPlan) {`
nomad: plan apply uses raw Raft future 2015-10-11 21:48:18 +00:00			`defer metrics.MeasureSince([]string{"nomad", "plan", "apply"}, time.Now())`
nomad: wait for plan to apply async 2015-10-11 21:57:36 +00:00			`defer close(waitCh)`

			`// Wait for the plan to apply`
nomad: plan apply uses raw Raft future 2015-10-11 21:48:18 +00:00			`if err := future.Error(); err != nil {`
nomad: wait for plan to apply async 2015-10-11 21:57:36 +00:00			`s.logger.Printf("[ERR] nomad: failed to apply plan: %v", err)`
			`pending.respond(nil, err)`
			`return`
nomad: plan apply uses raw Raft future 2015-10-11 21:48:18 +00:00			`}`
nomad: wait for plan to apply async 2015-10-11 21:57:36 +00:00
			`// Respond to the plan`
			`result.AllocIndex = future.Index()`
			`pending.respond(result, nil)`
nomad: testing plan evaluation 2015-08-05 01:30:05 +00:00			`}`

nomad: first pass at plan eval and apply 2015-08-04 23:32:46 +00:00			`// evaluatePlan is used to determine what portions of a plan`
			`// can be applied if any. Returns if there should be a plan application`
			`// which may be partial or if there was an error`
nomad: plan apply uses the EvaluatePool 2016-02-20 21:12:14 +00:00			`func evaluatePlan(pool EvaluatePool, snap state.StateSnapshot, plan structs.Plan) (structs.PlanResult, error) {`
nomad: add some profiling 2015-08-04 23:35:49 +00:00			`defer metrics.MeasureSince([]string{"nomad", "plan", "evaluate"}, time.Now())`
nomad: test evaluation of node plan 2015-08-05 01:10:57 +00:00
nomad: first pass at plan eval and apply 2015-08-04 23:32:46 +00:00			`// Create a result holder for the plan`
			`result := &structs.PlanResult{`
nomad: updating for new alloc representation 2015-08-26 00:36:52 +00:00			`NodeUpdate: make(map[string][]*structs.Allocation),`
nomad: first pass at plan eval and apply 2015-08-04 23:32:46 +00:00			`NodeAllocation: make(map[string][]*structs.Allocation),`
nomad: thread through failed allocations 2015-08-15 20:33:20 +00:00			`FailedAllocs: plan.FailedAllocs,`
nomad: first pass at plan eval and apply 2015-08-04 23:32:46 +00:00			`}`

nomad: updating for new alloc representation 2015-08-26 00:36:52 +00:00			`// Collect all the nodeIDs`
			`nodeIDs := make(map[string]struct{})`
			`for nodeID := range plan.NodeUpdate {`
			`nodeIDs[nodeID] = struct{}{}`
			`}`
nomad: test evaluation of node plan 2015-08-05 01:10:57 +00:00			`for nodeID := range plan.NodeAllocation {`
nomad: updating for new alloc representation 2015-08-26 00:36:52 +00:00			`nodeIDs[nodeID] = struct{}{}`
			`}`

nomad: plan apply uses the EvaluatePool 2016-02-20 21:12:14 +00:00			`// Setup a multierror to handle potentially getting many`
			`// errors since we are processing in parallel.`
			`var mErr multierror.Error`

			`// handleResult is used to process the result of evaluateNodePlan`
			`handleResult := func(nodeID string, fit bool, err error) (cancel bool) {`
nomad: test evaluation of node plan 2015-08-05 01:10:57 +00:00			`// Evaluate the plan for this node`
nomad: first pass at plan eval and apply 2015-08-04 23:32:46 +00:00			`if err != nil {`
nomad: plan apply uses the EvaluatePool 2016-02-20 21:12:14 +00:00			`mErr.Errors = append(mErr.Errors, err)`
			`return true`
nomad: first pass at plan eval and apply 2015-08-04 23:32:46 +00:00			`}`
nomad: test evaluation of node plan 2015-08-05 01:10:57 +00:00			`if !fit {`
nomad: first pass at plan eval and apply 2015-08-04 23:32:46 +00:00			`// Scheduler must have stale data, RefreshIndex should force`
			`// the latest view of allocations and nodes`
nomad: unifying the state store API 2015-09-07 03:56:38 +00:00			`allocIndex, err := snap.Index("allocs")`
nomad: first pass at plan eval and apply 2015-08-04 23:32:46 +00:00			`if err != nil {`
nomad: plan apply uses the EvaluatePool 2016-02-20 21:12:14 +00:00			`mErr.Errors = append(mErr.Errors, err)`
			`return true`
nomad: first pass at plan eval and apply 2015-08-04 23:32:46 +00:00			`}`
nomad: unifying the state store API 2015-09-07 03:56:38 +00:00			`nodeIndex, err := snap.Index("nodes")`
nomad: first pass at plan eval and apply 2015-08-04 23:32:46 +00:00			`if err != nil {`
nomad: plan apply uses the EvaluatePool 2016-02-20 21:12:14 +00:00			`mErr.Errors = append(mErr.Errors, err)`
			`return true`
nomad: first pass at plan eval and apply 2015-08-04 23:32:46 +00:00			`}`
nomad: move and test max function 2015-08-05 00:13:40 +00:00			`result.RefreshIndex = maxUint64(nodeIndex, allocIndex)`
nomad: first pass at plan eval and apply 2015-08-04 23:32:46 +00:00
			`// If we require all-at-once scheduling, there is no point`
			`// to continue the evaluation, as we've already failed.`
			`if plan.AllAtOnce {`
nomad: updating for new alloc representation 2015-08-26 00:36:52 +00:00			`result.NodeUpdate = nil`
nomad: testing plan evaluation 2015-08-05 01:30:05 +00:00			`result.NodeAllocation = nil`
nomad: plan apply uses the EvaluatePool 2016-02-20 21:12:14 +00:00			`return true`
nomad: first pass at plan eval and apply 2015-08-04 23:32:46 +00:00			`}`

			`// Skip this node, since it cannot be used.`
nomad: plan apply uses the EvaluatePool 2016-02-20 21:12:14 +00:00			`return`
nomad: first pass at plan eval and apply 2015-08-04 23:32:46 +00:00			`}`

			`// Add this to the plan result`
nomad: updating for new alloc representation 2015-08-26 00:36:52 +00:00			`if nodeUpdate := plan.NodeUpdate[nodeID]; len(nodeUpdate) > 0 {`
			`result.NodeUpdate[nodeID] = nodeUpdate`
nomad: planner can fast-path evict-only plans 2015-08-07 16:37:45 +00:00			`}`
			`if nodeAlloc := plan.NodeAllocation[nodeID]; len(nodeAlloc) > 0 {`
			`result.NodeAllocation[nodeID] = nodeAlloc`
			`}`
nomad: plan apply uses the EvaluatePool 2016-02-20 21:12:14 +00:00			`return`
			`}`

			`// Get the pool channels`
			`req := pool.RequestCh()`
			`resp := pool.ResultCh()`
			`outstanding := 0`
			`didCancel := false`

			`// Evalute each node in the plan, handling results as`
			`// they are ready to avoid blocking.`
			`for nodeID := range nodeIDs {`
			`select {`
			`case req <- evaluateRequest{snap, plan, nodeID}:`
			`outstanding++`
			`case r := <-resp:`
			`outstanding--`
nomad: extra comment 2016-02-20 21:41:49 +00:00
			`// Handle a result that allows us to cancel evaluation,`
			`// which may save time processing additional entries.`
nomad: plan apply uses the EvaluatePool 2016-02-20 21:12:14 +00:00			`if cancel := handleResult(r.nodeID, r.fit, r.err); cancel {`
			`didCancel = true`
			`break`
			`}`
			`}`
			`}`

			`// Drain the remaining results`
			`for outstanding > 0 {`
			`r := <-resp`
			`if !didCancel {`
			`if cancel := handleResult(r.nodeID, r.fit, r.err); cancel {`
			`didCancel = true`
			`}`
			`}`
			`outstanding--`
nomad: first pass at plan eval and apply 2015-08-04 23:32:46 +00:00			`}`
nomad: plan apply uses the EvaluatePool 2016-02-20 21:12:14 +00:00			`return result, mErr.ErrorOrNil()`
nomad: first pass at plan eval and apply 2015-08-04 23:32:46 +00:00			`}`

nomad: test evaluation of node plan 2015-08-05 01:10:57 +00:00			`// evaluateNodePlan is used to evalute the plan for a single node,`
			`// returning if the plan is valid or if an error is encountered`
nomad: move state and mocks into shared packages 2015-08-11 21:27:14 +00:00			`func evaluateNodePlan(snap state.StateSnapshot, plan structs.Plan, nodeID string) (bool, error) {`
nomad: planner can fast-path evict-only plans 2015-08-07 16:37:45 +00:00			`// If this is an evict-only plan, it always 'fits' since we are removing things.`
			`if len(plan.NodeAllocation[nodeID]) == 0 {`
			`return true, nil`
			`}`

nomad: test evaluation of node plan 2015-08-05 01:10:57 +00:00			`// Get the node itself`
nomad: unifying the state store API 2015-09-07 03:56:38 +00:00			`node, err := snap.NodeByID(nodeID)`
nomad: test evaluation of node plan 2015-08-05 01:10:57 +00:00			`if err != nil {`
Fix vet warnings 2015-10-07 10:18:19 +00:00			`return false, fmt.Errorf("failed to get node '%s': %v", nodeID, err)`
nomad: test evaluation of node plan 2015-08-05 01:10:57 +00:00			`}`

			`// If the node does not exist or is not ready for schduling it is not fit`
nomad: document some potential races 2015-08-16 01:03:05 +00:00			`// XXX: There is a potential race between when we do this check and when`
			`// the Raft commit happens.`
nomad: adding drain as node property 2015-09-07 02:47:02 +00:00			`if node == nil \|\| node.Status != structs.NodeStatusReady \|\| node.Drain {`
nomad: test evaluation of node plan 2015-08-05 01:10:57 +00:00			`return false, nil`
			`}`

nomad: Use AllocsByNodeTerminal in plan apply 2016-02-20 19:26:38 +00:00			`// Get the existing allocations that are non-terminal`
			`existingAlloc, err := snap.AllocsByNodeTerminal(nodeID, false)`
nomad: test evaluation of node plan 2015-08-05 01:10:57 +00:00			`if err != nil {`
Fix vet warnings 2015-10-07 10:18:19 +00:00			`return false, fmt.Errorf("failed to get existing allocations for '%s': %v", nodeID, err)`
nomad: test evaluation of node plan 2015-08-05 01:10:57 +00:00			`}`

			`// Determine the proposed allocation by first removing allocations`
			`// that are planned evictions and adding the new allocations.`
			`proposed := existingAlloc`
nomad: updating for new alloc representation 2015-08-26 00:36:52 +00:00			`var remove []*structs.Allocation`
			`if update := plan.NodeUpdate[nodeID]; len(update) > 0 {`
			`remove = append(remove, update...)`
nomad: test evaluation of node plan 2015-08-05 01:10:57 +00:00			`}`
nomad: plan apply handles update of existing allocation 2015-08-23 02:37:21 +00:00			`if updated := plan.NodeAllocation[nodeID]; len(updated) > 0 {`
			`for _, alloc := range updated {`
nomad: updating for new alloc representation 2015-08-26 00:36:52 +00:00			`remove = append(remove, alloc)`
nomad: plan apply handles update of existing allocation 2015-08-23 02:37:21 +00:00			`}`
			`}`
			`proposed = structs.RemoveAllocs(existingAlloc, remove)`
nomad: test evaluation of node plan 2015-08-05 01:10:57 +00:00			`proposed = append(proposed, plan.NodeAllocation[nodeID]...)`

			`// Check if these allocations fit`
nomad: fixing unit tests 2015-09-14 01:46:40 +00:00			`fit, _, _, err := structs.AllocsFit(node, proposed, nil)`
scheduler: working on bin pack 2015-08-13 18:54:59 +00:00			`return fit, err`
nomad: test evaluation of node plan 2015-08-05 01:10:57 +00:00			`}`