2015-08-16 20:54:49 +00:00
|
|
|
package agent
|
|
|
|
|
2015-08-16 23:40:04 +00:00
|
|
|
import (
|
2015-08-24 00:40:27 +00:00
|
|
|
"fmt"
|
2015-08-16 23:40:04 +00:00
|
|
|
"io"
|
|
|
|
"log"
|
2015-08-31 01:10:23 +00:00
|
|
|
"net"
|
2016-10-17 17:48:04 +00:00
|
|
|
"os"
|
2015-08-31 01:10:23 +00:00
|
|
|
"path/filepath"
|
2016-03-10 07:25:31 +00:00
|
|
|
"runtime"
|
2016-05-11 22:24:37 +00:00
|
|
|
"strconv"
|
2016-06-15 00:13:15 +00:00
|
|
|
"strings"
|
2015-08-16 23:40:04 +00:00
|
|
|
"sync"
|
2016-11-09 00:21:52 +00:00
|
|
|
"sync/atomic"
|
2015-10-29 13:47:06 +00:00
|
|
|
"time"
|
2015-08-16 21:34:38 +00:00
|
|
|
|
2015-08-23 23:53:15 +00:00
|
|
|
"github.com/hashicorp/nomad/client"
|
2016-02-12 21:21:56 +00:00
|
|
|
clientconfig "github.com/hashicorp/nomad/client/config"
|
2016-06-08 06:02:37 +00:00
|
|
|
"github.com/hashicorp/nomad/command/agent/consul"
|
2015-08-16 23:40:04 +00:00
|
|
|
"github.com/hashicorp/nomad/nomad"
|
2015-08-31 01:10:23 +00:00
|
|
|
"github.com/hashicorp/nomad/nomad/structs"
|
2015-08-16 23:40:04 +00:00
|
|
|
)
|
|
|
|
|
2016-06-17 00:34:25 +00:00
|
|
|
const (
|
|
|
|
clientHttpCheckInterval = 10 * time.Second
|
|
|
|
clientHttpCheckTimeout = 3 * time.Second
|
|
|
|
serverHttpCheckInterval = 10 * time.Second
|
2016-08-26 18:13:20 +00:00
|
|
|
serverHttpCheckTimeout = 6 * time.Second
|
2016-06-17 00:34:25 +00:00
|
|
|
serverRpcCheckInterval = 10 * time.Second
|
|
|
|
serverRpcCheckTimeout = 3 * time.Second
|
|
|
|
serverSerfCheckInterval = 10 * time.Second
|
|
|
|
serverSerfCheckTimeout = 3 * time.Second
|
|
|
|
)
|
|
|
|
|
2015-08-16 23:40:04 +00:00
|
|
|
// Agent is a long running daemon that is used to run both
|
|
|
|
// clients and servers. Servers are responsible for managing
|
|
|
|
// state and making scheduling decisions. Clients can be
|
|
|
|
// scheduled to, and are responsible for interfacing with
|
|
|
|
// servers to run allocations.
|
2015-08-16 20:54:49 +00:00
|
|
|
type Agent struct {
|
2015-08-16 23:40:04 +00:00
|
|
|
config *Config
|
|
|
|
logger *log.Logger
|
|
|
|
logOutput io.Writer
|
|
|
|
|
2016-05-23 18:09:31 +00:00
|
|
|
// consulSyncer registers the Nomad agent with the Consul Agent
|
|
|
|
consulSyncer *consul.Syncer
|
|
|
|
|
2016-11-04 22:24:28 +00:00
|
|
|
client *client.Client
|
2016-05-11 22:24:37 +00:00
|
|
|
|
2016-11-04 22:24:28 +00:00
|
|
|
server *nomad.Server
|
2015-08-16 23:40:04 +00:00
|
|
|
|
|
|
|
shutdown bool
|
2016-05-27 10:47:49 +00:00
|
|
|
shutdownCh chan struct{}
|
2015-08-16 23:40:04 +00:00
|
|
|
shutdownLock sync.Mutex
|
2015-08-16 20:54:49 +00:00
|
|
|
}
|
|
|
|
|
2015-08-16 23:40:04 +00:00
|
|
|
// NewAgent is used to create a new agent with the given configuration
|
2015-08-16 21:34:38 +00:00
|
|
|
func NewAgent(config *Config, logOutput io.Writer) (*Agent, error) {
|
2015-08-16 23:40:04 +00:00
|
|
|
a := &Agent{
|
|
|
|
config: config,
|
2016-06-22 22:20:56 +00:00
|
|
|
logger: log.New(logOutput, "", log.LstdFlags|log.Lmicroseconds),
|
2015-08-16 23:40:04 +00:00
|
|
|
logOutput: logOutput,
|
2016-06-17 06:15:41 +00:00
|
|
|
shutdownCh: make(chan struct{}),
|
2015-08-16 23:40:04 +00:00
|
|
|
}
|
2015-08-24 00:40:27 +00:00
|
|
|
|
2016-06-17 06:15:41 +00:00
|
|
|
if err := a.setupConsulSyncer(); err != nil {
|
2016-06-08 06:31:19 +00:00
|
|
|
return nil, fmt.Errorf("Failed to initialize Consul syncer task: %v", err)
|
2016-05-23 18:09:31 +00:00
|
|
|
}
|
2015-08-24 00:40:27 +00:00
|
|
|
if err := a.setupServer(); err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
if err := a.setupClient(); err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
if a.client == nil && a.server == nil {
|
|
|
|
return nil, fmt.Errorf("must have at least client or server mode enabled")
|
|
|
|
}
|
2016-06-08 06:31:19 +00:00
|
|
|
|
2016-06-13 05:30:52 +00:00
|
|
|
// The Nomad Agent runs the consul.Syncer regardless of whether or not the
|
|
|
|
// Agent is running in Client or Server mode (or both), and regardless of
|
2016-06-14 19:11:38 +00:00
|
|
|
// the consul.auto_advertise parameter. The Client and Server both reuse the
|
2016-06-13 05:30:52 +00:00
|
|
|
// same consul.Syncer instance. This Syncer task periodically executes
|
|
|
|
// callbacks that update Consul. The reason the Syncer is always running is
|
|
|
|
// because one of the callbacks is attempts to self-bootstrap Nomad using
|
|
|
|
// information found in Consul.
|
2016-05-24 04:45:13 +00:00
|
|
|
go a.consulSyncer.Run()
|
2016-05-22 15:24:54 +00:00
|
|
|
|
2015-08-16 21:34:38 +00:00
|
|
|
return a, nil
|
|
|
|
}
|
|
|
|
|
2017-02-01 22:20:14 +00:00
|
|
|
// convertServerConfig takes an agent config and log output and returns a Nomad
|
|
|
|
// Config.
|
|
|
|
func convertServerConfig(agentConfig *Config, logOutput io.Writer) (*nomad.Config, error) {
|
|
|
|
conf := agentConfig.NomadConfig
|
2015-09-06 01:41:00 +00:00
|
|
|
if conf == nil {
|
|
|
|
conf = nomad.DefaultConfig()
|
|
|
|
}
|
2017-02-01 22:20:14 +00:00
|
|
|
conf.LogOutput = logOutput
|
|
|
|
conf.DevMode = agentConfig.DevMode
|
|
|
|
conf.Build = fmt.Sprintf("%s%s", agentConfig.Version, agentConfig.VersionPrerelease)
|
|
|
|
if agentConfig.Region != "" {
|
|
|
|
conf.Region = agentConfig.Region
|
2015-08-31 01:14:40 +00:00
|
|
|
}
|
2017-02-01 22:20:14 +00:00
|
|
|
if agentConfig.Datacenter != "" {
|
|
|
|
conf.Datacenter = agentConfig.Datacenter
|
2015-08-31 01:14:40 +00:00
|
|
|
}
|
2017-02-01 22:20:14 +00:00
|
|
|
if agentConfig.NodeName != "" {
|
|
|
|
conf.NodeName = agentConfig.NodeName
|
2015-08-31 01:14:40 +00:00
|
|
|
}
|
2017-02-01 22:20:14 +00:00
|
|
|
if agentConfig.Server.BootstrapExpect > 0 {
|
|
|
|
if agentConfig.Server.BootstrapExpect == 1 {
|
2015-09-22 21:25:43 +00:00
|
|
|
conf.Bootstrap = true
|
|
|
|
} else {
|
2017-02-01 22:20:14 +00:00
|
|
|
atomic.StoreInt32(&conf.BootstrapExpect, int32(agentConfig.Server.BootstrapExpect))
|
2015-09-22 21:25:43 +00:00
|
|
|
}
|
2015-08-31 01:10:23 +00:00
|
|
|
}
|
2017-02-01 22:20:14 +00:00
|
|
|
if agentConfig.DataDir != "" {
|
|
|
|
conf.DataDir = filepath.Join(agentConfig.DataDir, "server")
|
2015-08-31 01:10:23 +00:00
|
|
|
}
|
2017-02-01 22:20:14 +00:00
|
|
|
if agentConfig.Server.DataDir != "" {
|
|
|
|
conf.DataDir = agentConfig.Server.DataDir
|
2015-08-31 01:10:23 +00:00
|
|
|
}
|
2017-02-01 22:20:14 +00:00
|
|
|
if agentConfig.Server.ProtocolVersion != 0 {
|
|
|
|
conf.ProtocolVersion = uint8(agentConfig.Server.ProtocolVersion)
|
2015-08-31 01:10:23 +00:00
|
|
|
}
|
2017-02-01 22:20:14 +00:00
|
|
|
if agentConfig.Server.NumSchedulers != 0 {
|
|
|
|
conf.NumSchedulers = agentConfig.Server.NumSchedulers
|
2015-08-31 01:10:23 +00:00
|
|
|
}
|
2017-02-01 22:20:14 +00:00
|
|
|
if len(agentConfig.Server.EnabledSchedulers) != 0 {
|
|
|
|
conf.EnabledSchedulers = agentConfig.Server.EnabledSchedulers
|
2015-08-31 01:10:23 +00:00
|
|
|
}
|
2015-09-11 01:37:42 +00:00
|
|
|
|
|
|
|
// Set up the bind addresses
|
2017-02-01 22:20:14 +00:00
|
|
|
rpcAddr, err := net.ResolveTCPAddr("tcp", agentConfig.normalizedAddrs.RPC)
|
2016-09-02 23:23:45 +00:00
|
|
|
if err != nil {
|
2017-02-01 22:20:14 +00:00
|
|
|
return nil, fmt.Errorf("Failed to parse RPC address %q: %v", agentConfig.normalizedAddrs.RPC, err)
|
2016-05-27 08:35:10 +00:00
|
|
|
}
|
2017-02-01 22:20:14 +00:00
|
|
|
serfAddr, err := net.ResolveTCPAddr("tcp", agentConfig.normalizedAddrs.Serf)
|
2016-05-27 08:35:10 +00:00
|
|
|
if err != nil {
|
2017-02-01 22:20:14 +00:00
|
|
|
return nil, fmt.Errorf("Failed to parse Serf address %q: %v", agentConfig.normalizedAddrs.Serf, err)
|
2016-05-27 08:35:10 +00:00
|
|
|
}
|
2016-09-02 23:23:45 +00:00
|
|
|
conf.RPCAddr.Port = rpcAddr.Port
|
|
|
|
conf.RPCAddr.IP = rpcAddr.IP
|
|
|
|
conf.SerfConfig.MemberlistConfig.BindPort = serfAddr.Port
|
|
|
|
conf.SerfConfig.MemberlistConfig.BindAddr = serfAddr.IP.String()
|
2016-05-27 08:35:10 +00:00
|
|
|
|
2016-09-02 23:23:45 +00:00
|
|
|
// Set up the advertise addresses
|
2017-02-01 22:20:14 +00:00
|
|
|
rpcAddr, err = net.ResolveTCPAddr("tcp", agentConfig.AdvertiseAddrs.RPC)
|
2016-05-27 07:42:31 +00:00
|
|
|
if err != nil {
|
2017-02-01 22:20:14 +00:00
|
|
|
return nil, fmt.Errorf("Failed to parse RPC advertise address %q: %v", agentConfig.AdvertiseAddrs.RPC, err)
|
2016-05-27 07:42:31 +00:00
|
|
|
}
|
2017-02-01 22:20:14 +00:00
|
|
|
serfAddr, err = net.ResolveTCPAddr("tcp", agentConfig.AdvertiseAddrs.Serf)
|
2016-09-02 23:23:45 +00:00
|
|
|
if err != nil {
|
2017-02-01 22:20:14 +00:00
|
|
|
return nil, fmt.Errorf("Failed to parse Serf advertise address %q: %v", agentConfig.AdvertiseAddrs.Serf, err)
|
2016-06-01 08:08:15 +00:00
|
|
|
}
|
2016-09-10 17:53:53 +00:00
|
|
|
conf.RPCAdvertise = rpcAddr
|
|
|
|
conf.SerfConfig.MemberlistConfig.AdvertiseAddr = serfAddr.IP.String()
|
|
|
|
conf.SerfConfig.MemberlistConfig.AdvertisePort = serfAddr.Port
|
2016-06-01 08:08:15 +00:00
|
|
|
|
2016-09-02 23:23:45 +00:00
|
|
|
// Set up gc threshold and heartbeat grace period
|
2017-02-01 22:20:14 +00:00
|
|
|
if gcThreshold := agentConfig.Server.NodeGCThreshold; gcThreshold != "" {
|
2015-10-29 13:47:06 +00:00
|
|
|
dur, err := time.ParseDuration(gcThreshold)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
conf.NodeGCThreshold = dur
|
|
|
|
}
|
2017-02-27 19:58:10 +00:00
|
|
|
if gcThreshold := agentConfig.Server.JobGCThreshold; gcThreshold != "" {
|
|
|
|
dur, err := time.ParseDuration(gcThreshold)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
conf.JobGCThreshold = dur
|
|
|
|
}
|
|
|
|
if gcThreshold := agentConfig.Server.EvalGCThreshold; gcThreshold != "" {
|
|
|
|
dur, err := time.ParseDuration(gcThreshold)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
conf.EvalGCThreshold = dur
|
|
|
|
}
|
2015-10-29 13:47:06 +00:00
|
|
|
|
2017-02-01 22:20:14 +00:00
|
|
|
if heartbeatGrace := agentConfig.Server.HeartbeatGrace; heartbeatGrace != "" {
|
2016-03-04 23:44:12 +00:00
|
|
|
dur, err := time.ParseDuration(heartbeatGrace)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
conf.HeartbeatGrace = dur
|
|
|
|
}
|
|
|
|
|
2017-02-01 22:20:14 +00:00
|
|
|
if *agentConfig.Consul.AutoAdvertise && agentConfig.Consul.ServerServiceName == "" {
|
2016-06-14 19:11:38 +00:00
|
|
|
return nil, fmt.Errorf("server_service_name must be set when auto_advertise is enabled")
|
|
|
|
}
|
|
|
|
|
2016-08-09 21:35:40 +00:00
|
|
|
// Add the Consul and Vault configs
|
2017-02-01 22:20:14 +00:00
|
|
|
conf.ConsulConfig = agentConfig.Consul
|
|
|
|
conf.VaultConfig = agentConfig.Vault
|
2016-06-14 19:11:38 +00:00
|
|
|
|
2016-10-25 22:57:38 +00:00
|
|
|
// Set the TLS config
|
2017-02-01 22:20:14 +00:00
|
|
|
conf.TLSConfig = agentConfig.TLSConfig
|
2016-10-24 05:22:00 +00:00
|
|
|
|
2015-09-11 19:02:22 +00:00
|
|
|
return conf, nil
|
|
|
|
}
|
|
|
|
|
2017-02-01 22:20:14 +00:00
|
|
|
// serverConfig is used to generate a new server configuration struct
|
|
|
|
// for initializing a nomad server.
|
|
|
|
func (a *Agent) serverConfig() (*nomad.Config, error) {
|
|
|
|
return convertServerConfig(a.config, a.logOutput)
|
|
|
|
}
|
|
|
|
|
2016-02-16 21:42:48 +00:00
|
|
|
// clientConfig is used to generate a new client configuration struct
|
2016-05-22 15:24:54 +00:00
|
|
|
// for initializing a Nomad client.
|
2016-02-16 21:42:48 +00:00
|
|
|
func (a *Agent) clientConfig() (*clientconfig.Config, error) {
|
2015-08-24 00:40:27 +00:00
|
|
|
// Setup the configuration
|
2015-09-06 01:41:00 +00:00
|
|
|
conf := a.config.ClientConfig
|
|
|
|
if conf == nil {
|
2016-05-31 18:58:02 +00:00
|
|
|
conf = clientconfig.DefaultConfig()
|
2015-09-06 01:41:00 +00:00
|
|
|
}
|
2015-08-24 00:40:27 +00:00
|
|
|
if a.server != nil {
|
|
|
|
conf.RPCHandler = a.server
|
|
|
|
}
|
|
|
|
conf.LogOutput = a.logOutput
|
2017-01-09 19:21:51 +00:00
|
|
|
conf.LogLevel = a.config.LogLevel
|
2015-08-24 00:40:27 +00:00
|
|
|
conf.DevMode = a.config.DevMode
|
2015-08-31 01:14:40 +00:00
|
|
|
if a.config.Region != "" {
|
|
|
|
conf.Region = a.config.Region
|
|
|
|
}
|
|
|
|
if a.config.DataDir != "" {
|
|
|
|
conf.StateDir = filepath.Join(a.config.DataDir, "client")
|
|
|
|
conf.AllocDir = filepath.Join(a.config.DataDir, "alloc")
|
|
|
|
}
|
|
|
|
if a.config.Client.StateDir != "" {
|
|
|
|
conf.StateDir = a.config.Client.StateDir
|
|
|
|
}
|
|
|
|
if a.config.Client.AllocDir != "" {
|
|
|
|
conf.AllocDir = a.config.Client.AllocDir
|
|
|
|
}
|
2015-08-31 01:10:23 +00:00
|
|
|
conf.Servers = a.config.Client.Servers
|
2015-10-02 07:29:18 +00:00
|
|
|
if a.config.Client.NetworkInterface != "" {
|
|
|
|
conf.NetworkInterface = a.config.Client.NetworkInterface
|
2015-10-01 15:31:47 +00:00
|
|
|
}
|
2016-08-02 02:58:32 +00:00
|
|
|
conf.ChrootEnv = a.config.Client.ChrootEnv
|
2015-09-28 23:45:32 +00:00
|
|
|
conf.Options = a.config.Client.Options
|
2016-06-15 00:13:15 +00:00
|
|
|
// Logging deprecation messages about consul related configuration in client
|
|
|
|
// options
|
|
|
|
var invalidConsulKeys []string
|
|
|
|
for key := range conf.Options {
|
|
|
|
if strings.HasPrefix(key, "consul") {
|
|
|
|
invalidConsulKeys = append(invalidConsulKeys, fmt.Sprintf("options.%s", key))
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if len(invalidConsulKeys) > 0 {
|
|
|
|
a.logger.Printf("[WARN] agent: Invalid keys: %v", strings.Join(invalidConsulKeys, ","))
|
2016-11-01 12:53:13 +00:00
|
|
|
a.logger.Printf(`Nomad client ignores consul related configuration in client options.
|
|
|
|
Please refer to the guide https://www.nomadproject.io/docs/agent/configuration/consul.html
|
2016-06-15 00:13:15 +00:00
|
|
|
to configure Nomad to work with Consul.`)
|
|
|
|
}
|
|
|
|
|
2015-10-03 00:32:11 +00:00
|
|
|
if a.config.Client.NetworkSpeed != 0 {
|
|
|
|
conf.NetworkSpeed = a.config.Client.NetworkSpeed
|
|
|
|
}
|
2017-03-14 19:56:31 +00:00
|
|
|
if a.config.Client.CpuCompute != 0 {
|
|
|
|
conf.CpuCompute = a.config.Client.CpuCompute
|
|
|
|
}
|
2015-12-23 00:10:30 +00:00
|
|
|
if a.config.Client.MaxKillTimeout != "" {
|
|
|
|
dur, err := time.ParseDuration(a.config.Client.MaxKillTimeout)
|
|
|
|
if err != nil {
|
2016-11-15 23:28:21 +00:00
|
|
|
return nil, fmt.Errorf("Error parsing max kill timeout: %s", err)
|
2015-12-23 00:10:30 +00:00
|
|
|
}
|
|
|
|
conf.MaxKillTimeout = dur
|
|
|
|
}
|
2016-03-09 20:25:30 +00:00
|
|
|
conf.ClientMaxPort = uint(a.config.Client.ClientMaxPort)
|
|
|
|
conf.ClientMinPort = uint(a.config.Client.ClientMinPort)
|
2015-08-31 01:10:23 +00:00
|
|
|
|
|
|
|
// Setup the node
|
|
|
|
conf.Node = new(structs.Node)
|
|
|
|
conf.Node.Datacenter = a.config.Datacenter
|
|
|
|
conf.Node.Name = a.config.NodeName
|
|
|
|
conf.Node.Meta = a.config.Client.Meta
|
|
|
|
conf.Node.NodeClass = a.config.Client.NodeClass
|
2016-03-19 07:54:19 +00:00
|
|
|
|
2016-09-02 23:23:45 +00:00
|
|
|
// Set up the HTTP advertise address
|
2016-11-09 19:37:41 +00:00
|
|
|
conf.Node.HTTPAddr = a.config.AdvertiseAddrs.HTTP
|
2016-03-14 02:05:41 +00:00
|
|
|
|
|
|
|
// Reserve resources on the node.
|
|
|
|
r := conf.Node.Reserved
|
|
|
|
if r == nil {
|
|
|
|
r = new(structs.Resources)
|
|
|
|
conf.Node.Reserved = r
|
|
|
|
}
|
|
|
|
r.CPU = a.config.Client.Reserved.CPU
|
|
|
|
r.MemoryMB = a.config.Client.Reserved.MemoryMB
|
|
|
|
r.DiskMB = a.config.Client.Reserved.DiskMB
|
|
|
|
r.IOPS = a.config.Client.Reserved.IOPS
|
|
|
|
conf.GloballyReservedPorts = a.config.Client.Reserved.ParsedReservedPorts
|
|
|
|
|
2016-03-23 00:12:30 +00:00
|
|
|
conf.Version = fmt.Sprintf("%s%s", a.config.Version, a.config.VersionPrerelease)
|
|
|
|
conf.Revision = a.config.Revision
|
2016-03-19 07:54:19 +00:00
|
|
|
|
2017-01-18 23:55:14 +00:00
|
|
|
if *a.config.Consul.AutoAdvertise && a.config.Consul.ClientServiceName == "" {
|
2016-06-14 19:11:38 +00:00
|
|
|
return nil, fmt.Errorf("client_service_name must be set when auto_advertise is enabled")
|
|
|
|
}
|
|
|
|
|
2016-05-27 10:49:29 +00:00
|
|
|
conf.ConsulConfig = a.config.Consul
|
2016-08-09 22:00:50 +00:00
|
|
|
conf.VaultConfig = a.config.Vault
|
2016-06-16 20:30:29 +00:00
|
|
|
conf.StatsCollectionInterval = a.config.Telemetry.collectionInterval
|
2016-08-02 02:49:01 +00:00
|
|
|
conf.PublishNodeMetrics = a.config.Telemetry.PublishNodeMetrics
|
|
|
|
conf.PublishAllocationMetrics = a.config.Telemetry.PublishAllocationMetrics
|
2016-10-24 05:22:00 +00:00
|
|
|
|
|
|
|
// Set the TLS related configs
|
2016-10-25 22:57:38 +00:00
|
|
|
conf.TLSConfig = a.config.TLSConfig
|
2016-10-26 18:13:53 +00:00
|
|
|
conf.Node.TLSEnabled = conf.TLSConfig.EnableHTTP
|
2016-10-24 05:22:00 +00:00
|
|
|
|
2017-01-31 23:32:20 +00:00
|
|
|
// Set the GC related configs
|
|
|
|
conf.GCInterval = a.config.Client.GCInterval
|
2017-03-11 00:27:00 +00:00
|
|
|
conf.GCParallelDestroys = a.config.Client.GCParallelDestroys
|
2017-01-31 23:32:20 +00:00
|
|
|
conf.GCDiskUsageThreshold = a.config.Client.GCDiskUsageThreshold
|
|
|
|
conf.GCInodeUsageThreshold = a.config.Client.GCInodeUsageThreshold
|
2017-02-27 21:42:37 +00:00
|
|
|
conf.NoHostUUID = a.config.Client.NoHostUUID
|
2017-01-31 23:32:20 +00:00
|
|
|
|
2016-02-16 21:42:48 +00:00
|
|
|
return conf, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
// setupServer is used to setup the server if enabled
|
|
|
|
func (a *Agent) setupServer() error {
|
|
|
|
if !a.config.Server.Enabled {
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
// Setup the configuration
|
|
|
|
conf, err := a.serverConfig()
|
|
|
|
if err != nil {
|
|
|
|
return fmt.Errorf("server config setup failed: %s", err)
|
|
|
|
}
|
|
|
|
|
2016-10-17 17:48:04 +00:00
|
|
|
// Sets up the keyring for gossip encryption
|
|
|
|
if err := a.setupKeyrings(conf); err != nil {
|
|
|
|
return fmt.Errorf("failed to configure keyring: %v", err)
|
|
|
|
}
|
|
|
|
|
2016-02-16 21:42:48 +00:00
|
|
|
// Create the server
|
2016-06-17 06:29:23 +00:00
|
|
|
server, err := nomad.NewServer(conf, a.consulSyncer, a.logger)
|
2016-02-16 21:42:48 +00:00
|
|
|
if err != nil {
|
|
|
|
return fmt.Errorf("server setup failed: %v", err)
|
|
|
|
}
|
|
|
|
a.server = server
|
2016-06-10 01:12:02 +00:00
|
|
|
|
2016-11-04 22:24:28 +00:00
|
|
|
// Consul check addresses default to bind but can be toggled to use advertise
|
2016-11-09 19:37:41 +00:00
|
|
|
httpCheckAddr := a.config.normalizedAddrs.HTTP
|
|
|
|
rpcCheckAddr := a.config.normalizedAddrs.RPC
|
|
|
|
serfCheckAddr := a.config.normalizedAddrs.Serf
|
2017-01-18 23:55:14 +00:00
|
|
|
if *a.config.Consul.ChecksUseAdvertise {
|
2016-11-04 22:24:28 +00:00
|
|
|
httpCheckAddr = a.config.AdvertiseAddrs.HTTP
|
|
|
|
rpcCheckAddr = a.config.AdvertiseAddrs.RPC
|
|
|
|
serfCheckAddr = a.config.AdvertiseAddrs.Serf
|
2016-09-02 23:23:45 +00:00
|
|
|
}
|
|
|
|
|
2016-06-10 01:12:02 +00:00
|
|
|
// Create the Nomad Server services for Consul
|
2016-10-26 23:30:29 +00:00
|
|
|
// TODO re-introduce HTTP/S checks when Consul 0.7.1 comes out
|
2017-01-18 23:55:14 +00:00
|
|
|
if *a.config.Consul.AutoAdvertise {
|
2016-06-13 23:29:07 +00:00
|
|
|
httpServ := &structs.Service{
|
|
|
|
Name: a.config.Consul.ServerServiceName,
|
2016-11-04 22:24:28 +00:00
|
|
|
PortLabel: a.config.AdvertiseAddrs.HTTP,
|
2016-06-13 23:29:07 +00:00
|
|
|
Tags: []string{consul.ServiceTagHTTP},
|
2016-06-17 00:34:25 +00:00
|
|
|
Checks: []*structs.ServiceCheck{
|
|
|
|
&structs.ServiceCheck{
|
2016-09-02 23:23:45 +00:00
|
|
|
Name: "Nomad Server HTTP Check",
|
2016-11-04 00:33:58 +00:00
|
|
|
Type: "http",
|
|
|
|
Path: "/v1/status/peers",
|
|
|
|
Protocol: "http",
|
2016-09-02 23:23:45 +00:00
|
|
|
Interval: serverHttpCheckInterval,
|
|
|
|
Timeout: serverHttpCheckTimeout,
|
|
|
|
PortLabel: httpCheckAddr,
|
2016-06-17 00:34:25 +00:00
|
|
|
},
|
|
|
|
},
|
2016-06-13 23:29:07 +00:00
|
|
|
}
|
|
|
|
rpcServ := &structs.Service{
|
|
|
|
Name: a.config.Consul.ServerServiceName,
|
2016-11-04 22:24:28 +00:00
|
|
|
PortLabel: a.config.AdvertiseAddrs.RPC,
|
2016-06-13 23:29:07 +00:00
|
|
|
Tags: []string{consul.ServiceTagRPC},
|
2016-06-17 00:34:25 +00:00
|
|
|
Checks: []*structs.ServiceCheck{
|
|
|
|
&structs.ServiceCheck{
|
2016-09-02 23:23:45 +00:00
|
|
|
Name: "Nomad Server RPC Check",
|
|
|
|
Type: "tcp",
|
|
|
|
Interval: serverRpcCheckInterval,
|
|
|
|
Timeout: serverRpcCheckTimeout,
|
|
|
|
PortLabel: rpcCheckAddr,
|
2016-06-17 00:34:25 +00:00
|
|
|
},
|
|
|
|
},
|
2016-06-13 23:29:07 +00:00
|
|
|
}
|
|
|
|
serfServ := &structs.Service{
|
|
|
|
Name: a.config.Consul.ServerServiceName,
|
2016-11-04 22:24:28 +00:00
|
|
|
PortLabel: a.config.AdvertiseAddrs.Serf,
|
2016-06-13 23:29:07 +00:00
|
|
|
Tags: []string{consul.ServiceTagSerf},
|
2016-06-17 00:34:25 +00:00
|
|
|
Checks: []*structs.ServiceCheck{
|
|
|
|
&structs.ServiceCheck{
|
2016-09-02 23:23:45 +00:00
|
|
|
Name: "Nomad Server Serf Check",
|
|
|
|
Type: "tcp",
|
|
|
|
Interval: serverSerfCheckInterval,
|
|
|
|
Timeout: serverSerfCheckTimeout,
|
|
|
|
PortLabel: serfCheckAddr,
|
2016-06-17 00:34:25 +00:00
|
|
|
},
|
|
|
|
},
|
2016-06-13 23:29:07 +00:00
|
|
|
}
|
2016-09-02 23:23:45 +00:00
|
|
|
|
2016-11-04 00:33:58 +00:00
|
|
|
// Add the http port check if TLS isn't enabled
|
|
|
|
// TODO Add TLS check when Consul 0.7.1 comes out.
|
|
|
|
consulServices := map[consul.ServiceKey]*structs.Service{
|
2016-06-13 23:29:07 +00:00
|
|
|
consul.GenerateServiceKey(rpcServ): rpcServ,
|
|
|
|
consul.GenerateServiceKey(serfServ): serfServ,
|
2016-11-04 00:33:58 +00:00
|
|
|
}
|
|
|
|
if !conf.TLSConfig.EnableHTTP {
|
|
|
|
consulServices[consul.GenerateServiceKey(httpServ)] = httpServ
|
|
|
|
}
|
|
|
|
a.consulSyncer.SetServices(consul.ServerDomain, consulServices)
|
2016-06-10 01:12:02 +00:00
|
|
|
}
|
|
|
|
|
2016-02-16 21:42:48 +00:00
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2016-10-17 17:48:04 +00:00
|
|
|
// setupKeyrings is used to initialize and load keyrings during agent startup
|
|
|
|
func (a *Agent) setupKeyrings(config *nomad.Config) error {
|
|
|
|
file := filepath.Join(a.config.DataDir, serfKeyring)
|
|
|
|
|
|
|
|
if a.config.Server.EncryptKey == "" {
|
|
|
|
goto LOAD
|
|
|
|
}
|
|
|
|
if _, err := os.Stat(file); err != nil {
|
|
|
|
if err := initKeyring(file, a.config.Server.EncryptKey); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
LOAD:
|
|
|
|
if _, err := os.Stat(file); err == nil {
|
|
|
|
config.SerfConfig.KeyringFile = file
|
|
|
|
}
|
|
|
|
if err := loadKeyringFile(config.SerfConfig); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
// Success!
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2016-02-16 21:42:48 +00:00
|
|
|
// setupClient is used to setup the client if enabled
|
|
|
|
func (a *Agent) setupClient() error {
|
|
|
|
if !a.config.Client.Enabled {
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
// Setup the configuration
|
|
|
|
conf, err := a.clientConfig()
|
|
|
|
if err != nil {
|
|
|
|
return fmt.Errorf("client setup failed: %v", err)
|
|
|
|
}
|
2015-08-31 01:10:23 +00:00
|
|
|
|
2016-03-10 07:25:31 +00:00
|
|
|
// Reserve some ports for the plugins if we are on Windows
|
|
|
|
if runtime.GOOS == "windows" {
|
|
|
|
if err := a.reservePortsForClient(conf); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
2016-02-05 23:17:15 +00:00
|
|
|
}
|
|
|
|
|
2015-08-31 01:10:23 +00:00
|
|
|
// Create the client
|
2016-06-17 06:29:23 +00:00
|
|
|
client, err := client.NewClient(conf, a.consulSyncer, a.logger)
|
2015-08-24 00:40:27 +00:00
|
|
|
if err != nil {
|
|
|
|
return fmt.Errorf("client setup failed: %v", err)
|
|
|
|
}
|
|
|
|
a.client = client
|
2016-06-10 01:12:02 +00:00
|
|
|
|
2016-09-02 23:23:45 +00:00
|
|
|
// Resolve the http check address
|
2016-11-09 19:37:41 +00:00
|
|
|
httpCheckAddr := a.config.normalizedAddrs.HTTP
|
2017-01-18 23:55:14 +00:00
|
|
|
if *a.config.Consul.ChecksUseAdvertise {
|
2016-11-04 22:24:28 +00:00
|
|
|
httpCheckAddr = a.config.AdvertiseAddrs.HTTP
|
2016-09-02 23:23:45 +00:00
|
|
|
}
|
|
|
|
|
2016-06-14 00:32:18 +00:00
|
|
|
// Create the Nomad Client services for Consul
|
2016-10-26 23:30:29 +00:00
|
|
|
// TODO think how we can re-introduce HTTP/S checks when Consul 0.7.1 comes
|
|
|
|
// out
|
2017-01-18 23:55:14 +00:00
|
|
|
if *a.config.Consul.AutoAdvertise {
|
2016-06-13 23:29:07 +00:00
|
|
|
httpServ := &structs.Service{
|
|
|
|
Name: a.config.Consul.ClientServiceName,
|
2016-11-04 22:24:28 +00:00
|
|
|
PortLabel: a.config.AdvertiseAddrs.HTTP,
|
2016-06-13 23:29:07 +00:00
|
|
|
Tags: []string{consul.ServiceTagHTTP},
|
2016-06-17 00:34:25 +00:00
|
|
|
Checks: []*structs.ServiceCheck{
|
|
|
|
&structs.ServiceCheck{
|
2016-09-02 23:23:45 +00:00
|
|
|
Name: "Nomad Client HTTP Check",
|
2016-11-04 00:33:58 +00:00
|
|
|
Type: "http",
|
|
|
|
Path: "/v1/agent/servers",
|
|
|
|
Protocol: "http",
|
2016-09-02 23:23:45 +00:00
|
|
|
Interval: clientHttpCheckInterval,
|
|
|
|
Timeout: clientHttpCheckTimeout,
|
|
|
|
PortLabel: httpCheckAddr,
|
2016-06-17 00:34:25 +00:00
|
|
|
},
|
|
|
|
},
|
2016-06-13 23:29:07 +00:00
|
|
|
}
|
2016-11-04 00:33:58 +00:00
|
|
|
if !conf.TLSConfig.EnableHTTP {
|
|
|
|
a.consulSyncer.SetServices(consul.ClientDomain, map[consul.ServiceKey]*structs.Service{
|
|
|
|
consul.GenerateServiceKey(httpServ): httpServ,
|
|
|
|
})
|
|
|
|
}
|
2016-06-10 01:12:02 +00:00
|
|
|
}
|
|
|
|
|
2015-08-24 00:40:27 +00:00
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2016-06-01 10:08:39 +00:00
|
|
|
// reservePortsForClient reserves a range of ports for the client to use when
|
2016-02-12 22:25:32 +00:00
|
|
|
// it creates various plugins for log collection, executors, drivers, etc
|
2016-02-12 21:21:56 +00:00
|
|
|
func (a *Agent) reservePortsForClient(conf *clientconfig.Config) error {
|
2016-02-12 22:25:32 +00:00
|
|
|
// finding the device name for loopback
|
2016-02-12 21:21:56 +00:00
|
|
|
deviceName, addr, mask, err := a.findLoopbackDevice()
|
|
|
|
if err != nil {
|
|
|
|
return fmt.Errorf("error finding the device name for loopback: %v", err)
|
|
|
|
}
|
2016-02-12 22:25:32 +00:00
|
|
|
|
|
|
|
// seeing if the user has already reserved some resources on this device
|
2016-02-12 21:21:56 +00:00
|
|
|
var nr *structs.NetworkResource
|
|
|
|
if conf.Node.Reserved == nil {
|
|
|
|
conf.Node.Reserved = &structs.Resources{}
|
|
|
|
}
|
|
|
|
for _, n := range conf.Node.Reserved.Networks {
|
|
|
|
if n.Device == deviceName {
|
|
|
|
nr = n
|
|
|
|
}
|
|
|
|
}
|
2016-02-12 22:25:32 +00:00
|
|
|
// If the user hasn't already created the device, we create it
|
2016-02-12 21:21:56 +00:00
|
|
|
if nr == nil {
|
|
|
|
nr = &structs.NetworkResource{
|
|
|
|
Device: deviceName,
|
|
|
|
IP: addr,
|
|
|
|
CIDR: mask,
|
|
|
|
ReservedPorts: make([]structs.Port, 0),
|
|
|
|
}
|
|
|
|
}
|
2016-02-12 22:25:32 +00:00
|
|
|
// appending the port ranges we want to use for the client to the list of
|
|
|
|
// reserved ports for this device
|
2016-02-12 21:21:56 +00:00
|
|
|
for i := conf.ClientMinPort; i <= conf.ClientMaxPort; i++ {
|
|
|
|
nr.ReservedPorts = append(nr.ReservedPorts, structs.Port{Label: fmt.Sprintf("plugin-%d", i), Value: int(i)})
|
|
|
|
}
|
|
|
|
conf.Node.Reserved.Networks = append(conf.Node.Reserved.Networks, nr)
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2016-02-12 22:25:32 +00:00
|
|
|
// findLoopbackDevice iterates through all the interfaces on a machine and
|
|
|
|
// returns the ip addr, mask of the loopback device
|
2016-02-12 21:21:56 +00:00
|
|
|
func (a *Agent) findLoopbackDevice() (string, string, string, error) {
|
2016-02-05 23:17:15 +00:00
|
|
|
var ifcs []net.Interface
|
|
|
|
var err error
|
|
|
|
ifcs, err = net.Interfaces()
|
|
|
|
if err != nil {
|
2016-02-12 21:21:56 +00:00
|
|
|
return "", "", "", err
|
2016-02-05 23:17:15 +00:00
|
|
|
}
|
|
|
|
for _, ifc := range ifcs {
|
|
|
|
addrs, err := ifc.Addrs()
|
|
|
|
if err != nil {
|
2016-02-12 22:25:32 +00:00
|
|
|
return "", "", "", err
|
2016-02-05 23:17:15 +00:00
|
|
|
}
|
|
|
|
for _, addr := range addrs {
|
2016-02-12 21:21:56 +00:00
|
|
|
var ip net.IP
|
|
|
|
switch v := addr.(type) {
|
|
|
|
case *net.IPNet:
|
|
|
|
ip = v.IP
|
|
|
|
case *net.IPAddr:
|
|
|
|
ip = v.IP
|
|
|
|
}
|
|
|
|
if ip.IsLoopback() {
|
2016-02-12 22:25:32 +00:00
|
|
|
if ip.To4() == nil {
|
|
|
|
continue
|
|
|
|
}
|
2016-02-12 21:21:56 +00:00
|
|
|
return ifc.Name, ip.String(), addr.String(), nil
|
2016-02-05 23:17:15 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2016-02-12 21:21:56 +00:00
|
|
|
|
2016-02-12 22:25:32 +00:00
|
|
|
return "", "", "", fmt.Errorf("no loopback devices with IPV4 addr found")
|
2016-02-05 23:17:15 +00:00
|
|
|
}
|
|
|
|
|
2015-08-16 23:40:04 +00:00
|
|
|
// Leave is used gracefully exit. Clients will inform servers
|
|
|
|
// of their departure so that allocations can be rescheduled.
|
2015-08-16 20:54:49 +00:00
|
|
|
func (a *Agent) Leave() error {
|
2015-08-23 23:53:15 +00:00
|
|
|
if a.client != nil {
|
|
|
|
if err := a.client.Leave(); err != nil {
|
|
|
|
a.logger.Printf("[ERR] agent: client leave failed: %v", err)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if a.server != nil {
|
|
|
|
if err := a.server.Leave(); err != nil {
|
|
|
|
a.logger.Printf("[ERR] agent: server leave failed: %v", err)
|
|
|
|
}
|
|
|
|
}
|
2015-08-16 20:54:49 +00:00
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2015-08-16 23:40:04 +00:00
|
|
|
// Shutdown is used to terminate the agent.
|
2015-08-16 20:54:49 +00:00
|
|
|
func (a *Agent) Shutdown() error {
|
2015-08-16 23:40:04 +00:00
|
|
|
a.shutdownLock.Lock()
|
|
|
|
defer a.shutdownLock.Unlock()
|
|
|
|
|
|
|
|
if a.shutdown {
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
a.logger.Println("[INFO] agent: requesting shutdown")
|
2015-08-23 23:53:15 +00:00
|
|
|
if a.client != nil {
|
|
|
|
if err := a.client.Shutdown(); err != nil {
|
|
|
|
a.logger.Printf("[ERR] agent: client shutdown failed: %v", err)
|
|
|
|
}
|
|
|
|
}
|
2015-08-16 23:40:04 +00:00
|
|
|
if a.server != nil {
|
2015-08-23 23:53:15 +00:00
|
|
|
if err := a.server.Shutdown(); err != nil {
|
|
|
|
a.logger.Printf("[ERR] agent: server shutdown failed: %v", err)
|
|
|
|
}
|
2015-08-16 23:40:04 +00:00
|
|
|
}
|
|
|
|
|
2016-06-10 03:35:07 +00:00
|
|
|
if err := a.consulSyncer.Shutdown(); err != nil {
|
|
|
|
a.logger.Printf("[ERR] agent: shutting down consul service failed: %v", err)
|
2016-05-11 22:24:37 +00:00
|
|
|
}
|
|
|
|
|
2015-08-16 23:40:04 +00:00
|
|
|
a.logger.Println("[INFO] agent: shutdown complete")
|
|
|
|
a.shutdown = true
|
|
|
|
close(a.shutdownCh)
|
2015-08-23 23:53:15 +00:00
|
|
|
return nil
|
2015-08-16 23:40:04 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// RPC is used to make an RPC call to the Nomad servers
|
|
|
|
func (a *Agent) RPC(method string, args interface{}, reply interface{}) error {
|
|
|
|
if a.server != nil {
|
|
|
|
return a.server.RPC(method, args, reply)
|
|
|
|
}
|
|
|
|
return a.client.RPC(method, args, reply)
|
2015-08-16 20:54:49 +00:00
|
|
|
}
|
2015-08-24 00:40:27 +00:00
|
|
|
|
|
|
|
// Client returns the configured client or nil
|
|
|
|
func (a *Agent) Client() *client.Client {
|
|
|
|
return a.client
|
|
|
|
}
|
|
|
|
|
|
|
|
// Server returns the configured server or nil
|
|
|
|
func (a *Agent) Server() *nomad.Server {
|
|
|
|
return a.server
|
|
|
|
}
|
2015-08-31 01:20:00 +00:00
|
|
|
|
|
|
|
// Stats is used to return statistics for debugging and insight
|
|
|
|
// for various sub-systems
|
|
|
|
func (a *Agent) Stats() map[string]map[string]string {
|
|
|
|
stats := make(map[string]map[string]string)
|
|
|
|
if a.server != nil {
|
|
|
|
subStat := a.server.Stats()
|
|
|
|
for k, v := range subStat {
|
|
|
|
stats[k] = v
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if a.client != nil {
|
|
|
|
subStat := a.client.Stats()
|
|
|
|
for k, v := range subStat {
|
|
|
|
stats[k] = v
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return stats
|
|
|
|
}
|
2016-05-11 22:24:37 +00:00
|
|
|
|
2016-06-10 01:12:02 +00:00
|
|
|
// setupConsulSyncer creates the Consul tasks used by this Nomad Agent
|
2016-06-08 06:31:19 +00:00
|
|
|
// (either Client or Server mode).
|
2016-06-17 06:15:41 +00:00
|
|
|
func (a *Agent) setupConsulSyncer() error {
|
2016-06-08 06:31:19 +00:00
|
|
|
var err error
|
2016-06-17 06:15:41 +00:00
|
|
|
a.consulSyncer, err = consul.NewSyncer(a.config.Consul, a.shutdownCh, a.logger)
|
2016-06-08 06:31:19 +00:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
2016-05-11 22:24:37 +00:00
|
|
|
|
2016-05-24 04:43:09 +00:00
|
|
|
a.consulSyncer.SetAddrFinder(func(portLabel string) (string, int) {
|
2016-05-14 07:36:26 +00:00
|
|
|
host, port, err := net.SplitHostPort(portLabel)
|
2016-05-11 22:24:37 +00:00
|
|
|
if err != nil {
|
2016-06-07 14:55:35 +00:00
|
|
|
p, err := strconv.Atoi(port)
|
|
|
|
if err != nil {
|
|
|
|
return "", 0
|
|
|
|
}
|
|
|
|
return "", p
|
2016-05-11 22:24:37 +00:00
|
|
|
}
|
2016-05-15 00:08:19 +00:00
|
|
|
|
2016-06-07 14:55:35 +00:00
|
|
|
// If the addr for the service is ":port", then we fall back
|
|
|
|
// to Nomad's default address resolution protocol.
|
|
|
|
//
|
|
|
|
// TODO(sean@): This should poll Consul to figure out what
|
|
|
|
// its advertise address is and use that in order to handle
|
|
|
|
// the case where there is something funky like NAT on this
|
|
|
|
// host. For now we just use the BindAddr if set, otherwise
|
|
|
|
// we fall back to a loopback addr.
|
2016-05-15 00:08:19 +00:00
|
|
|
if host == "" {
|
2016-06-07 14:55:35 +00:00
|
|
|
if a.config.BindAddr != "" {
|
2016-06-08 06:31:19 +00:00
|
|
|
host = a.config.BindAddr
|
2016-06-07 14:55:35 +00:00
|
|
|
} else {
|
|
|
|
host = "127.0.0.1"
|
|
|
|
}
|
2016-05-15 00:08:19 +00:00
|
|
|
}
|
2016-05-11 22:24:37 +00:00
|
|
|
p, err := strconv.Atoi(port)
|
|
|
|
if err != nil {
|
2016-06-07 14:55:35 +00:00
|
|
|
return host, 0
|
2016-05-11 22:24:37 +00:00
|
|
|
}
|
|
|
|
return host, p
|
|
|
|
})
|
|
|
|
|
2016-06-10 01:12:02 +00:00
|
|
|
return nil
|
2016-05-11 22:24:37 +00:00
|
|
|
}
|