2018-01-11 19:24:57 +00:00
|
|
|
package client
|
|
|
|
|
|
|
|
import (
|
2018-01-11 21:23:57 +00:00
|
|
|
"io"
|
2018-01-11 19:24:57 +00:00
|
|
|
"net"
|
|
|
|
"net/rpc"
|
|
|
|
"strings"
|
2018-01-09 23:26:53 +00:00
|
|
|
"time"
|
2018-01-11 19:24:57 +00:00
|
|
|
|
2018-01-11 21:23:57 +00:00
|
|
|
metrics "github.com/armon/go-metrics"
|
2018-01-09 23:26:53 +00:00
|
|
|
"github.com/hashicorp/consul/lib"
|
2018-01-11 19:24:57 +00:00
|
|
|
"github.com/hashicorp/nomad/helper/codec"
|
2018-01-12 21:58:44 +00:00
|
|
|
"github.com/hashicorp/nomad/helper/pool"
|
2018-01-09 23:26:53 +00:00
|
|
|
"github.com/hashicorp/nomad/nomad"
|
|
|
|
"github.com/hashicorp/nomad/nomad/structs"
|
2018-01-11 21:23:57 +00:00
|
|
|
"github.com/hashicorp/yamux"
|
2018-01-11 19:24:57 +00:00
|
|
|
)
|
|
|
|
|
|
|
|
// rpcEndpoints holds the RPC endpoints
|
|
|
|
type rpcEndpoints struct {
|
|
|
|
ClientStats *ClientStats
|
|
|
|
}
|
|
|
|
|
|
|
|
// ClientRPC is used to make a local, client only RPC call
|
|
|
|
func (c *Client) ClientRPC(method string, args interface{}, reply interface{}) error {
|
|
|
|
codec := &codec.InmemCodec{
|
|
|
|
Method: method,
|
|
|
|
Args: args,
|
|
|
|
Reply: reply,
|
|
|
|
}
|
|
|
|
if err := c.rpcServer.ServeRequest(codec); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
return codec.Err
|
|
|
|
}
|
|
|
|
|
|
|
|
// RPC is used to forward an RPC call to a nomad server, or fail if no servers.
|
|
|
|
func (c *Client) RPC(method string, args interface{}, reply interface{}) error {
|
|
|
|
// Invoke the RPCHandler if it exists
|
|
|
|
if c.config.RPCHandler != nil {
|
|
|
|
return c.config.RPCHandler.RPC(method, args, reply)
|
|
|
|
}
|
|
|
|
|
2018-01-09 23:26:53 +00:00
|
|
|
// This is subtle but we start measuring the time on the client side
|
|
|
|
// right at the time of the first request, vs. on the first retry as
|
|
|
|
// is done on the server side inside forward(). This is because the
|
|
|
|
// servers may already be applying the RPCHoldTimeout up there, so by
|
|
|
|
// starting the timer here we won't potentially double up the delay.
|
|
|
|
firstCheck := time.Now()
|
|
|
|
|
|
|
|
TRY:
|
|
|
|
server := c.servers.FindServer()
|
|
|
|
if server == nil {
|
2018-01-11 19:24:57 +00:00
|
|
|
return noServersErr
|
|
|
|
}
|
|
|
|
|
2018-01-09 23:26:53 +00:00
|
|
|
// Make the request.
|
|
|
|
rpcErr := c.connPool.RPC(c.Region(), server.Addr, c.RPCMajorVersion(), method, args, reply)
|
|
|
|
if rpcErr == nil {
|
2018-01-11 19:24:57 +00:00
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2018-01-09 23:26:53 +00:00
|
|
|
// Move off to another server, and see if we can retry.
|
|
|
|
c.logger.Printf("[ERR] nomad: %q RPC failed to server %s: %v", method, server.Addr, rpcErr)
|
|
|
|
c.servers.NotifyFailedServer(server)
|
|
|
|
if retry := canRetry(args, rpcErr); !retry {
|
|
|
|
return rpcErr
|
|
|
|
}
|
|
|
|
|
|
|
|
// We can wait a bit and retry!
|
|
|
|
// TODO(alexdadgar): Plumb through the RPCHoldTimeout config
|
|
|
|
//if time.Since(firstCheck) < c.config.RPCHoldTimeout {
|
|
|
|
if time.Since(firstCheck) < 5*time.Second {
|
|
|
|
jitter := lib.RandomStagger(5 * time.Second / nomad.JitterFraction)
|
|
|
|
select {
|
|
|
|
case <-time.After(jitter):
|
|
|
|
goto TRY
|
|
|
|
case <-c.shutdownCh:
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return rpcErr
|
|
|
|
}
|
|
|
|
|
|
|
|
// canRetry returns true if the given situation is safe for a retry.
|
|
|
|
func canRetry(args interface{}, err error) bool {
|
|
|
|
// No leader errors are always safe to retry since no state could have
|
|
|
|
// been changed.
|
|
|
|
if structs.IsErrNoLeader(err) {
|
|
|
|
return true
|
|
|
|
}
|
|
|
|
|
|
|
|
// Reads are safe to retry for stream errors, such as if a server was
|
|
|
|
// being shut down.
|
|
|
|
info, ok := args.(structs.RPCInfo)
|
|
|
|
if ok && info.IsRead() && lib.IsErrEOF(err) {
|
|
|
|
return true
|
|
|
|
}
|
|
|
|
|
|
|
|
return false
|
2018-01-11 19:24:57 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// setupClientRpc is used to setup the Client's RPC endpoints
|
|
|
|
func (c *Client) setupClientRpc() {
|
|
|
|
// Initialize the RPC handlers
|
|
|
|
c.endpoints.ClientStats = &ClientStats{c}
|
|
|
|
|
|
|
|
// Create the RPC Server
|
|
|
|
c.rpcServer = rpc.NewServer()
|
|
|
|
|
|
|
|
// Register the endpoints with the RPC server
|
|
|
|
c.setupClientRpcServer(c.rpcServer)
|
2018-01-11 21:23:57 +00:00
|
|
|
|
|
|
|
go c.rpcConnListener()
|
|
|
|
}
|
|
|
|
|
|
|
|
// rpcConnListener is a long lived function that listens for new connections
|
|
|
|
// being made on the connection pool and starts an RPC listener for each
|
|
|
|
// connection.
|
|
|
|
func (c *Client) rpcConnListener() {
|
|
|
|
// Make a channel for new connections.
|
|
|
|
conns := make(chan *yamux.Session, 4)
|
|
|
|
c.connPool.SetConnListener(conns)
|
|
|
|
|
|
|
|
for {
|
|
|
|
select {
|
|
|
|
case <-c.shutdownCh:
|
|
|
|
return
|
|
|
|
case session, ok := <-conns:
|
|
|
|
if !ok {
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
|
|
|
go c.listenConn(session)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// listenConn is used to listen for connections being made from the server on
|
|
|
|
// pre-existing connection. This should be called in a goroutine.
|
|
|
|
func (c *Client) listenConn(s *yamux.Session) {
|
|
|
|
for {
|
|
|
|
conn, err := s.Accept()
|
|
|
|
if err != nil {
|
|
|
|
if s.IsClosed() {
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
c.logger.Printf("[ERR] client.rpc: failed to accept RPC conn: %v", err)
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
|
|
|
go c.handleConn(conn)
|
|
|
|
metrics.IncrCounter([]string{"client", "rpc", "accept_conn"}, 1)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// handleConn is used to handle an individual connection.
|
|
|
|
func (c *Client) handleConn(conn net.Conn) {
|
|
|
|
defer conn.Close()
|
2018-01-12 21:58:44 +00:00
|
|
|
rpcCodec := pool.NewServerCodec(conn)
|
2018-01-11 21:23:57 +00:00
|
|
|
for {
|
|
|
|
select {
|
|
|
|
case <-c.shutdownCh:
|
|
|
|
return
|
|
|
|
default:
|
|
|
|
}
|
|
|
|
|
|
|
|
if err := c.rpcServer.ServeRequest(rpcCodec); err != nil {
|
|
|
|
if err != io.EOF && !strings.Contains(err.Error(), "closed") {
|
|
|
|
c.logger.Printf("[ERR] client.rpc: RPC error: %v (%v)", err, conn)
|
|
|
|
metrics.IncrCounter([]string{"client", "rpc", "request_error"}, 1)
|
|
|
|
}
|
|
|
|
return
|
|
|
|
}
|
|
|
|
metrics.IncrCounter([]string{"client", "rpc", "request"}, 1)
|
|
|
|
}
|
2018-01-11 19:24:57 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// setupClientRpcServer is used to populate a client RPC server with endpoints.
|
|
|
|
func (c *Client) setupClientRpcServer(server *rpc.Server) {
|
|
|
|
// Register the endpoints
|
|
|
|
server.Register(c.endpoints.ClientStats)
|
|
|
|
}
|
|
|
|
|
|
|
|
// resolveServer given a sever's address as a string, return it's resolved
|
|
|
|
// net.Addr or an error.
|
|
|
|
func resolveServer(s string) (net.Addr, error) {
|
|
|
|
const defaultClientPort = "4647" // default client RPC port
|
|
|
|
host, port, err := net.SplitHostPort(s)
|
|
|
|
if err != nil {
|
|
|
|
if strings.Contains(err.Error(), "missing port") {
|
|
|
|
host = s
|
|
|
|
port = defaultClientPort
|
|
|
|
} else {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return net.ResolveTCPAddr("tcp", net.JoinHostPort(host, port))
|
|
|
|
}
|
2018-01-09 23:26:53 +00:00
|
|
|
|
|
|
|
// Ping is used to ping a particular server and returns whether it is healthy or
|
|
|
|
// a potential error.
|
|
|
|
func (c *Client) Ping(srv net.Addr) (bool, error) {
|
|
|
|
var reply struct{}
|
|
|
|
err := c.connPool.RPC(c.Region(), srv, c.RPCMajorVersion(), "Status.Ping", struct{}{}, &reply)
|
|
|
|
return err == nil, err
|
|
|
|
}
|