333 lines
9.1 KiB
Go
333 lines
9.1 KiB
Go
package nomad
|
|
|
|
import (
|
|
"errors"
|
|
"fmt"
|
|
"net"
|
|
"time"
|
|
|
|
"github.com/hashicorp/go-msgpack/codec"
|
|
multierror "github.com/hashicorp/go-multierror"
|
|
msgpackrpc "github.com/hashicorp/net-rpc-msgpackrpc"
|
|
"github.com/hashicorp/nomad/helper/pool"
|
|
"github.com/hashicorp/nomad/nomad/structs"
|
|
"github.com/hashicorp/yamux"
|
|
)
|
|
|
|
// nodeConnState is used to track connection information about a Nomad Client.
|
|
type nodeConnState struct {
|
|
// Session holds the multiplexed yamux Session for dialing back.
|
|
Session *yamux.Session
|
|
|
|
// Established is when the connection was established.
|
|
Established time.Time
|
|
|
|
// Ctx is the full RPC context
|
|
Ctx *RPCContext
|
|
}
|
|
|
|
// getNodeConn returns the connection to the given node and whether it exists.
|
|
func (s *Server) getNodeConn(nodeID string) (*nodeConnState, bool) {
|
|
s.nodeConnsLock.RLock()
|
|
defer s.nodeConnsLock.RUnlock()
|
|
conns, ok := s.nodeConns[nodeID]
|
|
if !ok {
|
|
return nil, false
|
|
}
|
|
|
|
// Return the latest conn
|
|
var state *nodeConnState
|
|
for _, conn := range conns {
|
|
if state == nil || state.Established.Before(conn.Established) {
|
|
state = conn
|
|
}
|
|
}
|
|
|
|
// Shouldn't happen but rather be safe
|
|
if state == nil {
|
|
s.logger.Named("client_rpc").Warn("node exists in node connection map without any connection", "node_id", nodeID)
|
|
return nil, false
|
|
}
|
|
|
|
return state, ok
|
|
}
|
|
|
|
// connectedNodes returns the set of nodes we have a connection with.
|
|
func (s *Server) connectedNodes() map[string]time.Time {
|
|
s.nodeConnsLock.RLock()
|
|
defer s.nodeConnsLock.RUnlock()
|
|
nodes := make(map[string]time.Time, len(s.nodeConns))
|
|
for nodeID, conns := range s.nodeConns {
|
|
for _, conn := range conns {
|
|
if nodes[nodeID].Before(conn.Established) {
|
|
nodes[nodeID] = conn.Established
|
|
}
|
|
}
|
|
}
|
|
return nodes
|
|
}
|
|
|
|
// addNodeConn adds the mapping between a node and its session.
|
|
func (s *Server) addNodeConn(ctx *RPCContext) {
|
|
// Hotpath the no-op
|
|
if ctx == nil || ctx.NodeID == "" {
|
|
return
|
|
}
|
|
|
|
s.nodeConnsLock.Lock()
|
|
defer s.nodeConnsLock.Unlock()
|
|
|
|
// Capture the tracked connections so far
|
|
currentConns := s.nodeConns[ctx.NodeID]
|
|
|
|
// Check if we already have the connection. If we do, just update the
|
|
// establish time.
|
|
for _, c := range currentConns {
|
|
if c.Ctx.Conn.LocalAddr().String() == ctx.Conn.LocalAddr().String() &&
|
|
c.Ctx.Conn.RemoteAddr().String() == ctx.Conn.RemoteAddr().String() {
|
|
c.Established = time.Now()
|
|
return
|
|
}
|
|
}
|
|
|
|
// Add the new conn
|
|
s.nodeConns[ctx.NodeID] = append(s.nodeConns[ctx.NodeID], &nodeConnState{
|
|
Session: ctx.Session,
|
|
Established: time.Now(),
|
|
Ctx: ctx,
|
|
})
|
|
}
|
|
|
|
// removeNodeConn removes the mapping between a node and its session.
|
|
func (s *Server) removeNodeConn(ctx *RPCContext) {
|
|
// Hotpath the no-op
|
|
if ctx == nil || ctx.NodeID == "" {
|
|
return
|
|
}
|
|
|
|
s.nodeConnsLock.Lock()
|
|
defer s.nodeConnsLock.Unlock()
|
|
conns, ok := s.nodeConns[ctx.NodeID]
|
|
if !ok {
|
|
return
|
|
}
|
|
|
|
// It is important that we check that the connection being removed is the
|
|
// actual stored connection for the client. It is possible for the client to
|
|
// dial various addresses that all route to the same server. The most common
|
|
// case for this is the original address the client uses to connect to the
|
|
// server differs from the advertised address sent by the heartbeat.
|
|
for i, conn := range conns {
|
|
if conn.Ctx.Conn.LocalAddr().String() == ctx.Conn.LocalAddr().String() &&
|
|
conn.Ctx.Conn.RemoteAddr().String() == ctx.Conn.RemoteAddr().String() {
|
|
|
|
if len(conns) == 1 {
|
|
// We are deleting the last conn, remove it from the map
|
|
delete(s.nodeConns, ctx.NodeID)
|
|
} else {
|
|
// Slice out the connection we are deleting
|
|
s.nodeConns[ctx.NodeID] = append(s.nodeConns[ctx.NodeID][:i], s.nodeConns[ctx.NodeID][i+1:]...)
|
|
}
|
|
|
|
return
|
|
}
|
|
}
|
|
}
|
|
|
|
// serverWithNodeConn is used to determine which remote server has the most
|
|
// recent connection to the given node. The local server is not queried.
|
|
// ErrNoNodeConn is returned if all local peers could be queried but did not
|
|
// have a connection to the node. Otherwise if a connection could not be found
|
|
// and there were RPC errors, an error is returned.
|
|
func (s *Server) serverWithNodeConn(nodeID, region string) (*serverParts, error) {
|
|
// We skip ourselves.
|
|
selfAddr := s.LocalMember().Addr.String()
|
|
|
|
// Build the request
|
|
req := &structs.NodeSpecificRequest{
|
|
NodeID: nodeID,
|
|
QueryOptions: structs.QueryOptions{
|
|
Region: s.config.Region,
|
|
},
|
|
}
|
|
|
|
// Select the list of servers to check based on what region we are querying
|
|
s.peerLock.RLock()
|
|
|
|
var rawTargets []*serverParts
|
|
if region == s.Region() {
|
|
rawTargets = make([]*serverParts, 0, len(s.localPeers))
|
|
for _, srv := range s.localPeers {
|
|
rawTargets = append(rawTargets, srv)
|
|
}
|
|
} else {
|
|
peers, ok := s.peers[region]
|
|
if !ok {
|
|
s.peerLock.RUnlock()
|
|
return nil, structs.ErrNoRegionPath
|
|
}
|
|
rawTargets = peers
|
|
}
|
|
|
|
targets := make([]*serverParts, 0, len(rawTargets))
|
|
for _, target := range rawTargets {
|
|
targets = append(targets, target.Copy())
|
|
}
|
|
s.peerLock.RUnlock()
|
|
|
|
// connections is used to store the servers that have connections to the
|
|
// requested node.
|
|
var mostRecentServer *serverParts
|
|
var mostRecent time.Time
|
|
|
|
var rpcErr multierror.Error
|
|
for _, server := range targets {
|
|
if server.Addr.String() == selfAddr {
|
|
continue
|
|
}
|
|
|
|
// Make the RPC
|
|
var resp structs.NodeConnQueryResponse
|
|
err := s.connPool.RPC(s.config.Region, server.Addr, "Status.HasNodeConn", &req, &resp)
|
|
if err != nil {
|
|
multierror.Append(&rpcErr, fmt.Errorf("failed querying server %q: %v", server.Addr.String(), err))
|
|
continue
|
|
}
|
|
|
|
if resp.Connected && resp.Established.After(mostRecent) {
|
|
mostRecentServer = server
|
|
mostRecent = resp.Established
|
|
}
|
|
}
|
|
|
|
// Return an error if there is no route to the node.
|
|
if mostRecentServer == nil {
|
|
if err := rpcErr.ErrorOrNil(); err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
return nil, structs.ErrNoNodeConn
|
|
}
|
|
|
|
return mostRecentServer, nil
|
|
}
|
|
|
|
// forwardClientRPC forwards the RPC specified by method to the node specified
|
|
// by nodeID. Must be done after region forwarding, metrics, and permissions
|
|
// checks.
|
|
//
|
|
// This is a wrapper method for getNodeForRpc, getNodeConn, etc that Client
|
|
// RPCs which only need Servers to forward requests can use.
|
|
func (s *Server) forwardClientRPC(method, nodeID string, args, reply any) error {
|
|
if nodeID == "" {
|
|
return errors.New("missing NodeID")
|
|
}
|
|
|
|
// Check if the node even exists and is compatible with NodeRpc
|
|
snap, err := s.State().Snapshot()
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
// Make sure Node is new enough to support RPC
|
|
_, err = getNodeForRpc(snap, nodeID)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
// Get the connection to the client
|
|
state, ok := s.getNodeConn(nodeID)
|
|
if !ok {
|
|
// Make the RPC via another server
|
|
return findNodeConnAndForward(s, nodeID, method, args, reply)
|
|
}
|
|
|
|
// Make the RPC
|
|
return NodeRpc(state.Session, method, args, reply)
|
|
}
|
|
|
|
// NodeRpc is used to make an RPC call to a node. The method takes the
|
|
// Yamux session for the node and the method to be called.
|
|
func NodeRpc(session *yamux.Session, method string, args, reply interface{}) error {
|
|
// Open a new session
|
|
stream, err := session.Open()
|
|
if err != nil {
|
|
return fmt.Errorf("session open: %v", err)
|
|
}
|
|
defer stream.Close()
|
|
|
|
// Write the RpcNomad byte to set the mode
|
|
if _, err := stream.Write([]byte{byte(pool.RpcNomad)}); err != nil {
|
|
stream.Close()
|
|
return fmt.Errorf("set mode: %v", err)
|
|
}
|
|
|
|
// Make the RPC
|
|
err = msgpackrpc.CallWithCodec(pool.NewClientCodec(stream), method, args, reply)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
return nil
|
|
}
|
|
|
|
// NodeStreamingRpc is used to make a streaming RPC call to a node. The method
|
|
// takes the Yamux session for the node and the method to be called. It conducts
|
|
// the initial handshake and returns a connection to be used or an error. It is
|
|
// the callers responsibility to close the connection if there is no error.
|
|
func NodeStreamingRpc(session *yamux.Session, method string) (net.Conn, error) {
|
|
// Open a new session
|
|
stream, err := session.Open()
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
// Write the RpcNomad byte to set the mode
|
|
if _, err := stream.Write([]byte{byte(pool.RpcStreaming)}); err != nil {
|
|
stream.Close()
|
|
return nil, err
|
|
}
|
|
|
|
// Send the header
|
|
encoder := codec.NewEncoder(stream, structs.MsgpackHandle)
|
|
decoder := codec.NewDecoder(stream, structs.MsgpackHandle)
|
|
header := structs.StreamingRpcHeader{
|
|
Method: method,
|
|
}
|
|
if err := encoder.Encode(header); err != nil {
|
|
stream.Close()
|
|
return nil, err
|
|
}
|
|
|
|
// Wait for the acknowledgement
|
|
var ack structs.StreamingRpcAck
|
|
if err := decoder.Decode(&ack); err != nil {
|
|
stream.Close()
|
|
return nil, err
|
|
}
|
|
|
|
if ack.Error != "" {
|
|
stream.Close()
|
|
return nil, errors.New(ack.Error)
|
|
}
|
|
|
|
return stream, nil
|
|
}
|
|
|
|
// findNodeConnAndForward is a helper for finding the server with a connection
|
|
// to the given node and forwarding the RPC to the correct server. This does not
|
|
// work for streaming RPCs.
|
|
func findNodeConnAndForward(srv *Server, nodeID, method string, args, reply interface{}) error {
|
|
// Determine the Server that has a connection to the node.
|
|
srvWithConn, err := srv.serverWithNodeConn(nodeID, srv.Region())
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
if srvWithConn == nil {
|
|
return structs.ErrNoNodeConn
|
|
}
|
|
|
|
return srv.forwardServer(srvWithConn, method, args, reply)
|
|
}
|