open-consul/agent/rpc/middleware/interceptors.go

package middleware

import (
	"net"
	"reflect"
	"strconv"
	"strings"
	"time"

	"github.com/armon/go-metrics"
	"github.com/armon/go-metrics/prometheus"
	"github.com/hashicorp/consul-net-rpc/net/rpc"
	rpcRate "github.com/hashicorp/consul/agent/consul/rate"
	"github.com/hashicorp/go-hclog"
)

// RPCTypeInternal identifies the "RPC" request as coming from some internal
// operation that runs on the cluster leader. Technically this is not an RPC
// request, but these raft.Apply operations have the same impact on blocking
// queries, and streaming subscriptions, so need to be tracked by the same metric
// and logs.
// Really what we are measuring here is a "cluster operation". The term we have
// used for this historically is "RPC", so we continue to use that here.
const RPCTypeInternal = "internal"
const RPCTypeNetRPC = "net/rpc"

var metricRPCRequest = []string{"rpc", "server", "call"}
var requestLogName = strings.Join(metricRPCRequest, "_")

var OneTwelveRPCSummary = []prometheus.SummaryDefinition{
	{
		Name: metricRPCRequest,
		Help: "Measures the time an RPC service call takes to make in milliseconds. Labels mark which RPC method was called and metadata about the call.",
	},
}

type RequestRecorder struct {
	Logger         hclog.Logger
	RecorderFunc   func(key []string, val float32, labels []metrics.Label)
	serverIsLeader func() bool
	localDC        string
}

func NewRequestRecorder(logger hclog.Logger, isLeader func() bool, localDC string) *RequestRecorder {
	return &RequestRecorder{
		Logger:         logger,
		RecorderFunc:   metrics.AddSampleWithLabels,
		serverIsLeader: isLeader,
		localDC:        localDC,
	}
}

func (r *RequestRecorder) Record(requestName string, rpcType string, start time.Time, request interface{}, respErrored bool) {
	elapsed := time.Since(start).Microseconds()
	elapsedMs := float32(elapsed) / 1000
	reqType := requestType(request)
	isLeader := r.getServerLeadership()

	labels := []metrics.Label{
		{Name: "method", Value: requestName},
		{Name: "errored", Value: strconv.FormatBool(respErrored)},
		{Name: "request_type", Value: reqType},
		{Name: "rpc_type", Value: rpcType},
		{Name: "leader", Value: isLeader},
	}

	labels = r.addOptionalLabels(request, labels)

	// math.MaxInt64 < math.MaxFloat32 is true so we should be good!
	r.RecorderFunc(metricRPCRequest, elapsedMs, labels)

	labelsArr := flattenLabels(labels)
	r.Logger.Trace(requestLogName, labelsArr...)

}

func flattenLabels(labels []metrics.Label) []interface{} {

	var labelArr []interface{}
	for _, label := range labels {
		labelArr = append(labelArr, label.Name, label.Value)
	}

	return labelArr
}

func (r *RequestRecorder) addOptionalLabels(request interface{}, labels []metrics.Label) []metrics.Label {
	if rq, ok := request.(readQuery); ok {
		labels = append(labels,
			metrics.Label{
				Name:  "allow_stale",
				Value: strconv.FormatBool(rq.AllowStaleRead()),
			},
			metrics.Label{
				Name:  "blocking",
				Value: strconv.FormatBool(rq.GetMinQueryIndex() > 0),
			})
	}

	if td, ok := request.(targetDC); ok {
		requestDC := td.RequestDatacenter()
		labels = append(labels, metrics.Label{Name: "target_datacenter", Value: requestDC})

		if r.localDC == requestDC {
			labels = append(labels, metrics.Label{Name: "locality", Value: "local"})
		} else {
			labels = append(labels, metrics.Label{Name: "locality", Value: "forwarded"})
		}
	}

	return labels
}

func requestType(req interface{}) string {
	if r, ok := req.(interface{ IsRead() bool }); ok {
		if r.IsRead() {
			return "read"
		} else {
			return "write"
		}
	}

	// This logical branch should not happen. If it happens
	// it means an underlying request is not implementing the interface.
	// Rather than swallowing it up in a "read" or "write", let's be aware of it.
	return "unreported"
}

func (r *RequestRecorder) getServerLeadership() string {
	if r.serverIsLeader != nil {
		if r.serverIsLeader() {
			return "true"
		} else {
			return "false"
		}
	}

	// This logical branch should not happen. If it happens
	// it means that we have not plumbed down a way to verify
	// whether the server handling the request was a leader or not
	return "unreported"
}

type readQuery interface {
	GetMinQueryIndex() uint64
	AllowStaleRead() bool
}

type targetDC interface {
	RequestDatacenter() string
}

func GetNetRPCInterceptor(recorder *RequestRecorder) rpc.ServerServiceCallInterceptor {
	return func(reqServiceMethod string, argv, replyv reflect.Value, handler func() error) {
		reqStart := time.Now()

		err := handler()

		recorder.Record(reqServiceMethod, RPCTypeNetRPC, reqStart, argv.Interface(), err != nil)
	}
}

func GetNetRPCRateLimitingInterceptor(requestLimitsHandler rpcRate.RequestLimitsHandler, panicHandler RecoveryHandlerFunc) rpc.PreBodyInterceptor {

	return func(reqServiceMethod string, sourceAddr net.Addr) (retErr error) {

		defer func() {
			if r := recover(); r != nil {
				retErr = panicHandler(r)
			}
		}()

		op := rpcRate.Operation{
			Name:       reqServiceMethod,
			SourceAddr: sourceAddr,
			Type:       rpcRateLimitSpecs[reqServiceMethod].Type,
			Category:   rpcRateLimitSpecs[reqServiceMethod].Category,
		}

		// net/rpc does not provide a way to encode the nuances of the
		// error response (retry or retry elsewhere) so the error string
		// from the rate limiter is all that we have.
		return requestLimitsHandler.Allow(op)
	}
}
[sync oss] add net/rpc interceptor implementation (#12573) * sync ent changes from 866dcb0667 Signed-off-by: FFMMM <FFMMM@users.noreply.github.com> * update oss go.mod Signed-off-by: FFMMM <FFMMM@users.noreply.github.com> 2022-03-17 23:02:26 +00:00			`package middleware`

			`import (`
Wire up the rate limiter to net/rpc calls (#15879) 2023-01-04 19:38:44 +00:00			`"net"`
[sync oss] add net/rpc interceptor implementation (#12573) * sync ent changes from 866dcb0667 Signed-off-by: FFMMM <FFMMM@users.noreply.github.com> * update oss go.mod Signed-off-by: FFMMM <FFMMM@users.noreply.github.com> 2022-03-17 23:02:26 +00:00			`"reflect"`
			`"strconv"`
polish rpc.service.call metric behavior (#12624) 2022-03-31 17:49:37 +00:00			`"strings"`
[sync oss] add net/rpc interceptor implementation (#12573) * sync ent changes from 866dcb0667 Signed-off-by: FFMMM <FFMMM@users.noreply.github.com> * update oss go.mod Signed-off-by: FFMMM <FFMMM@users.noreply.github.com> 2022-03-17 23:02:26 +00:00			`"time"`

			`"github.com/armon/go-metrics"`
pre register new rpc metric, rename metric (#12582) 2022-03-22 00:26:32 +00:00			`"github.com/armon/go-metrics/prometheus"`
[sync oss] add net/rpc interceptor implementation (#12573) * sync ent changes from 866dcb0667 Signed-off-by: FFMMM <FFMMM@users.noreply.github.com> * update oss go.mod Signed-off-by: FFMMM <FFMMM@users.noreply.github.com> 2022-03-17 23:02:26 +00:00			`"github.com/hashicorp/consul-net-rpc/net/rpc"`
Wire up the rate limiter to net/rpc calls (#15879) 2023-01-04 19:38:44 +00:00			`rpcRate "github.com/hashicorp/consul/agent/consul/rate"`
[sync oss] add net/rpc interceptor implementation (#12573) * sync ent changes from 866dcb0667 Signed-off-by: FFMMM <FFMMM@users.noreply.github.com> * update oss go.mod Signed-off-by: FFMMM <FFMMM@users.noreply.github.com> 2022-03-17 23:02:26 +00:00			`"github.com/hashicorp/go-hclog"`
			`)`

			`// RPCTypeInternal identifies the "RPC" request as coming from some internal`
			`// operation that runs on the cluster leader. Technically this is not an RPC`
			`// request, but these raft.Apply operations have the same impact on blocking`
			`// queries, and streaming subscriptions, so need to be tracked by the same metric`
			`// and logs.`
			`// Really what we are measuring here is a "cluster operation". The term we have`
			`// used for this historically is "RPC", so we continue to use that here.`
			`const RPCTypeInternal = "internal"`
factor out recording func, add unit tests (#12585) Signed-off-by: FFMMM <FFMMM@users.noreply.github.com> 2022-03-22 16:31:54 +00:00			`const RPCTypeNetRPC = "net/rpc"`
[sync oss] add net/rpc interceptor implementation (#12573) * sync ent changes from 866dcb0667 Signed-off-by: FFMMM <FFMMM@users.noreply.github.com> * update oss go.mod Signed-off-by: FFMMM <FFMMM@users.noreply.github.com> 2022-03-17 23:02:26 +00:00
pre register new rpc metric, rename metric (#12582) 2022-03-22 00:26:32 +00:00			`var metricRPCRequest = []string{"rpc", "server", "call"}`
polish rpc.service.call metric behavior (#12624) 2022-03-31 17:49:37 +00:00			`var requestLogName = strings.Join(metricRPCRequest, "_")`
[sync oss] add net/rpc interceptor implementation (#12573) * sync ent changes from 866dcb0667 Signed-off-by: FFMMM <FFMMM@users.noreply.github.com> * update oss go.mod Signed-off-by: FFMMM <FFMMM@users.noreply.github.com> 2022-03-17 23:02:26 +00:00
polish rpc.service.call metric behavior (#12624) 2022-03-31 17:49:37 +00:00			`var OneTwelveRPCSummary = []prometheus.SummaryDefinition{`
pre register new rpc metric, rename metric (#12582) 2022-03-22 00:26:32 +00:00			`{`
			`Name: metricRPCRequest,`
polish rpc.service.call metric behavior (#12624) 2022-03-31 17:49:37 +00:00			`Help: "Measures the time an RPC service call takes to make in milliseconds. Labels mark which RPC method was called and metadata about the call.",`
pre register new rpc metric, rename metric (#12582) 2022-03-22 00:26:32 +00:00			`},`
			`}`

[sync oss] add net/rpc interceptor implementation (#12573) * sync ent changes from 866dcb0667 Signed-off-by: FFMMM <FFMMM@users.noreply.github.com> * update oss go.mod Signed-off-by: FFMMM <FFMMM@users.noreply.github.com> 2022-03-17 23:02:26 +00:00			`type RequestRecorder struct {`
add more labels to RequestRecorder (#12727) Co-authored-by: Daniel Nephin <dnephin@hashicorp.com> Signed-off-by: FFMMM <FFMMM@users.noreply.github.com> 2022-04-12 17:50:25 +00:00			`Logger hclog.Logger`
			`RecorderFunc func(key []string, val float32, labels []metrics.Label)`
			`serverIsLeader func() bool`
			`localDC string`
[sync oss] add net/rpc interceptor implementation (#12573) * sync ent changes from 866dcb0667 Signed-off-by: FFMMM <FFMMM@users.noreply.github.com> * update oss go.mod Signed-off-by: FFMMM <FFMMM@users.noreply.github.com> 2022-03-17 23:02:26 +00:00			`}`

add more labels to RequestRecorder (#12727) Co-authored-by: Daniel Nephin <dnephin@hashicorp.com> Signed-off-by: FFMMM <FFMMM@users.noreply.github.com> 2022-04-12 17:50:25 +00:00			`func NewRequestRecorder(logger hclog.Logger, isLeader func() bool, localDC string) *RequestRecorder {`
			`return &RequestRecorder{`
			`Logger: logger,`
			`RecorderFunc: metrics.AddSampleWithLabels,`
			`serverIsLeader: isLeader,`
			`localDC: localDC,`
			`}`
[sync oss] add net/rpc interceptor implementation (#12573) * sync ent changes from 866dcb0667 Signed-off-by: FFMMM <FFMMM@users.noreply.github.com> * update oss go.mod Signed-off-by: FFMMM <FFMMM@users.noreply.github.com> 2022-03-17 23:02:26 +00:00			`}`

			`func (r *RequestRecorder) Record(requestName string, rpcType string, start time.Time, request interface{}, respErrored bool) {`
Middleware: `RequestRecorder` reports calls below 1ms as decimal value (#12905) * Typos * Test failing * Convert values <1ms to decimal * Fix test * Update docs and test error msg * Applied suggested changes to test case * Changelog file and suggested changes * Update .changelog/12905.txt Co-authored-by: Chris S. Kim <kisunji92@gmail.com> * suggested change - start duration with microseconds instead of nanoseconds * fix error * suggested change - floats Co-authored-by: alex <8968914+acpana@users.noreply.github.com> Co-authored-by: Chris S. Kim <kisunji92@gmail.com> 2022-09-15 17:04:37 +00:00			`elapsed := time.Since(start).Microseconds()`
			`elapsedMs := float32(elapsed) / 1000`
[sync oss] add net/rpc interceptor implementation (#12573) * sync ent changes from 866dcb0667 Signed-off-by: FFMMM <FFMMM@users.noreply.github.com> * update oss go.mod Signed-off-by: FFMMM <FFMMM@users.noreply.github.com> 2022-03-17 23:02:26 +00:00			`reqType := requestType(request)`
add more labels to RequestRecorder (#12727) Co-authored-by: Daniel Nephin <dnephin@hashicorp.com> Signed-off-by: FFMMM <FFMMM@users.noreply.github.com> 2022-04-12 17:50:25 +00:00			`isLeader := r.getServerLeadership()`
[sync oss] add net/rpc interceptor implementation (#12573) * sync ent changes from 866dcb0667 Signed-off-by: FFMMM <FFMMM@users.noreply.github.com> * update oss go.mod Signed-off-by: FFMMM <FFMMM@users.noreply.github.com> 2022-03-17 23:02:26 +00:00
			`labels := []metrics.Label{`
			`{Name: "method", Value: requestName},`
			`{Name: "errored", Value: strconv.FormatBool(respErrored)},`
			`{Name: "request_type", Value: reqType},`
			`{Name: "rpc_type", Value: rpcType},`
add more labels to RequestRecorder (#12727) Co-authored-by: Daniel Nephin <dnephin@hashicorp.com> Signed-off-by: FFMMM <FFMMM@users.noreply.github.com> 2022-04-12 17:50:25 +00:00			`{Name: "leader", Value: isLeader},`
[sync oss] add net/rpc interceptor implementation (#12573) * sync ent changes from 866dcb0667 Signed-off-by: FFMMM <FFMMM@users.noreply.github.com> * update oss go.mod Signed-off-by: FFMMM <FFMMM@users.noreply.github.com> 2022-03-17 23:02:26 +00:00			`}`

add more labels to RequestRecorder (#12727) Co-authored-by: Daniel Nephin <dnephin@hashicorp.com> Signed-off-by: FFMMM <FFMMM@users.noreply.github.com> 2022-04-12 17:50:25 +00:00			`labels = r.addOptionalLabels(request, labels)`

polish rpc.service.call metric behavior (#12624) 2022-03-31 17:49:37 +00:00			`// math.MaxInt64 < math.MaxFloat32 is true so we should be good!`
Middleware: `RequestRecorder` reports calls below 1ms as decimal value (#12905) * Typos * Test failing * Convert values <1ms to decimal * Fix test * Update docs and test error msg * Applied suggested changes to test case * Changelog file and suggested changes * Update .changelog/12905.txt Co-authored-by: Chris S. Kim <kisunji92@gmail.com> * suggested change - start duration with microseconds instead of nanoseconds * fix error * suggested change - floats Co-authored-by: alex <8968914+acpana@users.noreply.github.com> Co-authored-by: Chris S. Kim <kisunji92@gmail.com> 2022-09-15 17:04:37 +00:00			`r.RecorderFunc(metricRPCRequest, elapsedMs, labels)`
add more labels to RequestRecorder (#12727) Co-authored-by: Daniel Nephin <dnephin@hashicorp.com> Signed-off-by: FFMMM <FFMMM@users.noreply.github.com> 2022-04-12 17:50:25 +00:00
			`labelsArr := flattenLabels(labels)`
			`r.Logger.Trace(requestLogName, labelsArr...)`

			`}`

			`func flattenLabels(labels []metrics.Label) []interface{} {`

			`var labelArr []interface{}`
			`for _, label := range labels {`
			`labelArr = append(labelArr, label.Name, label.Value)`
			`}`

			`return labelArr`
			`}`

			`func (r *RequestRecorder) addOptionalLabels(request interface{}, labels []metrics.Label) []metrics.Label {`
			`if rq, ok := request.(readQuery); ok {`
			`labels = append(labels,`
			`metrics.Label{`
			`Name: "allow_stale",`
			`Value: strconv.FormatBool(rq.AllowStaleRead()),`
			`},`
			`metrics.Label{`
			`Name: "blocking",`
			`Value: strconv.FormatBool(rq.GetMinQueryIndex() > 0),`
			`})`
			`}`

			`if td, ok := request.(targetDC); ok {`
			`requestDC := td.RequestDatacenter()`
			`labels = append(labels, metrics.Label{Name: "target_datacenter", Value: requestDC})`

			`if r.localDC == requestDC {`
			`labels = append(labels, metrics.Label{Name: "locality", Value: "local"})`
			`} else {`
			`labels = append(labels, metrics.Label{Name: "locality", Value: "forwarded"})`
			`}`
			`}`

			`return labels`
[sync oss] add net/rpc interceptor implementation (#12573) * sync ent changes from 866dcb0667 Signed-off-by: FFMMM <FFMMM@users.noreply.github.com> * update oss go.mod Signed-off-by: FFMMM <FFMMM@users.noreply.github.com> 2022-03-17 23:02:26 +00:00			`}`

			`func requestType(req interface{}) string {`
polish rpc.service.call metric behavior (#12624) 2022-03-31 17:49:37 +00:00			`if r, ok := req.(interface{ IsRead() bool }); ok {`
			`if r.IsRead() {`
			`return "read"`
			`} else {`
			`return "write"`
			`}`
[sync oss] add net/rpc interceptor implementation (#12573) * sync ent changes from 866dcb0667 Signed-off-by: FFMMM <FFMMM@users.noreply.github.com> * update oss go.mod Signed-off-by: FFMMM <FFMMM@users.noreply.github.com> 2022-03-17 23:02:26 +00:00			`}`
polish rpc.service.call metric behavior (#12624) 2022-03-31 17:49:37 +00:00
			`// This logical branch should not happen. If it happens`
			`// it means an underlying request is not implementing the interface.`
			`// Rather than swallowing it up in a "read" or "write", let's be aware of it.`
			`return "unreported"`
[sync oss] add net/rpc interceptor implementation (#12573) * sync ent changes from 866dcb0667 Signed-off-by: FFMMM <FFMMM@users.noreply.github.com> * update oss go.mod Signed-off-by: FFMMM <FFMMM@users.noreply.github.com> 2022-03-17 23:02:26 +00:00			`}`

add more labels to RequestRecorder (#12727) Co-authored-by: Daniel Nephin <dnephin@hashicorp.com> Signed-off-by: FFMMM <FFMMM@users.noreply.github.com> 2022-04-12 17:50:25 +00:00			`func (r *RequestRecorder) getServerLeadership() string {`
			`if r.serverIsLeader != nil {`
			`if r.serverIsLeader() {`
			`return "true"`
			`} else {`
			`return "false"`
			`}`
			`}`

			`// This logical branch should not happen. If it happens`
			`// it means that we have not plumbed down a way to verify`
			`// whether the server handling the request was a leader or not`
			`return "unreported"`
			`}`

			`type readQuery interface {`
			`GetMinQueryIndex() uint64`
			`AllowStaleRead() bool`
			`}`

			`type targetDC interface {`
			`RequestDatacenter() string`
			`}`

[sync oss] add net/rpc interceptor implementation (#12573) * sync ent changes from 866dcb0667 Signed-off-by: FFMMM <FFMMM@users.noreply.github.com> * update oss go.mod Signed-off-by: FFMMM <FFMMM@users.noreply.github.com> 2022-03-17 23:02:26 +00:00			`func GetNetRPCInterceptor(recorder *RequestRecorder) rpc.ServerServiceCallInterceptor {`
			`return func(reqServiceMethod string, argv, replyv reflect.Value, handler func() error) {`
			`reqStart := time.Now()`

			`err := handler()`

factor out recording func, add unit tests (#12585) Signed-off-by: FFMMM <FFMMM@users.noreply.github.com> 2022-03-22 16:31:54 +00:00			`recorder.Record(reqServiceMethod, RPCTypeNetRPC, reqStart, argv.Interface(), err != nil)`
[sync oss] add net/rpc interceptor implementation (#12573) * sync ent changes from 866dcb0667 Signed-off-by: FFMMM <FFMMM@users.noreply.github.com> * update oss go.mod Signed-off-by: FFMMM <FFMMM@users.noreply.github.com> 2022-03-17 23:02:26 +00:00			`}`
			`}`
Wire up the rate limiter to net/rpc calls (#15879) 2023-01-04 19:38:44 +00:00
feat: panic handler in rpc rate limit interceptor (#16022) * feat: handle panic in rpc rate limit interceptor * test: additional test cases to rpc rate limiting interceptor * refactor: remove unused listener 2023-01-25 19:13:38 +00:00			`func GetNetRPCRateLimitingInterceptor(requestLimitsHandler rpcRate.RequestLimitsHandler, panicHandler RecoveryHandlerFunc) rpc.PreBodyInterceptor {`

			`return func(reqServiceMethod string, sourceAddr net.Addr) (retErr error) {`

			`defer func() {`
			`if r := recover(); r != nil {`
			`retErr = panicHandler(r)`
			`}`
			`}()`
Wire up the rate limiter to net/rpc calls (#15879) 2023-01-04 19:38:44 +00:00
			`op := rpcRate.Operation{`
			`Name: reqServiceMethod,`
			`SourceAddr: sourceAddr,`
feat: add category annotation to RPC and gRPC methods (#16646) 2023-03-20 15:24:29 +00:00			`Type: rpcRateLimitSpecs[reqServiceMethod].Type,`
			`Category: rpcRateLimitSpecs[reqServiceMethod].Category,`
Wire up the rate limiter to net/rpc calls (#15879) 2023-01-04 19:38:44 +00:00			`}`

			`// net/rpc does not provide a way to encode the nuances of the`
			`// error response (retry or retry elsewhere) so the error string`
			`// from the rate limiter is all that we have.`
			`return requestLimitsHandler.Allow(op)`
			`}`
			`}`