open-vault/physical/gcs/gcs_ha.go

package gcs

import (
	"context"
	"encoding/json"
	"fmt"
	"sync"
	"time"

	"cloud.google.com/go/storage"
	metrics "github.com/armon/go-metrics"
	"github.com/hashicorp/errwrap"
	uuid "github.com/hashicorp/go-uuid"
	"github.com/hashicorp/vault/physical"
	"github.com/pkg/errors"
	"google.golang.org/api/googleapi"
)

// Verify Backend satisfies the correct interfaces
var _ physical.HABackend = (*Backend)(nil)
var _ physical.Lock = (*Lock)(nil)

const (
	// LockRenewInterval is the time to wait between lock renewals.
	LockRenewInterval = 5 * time.Second

	// LockRetryInterval is the amount of time to wait if the lock fails before
	// trying again.
	LockRetryInterval = 5 * time.Second

	// LockTTL is the default lock TTL.
	LockTTL = 15 * time.Second

	// LockWatchRetryInterval is the amount of time to wait if a watch fails
	// before trying again.
	LockWatchRetryInterval = 5 * time.Second

	// LockWatchRetryMax is the number of times to retry a failed watch before
	// signaling that leadership is lost.
	LockWatchRetryMax = 5
)

var (
	// metricLockUnlock is the metric to register for a lock delete.
	metricLockUnlock = []string{"gcs", "lock", "unlock"}

	// metricLockGet is the metric to register for a lock get.
	metricLockLock = []string{"gcs", "lock", "lock"}

	// metricLockValue is the metric to register for a lock create/update.
	metricLockValue = []string{"gcs", "lock", "value"}
)

// Lock is the HA lock.
type Lock struct {
	// backend is the underlying physical backend.
	backend *Backend

	// key is the name of the key. value is the value of the key.
	key, value string

	// held is a boolean indicating if the lock is currently held.
	held bool

	// identity is the internal identity of this key (unique to this server
	// instance).
	identity string

	// lock is an internal lock
	lock sync.Mutex

	// stopCh is the channel that stops all operations. It may be closed in the
	// event of a leader loss or graceful shutdown. stopped is a boolean
	// indicating if we are stopped - it exists to prevent double closing the
	// channel. stopLock is a mutex around the locks.
	stopCh   chan struct{}
	stopped  bool
	stopLock sync.Mutex

	// Allow modifying the Lock durations for ease of unit testing.
	renewInterval      time.Duration
	retryInterval      time.Duration
	ttl                time.Duration
	watchRetryInterval time.Duration
	watchRetryMax      int
}

// LockRecord is the struct that corresponds to a lock.
type LockRecord struct {
	Key       string    `json:"key"`
	Value     string    `json:"value"`
	Identity  string    `json:"identity"`
	Timestamp time.Time `json:"timestamp"`

	// attrs are the internal object attributes. This is stored internally, for
	// internal consumption only.
	attrs *storage.ObjectAttrs
}

// HAEnabled implements HABackend and indicates that this backend supports high
// availability.
func (b *Backend) HAEnabled() bool {
	return b.haEnabled
}

// LockWith acquires a mutual exclusion based on the given key.
func (b *Backend) LockWith(key, value string) (physical.Lock, error) {
	identity, err := uuid.GenerateUUID()
	if err != nil {
		return nil, errwrap.Wrapf("lock with: {{err}}", err)
	}
	return &Lock{
		backend:  b,
		key:      key,
		value:    value,
		identity: identity,
		stopped:  true,

		renewInterval:      LockRenewInterval,
		retryInterval:      LockRetryInterval,
		ttl:                LockTTL,
		watchRetryInterval: LockWatchRetryInterval,
		watchRetryMax:      LockWatchRetryMax,
	}, nil
}

// Lock acquires the given lock. The stopCh is optional. If closed, it
// interrupts the lock acquisition attempt. The returned channel should be
// closed when leadership is lost.
func (l *Lock) Lock(stopCh <-chan struct{}) (<-chan struct{}, error) {
	defer metrics.MeasureSince(metricLockLock, time.Now())

	l.lock.Lock()
	defer l.lock.Unlock()
	if l.held {
		return nil, errors.New("lock already held")
	}

	// Attempt to lock - this function blocks until a lock is acquired or an error
	// occurs.
	acquired, err := l.attemptLock(stopCh)
	if err != nil {
		return nil, errwrap.Wrapf("lock: {{err}}", err)
	}
	if !acquired {
		return nil, nil
	}

	// We have the lock now
	l.held = true

	// Build the locks
	l.stopLock.Lock()
	l.stopCh = make(chan struct{})
	l.stopped = false
	l.stopLock.Unlock()

	// Periodically renew and watch the lock
	go l.renewLock()
	go l.watchLock()

	return l.stopCh, nil
}

// Unlock releases the lock.
func (l *Lock) Unlock() error {
	defer metrics.MeasureSince(metricLockUnlock, time.Now())

	l.lock.Lock()
	defer l.lock.Unlock()
	if !l.held {
		return nil
	}

	// Stop any existing locking or renewal attempts
	l.stopLock.Lock()
	if !l.stopped {
		l.stopped = true
		close(l.stopCh)
	}
	l.stopLock.Unlock()

	// Delete
	ctx := context.Background()
	if err := l.backend.Delete(ctx, l.key); err != nil {
		return err
	}

	// We are no longer holding the lock
	l.held = false

	return nil
}

// Value returns the value of the lock and if it is held.
func (l *Lock) Value() (bool, string, error) {
	defer metrics.MeasureSince(metricLockValue, time.Now())

	r, err := l.get(context.Background())
	if err != nil {
		return false, "", err
	}
	if r == nil {
		return false, "", err
	}
	return true, string(r.Value), nil
}

// attemptLock attempts to acquire a lock. If the given channel is closed, the
// acquisition attempt stops. This function returns when a lock is acquired or
// an error occurs.
func (l *Lock) attemptLock(stopCh <-chan struct{}) (bool, error) {
	ticker := time.NewTicker(l.retryInterval)
	defer ticker.Stop()

	for {
		select {
		case <-ticker.C:
			acquired, err := l.writeLock()
			if err != nil {
				return false, errwrap.Wrapf("attempt lock: {{err}}", err)
			}
			if !acquired {
				continue
			}

			return true, nil
		case <-stopCh:
			return false, nil
		}
	}
}

// renewLock renews the given lock until the channel is closed.
func (l *Lock) renewLock() {
	ticker := time.NewTicker(l.renewInterval)
	defer ticker.Stop()

	for {
		select {
		case <-ticker.C:
			l.writeLock()
		case <-l.stopCh:
			return
		}
	}
}

// watchLock checks whether the lock has changed in the table and closes the
// leader channel accordingly. If an error occurs during the check, watchLock
// will retry the operation and then close the leader channel if it can't
// succeed after retries.
func (l *Lock) watchLock() {
	retries := 0
	ticker := time.NewTicker(l.watchRetryInterval)

	for {
		// Check if the channel is already closed
		select {
		case <-l.stopCh:
		default:
		}

		// Check if we've exceeded retries
		if retries >= l.watchRetryMax-1 {
			break
		}

		// Wait for the timer
		<-ticker.C

		// Attempt to read the key
		r, err := l.get(context.Background())
		if err != nil {
			retries++
			continue
		}

		// Verify the identity is the same
		if r == nil || r.Identity != l.identity {
			break
		}
	}

	l.stopLock.Lock()
	defer l.stopLock.Unlock()
	if !l.stopped {
		l.stopped = true
		close(l.stopCh)
	}
}

// writeLock writes the given lock using the following algorithm:
//
// - lock does not exist
//   - write the lock
// - lock exists
//   - if key is empty or identity is the same or timestamp exceeds TTL
//     - update the lock to self
func (l *Lock) writeLock() (bool, error) {
	// Pooling
	l.backend.permitPool.Acquire()
	defer l.backend.permitPool.Release()

	// Create a transaction to read and the update (maybe)
	ctx, cancel := context.WithCancel(context.Background())
	defer cancel()

	// The operation may be retried, so we need to stop it if we lose leadership.
	go func() {
		select {
		case <-l.stopCh:
			cancel()
		case <-ctx.Done():
		}
	}()

	// Build up the list of conditions
	var conds storage.Conditions

	// Read the record
	r, err := l.get(ctx)
	if err != nil {
		return false, errwrap.Wrapf("write lock: {{err}}", err)
	}
	if r != nil {
		// If the key is empty or the identity is ours or the ttl expired, we can
		// write. Otherwise, return now because we cannot.
		if r.Key != "" && r.Identity != l.identity && time.Now().UTC().Sub(r.Timestamp) < l.ttl {
			return false, nil
		}

		// CAS operation
		conds.GenerationMatch = r.attrs.Generation
		conds.MetagenerationMatch = r.attrs.Metageneration
	} else {
		// Ensure no one created while we were working
		conds.DoesNotExist = true
	}

	// Update the lock to now
	lockData, err := json.Marshal(&LockRecord{
		Key:       l.key,
		Value:     l.value,
		Identity:  l.identity,
		Timestamp: time.Now().UTC(),
	})
	if err != nil {
		return false, errwrap.Wrapf("write lock: failed to encode JSON: {{err}}", err)
	}

	// Write the object
	obj := l.backend.client.Bucket(l.backend.bucket).Object(l.key)
	w := obj.If(conds).NewWriter(ctx)
	w.ObjectAttrs.CacheControl = "no-cache; no-store; max-age=0"
	w.ObjectAttrs.Metadata = map[string]string{
		"lock": string(lockData),
	}
	if err := w.Close(); err != nil {
		// If the pre-condition failed, it means that we already have a lock.
		if terr, ok := err.(*googleapi.Error); ok && terr.Code == 412 {
			return false, nil
		}
		return false, err
	}

	return true, nil
}

// get retrieves the value for the lock.
func (l *Lock) get(ctx context.Context) (*LockRecord, error) {
	// Pooling
	l.backend.permitPool.Acquire()
	defer l.backend.permitPool.Release()

	// Read
	attrs, err := l.backend.client.Bucket(l.backend.bucket).Object(l.key).Attrs(ctx)
	if err == storage.ErrObjectNotExist {
		return nil, nil
	}
	if err != nil {
		return nil, errwrap.Wrapf(fmt.Sprintf("failed to read attrs for %q: {{err}}", l.key), err)
	}

	// If we got this far, we have attributes, meaning the lockfile exists.
	var r LockRecord
	r.attrs = attrs
	lockData := []byte(attrs.Metadata["lock"])
	if err := json.Unmarshal(lockData, &r); err != nil {
		return nil, errwrap.Wrapf("failed to decode lock: {{err}}", err)
	}
	return &r, nil
}
Add HA support to the Google Cloud Storage backend (#4226) 2018-03-30 16:36:37 +00:00			`package gcs`

			`import (`
Use context from stdlib in google physical backends (#4922) * Use context from stdlib in google physical backends * Do not prefix logs (Vault will do it) 2018-07-13 15:00:38 +00:00			`"context"`
Add HA support to the Google Cloud Storage backend (#4226) 2018-03-30 16:36:37 +00:00			`"encoding/json"`
			`"fmt"`
			`"sync"`
			`"time"`

			`"cloud.google.com/go/storage"`
			`metrics "github.com/armon/go-metrics"`
			`"github.com/hashicorp/errwrap"`
			`uuid "github.com/hashicorp/go-uuid"`
			`"github.com/hashicorp/vault/physical"`
			`"github.com/pkg/errors"`
			`"google.golang.org/api/googleapi"`
			`)`

			`// Verify Backend satisfies the correct interfaces`
			`var _ physical.HABackend = (*Backend)(nil)`
			`var _ physical.Lock = (*Lock)(nil)`

			`const (`
			`// LockRenewInterval is the time to wait between lock renewals.`
			`LockRenewInterval = 5 * time.Second`

			`// LockRetryInterval is the amount of time to wait if the lock fails before`
			`// trying again.`
			`LockRetryInterval = 5 * time.Second`

			`// LockTTL is the default lock TTL.`
			`LockTTL = 15 * time.Second`

			`// LockWatchRetryInterval is the amount of time to wait if a watch fails`
			`// before trying again.`
			`LockWatchRetryInterval = 5 * time.Second`

			`// LockWatchRetryMax is the number of times to retry a failed watch before`
			`// signaling that leadership is lost.`
			`LockWatchRetryMax = 5`
			`)`

			`var (`
			`// metricLockUnlock is the metric to register for a lock delete.`
			`metricLockUnlock = []string{"gcs", "lock", "unlock"}`

			`// metricLockGet is the metric to register for a lock get.`
			`metricLockLock = []string{"gcs", "lock", "lock"}`

			`// metricLockValue is the metric to register for a lock create/update.`
			`metricLockValue = []string{"gcs", "lock", "value"}`
			`)`

			`// Lock is the HA lock.`
			`type Lock struct {`
			`// backend is the underlying physical backend.`
			`backend *Backend`

			`// key is the name of the key. value is the value of the key.`
			`key, value string`

			`// held is a boolean indicating if the lock is currently held.`
			`held bool`

			`// identity is the internal identity of this key (unique to this server`
			`// instance).`
			`identity string`

			`// lock is an internal lock`
			`lock sync.Mutex`

			`// stopCh is the channel that stops all operations. It may be closed in the`
			`// event of a leader loss or graceful shutdown. stopped is a boolean`
			`// indicating if we are stopped - it exists to prevent double closing the`
			`// channel. stopLock is a mutex around the locks.`
			`stopCh chan struct{}`
			`stopped bool`
			`stopLock sync.Mutex`

			`// Allow modifying the Lock durations for ease of unit testing.`
			`renewInterval time.Duration`
			`retryInterval time.Duration`
			`ttl time.Duration`
			`watchRetryInterval time.Duration`
			`watchRetryMax int`
			`}`

			`// LockRecord is the struct that corresponds to a lock.`
			`type LockRecord struct {`
			Key string `json:"key"`
			Value string `json:"value"`
			Identity string `json:"identity"`
			Timestamp time.Time `json:"timestamp"`

			`// attrs are the internal object attributes. This is stored internally, for`
			`// internal consumption only.`
			`attrs *storage.ObjectAttrs`
			`}`

			`// HAEnabled implements HABackend and indicates that this backend supports high`
			`// availability.`
			`func (b *Backend) HAEnabled() bool {`
			`return b.haEnabled`
			`}`

			`// LockWith acquires a mutual exclusion based on the given key.`
			`func (b *Backend) LockWith(key, value string) (physical.Lock, error) {`
			`identity, err := uuid.GenerateUUID()`
			`if err != nil {`
			`return nil, errwrap.Wrapf("lock with: {{err}}", err)`
			`}`
			`return &Lock{`
			`backend: b,`
			`key: key,`
			`value: value,`
			`identity: identity,`
			`stopped: true,`

			`renewInterval: LockRenewInterval,`
			`retryInterval: LockRetryInterval,`
			`ttl: LockTTL,`
			`watchRetryInterval: LockWatchRetryInterval,`
			`watchRetryMax: LockWatchRetryMax,`
			`}, nil`
			`}`

			`// Lock acquires the given lock. The stopCh is optional. If closed, it`
			`// interrupts the lock acquisition attempt. The returned channel should be`
			`// closed when leadership is lost.`
			`func (l *Lock) Lock(stopCh <-chan struct{}) (<-chan struct{}, error) {`
			`defer metrics.MeasureSince(metricLockLock, time.Now())`

			`l.lock.Lock()`
			`defer l.lock.Unlock()`
			`if l.held {`
			`return nil, errors.New("lock already held")`
			`}`

			`// Attempt to lock - this function blocks until a lock is acquired or an error`
			`// occurs.`
			`acquired, err := l.attemptLock(stopCh)`
			`if err != nil {`
			`return nil, errwrap.Wrapf("lock: {{err}}", err)`
			`}`
			`if !acquired {`
			`return nil, nil`
			`}`

			`// We have the lock now`
			`l.held = true`

			`// Build the locks`
			`l.stopLock.Lock()`
			`l.stopCh = make(chan struct{})`
			`l.stopped = false`
			`l.stopLock.Unlock()`

			`// Periodically renew and watch the lock`
			`go l.renewLock()`
			`go l.watchLock()`

			`return l.stopCh, nil`
			`}`

			`// Unlock releases the lock.`
			`func (l *Lock) Unlock() error {`
			`defer metrics.MeasureSince(metricLockUnlock, time.Now())`

			`l.lock.Lock()`
			`defer l.lock.Unlock()`
			`if !l.held {`
			`return nil`
			`}`

			`// Stop any existing locking or renewal attempts`
			`l.stopLock.Lock()`
			`if !l.stopped {`
			`l.stopped = true`
			`close(l.stopCh)`
			`}`
			`l.stopLock.Unlock()`

			`// Delete`
			`ctx := context.Background()`
			`if err := l.backend.Delete(ctx, l.key); err != nil {`
			`return err`
			`}`

			`// We are no longer holding the lock`
			`l.held = false`

			`return nil`
			`}`

			`// Value returns the value of the lock and if it is held.`
			`func (l *Lock) Value() (bool, string, error) {`
			`defer metrics.MeasureSince(metricLockValue, time.Now())`

			`r, err := l.get(context.Background())`
			`if err != nil {`
			`return false, "", err`
			`}`
			`if r == nil {`
			`return false, "", err`
			`}`
			`return true, string(r.Value), nil`
			`}`

			`// attemptLock attempts to acquire a lock. If the given channel is closed, the`
			`// acquisition attempt stops. This function returns when a lock is acquired or`
			`// an error occurs.`
			`func (l *Lock) attemptLock(stopCh <-chan struct{}) (bool, error) {`
			`ticker := time.NewTicker(l.retryInterval)`
			`defer ticker.Stop()`

			`for {`
			`select {`
			`case <-ticker.C:`
			`acquired, err := l.writeLock()`
			`if err != nil {`
			`return false, errwrap.Wrapf("attempt lock: {{err}}", err)`
			`}`
			`if !acquired {`
			`continue`
			`}`

			`return true, nil`
			`case <-stopCh:`
			`return false, nil`
			`}`
			`}`
			`}`

			`// renewLock renews the given lock until the channel is closed.`
			`func (l *Lock) renewLock() {`
			`ticker := time.NewTicker(l.renewInterval)`
			`defer ticker.Stop()`

			`for {`
			`select {`
			`case <-ticker.C:`
			`l.writeLock()`
			`case <-l.stopCh:`
			`return`
			`}`
			`}`
			`}`

			`// watchLock checks whether the lock has changed in the table and closes the`
			`// leader channel accordingly. If an error occurs during the check, watchLock`
			`// will retry the operation and then close the leader channel if it can't`
			`// succeed after retries.`
			`func (l *Lock) watchLock() {`
			`retries := 0`
			`ticker := time.NewTicker(l.watchRetryInterval)`

			`for {`
			`// Check if the channel is already closed`
			`select {`
			`case <-l.stopCh:`
			`default:`
			`}`

			`// Check if we've exceeded retries`
			`if retries >= l.watchRetryMax-1 {`
			`break`
			`}`

			`// Wait for the timer`
			`<-ticker.C`

			`// Attempt to read the key`
			`r, err := l.get(context.Background())`
			`if err != nil {`
			`retries++`
			`continue`
			`}`

			`// Verify the identity is the same`
			`if r == nil \|\| r.Identity != l.identity {`
			`break`
			`}`
			`}`

			`l.stopLock.Lock()`
			`defer l.stopLock.Unlock()`
			`if !l.stopped {`
			`l.stopped = true`
			`close(l.stopCh)`
			`}`
			`}`

			`// writeLock writes the given lock using the following algorithm:`
			`//`
			`// - lock does not exist`
			`// - write the lock`
			`// - lock exists`
			`// - if key is empty or identity is the same or timestamp exceeds TTL`
			`// - update the lock to self`
			`func (l *Lock) writeLock() (bool, error) {`
			`// Pooling`
			`l.backend.permitPool.Acquire()`
			`defer l.backend.permitPool.Release()`

			`// Create a transaction to read and the update (maybe)`
			`ctx, cancel := context.WithCancel(context.Background())`
			`defer cancel()`

			`// The operation may be retried, so we need to stop it if we lose leadership.`
			`go func() {`
			`select {`
			`case <-l.stopCh:`
			`cancel()`
			`case <-ctx.Done():`
			`}`
			`}()`

			`// Build up the list of conditions`
			`var conds storage.Conditions`

			`// Read the record`
			`r, err := l.get(ctx)`
			`if err != nil {`
			`return false, errwrap.Wrapf("write lock: {{err}}", err)`
			`}`
			`if r != nil {`
			`// If the key is empty or the identity is ours or the ttl expired, we can`
			`// write. Otherwise, return now because we cannot.`
			`if r.Key != "" && r.Identity != l.identity && time.Now().UTC().Sub(r.Timestamp) < l.ttl {`
			`return false, nil`
			`}`

			`// CAS operation`
			`conds.GenerationMatch = r.attrs.Generation`
			`conds.MetagenerationMatch = r.attrs.Metageneration`
			`} else {`
			`// Ensure no one created while we were working`
			`conds.DoesNotExist = true`
			`}`

			`// Update the lock to now`
			`lockData, err := json.Marshal(&LockRecord{`
			`Key: l.key,`
			`Value: l.value,`
			`Identity: l.identity,`
			`Timestamp: time.Now().UTC(),`
			`})`
			`if err != nil {`
			`return false, errwrap.Wrapf("write lock: failed to encode JSON: {{err}}", err)`
			`}`

			`// Write the object`
			`obj := l.backend.client.Bucket(l.backend.bucket).Object(l.key)`
			`w := obj.If(conds).NewWriter(ctx)`
			`w.ObjectAttrs.CacheControl = "no-cache; no-store; max-age=0"`
			`w.ObjectAttrs.Metadata = map[string]string{`
			`"lock": string(lockData),`
			`}`
			`if err := w.Close(); err != nil {`
			`// If the pre-condition failed, it means that we already have a lock.`
			`if terr, ok := err.(*googleapi.Error); ok && terr.Code == 412 {`
			`return false, nil`
			`}`
			`return false, err`
			`}`

			`return true, nil`
			`}`

			`// get retrieves the value for the lock.`
			`func (l Lock) get(ctx context.Context) (LockRecord, error) {`
			`// Pooling`
			`l.backend.permitPool.Acquire()`
			`defer l.backend.permitPool.Release()`

			`// Read`
			`attrs, err := l.backend.client.Bucket(l.backend.bucket).Object(l.key).Attrs(ctx)`
			`if err == storage.ErrObjectNotExist {`
			`return nil, nil`
			`}`
			`if err != nil {`
			`return nil, errwrap.Wrapf(fmt.Sprintf("failed to read attrs for %q: {{err}}", l.key), err)`
			`}`

			`// If we got this far, we have attributes, meaning the lockfile exists.`
			`var r LockRecord`
			`r.attrs = attrs`
			`lockData := []byte(attrs.Metadata["lock"])`
			`if err := json.Unmarshal(lockData, &r); err != nil {`
			`return nil, errwrap.Wrapf("failed to decode lock: {{err}}", err)`
			`}`
			`return &r, nil`
			`}`