Support persistent watches

Implements the new persistent watch types introduced in 3.6, along with corresponding TreeCache and NodeCache utilities that try to keep in sync with the remote state.
go-zookeeper · Nov 17, 2022 · 70046d1 · 70046d1
1 parent 9cb9752
commit 70046d1
Show file tree

Hide file tree

Showing 17 changed files with 2,434 additions and 100 deletions.
diff --git a/Makefile b/Makefile
@@ -1,5 +1,5 @@
 # make file to hold the logic of build and test setup
-ZK_VERSION ?= 3.5.6
+ZK_VERSION ?= 3.6.3
 
 # Apache changed the name of the archive in version 3.5.x and seperated out
 # src and binary packages

diff --git a/cache_utils.go b/cache_utils.go
@@ -0,0 +1,202 @@
+package zk
+
+import (
+	"math"
+	"math/rand"
+	"strings"
+	"sync"
+	"sync/atomic"
+	"time"
+)
+
+// ErrorFilter determines whether the given error can be retried, or if the call should be abandoned.
+type ErrorFilter func(err error) (canRetry bool)
+
+// BackoffPolicy computes how long ExecuteWithRetries should wait between failed attempts. If this returns a negative
+// value, ExecuteWithRetries will exit with the last encountered error.
+type BackoffPolicy func(attempt int) (backoff time.Duration)
+
+// ExecuteWithRetries simply retries the given call as many times as the given ErrorFilter will allow, waiting in
+// between attempts according to the BackoffPolicy. If the error filter says an error cannot be retried, or the policy
+// returns a negative backoff or stopChan is closed, the last encountered error is returned.
+func ExecuteWithRetries(
+	filter ErrorFilter,
+	policy BackoffPolicy,
+	stopChan <-chan struct{},
+	call func() (err error),
+) (err error) {
+	for attempt := 0; ; attempt++ {
+		err = call()
+		if err == nil {
+			return nil
+		}
+
+		if !filter(err) {
+			return err
+		}
+
+		backoff := policy(attempt)
+		if backoff < 0 {
+			return err
+		}
+
+		select {
+		case <-stopChan:
+			return err
+		case <-time.After(backoff):
+			continue
+		}
+	}
+}
+
+// The DefaultWatcherBackoffPolicy is an ExponentialBackoffPolicy with infinite retries. The reasoning behind infinite
+// retries by default is that if any network connectivity issues arise, the watcher itself will likely be impacted or
+// stop receiving events altogether. Retrying forever is the best bet to keep everything in sync.
+var DefaultWatcherBackoffPolicy BackoffPolicy = (&ExponentialBackoffPolicy{
+	InitialBackoff: 100 * time.Millisecond,
+	MaxBackoff:     5 * time.Second,
+	MaxAttempts:    math.MaxInt64,
+}).ComputeBackoff
+
+type RetryPolicyFunc func(attempt int, lastError error) time.Duration
+
+func (r RetryPolicyFunc) ComputeBackoff(attempt int, lastError error) (backoff time.Duration) {
+	return r(attempt, lastError)
+}
+
+// ExponentialBackoffPolicy is a BackoffPolicy that implements exponential backoff and jitter (see "Full Jitter" in
+// https://aws.amazon.com/blogs/architecture/exponential-backoff-and-jitter/). It gives an option to dynamically decide
+// whether to retry specific error types.
+type ExponentialBackoffPolicy struct {
+	// The initial backoff duration and the value that will be multiplied when calculating the backoff for a specific
+	// attempt.
+	InitialBackoff time.Duration
+	// The maximum duration to backoff.
+	MaxBackoff time.Duration
+	// How many times to retry a given call before bailing.
+	MaxAttempts int
+	// If non-nil, this rand.Rand will be used to generate the jitter. Otherwise, the global rand is used.
+	Rand *rand.Rand
+}
+
+func (e *ExponentialBackoffPolicy) ComputeBackoff(attempt int) (backoff time.Duration) {
+	if attempt > e.MaxAttempts {
+		return -1
+	}
+
+	backoff = e.InitialBackoff << attempt
+	if backoff < e.InitialBackoff /* check for overflow from left shift */ || backoff > e.MaxBackoff {
+		backoff = e.MaxBackoff
+	}
+
+	if e.Rand != nil {
+		backoff = time.Duration(e.Rand.Int63n(int64(backoff)))
+	} else {
+		backoff = time.Duration(rand.Int63n(int64(backoff)))
+
+	}
+
+	return backoff
+}
+
+// GetWithRetries attempts to fetch the given node's data using ExecuteWithRetries. It will attempt to retry all but
+// the following three errors:
+// - zk.ErrNoNode: Retrying fetches on a node that doesn't exist isn't going to yield very interesting results,
+// especially in the context of a watch where an eventual zk.EventNodeCreated will notify the watcher of the node's
+// reappearance.
+//
+// - zk.ErrConnectionClosed: This error is returned by any call made after Close() is called on a zk.Conn. This call
+// will never succeed.
+//
+// - zk.ErrNoAuth: If a zk.Conn does not have the required authentication to access a node, retrying the call will not
+// succeed until authentication is added. It's best to report this as early as possible instead of blocking the process.
+func GetWithRetries(
+	policy BackoffPolicy,
+	stopChan chan struct{},
+	conn *Conn,
+	nodePath string,
+) (data []byte, stat *Stat, err error) {
+	err = ExecuteWithRetries(
+		func(err error) bool {
+			return err != ErrNoNode && err != ErrConnectionClosed && err != ErrNoAuth
+		},
+		policy,
+		stopChan,
+		func() (err error) {
+			data, stat, err = conn.Get(nodePath)
+			return err
+		},
+	)
+	return data, stat, err
+}
+
+// MultiReadWithRetries batches the given ops by the given batchLimit and executes each batch in parallel. Much like
+// how Conn.MultiRead is expected to behave, each MultiReadResponse will correspond to the given ReadOp in the same
+// position.
+func MultiReadWithRetries(
+	policy BackoffPolicy,
+	stopChan chan struct{},
+	conn *Conn,
+	batchLimit int,
+	ops ...ReadOp,
+) (responses []MultiReadResponse, err error) {
+	var firstErr atomic.Pointer[error]
+
+	responses = make([]MultiReadResponse, len(ops))
+	wg := sync.WaitGroup{}
+
+	for offset := 0; offset < len(ops); offset += batchLimit {
+		start := offset
+		end := offset + batchLimit
+		if end > len(ops) {
+			end = len(ops)
+		}
+
+		wg.Add(1)
+		go func() {
+			defer wg.Done()
+			var batchRes []MultiReadResponse
+			err := ExecuteWithRetries(
+				func(err error) (canRetry bool) {
+					return err != ErrConnectionClosed
+				},
+				policy,
+				stopChan,
+				func() (err error) {
+					batchRes, err = conn.MultiRead(ops[start:end]...)
+					return err
+				},
+			)
+			if err != nil {
+				firstErr.CompareAndSwap(nil, &err)
+				return
+			}
+			copy(responses[start:end], batchRes)
+		}()
+	}
+	wg.Wait()
+	if errPtr := firstErr.Load(); errPtr != nil {
+		return nil, *errPtr
+	}
+	return responses, nil
+}
+
+func JoinPath(parent, child string) string {
+	if !strings.HasSuffix(parent, "/") {
+		parent += "/"
+	}
+	if strings.HasPrefix(child, "/") {
+		child = child[1:]
+	}
+	return parent + child
+}
+
+func SplitPath(path string) (dir, name string) {
+	i := strings.LastIndex(path, "/")
+	if i == 0 {
+		dir, name = "/", path[1:]
+	} else {
+		dir, name = path[:i], path[i+1:]
+	}
+	return dir, name
+}
diff --git a/cache_utils_test.go b/cache_utils_test.go
@@ -0,0 +1,73 @@
+package zk
+
+import (
+	"fmt"
+	"testing"
+	"time"
+)
+
+func TestExecuteWithRetries(t *testing.T) {
+	errors := make([]error, 5)
+	for i := range errors {
+		errors[i] = fmt.Errorf("%d", i)
+	}
+	idx := 0
+	call := func() error {
+		err := errors[idx]
+		idx++
+		return err
+	}
+
+	stopChan := make(chan struct{})
+
+	err := ExecuteWithRetries(
+		func(error) bool { return false },
+		func(int) time.Duration { return 0 },
+		stopChan,
+		call,
+	)
+	if err != errors[0] {
+		t.Fatalf("Did not get correct error: %+v", err)
+	}
+
+	idx = 0
+	attempts := 0
+	err = ExecuteWithRetries(
+		func(error) bool {
+			return idx <= 2
+		},
+		func(int) time.Duration {
+			attempts++
+			return 0
+		},
+		stopChan,
+		call,
+	)
+	if err != errors[2] {
+		t.Fatalf("Did not get correct error: %+v", err)
+	}
+	if attempts != 2 {
+		t.Fatalf("Did not get correct attempt count: %d", attempts)
+	}
+
+	idx = 0
+	attempts = 0
+	err = ExecuteWithRetries(
+		func(error) bool {
+			return true
+		},
+		func(int) time.Duration {
+			attempts++
+			// If call is called again after stopChan is closed, it will panic because no more errors remain
+			if attempts == 5 {
+				close(stopChan)
+			}
+			return 0
+		},
+		stopChan,
+		call,
+	)
+	if err != errors[4] {
+		t.Fatalf("Did not get correct error: %+v", err)
+	}
+}