Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Etcd2Topo: Use node's ModRevision consistently for in-memory topo.Version value #15847

Merged
merged 4 commits into from
May 12, 2024
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
11 changes: 7 additions & 4 deletions go/vt/topo/etcd2topo/watch.go
Original file line number Diff line number Diff line change
Expand Up @@ -51,7 +51,10 @@ func (s *Server) Watch(ctx context.Context, filePath string) (*topo.WatchData, <
}
wd := &topo.WatchData{
Contents: initial.Kvs[0].Value,
Version: EtcdVersion(initial.Kvs[0].Version),
// ModRevision is used for the topo.Version value as we get the new Revision value back
// when updating the file/key within a transaction in file.go and so this is the opaque
// version that we can use to enforce serializabile writes for the file/key.
Version: EtcdVersion(initial.Kvs[0].ModRevision),
}

// Create an outer context that will be canceled on return and will cancel all inner watches.
Expand Down Expand Up @@ -133,7 +136,7 @@ func (s *Server) Watch(ctx context.Context, filePath string) (*topo.WatchData, <
case mvccpb.PUT:
notifications <- &topo.WatchData{
Contents: ev.Kv.Value,
Version: EtcdVersion(ev.Kv.Version),
Version: EtcdVersion(ev.Kv.ModRevision),
}
case mvccpb.DELETE:
// Node is gone, send a final notice.
Expand Down Expand Up @@ -174,7 +177,7 @@ func (s *Server) WatchRecursive(ctx context.Context, dirpath string) ([]*topo.Wa
var wd topo.WatchDataRecursive
wd.Path = string(kv.Key)
wd.Contents = kv.Value
wd.Version = EtcdVersion(initial.Kvs[0].Version)
wd.Version = EtcdVersion(initial.Kvs[0].ModRevision)
initialwd = append(initialwd, &wd)
}

Expand Down Expand Up @@ -256,7 +259,7 @@ func (s *Server) WatchRecursive(ctx context.Context, dirpath string) ([]*topo.Wa
Path: string(ev.Kv.Key),
WatchData: topo.WatchData{
Contents: ev.Kv.Value,
Version: EtcdVersion(ev.Kv.Version),
Version: EtcdVersion(ev.Kv.ModRevision),
},
}
case mvccpb.DELETE:
Expand Down
159 changes: 159 additions & 0 deletions go/vt/topo/etcd2topo/watch_test.go
Original file line number Diff line number Diff line change
@@ -0,0 +1,159 @@
/*
Copyright 2024 The Vitess Authors.

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
*/

package etcd2topo

import (
"context"
"fmt"
"path"
"sync/atomic"
"testing"
"time"

"github.com/stretchr/testify/require"

clientv3 "go.etcd.io/etcd/client/v3"

"vitess.io/vitess/go/test/utils"
"vitess.io/vitess/go/vt/topo"
)

// TestWatchTopoVersion tests how the topo.Version values work within the etcd2topo
// Watch implementation. Today, those logical versions are based on the key's
// ModRevision value, which is a monotonically increasing int64 value. See
// https://github.com/vitessio/vitess/pull/15847 for additional details and the
// current reasoning behing using ModRevision. This can be changed in the future
// but should be done so intentionally, thus this test ensures we don't change the
// behavior accidentally/uinintentionally.
func TestWatchTopoVersion(t *testing.T) {
ctx := utils.LeakCheckContext(t)
etcdServerAddr, _ := startEtcd(t, 0)
root := "/vitess/test"
name := "testkey"
path := path.Join(root, name)
value := "testval"
// We use these two variables to ensure that we receive all of the changes in
// our watch.
changesMade := atomic.Int64{} // This is accessed across goroutines
changesSeen := int64(0)
client, err := clientv3.New(clientv3.Config{
Endpoints: []string{etcdServerAddr},
DialTimeout: 5 * time.Second,
})
require.NoError(t, err)
serverRunningCh := make(chan struct{})
server := &Server{
cli: client,
root: root,
running: serverRunningCh,
}
defer server.Close()

// Create the key as the vitess topo server requires that it exist before you
// can watch it (the lower level etcd watch does not require this).
client.Put(ctx, path, fmt.Sprintf("%s-%d", value, changesMade.Load()))
changesMade.Add(1)

var data <-chan *topo.WatchData
_, data, err = server.Watch(ctx, name)
require.NoError(t, err, "Server.Watch() error = %v", err)

// Coordinate between the goroutines on the delete so that we don't miss
// N changes when restarting the watch.
token := make(chan struct{})
defer close(token)

// Run a goroutine that updates the key we're watching.
go func() {
cur := changesMade.Load() + 1
batchSize := int64(10)
for i := cur; i <= cur+batchSize; i++ {
client.Put(ctx, path, fmt.Sprintf("%s-%d", value, i))
changesMade.Add(1)
select {
case <-ctx.Done():
return
default:
}
}
// Delete the key to ensure that our version continues to be monotonically
// increasing.
client.Delete(ctx, path)
changesMade.Add(1)
// Let the main goroutine process the delete and restart the watch before
// we make more changes.
token <- struct{}{}
cur = changesMade.Load() + 1
for i := cur; i <= cur+batchSize; i++ {
client.Put(ctx, path, fmt.Sprintf("%s-%d", value, i))
changesMade.Add(1)
select {
case <-ctx.Done():
return
default:
}
}
}()

// When using ModRevision as the logical key version, the Revision is initially
// 1 as we're at the first change of the keyspace (it has been created). This
// means that the first time we receive a change in the watch, we should expect
// the key's topo.Version to be 2 as it's the second change to the keyspace.
// We start with 1 as we increment this every time we receive a change in the
// watch.
expectedVersion := int64(1)

// Consider the test done when we've been watching the key for 10 seconds. We
// should receive all of the changes made within 1 second but we allow for a lot
// of extra time to prevent flakiness when the host is very slow for any reason.
watchCtx, cancel := context.WithTimeout(ctx, 10*time.Second)
defer cancel()
for {
select {
case <-watchCtx.Done():
require.Equal(t, changesMade.Load(), changesSeen, "expected %d changes, got %d", changesMade.Load(), changesSeen)
return // Success, we're done
case <-ctx.Done():
require.FailNow(t, "test context cancelled")
case <-serverRunningCh:
require.FailNow(t, "topo server is no longer running")
case wd := <-data:
changesSeen++
expectedVersion++
if wd.Err != nil {
if topo.IsErrType(wd.Err, topo.NoNode) {
// This was our delete. We'll restart the watch.
// Note that the lower level etcd watch doesn't treat delete as
// any special kind of change/event, it's another change to the
// key, but our topo server Watch treats this as an implicit end
// of the watch and it terminates it.
// We create the key again as the vitess topo server requires
// that it exist before watching it.
client.Put(ctx, path, fmt.Sprintf("%s-%d", value, changesMade.Load()))
changesMade.Add(1)
_, data, err = server.Watch(ctx, name)
require.NoError(t, err, "Server.Watch() error = %v", err)
<-token // Tell the goroutine making changes to continue
continue
}
require.FailNow(t, "unexpected error in watch data", "error: %v", wd.Err)
}
gotVersion := int64(wd.Version.(EtcdVersion))
require.Equal(t, expectedVersion, gotVersion, "expected version %d, got %d", expectedVersion, gotVersion)
}
}
}
Loading