Skip to content

Commit 4a9ad47

Browse files
committed
tests/integration: deflake etcd-io#15409
The cluster version will be initialized after the member becomes leader. The update is handled asynchronously. It couldn't be updated if the member has been closed and the go-runtime picks the `s.stopping` channel first. ```go // https://github.com/etcd-io/etcd/blob/e2a5df534cf6b0a12859e61bfc2758d56a1e1971/server/etcdserver/server.go#L2170 func (s *EtcdServer) monitorClusterVersions() { ... for { select { case <-s.firstCommitInTerm.Receive(): case <-time.After(monitorVersionInterval): case <-s.stopping: return } ... } } ``` Or after the `s.stopping` has been closed, the [UpdateClusterVersion][1] won't file GoAttach successfully. For the etcd-io#15409, we can see the warn log `server has stopped; skipping GoAttach` from GoAttach: ```plain https://github.com/etcd-io/etcd/actions/runs/4340931587/jobs/7580103902 logger.go:130: 2023-03-06T07:36:44.253Z WARN default stopping grpc server due to error {"error": "accept tcp 127.0.0.1:2379: use of closed network connection"} logger.go:130: 2023-03-06T07:36:44.253Z WARN default stopped grpc server due to error {"error": "accept tcp 127.0.0.1:2379: use of closed network connection"} logger.go:130: 2023-03-06T07:36:44.253Z ERROR default setting up serving from embedded etcd failed. {"error": "accept tcp 127.0.0.1:2379: use of closed network connection"} logger.go:130: 2023-03-06T07:36:44.253Z ERROR default setting up serving from embedded etcd failed. {"error": "http: Server closed"} logger.go:130: 2023-03-06T07:36:44.253Z INFO default skipped leadership transfer for single voting member cluster {"local-member-id": "8e9e05c52164694d", "current-leader-member-id": "8e9e05c52164694d"} logger.go:130: 2023-03-06T07:36:44.253Z WARN default server has stopped; skipping GoAttach ... ``` If the cluster version isn't updated, the minimum storage version will be v3.5 because the [AuthStatus][2] is introduced in [v3.5][3]. The compare will fail. To fix this issue, we should wait for cluster version to become ready after server is ready to serve request. [1]: <https://github.com/etcd-io/etcd/blob/e2a5df534cf6b0a12859e61bfc2758d56a1e1971/server/etcdserver/adapters.go#L45> [2]: <etcd-io@071e70c> [3]: <etcd-io@1b4e54c> Signed-off-by: Wei Fu <[email protected]>
1 parent e2a5df5 commit 4a9ad47

File tree

1 file changed

+38
-3
lines changed

1 file changed

+38
-3
lines changed

tests/integration/utl_wal_version_test.go

Lines changed: 38 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -28,6 +28,7 @@ import (
2828
"go.etcd.io/etcd/server/v3/embed"
2929
"go.etcd.io/etcd/server/v3/storage/wal"
3030
"go.etcd.io/etcd/server/v3/storage/wal/walpb"
31+
framecfg "go.etcd.io/etcd/tests/v3/framework/config"
3132
"go.etcd.io/etcd/tests/v3/framework/integration"
3233
)
3334

@@ -45,28 +46,62 @@ func TestEtcdVersionFromWAL(t *testing.T) {
4546
t.Fatalf("failed to start embed.Etcd for test")
4647
}
4748

49+
// When the member becomes leader, it will update the cluster version
50+
// with the cluster's minimum version. As it's updated asynchronously,
51+
// it could not be updated in time before close. Wait for it to become
52+
// ready.
53+
if err := waitForClusterVersionReady(srv); err != nil {
54+
srv.Close()
55+
t.Fatalf("failed to wait for cluster version to become ready: %v", err)
56+
}
57+
4858
ccfg := clientv3.Config{Endpoints: []string{cfg.ACUrls[0].String()}}
4959
cli, err := integration.NewClient(t, ccfg)
5060
if err != nil {
5161
srv.Close()
5262
t.Fatal(err)
5363
}
54-
// Get auth status to increase etcd version of proto stored in wal
64+
65+
// Once the cluster version has been updated, any entity's storage
66+
// version should be align with cluster version.
5567
ctx, cancel := context.WithTimeout(context.Background(), testutil.RequestTimeout)
56-
cli.AuthStatus(ctx)
68+
_, err = cli.AuthStatus(ctx)
5769
cancel()
70+
if err != nil {
71+
srv.Close()
72+
t.Fatalf("failed to get auth status: %v", err)
73+
}
5874

5975
cli.Close()
6076
srv.Close()
6177

6278
w, err := wal.Open(zap.NewNop(), cfg.Dir+"/member/wal", walpb.Snapshot{})
6379
if err != nil {
64-
panic(err)
80+
t.Fatal(err)
6581
}
6682
defer w.Close()
83+
6784
walVersion, err := wal.ReadWALVersion(w)
6885
if err != nil {
6986
t.Fatal(err)
7087
}
7188
assert.Equal(t, &semver.Version{Major: 3, Minor: 6}, walVersion.MinimalEtcdVersion())
7289
}
90+
91+
func waitForClusterVersionReady(srv *embed.Etcd) error {
92+
ctx, cancel := context.WithTimeout(context.Background(), 10*time.Second)
93+
defer cancel()
94+
95+
for {
96+
select {
97+
case <-ctx.Done():
98+
return ctx.Err()
99+
default:
100+
}
101+
102+
if srv.Server.ClusterVersion() != nil {
103+
return nil
104+
}
105+
time.Sleep(framecfg.TickDuration)
106+
}
107+
}

0 commit comments

Comments
 (0)