keyring: fix flake in replication-after-election test (#13749)

The test for simulating a key rotation across leader elections was flaky because we weren't waiting for a leader election and was checking the server configs rather than raft for which server was currently the leader. Fixing the flake revealed a bug in the test that we weren't ensuring the new leader was running its own replication, so it wouldn't pick up the key material from the previous follower.
2026-01-06 10:25:42 +03:00 · 2022-07-15 11:09:09 -04:00
parent 573aa4519e
commit 7967c65dd2
1 changed files with 8 additions and 12 deletions
--- a/nomad/encrypter_test.go
+++ b/nomad/encrypter_test.go
@@ -189,15 +189,11 @@ func TestKeyringReplicator(t *testing.T) {
 	checkReplicationFn := func(keyID string) func() bool {
 		return func() bool {
 			for _, srv := range servers {
-				if srv == leader {
-					continue
-				}
 				keyPath := filepath.Join(srv.GetConfig().DataDir, "keystore",
 					keyID+nomadKeystoreExtension)
 				if _, err := os.Stat(keyPath); err != nil {
 					return false
 				}
-
 			}
 			return true
 		}
@@ -245,9 +241,6 @@ func TestKeyringReplicator(t *testing.T) {
 	// key, and triggering a leader election.

 	for _, srv := range servers {
-		if srv == leader {
-			continue
-		}
 		srv.keyringReplicator.stop()
 	}

@@ -258,14 +251,17 @@ func TestKeyringReplicator(t *testing.T) {
 	err = leader.leadershipTransfer()
 	require.NoError(t, err)

+	testutil.WaitForLeader(t, leader.RPC)
+
 	for _, srv := range servers {
-		if ok, _ := srv.getLeader(); !ok {
-			ctx, cancel := context.WithCancel(context.Background())
-			defer cancel()
-			go srv.keyringReplicator.run(ctx)
-		} else {
+		if ok, _ := srv.getLeader(); ok {
 			t.Logf("new leader is %s", srv.config.NodeName)
 		}
+
+		ctx, cancel := context.WithCancel(context.Background())
+		defer cancel()
+		t.Logf("replicating on %s", srv.config.NodeName)
+		go srv.keyringReplicator.run(ctx)
 	}

 	require.Eventually(t, checkReplicationFn(keyID3),