test(notifier): add regression test for stale unregister on re-register

Add TestNotifierReRegisterKeepsNewestSlot to reproduce the race where
an old unregister callback can remove a newer worker registration.

This test fails without the follow-up notifier fix.
This commit is contained in:
Matthew Buckingham-Bishop 2026-03-05 00:16:14 -08:00
parent 5691835f67
commit 42c6b723f6
1 changed files with 33 additions and 0 deletions

View File

@ -47,3 +47,36 @@ func TestNotifier(t *testing.T) {
wg.Wait()
}
func TestNotifierReRegisterKeepsNewestSlot(t *testing.T) {
ctx := context.Background()
watcher := notifier.NewNotifier(zap.NewNop().Sugar())
const worker = "worker-a"
_, staleCancel := watcher.Register(ctx, worker)
newestCh, newestCancel := watcher.Register(ctx, worker)
defer newestCancel()
// Simulate stale connection cleanup arriving after the worker has already re-registered.
staleCancel()
notifyCtx, notifyCancel := context.WithTimeout(ctx, 300*time.Millisecond)
defer notifyCancel()
notifyErrCh := make(chan error, 1)
go func() {
notifyErrCh <- watcher.Notify(notifyCtx, worker, nil)
}()
select {
case <-newestCh:
case err := <-notifyErrCh:
require.NoError(t, err)
t.Fatal("notify returned before delivering message to newest registration")
case <-time.After(time.Second):
t.Fatal("timed out waiting for notify delivery")
}
require.NoError(t, <-notifyErrCh)
}