m/p/supervisor: wait for runnables to exit in TestHarness This ensures that tests which aren't marked as parallel won't interfere with eachother due to still running runnables (for example, gracefully terminating gRPC services listening on some stable port number). To implement this, we add the Liquidator, a goroutine responsible for maintaining a minimum viable supervisor processor which records all runnables' exits. These can then be inspected by the TestHarness to ensure that all runnables are truly dead. Change-Id: I436f9608d1e0e04796f7198b641e7d625df885f8 Reviewed-on: https://review.monogon.dev/c/monogon/+/625 Reviewed-by: Leopold Schabel <leo@nexantic.com>

commit: ec19b60842e905a4400e5f8b46b783a54d0a025a [log] [tgz]
author: Serge Bazanski <serge@monogon.tech> Wed Mar 09 20:41:31 2022 +0100
committer: Sergiusz Bazanski <serge@monogon.tech> Fri Mar 11 11:00:50 2022 +0000
tree: b4c0d22ef5dc693a21fef4e987d9c82457d816f6
parent: 662182fd732fb523ee76bdc069f603bc378a6d2e [diff] [blame]
diff --git a/metropolis/pkg/supervisor/supervisor_testhelpers.go b/metropolis/pkg/supervisor/supervisor_testhelpers.go
index 85361c2..1bfb6c0 100644
--- a/metropolis/pkg/supervisor/supervisor_testhelpers.go
+++ b/metropolis/pkg/supervisor/supervisor_testhelpers.go

@@ -19,7 +19,10 @@
 import (
 	"context"
 	"errors"
+	"log"
+	"sort"
 	"testing"
+	"time"
 
 	"source.monogon.dev/metropolis/pkg/logtree"
 )
@@ -32,9 +35,10 @@
 // error, the harness will throw a test error, but will not abort the test.
 //
 // The harness also returns a context cancel function that can be used to
-// terminate the started supervisor early.  Regardless of manual cancellation,
+// terminate the started supervisor early. Regardless of manual cancellation,
 // the supervisor will always be terminated up at the end of the test/benchmark
-// it's running in.
+// it's running in. The supervision tree will also be cleaned up and the test
+// will block until all runnables have exited.
 //
 // The second returned value is the logtree used by this supervisor. It can be
 // used to assert some log messages are emitted in tests that exercise some
@@ -43,12 +47,11 @@
 	t.Helper()
 
 	ctx, ctxC := context.WithCancel(context.Background())
-	t.Cleanup(ctxC)
 
 	lt := logtree.New()
 	logtree.PipeAllToStderr(t, lt)
 
-	New(ctx, func(ctx context.Context) error {
+	sup := New(ctx, func(ctx context.Context) error {
 		Logger(ctx).Infof("Starting test %s...", t.Name())
 		if err := r(ctx); err != nil && !errors.Is(err, ctx.Err()) {
 			t.Errorf("Supervised runnable in harness returned error: %v", err)
@@ -56,5 +59,31 @@
 		}
 		return nil
 	}, WithExistingLogtree(lt))
+
+	t.Cleanup(func() {
+		log.Printf("supervisor.TestHarness: Canceling context...")
+		ctxC()
+		log.Printf("supervisor.TestHarness: Waiting for supervisor runnables to die...")
+		timeoutNag := time.Now().Add(5 * time.Second)
+
+		for {
+			live := sup.liveRunnables()
+			if len(live) == 0 {
+				log.Printf("supervisor.TestHarness: All done.")
+				return
+			}
+
+			if time.Now().After(timeoutNag) {
+				timeoutNag = time.Now().Add(5 * time.Second)
+				sort.Strings(live)
+				log.Printf("supervisor.TestHarness: Still live:")
+				for _, l := range live {
+					log.Printf("supervisor.TestHarness: - %s", l)
+				}
+			}
+
+			time.Sleep(time.Second)
+		}
+	})
 	return ctxC, lt
 }
commit	ec19b60842e905a4400e5f8b46b783a54d0a025a	[log] [tgz]
author	Serge Bazanski <serge@monogon.tech>	Wed Mar 09 20:41:31 2022 +0100
committer	Sergiusz Bazanski <serge@monogon.tech>	Fri Mar 11 11:00:50 2022 +0000
tree	b4c0d22ef5dc693a21fef4e987d9c82457d816f6
parent	662182fd732fb523ee76bdc069f603bc378a6d2e [diff] [blame]