diff --git a/connectivity/suite.go b/connectivity/suite.go index c25688c200..079a26f085 100644 --- a/connectivity/suite.go +++ b/connectivity/suite.go @@ -217,6 +217,8 @@ func Run(ctx context.Context, ct *check.ConnectivityTest, addExtraTests func(*ch // include --include-upgrade-tests" return ct.Run(ctx) } + + ct.NewTest("no-missed-tail-calls").WithScenarios(tests.NoMissedTailCalls()) } // Run all tests without any policies in place. diff --git a/connectivity/tests/errors.go b/connectivity/tests/errors.go index 1fd1671201..ffd207dbf3 100644 --- a/connectivity/tests/errors.go +++ b/connectivity/tests/errors.go @@ -5,10 +5,12 @@ package tests import ( "context" + "strconv" "strings" "time" "github.com/cilium/cilium-cli/connectivity/check" + "github.com/cilium/cilium-cli/defaults" ) // NoErrorsInLogs checks whether there are no error messages in cilium-agent @@ -41,6 +43,50 @@ func (n *noErrorsInLogs) Run(ctx context.Context, t *check.Test) { } +// NoMissedTailCalls checks whether there were no drops due to missed (BPF) +// tail calls. +func NoMissedTailCalls() check.Scenario { + return &noMissedTailCalls{} +} + +type noMissedTailCalls struct{} + +func (n *noMissedTailCalls) Name() string { + return "no-missed-tail-calls" +} + +func (n *noMissedTailCalls) Run(ctx context.Context, t *check.Test) { + ct := t.Context() + cmd := []string{ + "/bin/sh", "-c", + "cilium metrics list -o json | jq '.[] | select( .name == \"cilium_drop_count_total\" and .labels.reason == \"Missed tail call\" ).value'", + } + + for _, pod := range ct.CiliumPods() { + pod := pod + stdout, err := pod.K8sClient.ExecInPod(ctx, pod.Pod.Namespace, pod.Pod.Name, defaults.AgentContainerName, cmd) + if err != nil { + t.Fatalf("Error fetching missed tail call drop counts: %s", err) + } + countStr := stdout.String() + t.NewAction(n, pod.Pod.Name, nil, nil, check.IPFamilyNone).Run(func(a *check.Action) { + if countStr == "" { + return + } + + count, err := strconv.Atoi(countStr) + if err != nil { + a.Fatalf("Failed to convert missed tail call drops %q to int: %s", countStr, err) + } + + if count != 0 { + a.Fatalf("Detected drops due to missed tail calls: %d", count) + } + }) + } + +} + func checkErrorsInLogs(logs string, a *check.Action) { uniqueFailures := make(map[string]int) for _, msg := range strings.Split(logs, "\n") {