ory · aeneasr · Dec 20, 2022 · Dec 19, 2022 · Dec 19, 2022 · Dec 20, 2022
@@ -274,29 +274,36 @@ func (e *WebHook) execute(ctx context.Context, data *templateContext) error {
 			attribute.String("webhook.identity.nid", data.Identity.NID.String()),
 		)
 	}
+
 	var (
-		httpClient                       = e.deps.HTTPClient(ctx)
-		async                            = gjson.GetBytes(e.conf, "response.ignore").Bool()
-		parseResponse                    = gjson.GetBytes(e.conf, "can_interrupt").Bool()
-		tracer                           = trace.SpanFromContext(ctx).TracerProvider().Tracer("kratos-webhooks")
-		cancel        context.CancelFunc = func() {}
-		spanOpts                         = []trace.SpanStartOption{trace.WithAttributes(attrs...)}
-		errChan                          = make(chan error, 1)
+		httpClient     = e.deps.HTTPClient(ctx)
+		ignoreResponse = gjson.GetBytes(e.conf, "response.ignore").Bool()
+		canInterrupt   = gjson.GetBytes(e.conf, "can_interrupt").Bool()
+		tracer         = trace.SpanFromContext(ctx).TracerProvider().Tracer("kratos-webhooks")
+		spanOpts       = []trace.SpanStartOption{trace.WithAttributes(attrs...)}
+		errChan        = make(chan error, 1)
 	)
-	if async {
-		// dissociate the context from the one passed into this function
-		ctx, cancel = context.WithTimeout(context.Background(), 5*time.Minute)
-		spanOpts = append(spanOpts, trace.WithNewRoot())
-	}
+
 	ctx, span := tracer.Start(ctx, "Webhook", spanOpts...)
 	e.deps.Logger().WithRequest(req.Request).Info("Dispatching webhook")
-	t0 := time.Now()
+
+	req = req.WithContext(ctx)
+	if ignoreResponse {
+		// This is one of the few places where spawning a context.Background() is ok. We need to do this
+		// because the function runs asynchronously and we don't want to cancel the request if the
+		// incoming request context is cancelled.
+		//
+		// The webhook will still cancel after 30 seconds as that is the configured timeout for the HTTP client.
+		req = req.WithContext(context.Background())
+		// spanOpts = append(spanOpts, trace.WithNewRoot())
+	}
+
+	startTime := time.Now()
 	go func() {
 		defer close(errChan)
-		defer cancel()
 		defer span.End()
 
-		resp, err := httpClient.Do(req.WithContext(ctx))
+		resp, err := httpClient.Do(req)
 		if err != nil {
 			span.SetStatus(codes.Error, err.Error())
 			errChan <- errors.WithStack(err)
@@ -307,7 +314,7 @@ func (e *WebHook) execute(ctx context.Context, data *templateContext) error {
 
 		if resp.StatusCode >= http.StatusBadRequest {
 			span.SetStatus(codes.Error, "HTTP status code >= 400")
-			if parseResponse {
+			if canInterrupt {
 				if err := parseWebhookResponse(resp); err != nil {
 					span.SetStatus(codes.Error, err.Error())
 					errChan <- err
@@ -320,16 +327,17 @@ func (e *WebHook) execute(ctx context.Context, data *templateContext) error {
 		errChan <- nil
 	}()
 
-	if async {
+	if ignoreResponse {
 		traceID, spanID := span.SpanContext().TraceID(), span.SpanContext().SpanID()
+		logger := e.deps.Logger().WithField("otel", map[string]string{
+			"trace_id": traceID.String(),
+			"span_id":  spanID.String(),
+		})
 		go func() {
 			if err := <-errChan; err != nil {
-				e.deps.Logger().WithField("otel", map[string]string{
-					"trace_id": traceID.String(),
-					"span_id":  spanID.String(),
-				}).WithError(err).Warning("Webhook request failed but the error was ignored because the configuration indicated that the upstream response should be ignored.")
+				logger.WithField("duration", time.Since(startTime)).WithError(err).Warning("Webhook request failed but the error was ignored because the configuration indicated that the upstream response should be ignored.")
 			} else {
-				e.deps.Logger().WithField("duration", time.Since(t0)).Info("Webhook request succeeded")
+				logger.WithField("duration", time.Since(startTime)).Info("Webhook request succeeded")
 			}
 		}()
 		return nil

@@ -861,13 +861,15 @@ func TestAsyncWebhook(t *testing.T) {
 		URL:    &url.URL{Path: "/some_end_point"},
 		Method: http.MethodPost,
 	}
+
 	incomingCtx, incomingCancel := context.WithCancel(context.Background())
 	if deadline, ok := t.Deadline(); ok {
 		// cancel this context one second before test timeout for clean shutdown
 		var cleanup context.CancelFunc
 		incomingCtx, cleanup = context.WithDeadline(incomingCtx, deadline.Add(-time.Second))
 		defer cleanup()
 	}
+
 	req = req.WithContext(incomingCtx)
 	s := &session.Session{ID: x.NewUUID(), Identity: &identity.Identity{ID: x.NewUUID()}}
 	f := &login.Flow{ID: x.NewUUID()}
@@ -899,36 +901,23 @@ func TestAsyncWebhook(t *testing.T) {
 	}
 	// at this point, a goroutine is in the middle of the call to our test handler and waiting for a response
 	incomingCancel() // simulate the incoming Kratos request having finished
+	close(blockHandlerOnExit)
 	timeout := time.After(200 * time.Millisecond)
-	for done := false; !done; {
-		if last := logHook.LastEntry(); last != nil {
-			msg, err := last.String()
-			require.NoError(t, err)
-			assert.Contains(t, msg, "Dispatching webhook")
+	var found bool
+	for !found {
+		for _, entry := range logHook.AllEntries() {
+			if entry.Message == "Webhook request succeeded" {
+				found = true
+				break
+			}
 		}
 
-		select {
-		case <-timeout:
-			done = true
-		case <-time.After(50 * time.Millisecond):
-			// continue loop
-		}
-	}
-	logHook.Reset()
-	close(blockHandlerOnExit)
-	timeout = time.After(200 * time.Millisecond)
-	for {
-		if last := logHook.LastEntry(); last != nil {
-			msg, err := last.String()
-			require.NoError(t, err)
-			assert.Contains(t, msg, "Webhook request succeeded")
-			break
-		}
 		select {
 		case <-timeout:
 			t.Fatal("timed out waiting for successful webhook completion")
 		case <-time.After(50 * time.Millisecond):
 			// continue loop
 		}
 	}
+	require.True(t, found)
 }