grafana · pstibrany · Jan 14, 2022 · Jan 13, 2022 · Jan 13, 2022 · Jan 13, 2022
diff --git a/CHANGELOG.md b/CHANGELOG.md
@@ -200,6 +200,7 @@
 * [BUGFIX] Ruler: fix formatting of rule groups in `/ruler/rule_groups` endpoint. #655
 * [BUGFIX] Querier: Disable query scheduler SRV DNS lookup. #689
 * [BUGFIX] Query-frontend: fix API error messages that were mentioning Prometheus `--enable-feature=promql-negative-offset` and `--enable-feature=promql-at-modifier` flags. #688
+* [BUGFIX] Query-frontend: worker's cancellation channels are now buffered to ensure that all request cancellations are properly handled. #741
 
 ### Mixin (changes since `grafana/cortex-jsonnet` `1.9.0`)
 

@@ -196,21 +196,14 @@ func (f *Frontend) RoundTripGRPC(ctx context.Context, req *httpgrpc.HTTPRequest)
 	retries := f.cfg.WorkerConcurrency + 1 // To make sure we hit at least two different schedulers.
 
 enqueueAgain:
+	var cancelCh chan<- uint64
 	select {
 	case <-ctx.Done():
 		return nil, ctx.Err()
 
 	case f.requestsCh <- freq:
 		// Enqueued, let's wait for response.
-	}
-
-	var cancelCh chan<- uint64
-
-	select {
-	case <-ctx.Done():
-		return nil, ctx.Err()
-
-	case enqRes := <-freq.enqueue:
+		enqRes := <-freq.enqueue
 		if enqRes.status == waitForResponse {
 			cancelCh = enqRes.cancelCh
 			break // go wait for response.
@@ -232,6 +225,7 @@ enqueueAgain:
 				// cancellation sent.
 			default:
 				// failed to cancel, ignore.
+				level.Warn(f.log).Log("msg", "failed to send cancellation request to scheduler, queue full")
 			}
 		}
 		return nil, ctx.Err()

@@ -26,7 +26,12 @@ import (
 	"github.com/grafana/mimir/pkg/util"
 )
 
-const schedulerAddressLabel = "scheduler_address"
+const (
+	schedulerAddressLabel = "scheduler_address"
+	// schedulerWorkerCancelChanCapacity should be at least as big as the number of sub-queries issued by a single query
+	// per scheduler (after splitting and sharding) in order to allow all of them being canceled while scheduler worker is busy.
+	schedulerWorkerCancelChanCapacity = 1000
+)
 
 type frontendSchedulerWorkers struct {
 	services.Service
@@ -197,7 +202,7 @@ func newFrontendSchedulerWorker(conn *grpc.ClientConn, schedulerAddr string, fro
 		schedulerAddr:    schedulerAddr,
 		frontendAddr:     frontendAddr,
 		requestCh:        requestCh,
-		cancelCh:         make(chan uint64),
+		cancelCh:         make(chan uint64, schedulerWorkerCancelChanCapacity),
 		enqueuedRequests: enqueuedRequests,
 	}
 	w.ctx, w.cancel = context.WithCancel(context.Background())
@@ -331,6 +336,10 @@ func (w *frontendSchedulerWorker) schedulerLoop(loop schedulerpb.SchedulerForFro
 						Body: []byte("too many outstanding requests"),
 					},
 				}
+
+			default:
+				level.Error(w.log).Log("msg", "unknown response status from the scheduler", "resp", resp, "queryID", req.queryID)
+				req.enqueue <- enqueueResult{status: failed}
 			}
 
 		case reqID := <-w.cancelCh:

@@ -228,6 +228,55 @@ func TestFrontendCancellation(t *testing.T) {
 	})
 }
 
+// When frontendWorker that processed the request is busy (processing a new request or cancelling a previous one)
+// we still need to make sure that the cancellation reach the scheduler at some point.
+// Issue: https://github.com/grafana/mimir/issues/740
+func TestFrontendWorkerCancellation(t *testing.T) {
+	f, ms := setupFrontend(t, nil, nil)
+
+	ctx, cancel := context.WithTimeout(context.Background(), 200*time.Millisecond)
+	defer cancel()
+
+	// send multiple requests > maxconcurrency of scheduler. So that it keeps all the frontend worker busy in serving requests.
+	reqCount := testFrontendWorkerConcurrency + 5
+	var wg sync.WaitGroup
+	for i := 0; i < reqCount; i++ {
+		wg.Add(1)
+		go func() {
+			defer wg.Done()
+			resp, err := f.RoundTripGRPC(user.InjectOrgID(ctx, "test"), &httpgrpc.HTTPRequest{})
+			require.EqualError(t, err, context.DeadlineExceeded.Error())
+			require.Nil(t, resp)
+		}()
+	}
+
+	wg.Wait()
+
+	// We wait a bit to make sure scheduler receives the cancellation request.
+	// 2 * reqCount because for every request, should also be corresponding cancel request
+	test.Poll(t, 5*time.Second, 2*reqCount, func() interface{} {
+		ms.mu.Lock()
+		defer ms.mu.Unlock()
+
+		return len(ms.msgs)
+	})
+
+	ms.checkWithLock(func() {
+		require.Equal(t, 2*reqCount, len(ms.msgs))
+		msgTypeCounts := map[schedulerpb.FrontendToSchedulerType]int{}
+		for _, msg := range ms.msgs {
+			msgTypeCounts[msg.Type]++
+		}
+		expectedMsgTypeCounts := map[schedulerpb.FrontendToSchedulerType]int{
+			schedulerpb.ENQUEUE: reqCount,
+			schedulerpb.CANCEL:  reqCount,
+		}
+		require.Equalf(t, expectedMsgTypeCounts, msgTypeCounts,
+			"Should receive %d enqueue (%d) requests, and %d cancel (%d) requests.", reqCount, schedulerpb.ENQUEUE, reqCount, schedulerpb.CANCEL,
+		)
+	})
+}
+
 func TestFrontendFailedCancellation(t *testing.T) {
 	f, ms := setupFrontend(t, nil, nil)