apache · clintropolis · Mar 10, 2020 · Jan 29, 2020 · Jan 31, 2020 · Feb 25, 2020
diff --git a/...marks/src/test/java/org/apache/druid/benchmark/query/CachingClusteredClientBenchmark.java b/...marks/src/test/java/org/apache/druid/benchmark/query/CachingClusteredClientBenchmark.java
@@ -104,7 +104,9 @@
 import org.apache.druid.query.topn.TopNResultValue;
 import org.apache.druid.segment.QueryableIndex;
 import org.apache.druid.segment.QueryableIndexSegment;
+import org.apache.druid.server.QueryScheduler;
 import org.apache.druid.server.coordination.ServerType;
+import org.apache.druid.server.scheduling.NoQueryLaningStrategy;
 import org.apache.druid.timeline.DataSegment;
 import org.apache.druid.timeline.DataSegment.PruneSpecsHolder;
 import org.apache.druid.timeline.SegmentId;
@@ -338,7 +340,8 @@ public <T, QueryType extends Query<T>> QueryToolChest<T, QueryType> getToolChest
         new CacheConfig(),
         new DruidHttpClientConfig(),
         processingConfig,
-        forkJoinPool
+        forkJoinPool,
+        new QueryScheduler(Integer.MAX_VALUE, NoQueryLaningStrategy.INSTANCE)
     );
   }
 

diff --git a/docs/configuration/index.md b/docs/configuration/index.md
@@ -1476,9 +1476,31 @@ These Broker configurations can be defined in the `broker/runtime.properties` fi
 |`druid.broker.select.tier`|`highestPriority`, `lowestPriority`, `custom`|If segments are cross-replicated across tiers in a cluster, you can tell the broker to prefer to select segments in a tier with a certain priority.|`highestPriority`|
 |`druid.broker.select.tier.custom.priorities`|`An array of integer priorities.`|Select servers in tiers with a custom priority list.|None|
 
+##### Query laning
+
+Druid provides facilities to aid in query capacity reservation for heterogenous query workloads in the form of 'laning' strategies, which provide a variety of mechanisms examine and classify a query at the broker, assigning it to a 'lane'. Lanes are defined with capacity limits which the broker will enforce, causing requests in excess of the capacity to be discarded with an HTTP 429 status code, reserving resources for other lanes or for interactive queries (with no lane). 
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.query.scheduler.numThreads`|Maximum number of HTTP threads to dedicate to query processing. To save HTTP thread capacity, this should be lower than `druid.server.http.numThreads`.|Unbounded|
+|`druid.query.scheduler.laning.type`|Query laning strategy to use to assign queries to a lane in order to control capacities for certain classes of queries.|`none`|
+
+###### No laning strategy
+
+In this mode, queries are never assigned a lane and only limited by `druid.server.http.numThreads` or `druid.query.scheduler.numThreads`, if set. This is the default Druid query scheduler operating mode.
+
+###### 'High/Low' laning strategy
+This laning strategy splits queries with a `priority` below zero into a `low` query lane, automatically. The limit on `low` queries can be set to some desired fraction of the total capacity (or HTTP thread pool size), reserving capacity for interactive queries. Queries in the `low` lane are _not_ guaranteed their capacity, which may be consumed by interactive queries, but may use up to this limit if total capacity is available. 
+
+This strategy can be enabled by setting `druid.query.scheduler.laning.type` to `hilo`.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.query.scheduler.laning.maxLowThreads`|Maximum number of HTTP threads that can be used by queries with a priority lower than 0.|No default, must be set if using this mode|
+
 ##### Server Configuration
 
-Druid uses Jetty to serve HTTP requests.
+Druid uses Jetty to serve HTTP requests. Each query being processed consumes a single thread from `druid.server.http.numThreads`, so consider defining `druid.query.scheduler.numThreads` to a lower value in order to reserve HTTP threads for responding to health checks, lookup loading, and other non-query, and in most cases comparatively very short lived, HTTP requests.
 
 |Property|Description|Default|
 |--------|-----------|-------|

diff --git a/...rage-query/src/test/java/org/apache/druid/query/movingaverage/MovingAverageQueryTest.java b/...rage-query/src/test/java/org/apache/druid/query/movingaverage/MovingAverageQueryTest.java
@@ -65,7 +65,9 @@
 import org.apache.druid.query.timeseries.TimeseriesQuery;
 import org.apache.druid.query.timeseries.TimeseriesResultValue;
 import org.apache.druid.server.ClientQuerySegmentWalker;
+import org.apache.druid.server.QueryScheduler;
 import org.apache.druid.server.initialization.ServerConfig;
+import org.apache.druid.server.scheduling.NoQueryLaningStrategy;
 import org.apache.druid.testing.InitializedNullHandlingTest;
 import org.apache.druid.timeline.TimelineLookup;
 import org.hamcrest.core.IsInstanceOf;
@@ -361,7 +363,8 @@ public String getFormatString()
             return null;
           }
         },
-        ForkJoinPool.commonPool()
+        ForkJoinPool.commonPool(),
+        new QueryScheduler(Integer.MAX_VALUE, NoQueryLaningStrategy.INSTANCE)
     );
 
     ClientQuerySegmentWalker walker = new ClientQuerySegmentWalker(

diff --git a/...ng-service/src/test/java/org/apache/druid/indexing/common/task/RealtimeIndexTaskTest.java b/...ng-service/src/test/java/org/apache/druid/indexing/common/task/RealtimeIndexTaskTest.java
@@ -909,7 +909,7 @@ private TaskToolbox makeToolbox(
                 new QueryWatcher()
                 {
                   @Override
-                  public void registerQuery(Query query, ListenableFuture future)
+                  public void registerQueryFuture(Query query, ListenableFuture future)
                   {
                     // do nothing
                   }

diff --git a/processing/src/main/java/org/apache/druid/query/ChainedExecutionQueryRunner.java b/processing/src/main/java/org/apache/druid/query/ChainedExecutionQueryRunner.java
@@ -144,7 +144,7 @@ public Iterable<T> call()
                 )
             );
 
-            queryWatcher.registerQuery(query, futures);
+            queryWatcher.registerQueryFuture(query, futures);
 
             try {
               return new MergeIterable<>(

diff --git a/processing/src/main/java/org/apache/druid/query/GroupByMergedQueryRunner.java b/processing/src/main/java/org/apache/druid/query/GroupByMergedQueryRunner.java
@@ -178,7 +178,7 @@ private void waitForFutureCompletion(
   )
   {
     try {
-      queryWatcher.registerQuery(query, future);
+      queryWatcher.registerQueryFuture(query, future);
       if (QueryContexts.hasTimeout(query)) {
         future.get(QueryContexts.getTimeout(query), TimeUnit.MILLISECONDS);
       } else {

diff --git a/processing/src/main/java/org/apache/druid/query/QueryContexts.java b/processing/src/main/java/org/apache/druid/query/QueryContexts.java
@@ -35,6 +35,7 @@
 public class QueryContexts
 {
   public static final String PRIORITY_KEY = "priority";
+  public static final String LANE_KEY = "lane";
   public static final String TIMEOUT_KEY = "timeout";
   public static final String MAX_SCATTER_GATHER_BYTES_KEY = "maxScatterGatherBytes";
   public static final String MAX_QUEUED_BYTES_KEY = "maxQueuedBytes";
@@ -200,6 +201,11 @@ public static <T> int getPriority(Query<T> query, int defaultValue)
     return parseInt(query, PRIORITY_KEY, defaultValue);
   }
 
+  public static <T> String getLane(Query<T> query)
+  {
+    return (String) query.getContextValue(LANE_KEY);
+  }
+
   public static <T> boolean getEnableParallelMerges(Query<T> query)
   {
     return parseBoolean(query, BROKER_PARALLEL_MERGE_KEY, DEFAULT_ENABLE_PARALLEL_MERGE);

diff --git a/processing/src/main/java/org/apache/druid/query/QueryWatcher.java b/processing/src/main/java/org/apache/druid/query/QueryWatcher.java
@@ -43,5 +43,5 @@ public interface QueryWatcher
    * @param query a query, which may be a subset of a larger query, as long as the underlying queryId is unchanged
    * @param future the future holding the execution status of the query
    */
-  void registerQuery(Query query, ListenableFuture future);
+  void registerQueryFuture(Query<?> query, ListenableFuture<?> future);
 }
diff --git a/...c/main/java/org/apache/druid/query/groupby/epinephelinae/GroupByMergingQueryRunnerV2.java b/...c/main/java/org/apache/druid/query/groupby/epinephelinae/GroupByMergingQueryRunnerV2.java
@@ -346,7 +346,7 @@ private void waitForFutureCompletion(
   {
     try {
       if (queryWatcher != null) {
-        queryWatcher.registerQuery(query, future);
+        queryWatcher.registerQueryFuture(query, future);
       }
 
       if (hasTimeout && timeout <= 0) {

diff --git a/...sing/src/main/java/org/apache/druid/query/metadata/SegmentMetadataQueryRunnerFactory.java b/...sing/src/main/java/org/apache/druid/query/metadata/SegmentMetadataQueryRunnerFactory.java
@@ -219,7 +219,7 @@ public Sequence<SegmentAnalysis> call()
                         }
                     );
                     try {
-                      queryWatcher.registerQuery(query, future);
+                      queryWatcher.registerQueryFuture(query, future);
                       if (QueryContexts.hasTimeout(query)) {
                         return future.get(QueryContexts.getTimeout(query), TimeUnit.MILLISECONDS);
                       } else {

diff --git a/processing/src/test/java/org/apache/druid/query/ChainedExecutionQueryRunnerTest.java b/processing/src/test/java/org/apache/druid/query/ChainedExecutionQueryRunnerTest.java
@@ -84,7 +84,7 @@ public int getNumThreads()
 
     Capture<ListenableFuture> capturedFuture = EasyMock.newCapture();
     QueryWatcher watcher = EasyMock.createStrictMock(QueryWatcher.class);
-    watcher.registerQuery(
+    watcher.registerQueryFuture(
         EasyMock.anyObject(),
         EasyMock.and(EasyMock.anyObject(), EasyMock.capture(capturedFuture))
     );
@@ -207,7 +207,7 @@ public int getNumThreads()
 
     Capture<ListenableFuture> capturedFuture = Capture.newInstance();
     QueryWatcher watcher = EasyMock.createStrictMock(QueryWatcher.class);
-    watcher.registerQuery(
+    watcher.registerQueryFuture(
         EasyMock.anyObject(),
         EasyMock.and(EasyMock.anyObject(), EasyMock.capture(capturedFuture))
     );

diff --git a/.../test/java/org/apache/druid/query/groupby/GroupByLimitPushDownInsufficientBufferTest.java b/.../test/java/org/apache/druid/query/groupby/GroupByLimitPushDownInsufficientBufferTest.java
@@ -676,7 +676,7 @@ public static <T, QueryType extends Query<T>> QueryRunner<T> makeQueryRunner(
   public static final QueryWatcher NOOP_QUERYWATCHER = new QueryWatcher()
   {
     @Override
-    public void registerQuery(Query query, ListenableFuture future)
+    public void registerQueryFuture(Query query, ListenableFuture future)
     {
 
     }

diff --git a/processing/src/test/java/org/apache/druid/query/groupby/GroupByMultiSegmentTest.java b/processing/src/test/java/org/apache/druid/query/groupby/GroupByMultiSegmentTest.java
@@ -411,7 +411,7 @@ public static <T, QueryType extends Query<T>> QueryRunner<T> makeQueryRunner(
   public static final QueryWatcher NOOP_QUERYWATCHER = new QueryWatcher()
   {
     @Override
-    public void registerQuery(Query query, ListenableFuture future)
+    public void registerQueryFuture(Query query, ListenableFuture future)
     {
 
     }